diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" --- "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.3434, "train/learning_rate": 2.5073239436619717e-05, "train/epoch": 5.04, "train/global_step": 4500, "_runtime": 26859, "_timestamp": 1648168203, "_step": 4502, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 8.0, 19.0, 11.0, 11.0, 18.0, 20.0, 23.0, 37.0, 21.0, 38.0, 48.0, 54.0, 42.0, 54.0, 50.0, 59.0, 50.0, 58.0, 46.0, 51.0, 35.0, 31.0, 40.0, 26.0, 30.0, 15.0, 23.0, 5.0, 10.0, 11.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.145931243896484, -46.14273452758789, -45.13954162597656, -44.13634490966797, -43.133148193359375, -42.12995147705078, -41.12675476074219, -40.12356185913086, -39.120365142822266, -38.11716842651367, -37.113975524902344, -36.11077880859375, -35.107582092285156, -34.10438537597656, -33.10118865966797, -32.09799575805664, -31.094799041748047, -30.091602325439453, -29.088407516479492, -28.08521270751953, -27.082015991210938, -26.078819274902344, -25.075624465942383, -24.072429656982422, -23.069232940673828, -22.066036224365234, -21.062841415405273, -20.059646606445312, -19.05644989013672, -18.053253173828125, -17.050058364868164, -16.046863555908203, -15.04366683959961, -14.040471076965332, -13.037275314331055, -12.034079551696777, -11.0308837890625, -10.027688026428223, -9.024492263793945, -8.021296501159668, -7.018100738525391, -6.014904975891113, -5.011709213256836, -4.008513450622559, -3.0053176879882812, -2.002121925354004, -0.9989261627197266, 0.004269599914550781, 1.0074653625488281, 2.0106611251831055, 3.013856887817383, 4.01705265045166, 5.0202484130859375, 6.023444175720215, 7.026639938354492, 8.02983570098877, 9.033031463623047, 10.036227226257324, 11.039422988891602, 12.042618751525879, 13.045814514160156, 14.049010276794434, 15.052206039428711, 16.055400848388672, 17.058597564697266]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 1.0, 7.0, 14.0, 6.0, 12.0, 9.0, 16.0, 18.0, 12.0, 17.0, 25.0, 20.0, 28.0, 28.0, 26.0, 31.0, 42.0, 32.0, 27.0, 45.0, 31.0, 34.0, 30.0, 38.0, 45.0, 43.0, 32.0, 27.0, 38.0, 26.0, 31.0, 23.0, 22.0, 18.0, 16.0, 19.0, 19.0, 10.0, 16.0, 17.0, 13.0, 11.0, 2.0, 2.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.34871482849121, -23.52866554260254, -22.708616256713867, -21.888566970825195, -21.068517684936523, -20.24846839904785, -19.42841911315918, -18.608369827270508, -17.788320541381836, -16.968271255493164, -16.148221969604492, -15.32817268371582, -14.508123397827148, -13.688074111938477, -12.868024826049805, -12.047975540161133, -11.227926254272461, -10.407876968383789, -9.587827682495117, -8.767778396606445, -7.947729110717773, -7.127679824829102, -6.30763053894043, -5.487581253051758, -4.667531967163086, -3.847482681274414, -3.027433395385742, -2.2073841094970703, -1.3873348236083984, -0.5672855377197266, 0.2527637481689453, 1.0728130340576172, 1.8928642272949219, 2.7129135131835938, 3.5329627990722656, 4.3530120849609375, 5.173061370849609, 5.993110656738281, 6.813159942626953, 7.633209228515625, 8.453258514404297, 9.273307800292969, 10.09335708618164, 10.913406372070312, 11.733455657958984, 12.553504943847656, 13.373554229736328, 14.193603515625, 15.013652801513672, 15.833702087402344, 16.653751373291016, 17.473800659179688, 18.29384994506836, 19.11389923095703, 19.933948516845703, 20.753997802734375, 21.574047088623047, 22.39409637451172, 23.21414566040039, 24.034194946289062, 24.854244232177734, 25.674293518066406, 26.494342803955078, 27.31439208984375, 28.134441375732422]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 8.0, 22.0, 26.0, 52.0, 82.0, 142.0, 226.0, 408.0, 652.0, 1048.0, 1850.0, 3235.0, 5480.0, 9769.0, 16576.0, 29675.0, 51925.0, 90893.0, 156444.0, 256832.0, 401361.0, 560558.0, 658964.0, 629369.0, 491966.0, 333319.0, 206527.0, 121915.0, 70879.0, 40066.0, 22798.0, 13093.0, 7371.0, 4458.0, 2564.0, 1489.0, 864.0, 550.0, 307.0, 199.0, 117.0, 63.0, 46.0, 38.0, 22.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-25.21875, -24.425048828125, -23.63134765625, -22.837646484375, -22.0439453125, -21.250244140625, -20.45654296875, -19.662841796875, -18.869140625, -18.075439453125, -17.28173828125, -16.488037109375, -15.6943359375, -14.900634765625, -14.10693359375, -13.313232421875, -12.51953125, -11.725830078125, -10.93212890625, -10.138427734375, -9.3447265625, -8.551025390625, -7.75732421875, -6.963623046875, -6.169921875, -5.376220703125, -4.58251953125, -3.788818359375, -2.9951171875, -2.201416015625, -1.40771484375, -0.614013671875, 0.1796875, 0.973388671875, 1.76708984375, 2.560791015625, 3.3544921875, 4.148193359375, 4.94189453125, 5.735595703125, 6.529296875, 7.322998046875, 8.11669921875, 8.910400390625, 9.7041015625, 10.497802734375, 11.29150390625, 12.085205078125, 12.87890625, 13.672607421875, 14.46630859375, 15.260009765625, 16.0537109375, 16.847412109375, 17.64111328125, 18.434814453125, 19.228515625, 20.022216796875, 20.81591796875, 21.609619140625, 22.4033203125, 23.197021484375, 23.99072265625, 24.784423828125, 25.578125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 5.0, 8.0, 11.0, 11.0, 11.0, 19.0, 16.0, 21.0, 15.0, 30.0, 18.0, 31.0, 33.0, 28.0, 41.0, 31.0, 33.0, 49.0, 48.0, 45.0, 40.0, 36.0, 26.0, 35.0, 36.0, 29.0, 36.0, 29.0, 29.0, 27.0, 18.0, 13.0, 22.0, 11.0, 11.0, 15.0, 15.0, 9.0, 8.0, 7.0, 8.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.828125, -20.1787109375, -19.529296875, -18.8798828125, -18.23046875, -17.5810546875, -16.931640625, -16.2822265625, -15.6328125, -14.9833984375, -14.333984375, -13.6845703125, -13.03515625, -12.3857421875, -11.736328125, -11.0869140625, -10.4375, -9.7880859375, -9.138671875, -8.4892578125, -7.83984375, -7.1904296875, -6.541015625, -5.8916015625, -5.2421875, -4.5927734375, -3.943359375, -3.2939453125, -2.64453125, -1.9951171875, -1.345703125, -0.6962890625, -0.046875, 0.6025390625, 1.251953125, 1.9013671875, 2.55078125, 3.2001953125, 3.849609375, 4.4990234375, 5.1484375, 5.7978515625, 6.447265625, 7.0966796875, 7.74609375, 8.3955078125, 9.044921875, 9.6943359375, 10.34375, 10.9931640625, 11.642578125, 12.2919921875, 12.94140625, 13.5908203125, 14.240234375, 14.8896484375, 15.5390625, 16.1884765625, 16.837890625, 17.4873046875, 18.13671875, 18.7861328125, 19.435546875, 20.0849609375, 20.734375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 9.0, 8.0, 14.0, 31.0, 34.0, 51.0, 90.0, 107.0, 213.0, 375.0, 683.0, 1197.0, 2065.0, 3555.0, 6384.0, 11185.0, 19083.0, 33172.0, 56416.0, 92094.0, 145956.0, 222635.0, 318146.0, 423327.0, 510879.0, 545873.0, 505098.0, 414425.0, 309257.0, 214775.0, 140354.0, 88363.0, 53664.0, 31565.0, 18397.0, 10652.0, 5984.0, 3472.0, 1881.0, 1200.0, 638.0, 397.0, 209.0, 151.0, 91.0, 41.0, 39.0, 15.0, 10.0, 15.0, 7.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-20.171875, -19.487060546875, -18.80224609375, -18.117431640625, -17.4326171875, -16.747802734375, -16.06298828125, -15.378173828125, -14.693359375, -14.008544921875, -13.32373046875, -12.638916015625, -11.9541015625, -11.269287109375, -10.58447265625, -9.899658203125, -9.21484375, -8.530029296875, -7.84521484375, -7.160400390625, -6.4755859375, -5.790771484375, -5.10595703125, -4.421142578125, -3.736328125, -3.051513671875, -2.36669921875, -1.681884765625, -0.9970703125, -0.312255859375, 0.37255859375, 1.057373046875, 1.7421875, 2.427001953125, 3.11181640625, 3.796630859375, 4.4814453125, 5.166259765625, 5.85107421875, 6.535888671875, 7.220703125, 7.905517578125, 8.59033203125, 9.275146484375, 9.9599609375, 10.644775390625, 11.32958984375, 12.014404296875, 12.69921875, 13.384033203125, 14.06884765625, 14.753662109375, 15.4384765625, 16.123291015625, 16.80810546875, 17.492919921875, 18.177734375, 18.862548828125, 19.54736328125, 20.232177734375, 20.9169921875, 21.601806640625, 22.28662109375, 22.971435546875, 23.65625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 20.0, 20.0, 29.0, 34.0, 43.0, 66.0, 68.0, 82.0, 108.0, 137.0, 156.0, 203.0, 225.0, 240.0, 290.0, 240.0, 279.0, 276.0, 233.0, 213.0, 193.0, 171.0, 131.0, 134.0, 109.0, 88.0, 61.0, 54.0, 40.0, 29.0, 23.0, 18.0, 11.0, 6.0, 5.0, 9.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.613037109375, -10.24951171875, -9.885986328125, -9.5224609375, -9.158935546875, -8.79541015625, -8.431884765625, -8.068359375, -7.704833984375, -7.34130859375, -6.977783203125, -6.6142578125, -6.250732421875, -5.88720703125, -5.523681640625, -5.16015625, -4.796630859375, -4.43310546875, -4.069580078125, -3.7060546875, -3.342529296875, -2.97900390625, -2.615478515625, -2.251953125, -1.888427734375, -1.52490234375, -1.161376953125, -0.7978515625, -0.434326171875, -0.07080078125, 0.292724609375, 0.65625, 1.019775390625, 1.38330078125, 1.746826171875, 2.1103515625, 2.473876953125, 2.83740234375, 3.200927734375, 3.564453125, 3.927978515625, 4.29150390625, 4.655029296875, 5.0185546875, 5.382080078125, 5.74560546875, 6.109130859375, 6.47265625, 6.836181640625, 7.19970703125, 7.563232421875, 7.9267578125, 8.290283203125, 8.65380859375, 9.017333984375, 9.380859375, 9.744384765625, 10.10791015625, 10.471435546875, 10.8349609375, 11.198486328125, 11.56201171875, 11.925537109375, 12.2890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 6.0, 6.0, 14.0, 16.0, 21.0, 28.0, 26.0, 21.0, 30.0, 26.0, 38.0, 42.0, 56.0, 44.0, 39.0, 49.0, 48.0, 48.0, 43.0, 41.0, 48.0, 47.0, 33.0, 36.0, 31.0, 26.0, 17.0, 25.0, 10.0, 14.0, 9.0, 4.0, 4.0, 9.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.54071617126465, -25.7466983795166, -24.952680587768555, -24.158662796020508, -23.364646911621094, -22.570629119873047, -21.776611328125, -20.982593536376953, -20.188575744628906, -19.39455795288086, -18.600540161132812, -17.806522369384766, -17.01250457763672, -16.218488693237305, -15.424470901489258, -14.630453109741211, -13.836435317993164, -13.042417526245117, -12.24839973449707, -11.45438289642334, -10.660365104675293, -9.866347312927246, -9.072330474853516, -8.278312683105469, -7.484294891357422, -6.690277099609375, -5.896259784698486, -5.102242469787598, -4.308224678039551, -3.514207124710083, -2.7201895713806152, -1.9261722564697266, -1.1321544647216797, -0.3381369113922119, 0.45588064193725586, 1.2498981952667236, 2.0439157485961914, 2.837933301925659, 3.631950855255127, 4.425968170166016, 5.2199859619140625, 6.014003753662109, 6.808021068572998, 7.602038383483887, 8.396056175231934, 9.19007396697998, 9.984090805053711, 10.778108596801758, 11.572126388549805, 12.366144180297852, 13.160161972045898, 13.954178810119629, 14.748196601867676, 15.542214393615723, 16.336231231689453, 17.1302490234375, 17.924266815185547, 18.718284606933594, 19.51230239868164, 20.306320190429688, 21.100337982177734, 21.89435386657715, 22.688371658325195, 23.482389450073242, 24.27640724182129]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 24.0, 25.0, 20.0, 23.0, 32.0, 25.0, 21.0, 30.0, 31.0, 38.0, 34.0, 37.0, 38.0, 44.0, 49.0, 42.0, 35.0, 38.0, 28.0, 37.0, 33.0, 32.0, 20.0, 21.0, 22.0, 18.0, 16.0, 13.0, 15.0, 10.0, 12.0, 8.0, 9.0, 14.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-23.881210327148438, -23.164676666259766, -22.448143005371094, -21.731609344482422, -21.01507568359375, -20.29854393005371, -19.58201026916504, -18.865476608276367, -18.148942947387695, -17.432409286499023, -16.71587562561035, -15.999342918395996, -15.282809257507324, -14.566275596618652, -13.849742889404297, -13.133209228515625, -12.416675567626953, -11.700141906738281, -10.98360824584961, -10.267075538635254, -9.550541877746582, -8.83400821685791, -8.117475509643555, -7.400941848754883, -6.684408187866211, -5.967874526977539, -5.251341342926025, -4.534808158874512, -3.81827449798584, -3.101741075515747, -2.3852076530456543, -1.6686744689941406, -0.9521408081054688, -0.23560738563537598, 0.4809260368347168, 1.1974594593048096, 1.9139928817749023, 2.630526304244995, 3.347059726715088, 4.063592910766602, 4.780126571655273, 5.496660232543945, 6.213193416595459, 6.929726600646973, 7.6462602615356445, 8.362793922424316, 9.079326629638672, 9.795860290527344, 10.512393951416016, 11.228927612304688, 11.94546127319336, 12.661993980407715, 13.378527641296387, 14.095061302185059, 14.811594009399414, 15.528127670288086, 16.244661331176758, 16.96119499206543, 17.6777286529541, 18.394262313842773, 19.110794067382812, 19.827327728271484, 20.543861389160156, 21.260395050048828, 21.9769287109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 16.0, 21.0, 28.0, 49.0, 93.0, 142.0, 207.0, 312.0, 495.0, 690.0, 1197.0, 1905.0, 2997.0, 4486.0, 6909.0, 10652.0, 16423.0, 24872.0, 38160.0, 57801.0, 85411.0, 118619.0, 147336.0, 148610.0, 121910.0, 87269.0, 59070.0, 39046.0, 25456.0, 17078.0, 11167.0, 7179.0, 4603.0, 2957.0, 1954.0, 1271.0, 778.0, 516.0, 311.0, 196.0, 124.0, 87.0, 54.0, 33.0, 18.0, 25.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.203125, -23.447509765625, -22.69189453125, -21.936279296875, -21.1806640625, -20.425048828125, -19.66943359375, -18.913818359375, -18.158203125, -17.402587890625, -16.64697265625, -15.891357421875, -15.1357421875, -14.380126953125, -13.62451171875, -12.868896484375, -12.11328125, -11.357666015625, -10.60205078125, -9.846435546875, -9.0908203125, -8.335205078125, -7.57958984375, -6.823974609375, -6.068359375, -5.312744140625, -4.55712890625, -3.801513671875, -3.0458984375, -2.290283203125, -1.53466796875, -0.779052734375, -0.0234375, 0.732177734375, 1.48779296875, 2.243408203125, 2.9990234375, 3.754638671875, 4.51025390625, 5.265869140625, 6.021484375, 6.777099609375, 7.53271484375, 8.288330078125, 9.0439453125, 9.799560546875, 10.55517578125, 11.310791015625, 12.06640625, 12.822021484375, 13.57763671875, 14.333251953125, 15.0888671875, 15.844482421875, 16.60009765625, 17.355712890625, 18.111328125, 18.866943359375, 19.62255859375, 20.378173828125, 21.1337890625, 21.889404296875, 22.64501953125, 23.400634765625, 24.15625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 9.0, 7.0, 14.0, 12.0, 15.0, 21.0, 25.0, 18.0, 22.0, 22.0, 26.0, 33.0, 41.0, 29.0, 33.0, 32.0, 28.0, 45.0, 42.0, 55.0, 27.0, 42.0, 43.0, 31.0, 28.0, 35.0, 30.0, 27.0, 21.0, 21.0, 22.0, 20.0, 16.0, 10.0, 8.0, 13.0, 17.0, 6.0, 7.0, 6.0, 5.0, 3.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-23.53125, -22.84326171875, -22.1552734375, -21.46728515625, -20.779296875, -20.09130859375, -19.4033203125, -18.71533203125, -18.02734375, -17.33935546875, -16.6513671875, -15.96337890625, -15.275390625, -14.58740234375, -13.8994140625, -13.21142578125, -12.5234375, -11.83544921875, -11.1474609375, -10.45947265625, -9.771484375, -9.08349609375, -8.3955078125, -7.70751953125, -7.01953125, -6.33154296875, -5.6435546875, -4.95556640625, -4.267578125, -3.57958984375, -2.8916015625, -2.20361328125, -1.515625, -0.82763671875, -0.1396484375, 0.54833984375, 1.236328125, 1.92431640625, 2.6123046875, 3.30029296875, 3.98828125, 4.67626953125, 5.3642578125, 6.05224609375, 6.740234375, 7.42822265625, 8.1162109375, 8.80419921875, 9.4921875, 10.18017578125, 10.8681640625, 11.55615234375, 12.244140625, 12.93212890625, 13.6201171875, 14.30810546875, 14.99609375, 15.68408203125, 16.3720703125, 17.06005859375, 17.748046875, 18.43603515625, 19.1240234375, 19.81201171875, 20.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 12.0, 18.0, 25.0, 51.0, 75.0, 121.0, 173.0, 223.0, 362.0, 591.0, 922.0, 1352.0, 2029.0, 3039.0, 4745.0, 7222.0, 11090.0, 17712.0, 27944.0, 44362.0, 71287.0, 110192.0, 154529.0, 173421.0, 144395.0, 99952.0, 63581.0, 39595.0, 25162.0, 15667.0, 10170.0, 6456.0, 4290.0, 2632.0, 1803.0, 1174.0, 820.0, 494.0, 298.0, 224.0, 125.0, 89.0, 47.0, 29.0, 20.0, 13.0, 7.0, 9.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.05859375, -19.3984375, -18.73828125, -18.078125, -17.41796875, -16.7578125, -16.09765625, -15.4375, -14.77734375, -14.1171875, -13.45703125, -12.796875, -12.13671875, -11.4765625, -10.81640625, -10.15625, -9.49609375, -8.8359375, -8.17578125, -7.515625, -6.85546875, -6.1953125, -5.53515625, -4.875, -4.21484375, -3.5546875, -2.89453125, -2.234375, -1.57421875, -0.9140625, -0.25390625, 0.40625, 1.06640625, 1.7265625, 2.38671875, 3.046875, 3.70703125, 4.3671875, 5.02734375, 5.6875, 6.34765625, 7.0078125, 7.66796875, 8.328125, 8.98828125, 9.6484375, 10.30859375, 10.96875, 11.62890625, 12.2890625, 12.94921875, 13.609375, 14.26953125, 14.9296875, 15.58984375, 16.25, 16.91015625, 17.5703125, 18.23046875, 18.890625, 19.55078125, 20.2109375, 20.87109375, 21.53125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 3.0, 2.0, 8.0, 8.0, 8.0, 12.0, 13.0, 8.0, 14.0, 13.0, 12.0, 14.0, 24.0, 31.0, 25.0, 18.0, 29.0, 45.0, 40.0, 40.0, 34.0, 41.0, 46.0, 34.0, 43.0, 41.0, 35.0, 50.0, 31.0, 39.0, 28.0, 25.0, 25.0, 31.0, 20.0, 23.0, 16.0, 20.0, 9.0, 7.0, 5.0, 7.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -17.0335693359375, -16.520263671875, -16.0069580078125, -15.49365234375, -14.9803466796875, -14.467041015625, -13.9537353515625, -13.4404296875, -12.9271240234375, -12.413818359375, -11.9005126953125, -11.38720703125, -10.8739013671875, -10.360595703125, -9.8472900390625, -9.333984375, -8.8206787109375, -8.307373046875, -7.7940673828125, -7.28076171875, -6.7674560546875, -6.254150390625, -5.7408447265625, -5.2275390625, -4.7142333984375, -4.200927734375, -3.6876220703125, -3.17431640625, -2.6610107421875, -2.147705078125, -1.6343994140625, -1.12109375, -0.6077880859375, -0.094482421875, 0.4188232421875, 0.93212890625, 1.4454345703125, 1.958740234375, 2.4720458984375, 2.9853515625, 3.4986572265625, 4.011962890625, 4.5252685546875, 5.03857421875, 5.5518798828125, 6.065185546875, 6.5784912109375, 7.091796875, 7.6051025390625, 8.118408203125, 8.6317138671875, 9.14501953125, 9.6583251953125, 10.171630859375, 10.6849365234375, 11.1982421875, 11.7115478515625, 12.224853515625, 12.7381591796875, 13.25146484375, 13.7647705078125, 14.278076171875, 14.7913818359375, 15.3046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 19.0, 16.0, 27.0, 48.0, 69.0, 105.0, 140.0, 258.0, 333.0, 535.0, 905.0, 1767.0, 3794.0, 10153.0, 32774.0, 142110.0, 609087.0, 186160.0, 39673.0, 11670.0, 4311.0, 1935.0, 1009.0, 597.0, 316.0, 224.0, 133.0, 115.0, 71.0, 49.0, 41.0, 27.0, 21.0, 14.0, 11.0, 9.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.75, -44.921875, -43.09375, -41.265625, -39.4375, -37.609375, -35.78125, -33.953125, -32.125, -30.296875, -28.46875, -26.640625, -24.8125, -22.984375, -21.15625, -19.328125, -17.5, -15.671875, -13.84375, -12.015625, -10.1875, -8.359375, -6.53125, -4.703125, -2.875, -1.046875, 0.78125, 2.609375, 4.4375, 6.265625, 8.09375, 9.921875, 11.75, 13.578125, 15.40625, 17.234375, 19.0625, 20.890625, 22.71875, 24.546875, 26.375, 28.203125, 30.03125, 31.859375, 33.6875, 35.515625, 37.34375, 39.171875, 41.0, 42.828125, 44.65625, 46.484375, 48.3125, 50.140625, 51.96875, 53.796875, 55.625, 57.453125, 59.28125, 61.109375, 62.9375, 64.765625, 66.59375, 68.421875, 70.25]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 7.0, 8.0, 8.0, 12.0, 19.0, 22.0, 46.0, 60.0, 98.0, 175.0, 213.0, 109.0, 70.0, 44.0, 23.0, 26.0, 12.0, 12.0, 11.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005031585693359375, -0.004888176918029785, -0.004744768142700195, -0.0046013593673706055, -0.004457950592041016, -0.004314541816711426, -0.004171133041381836, -0.004027724266052246, -0.0038843154907226562, -0.0037409067153930664, -0.0035974979400634766, -0.0034540891647338867, -0.003310680389404297, -0.003167271614074707, -0.003023862838745117, -0.0028804540634155273, -0.0027370452880859375, -0.0025936365127563477, -0.002450227737426758, -0.002306818962097168, -0.002163410186767578, -0.0020200014114379883, -0.0018765926361083984, -0.0017331838607788086, -0.0015897750854492188, -0.001446366310119629, -0.001302957534790039, -0.0011595487594604492, -0.0010161399841308594, -0.0008727312088012695, -0.0007293224334716797, -0.0005859136581420898, -0.0004425048828125, -0.00029909610748291016, -0.0001556873321533203, -1.2278556823730469e-05, 0.00013113021850585938, 0.0002745389938354492, 0.00041794776916503906, 0.0005613565444946289, 0.0007047653198242188, 0.0008481740951538086, 0.0009915828704833984, 0.0011349916458129883, 0.0012784004211425781, 0.001421809196472168, 0.0015652179718017578, 0.0017086267471313477, 0.0018520355224609375, 0.0019954442977905273, 0.002138853073120117, 0.002282261848449707, 0.002425670623779297, 0.0025690793991088867, 0.0027124881744384766, 0.0028558969497680664, 0.0029993057250976562, 0.003142714500427246, 0.003286123275756836, 0.0034295320510864258, 0.0035729408264160156, 0.0037163496017456055, 0.0038597583770751953, 0.004003167152404785, 0.004146575927734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 8.0, 21.0, 27.0, 29.0, 48.0, 86.0, 103.0, 143.0, 220.0, 294.0, 450.0, 758.0, 1118.0, 1728.0, 2706.0, 4493.0, 7627.0, 13558.0, 23554.0, 42528.0, 77795.0, 150765.0, 247447.0, 215850.0, 115990.0, 60766.0, 34094.0, 18980.0, 10807.0, 6231.0, 3798.0, 2279.0, 1462.0, 939.0, 630.0, 415.0, 239.0, 182.0, 120.0, 73.0, 49.0, 39.0, 31.0, 24.0, 13.0, 9.0, 3.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-25.125, -24.359130859375, -23.59326171875, -22.827392578125, -22.0615234375, -21.295654296875, -20.52978515625, -19.763916015625, -18.998046875, -18.232177734375, -17.46630859375, -16.700439453125, -15.9345703125, -15.168701171875, -14.40283203125, -13.636962890625, -12.87109375, -12.105224609375, -11.33935546875, -10.573486328125, -9.8076171875, -9.041748046875, -8.27587890625, -7.510009765625, -6.744140625, -5.978271484375, -5.21240234375, -4.446533203125, -3.6806640625, -2.914794921875, -2.14892578125, -1.383056640625, -0.6171875, 0.148681640625, 0.91455078125, 1.680419921875, 2.4462890625, 3.212158203125, 3.97802734375, 4.743896484375, 5.509765625, 6.275634765625, 7.04150390625, 7.807373046875, 8.5732421875, 9.339111328125, 10.10498046875, 10.870849609375, 11.63671875, 12.402587890625, 13.16845703125, 13.934326171875, 14.7001953125, 15.466064453125, 16.23193359375, 16.997802734375, 17.763671875, 18.529541015625, 19.29541015625, 20.061279296875, 20.8271484375, 21.593017578125, 22.35888671875, 23.124755859375, 23.890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 6.0, 5.0, 11.0, 8.0, 20.0, 9.0, 14.0, 16.0, 26.0, 36.0, 28.0, 40.0, 58.0, 71.0, 78.0, 88.0, 88.0, 65.0, 61.0, 39.0, 43.0, 29.0, 30.0, 26.0, 21.0, 18.0, 12.0, 11.0, 9.0, 11.0, 2.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.53411865234375, -10.2479248046875, -9.96173095703125, -9.675537109375, -9.38934326171875, -9.1031494140625, -8.81695556640625, -8.53076171875, -8.24456787109375, -7.9583740234375, -7.67218017578125, -7.385986328125, -7.09979248046875, -6.8135986328125, -6.52740478515625, -6.2412109375, -5.95501708984375, -5.6688232421875, -5.38262939453125, -5.096435546875, -4.81024169921875, -4.5240478515625, -4.23785400390625, -3.95166015625, -3.66546630859375, -3.3792724609375, -3.09307861328125, -2.806884765625, -2.52069091796875, -2.2344970703125, -1.94830322265625, -1.662109375, -1.37591552734375, -1.0897216796875, -0.80352783203125, -0.517333984375, -0.23114013671875, 0.0550537109375, 0.34124755859375, 0.62744140625, 0.91363525390625, 1.1998291015625, 1.48602294921875, 1.772216796875, 2.05841064453125, 2.3446044921875, 2.63079833984375, 2.9169921875, 3.20318603515625, 3.4893798828125, 3.77557373046875, 4.061767578125, 4.34796142578125, 4.6341552734375, 4.92034912109375, 5.20654296875, 5.49273681640625, 5.7789306640625, 6.06512451171875, 6.351318359375, 6.63751220703125, 6.9237060546875, 7.20989990234375, 7.49609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 15.0, 8.0, 14.0, 23.0, 18.0, 16.0, 30.0, 23.0, 44.0, 31.0, 43.0, 44.0, 45.0, 41.0, 57.0, 46.0, 48.0, 47.0, 39.0, 39.0, 40.0, 45.0, 38.0, 42.0, 15.0, 27.0, 20.0, 20.0, 18.0, 7.0, 6.0, 6.0, 7.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.890993118286133, -24.126096725463867, -23.3612003326416, -22.596303939819336, -21.83140754699707, -21.066511154174805, -20.30161476135254, -19.536718368530273, -18.771821975708008, -18.006925582885742, -17.242029190063477, -16.47713279724121, -15.712236404418945, -14.94734001159668, -14.182443618774414, -13.417547225952148, -12.652650833129883, -11.887754440307617, -11.122858047485352, -10.357961654663086, -9.59306526184082, -8.828168869018555, -8.063272476196289, -7.298376083374023, -6.533479690551758, -5.768583297729492, -5.003686904907227, -4.238790512084961, -3.4738941192626953, -2.7089977264404297, -1.944101333618164, -1.1792049407958984, -0.414306640625, 0.3505897521972656, 1.1154861450195312, 1.8803825378417969, 2.6452789306640625, 3.410175323486328, 4.175071716308594, 4.939968109130859, 5.704864501953125, 6.469760894775391, 7.234657287597656, 7.999553680419922, 8.764450073242188, 9.529346466064453, 10.294242858886719, 11.059139251708984, 11.82403564453125, 12.588932037353516, 13.353828430175781, 14.118724822998047, 14.883621215820312, 15.648517608642578, 16.413414001464844, 17.17831039428711, 17.943206787109375, 18.70810317993164, 19.472999572753906, 20.237895965576172, 21.002792358398438, 21.767688751220703, 22.53258514404297, 23.297481536865234, 24.0623779296875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 3.0, 8.0, 9.0, 8.0, 12.0, 11.0, 17.0, 14.0, 17.0, 19.0, 20.0, 16.0, 15.0, 19.0, 32.0, 33.0, 36.0, 22.0, 39.0, 32.0, 32.0, 44.0, 34.0, 43.0, 39.0, 38.0, 37.0, 41.0, 33.0, 31.0, 22.0, 27.0, 29.0, 17.0, 13.0, 21.0, 13.0, 21.0, 14.0, 3.0, 11.0, 3.0, 14.0, 7.0, 5.0, 8.0, 3.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.59387969970703, -19.931934356689453, -19.269987106323242, -18.608041763305664, -17.946096420288086, -17.284149169921875, -16.622203826904297, -15.960258483886719, -15.298312187194824, -14.63636589050293, -13.974420547485352, -13.312474250793457, -12.650527954101562, -11.988582611083984, -11.32663631439209, -10.664690017700195, -10.002744674682617, -9.340798377990723, -8.678853034973145, -8.01690673828125, -7.354960918426514, -6.693015098571777, -6.031068801879883, -5.3691229820251465, -4.70717716217041, -4.045231342315674, -3.3832852840423584, -2.721339225769043, -2.0593934059143066, -1.3974475860595703, -0.7355015277862549, -0.07355546951293945, 0.5883922576904297, 1.2503381967544556, 1.9122841358184814, 2.574230194091797, 3.236176013946533, 3.8981218338012695, 4.560068130493164, 5.2220139503479, 5.883959770202637, 6.545905590057373, 7.207851409912109, 7.869797706604004, 8.531744003295898, 9.193689346313477, 9.855635643005371, 10.517581939697266, 11.179527282714844, 11.841473579406738, 12.503418922424316, 13.165365219116211, 13.827310562133789, 14.489256858825684, 15.151203155517578, 15.813148498535156, 16.475093841552734, 17.137039184570312, 17.798986434936523, 18.4609317779541, 19.12287712097168, 19.78482437133789, 20.44676971435547, 21.108715057373047, 21.770662307739258]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 11.0, 17.0, 27.0, 47.0, 75.0, 148.0, 226.0, 316.0, 538.0, 780.0, 1306.0, 2014.0, 3131.0, 4899.0, 7499.0, 11257.0, 16839.0, 24721.0, 35175.0, 48171.0, 62924.0, 77916.0, 91429.0, 100068.0, 102782.0, 97844.0, 87443.0, 72676.0, 57830.0, 43387.0, 31743.0, 21891.0, 14955.0, 10128.0, 6776.0, 4087.0, 2756.0, 1742.0, 1099.0, 700.0, 463.0, 272.0, 178.0, 98.0, 60.0, 35.0, 25.0, 18.0, 13.0, 7.0, 6.0, 2.0, 3.0, 0.0, 3.0], "bins": [-14.3046875, -13.8756103515625, -13.446533203125, -13.0174560546875, -12.58837890625, -12.1593017578125, -11.730224609375, -11.3011474609375, -10.8720703125, -10.4429931640625, -10.013916015625, -9.5848388671875, -9.15576171875, -8.7266845703125, -8.297607421875, -7.8685302734375, -7.439453125, -7.0103759765625, -6.581298828125, -6.1522216796875, -5.72314453125, -5.2940673828125, -4.864990234375, -4.4359130859375, -4.0068359375, -3.5777587890625, -3.148681640625, -2.7196044921875, -2.29052734375, -1.8614501953125, -1.432373046875, -1.0032958984375, -0.57421875, -0.1451416015625, 0.283935546875, 0.7130126953125, 1.14208984375, 1.5711669921875, 2.000244140625, 2.4293212890625, 2.8583984375, 3.2874755859375, 3.716552734375, 4.1456298828125, 4.57470703125, 5.0037841796875, 5.432861328125, 5.8619384765625, 6.291015625, 6.7200927734375, 7.149169921875, 7.5782470703125, 8.00732421875, 8.4364013671875, 8.865478515625, 9.2945556640625, 9.7236328125, 10.1527099609375, 10.581787109375, 11.0108642578125, 11.43994140625, 11.8690185546875, 12.298095703125, 12.7271728515625, 13.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 6.0, 4.0, 9.0, 8.0, 9.0, 17.0, 11.0, 18.0, 21.0, 13.0, 22.0, 23.0, 23.0, 31.0, 26.0, 29.0, 32.0, 36.0, 42.0, 40.0, 41.0, 41.0, 40.0, 40.0, 38.0, 44.0, 36.0, 26.0, 35.0, 22.0, 30.0, 22.0, 26.0, 17.0, 17.0, 15.0, 15.0, 12.0, 10.0, 8.0, 10.0, 7.0, 2.0, 11.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.4375, -20.7265625, -20.015625, -19.3046875, -18.59375, -17.8828125, -17.171875, -16.4609375, -15.75, -15.0390625, -14.328125, -13.6171875, -12.90625, -12.1953125, -11.484375, -10.7734375, -10.0625, -9.3515625, -8.640625, -7.9296875, -7.21875, -6.5078125, -5.796875, -5.0859375, -4.375, -3.6640625, -2.953125, -2.2421875, -1.53125, -0.8203125, -0.109375, 0.6015625, 1.3125, 2.0234375, 2.734375, 3.4453125, 4.15625, 4.8671875, 5.578125, 6.2890625, 7.0, 7.7109375, 8.421875, 9.1328125, 9.84375, 10.5546875, 11.265625, 11.9765625, 12.6875, 13.3984375, 14.109375, 14.8203125, 15.53125, 16.2421875, 16.953125, 17.6640625, 18.375, 19.0859375, 19.796875, 20.5078125, 21.21875, 21.9296875, 22.640625, 23.3515625, 24.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 12.0, 16.0, 34.0, 42.0, 59.0, 82.0, 125.0, 168.0, 274.0, 338.0, 521.0, 763.0, 1137.0, 1768.0, 2511.0, 3889.0, 5761.0, 8976.0, 13598.0, 20132.0, 29535.0, 42356.0, 58540.0, 77329.0, 94106.0, 106920.0, 111695.0, 106994.0, 94139.0, 76747.0, 58671.0, 42215.0, 29657.0, 19826.0, 13317.0, 8758.0, 5844.0, 3873.0, 2468.0, 1733.0, 1167.0, 810.0, 516.0, 356.0, 272.0, 164.0, 106.0, 66.0, 44.0, 37.0, 36.0, 13.0, 15.0, 4.0, 9.0, 6.0, 3.0, 2.0], "bins": [-17.53125, -16.99169921875, -16.4521484375, -15.91259765625, -15.373046875, -14.83349609375, -14.2939453125, -13.75439453125, -13.21484375, -12.67529296875, -12.1357421875, -11.59619140625, -11.056640625, -10.51708984375, -9.9775390625, -9.43798828125, -8.8984375, -8.35888671875, -7.8193359375, -7.27978515625, -6.740234375, -6.20068359375, -5.6611328125, -5.12158203125, -4.58203125, -4.04248046875, -3.5029296875, -2.96337890625, -2.423828125, -1.88427734375, -1.3447265625, -0.80517578125, -0.265625, 0.27392578125, 0.8134765625, 1.35302734375, 1.892578125, 2.43212890625, 2.9716796875, 3.51123046875, 4.05078125, 4.59033203125, 5.1298828125, 5.66943359375, 6.208984375, 6.74853515625, 7.2880859375, 7.82763671875, 8.3671875, 8.90673828125, 9.4462890625, 9.98583984375, 10.525390625, 11.06494140625, 11.6044921875, 12.14404296875, 12.68359375, 13.22314453125, 13.7626953125, 14.30224609375, 14.841796875, 15.38134765625, 15.9208984375, 16.46044921875, 17.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 9.0, 13.0, 16.0, 16.0, 12.0, 13.0, 16.0, 20.0, 24.0, 30.0, 31.0, 30.0, 33.0, 36.0, 35.0, 43.0, 31.0, 32.0, 40.0, 45.0, 47.0, 45.0, 42.0, 37.0, 20.0, 31.0, 36.0, 27.0, 19.0, 23.0, 26.0, 16.0, 10.0, 13.0, 15.0, 7.0, 10.0, 5.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-17.390625, -16.918701171875, -16.44677734375, -15.974853515625, -15.5029296875, -15.031005859375, -14.55908203125, -14.087158203125, -13.615234375, -13.143310546875, -12.67138671875, -12.199462890625, -11.7275390625, -11.255615234375, -10.78369140625, -10.311767578125, -9.83984375, -9.367919921875, -8.89599609375, -8.424072265625, -7.9521484375, -7.480224609375, -7.00830078125, -6.536376953125, -6.064453125, -5.592529296875, -5.12060546875, -4.648681640625, -4.1767578125, -3.704833984375, -3.23291015625, -2.760986328125, -2.2890625, -1.817138671875, -1.34521484375, -0.873291015625, -0.4013671875, 0.070556640625, 0.54248046875, 1.014404296875, 1.486328125, 1.958251953125, 2.43017578125, 2.902099609375, 3.3740234375, 3.845947265625, 4.31787109375, 4.789794921875, 5.26171875, 5.733642578125, 6.20556640625, 6.677490234375, 7.1494140625, 7.621337890625, 8.09326171875, 8.565185546875, 9.037109375, 9.509033203125, 9.98095703125, 10.452880859375, 10.9248046875, 11.396728515625, 11.86865234375, 12.340576171875, 12.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 9.0, 11.0, 15.0, 22.0, 30.0, 42.0, 70.0, 108.0, 169.0, 239.0, 378.0, 566.0, 861.0, 1303.0, 2199.0, 3270.0, 5310.0, 8401.0, 13352.0, 21065.0, 32951.0, 49412.0, 70497.0, 94624.0, 115502.0, 127354.0, 124511.0, 108335.0, 85650.0, 62720.0, 42704.0, 28263.0, 17917.0, 11496.0, 6967.0, 4415.0, 2839.0, 1727.0, 1139.0, 705.0, 446.0, 309.0, 210.0, 136.0, 102.0, 73.0, 56.0, 24.0, 22.0, 11.0, 11.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-6.2734375, -6.082275390625, -5.89111328125, -5.699951171875, -5.5087890625, -5.317626953125, -5.12646484375, -4.935302734375, -4.744140625, -4.552978515625, -4.36181640625, -4.170654296875, -3.9794921875, -3.788330078125, -3.59716796875, -3.406005859375, -3.21484375, -3.023681640625, -2.83251953125, -2.641357421875, -2.4501953125, -2.259033203125, -2.06787109375, -1.876708984375, -1.685546875, -1.494384765625, -1.30322265625, -1.112060546875, -0.9208984375, -0.729736328125, -0.53857421875, -0.347412109375, -0.15625, 0.034912109375, 0.22607421875, 0.417236328125, 0.6083984375, 0.799560546875, 0.99072265625, 1.181884765625, 1.373046875, 1.564208984375, 1.75537109375, 1.946533203125, 2.1376953125, 2.328857421875, 2.52001953125, 2.711181640625, 2.90234375, 3.093505859375, 3.28466796875, 3.475830078125, 3.6669921875, 3.858154296875, 4.04931640625, 4.240478515625, 4.431640625, 4.622802734375, 4.81396484375, 5.005126953125, 5.1962890625, 5.387451171875, 5.57861328125, 5.769775390625, 5.9609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 7.0, 14.0, 19.0, 24.0, 26.0, 21.0, 23.0, 21.0, 38.0, 33.0, 53.0, 54.0, 55.0, 59.0, 46.0, 59.0, 52.0, 55.0, 55.0, 37.0, 28.0, 45.0, 31.0, 26.0, 26.0, 18.0, 10.0, 7.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007405281066894531, -0.0007174089550971985, -0.0006942898035049438, -0.0006711706519126892, -0.0006480515003204346, -0.0006249323487281799, -0.0006018131971359253, -0.0005786940455436707, -0.000555574893951416, -0.0005324557423591614, -0.0005093365907669067, -0.0004862174391746521, -0.00046309828758239746, -0.0004399791359901428, -0.0004168599843978882, -0.00039374083280563354, -0.0003706216812133789, -0.00034750252962112427, -0.00032438337802886963, -0.000301264226436615, -0.00027814507484436035, -0.0002550259232521057, -0.00023190677165985107, -0.00020878762006759644, -0.0001856684684753418, -0.00016254931688308716, -0.00013943016529083252, -0.00011631101369857788, -9.319186210632324e-05, -7.00727105140686e-05, -4.6953558921813965e-05, -2.3834407329559326e-05, -7.152557373046875e-07, 2.240389585494995e-05, 4.552304744720459e-05, 6.864219903945923e-05, 9.176135063171387e-05, 0.0001148805022239685, 0.00013799965381622314, 0.00016111880540847778, 0.00018423795700073242, 0.00020735710859298706, 0.0002304762601852417, 0.00025359541177749634, 0.000276714563369751, 0.0002998337149620056, 0.00032295286655426025, 0.0003460720181465149, 0.00036919116973876953, 0.00039231032133102417, 0.0004154294729232788, 0.00043854862451553345, 0.0004616677761077881, 0.0004847869277000427, 0.0005079060792922974, 0.000531025230884552, 0.0005541443824768066, 0.0005772635340690613, 0.0006003826856613159, 0.0006235018372535706, 0.0006466209888458252, 0.0006697401404380798, 0.0006928592920303345, 0.0007159784436225891, 0.0007390975952148438]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 13.0, 16.0, 20.0, 47.0, 53.0, 65.0, 116.0, 168.0, 227.0, 339.0, 552.0, 869.0, 1421.0, 2162.0, 3386.0, 5283.0, 8380.0, 12792.0, 19949.0, 30350.0, 43891.0, 61310.0, 81264.0, 100202.0, 114483.0, 116827.0, 110181.0, 93926.0, 73879.0, 54664.0, 38208.0, 26007.0, 16929.0, 10881.0, 7082.0, 4562.0, 2888.0, 1819.0, 1130.0, 768.0, 490.0, 316.0, 203.0, 144.0, 83.0, 63.0, 49.0, 31.0, 16.0, 22.0, 11.0, 8.0, 3.0, 2.0, 2.0, 1.0, 4.0], "bins": [-5.6171875, -5.443359375, -5.26953125, -5.095703125, -4.921875, -4.748046875, -4.57421875, -4.400390625, -4.2265625, -4.052734375, -3.87890625, -3.705078125, -3.53125, -3.357421875, -3.18359375, -3.009765625, -2.8359375, -2.662109375, -2.48828125, -2.314453125, -2.140625, -1.966796875, -1.79296875, -1.619140625, -1.4453125, -1.271484375, -1.09765625, -0.923828125, -0.75, -0.576171875, -0.40234375, -0.228515625, -0.0546875, 0.119140625, 0.29296875, 0.466796875, 0.640625, 0.814453125, 0.98828125, 1.162109375, 1.3359375, 1.509765625, 1.68359375, 1.857421875, 2.03125, 2.205078125, 2.37890625, 2.552734375, 2.7265625, 2.900390625, 3.07421875, 3.248046875, 3.421875, 3.595703125, 3.76953125, 3.943359375, 4.1171875, 4.291015625, 4.46484375, 4.638671875, 4.8125, 4.986328125, 5.16015625, 5.333984375, 5.5078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 7.0, 8.0, 12.0, 10.0, 13.0, 26.0, 30.0, 40.0, 32.0, 35.0, 45.0, 50.0, 54.0, 56.0, 48.0, 62.0, 57.0, 56.0, 41.0, 49.0, 45.0, 37.0, 43.0, 30.0, 31.0, 14.0, 15.0, 10.0, 6.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.44940185546875, -2.3558349609375, -2.26226806640625, -2.168701171875, -2.07513427734375, -1.9815673828125, -1.88800048828125, -1.79443359375, -1.70086669921875, -1.6072998046875, -1.51373291015625, -1.420166015625, -1.32659912109375, -1.2330322265625, -1.13946533203125, -1.0458984375, -0.95233154296875, -0.8587646484375, -0.76519775390625, -0.671630859375, -0.57806396484375, -0.4844970703125, -0.39093017578125, -0.29736328125, -0.20379638671875, -0.1102294921875, -0.01666259765625, 0.076904296875, 0.17047119140625, 0.2640380859375, 0.35760498046875, 0.451171875, 0.54473876953125, 0.6383056640625, 0.73187255859375, 0.825439453125, 0.91900634765625, 1.0125732421875, 1.10614013671875, 1.19970703125, 1.29327392578125, 1.3868408203125, 1.48040771484375, 1.573974609375, 1.66754150390625, 1.7611083984375, 1.85467529296875, 1.9482421875, 2.04180908203125, 2.1353759765625, 2.22894287109375, 2.322509765625, 2.41607666015625, 2.5096435546875, 2.60321044921875, 2.69677734375, 2.79034423828125, 2.8839111328125, 2.97747802734375, 3.071044921875, 3.16461181640625, 3.2581787109375, 3.35174560546875, 3.4453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 4.0, 6.0, 11.0, 7.0, 21.0, 18.0, 14.0, 19.0, 21.0, 13.0, 24.0, 29.0, 30.0, 29.0, 51.0, 45.0, 44.0, 49.0, 51.0, 38.0, 42.0, 46.0, 48.0, 37.0, 32.0, 37.0, 37.0, 28.0, 23.0, 23.0, 25.0, 16.0, 9.0, 10.0, 14.0, 7.0, 11.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.46728515625, -20.751571655273438, -20.035856246948242, -19.32014274597168, -18.604427337646484, -17.888713836669922, -17.172998428344727, -16.457284927368164, -15.741569519042969, -15.02585506439209, -14.310140609741211, -13.594426155090332, -12.878711700439453, -12.162997245788574, -11.447282791137695, -10.731569290161133, -10.015854835510254, -9.300140380859375, -8.584425926208496, -7.868711471557617, -7.152997016906738, -6.437282562255859, -5.721568584442139, -5.00585412979126, -4.290139675140381, -3.574425220489502, -2.858710765838623, -2.1429965496063232, -1.4272820949554443, -0.7115676403045654, 0.004146575927734375, 0.7198610305786133, 1.4355754852294922, 2.151289939880371, 2.86700439453125, 3.58271861076355, 4.298433303833008, 5.014147758483887, 5.729861736297607, 6.445576190948486, 7.161290645599365, 7.877005100250244, 8.592719078063965, 9.308433532714844, 10.024147987365723, 10.739862442016602, 11.45557689666748, 12.17129135131836, 12.887005805969238, 13.602720260620117, 14.318434715270996, 15.034149169921875, 15.749863624572754, 16.465578079223633, 17.181291580200195, 17.89700698852539, 18.612720489501953, 19.328433990478516, 20.04414939880371, 20.759862899780273, 21.47557830810547, 22.19129180908203, 22.907007217407227, 23.62272071838379, 24.338436126708984]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 5.0, 6.0, 7.0, 13.0, 16.0, 14.0, 19.0, 22.0, 18.0, 17.0, 28.0, 27.0, 29.0, 24.0, 36.0, 24.0, 36.0, 41.0, 31.0, 44.0, 39.0, 46.0, 37.0, 50.0, 34.0, 23.0, 37.0, 33.0, 20.0, 20.0, 22.0, 19.0, 20.0, 17.0, 21.0, 18.0, 15.0, 7.0, 11.0, 10.0, 9.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-23.3586368560791, -22.635541915893555, -21.912445068359375, -21.189350128173828, -20.46625518798828, -19.7431583404541, -19.020063400268555, -18.296966552734375, -17.573871612548828, -16.85077667236328, -16.1276798248291, -15.404584884643555, -14.681488990783691, -13.958393096923828, -13.235298156738281, -12.512202262878418, -11.789106369018555, -11.066010475158691, -10.342914581298828, -9.619819641113281, -8.896723747253418, -8.173627853393555, -7.45053243637085, -6.7274370193481445, -6.004341125488281, -5.281245231628418, -4.558149814605713, -3.8350541591644287, -3.1119585037231445, -2.3888628482818604, -1.6657671928405762, -0.9426717758178711, -0.2195758819580078, 0.5035197734832764, 1.2266154289245605, 1.9497110843658447, 2.672806739807129, 3.395902395248413, 4.118998050689697, 4.842093467712402, 5.565189361572266, 6.288285255432129, 7.011380672454834, 7.734476089477539, 8.457571983337402, 9.180667877197266, 9.903762817382812, 10.626858711242676, 11.349954605102539, 12.073050498962402, 12.796146392822266, 13.519241333007812, 14.242337226867676, 14.965433120727539, 15.688528060913086, 16.411624908447266, 17.134719848632812, 17.85781478881836, 18.58091163635254, 19.304006576538086, 20.027103424072266, 20.750198364257812, 21.47329330444336, 22.196388244628906, 22.919485092163086]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 7.0, 18.0, 45.0, 83.0, 133.0, 212.0, 370.0, 603.0, 1036.0, 1806.0, 2940.0, 5054.0, 8331.0, 14356.0, 24829.0, 42801.0, 73086.0, 123074.0, 201944.0, 311443.0, 441128.0, 555609.0, 599334.0, 551253.0, 437214.0, 307542.0, 197430.0, 120616.0, 71636.0, 41414.0, 24259.0, 14248.0, 8160.0, 4844.0, 2905.0, 1733.0, 1031.0, 635.0, 405.0, 244.0, 169.0, 98.0, 68.0, 44.0, 27.0, 21.0, 18.0, 7.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.0, -17.389404296875, -16.77880859375, -16.168212890625, -15.5576171875, -14.947021484375, -14.33642578125, -13.725830078125, -13.115234375, -12.504638671875, -11.89404296875, -11.283447265625, -10.6728515625, -10.062255859375, -9.45166015625, -8.841064453125, -8.23046875, -7.619873046875, -7.00927734375, -6.398681640625, -5.7880859375, -5.177490234375, -4.56689453125, -3.956298828125, -3.345703125, -2.735107421875, -2.12451171875, -1.513916015625, -0.9033203125, -0.292724609375, 0.31787109375, 0.928466796875, 1.5390625, 2.149658203125, 2.76025390625, 3.370849609375, 3.9814453125, 4.592041015625, 5.20263671875, 5.813232421875, 6.423828125, 7.034423828125, 7.64501953125, 8.255615234375, 8.8662109375, 9.476806640625, 10.08740234375, 10.697998046875, 11.30859375, 11.919189453125, 12.52978515625, 13.140380859375, 13.7509765625, 14.361572265625, 14.97216796875, 15.582763671875, 16.193359375, 16.803955078125, 17.41455078125, 18.025146484375, 18.6357421875, 19.246337890625, 19.85693359375, 20.467529296875, 21.078125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 6.0, 12.0, 7.0, 13.0, 15.0, 11.0, 22.0, 17.0, 20.0, 21.0, 20.0, 19.0, 28.0, 32.0, 34.0, 38.0, 38.0, 36.0, 42.0, 35.0, 47.0, 26.0, 37.0, 34.0, 40.0, 28.0, 29.0, 26.0, 22.0, 19.0, 23.0, 20.0, 20.0, 18.0, 15.0, 27.0, 11.0, 15.0, 8.0, 10.0, 9.0, 11.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-16.0, -15.460693359375, -14.92138671875, -14.382080078125, -13.8427734375, -13.303466796875, -12.76416015625, -12.224853515625, -11.685546875, -11.146240234375, -10.60693359375, -10.067626953125, -9.5283203125, -8.989013671875, -8.44970703125, -7.910400390625, -7.37109375, -6.831787109375, -6.29248046875, -5.753173828125, -5.2138671875, -4.674560546875, -4.13525390625, -3.595947265625, -3.056640625, -2.517333984375, -1.97802734375, -1.438720703125, -0.8994140625, -0.360107421875, 0.17919921875, 0.718505859375, 1.2578125, 1.797119140625, 2.33642578125, 2.875732421875, 3.4150390625, 3.954345703125, 4.49365234375, 5.032958984375, 5.572265625, 6.111572265625, 6.65087890625, 7.190185546875, 7.7294921875, 8.268798828125, 8.80810546875, 9.347412109375, 9.88671875, 10.426025390625, 10.96533203125, 11.504638671875, 12.0439453125, 12.583251953125, 13.12255859375, 13.661865234375, 14.201171875, 14.740478515625, 15.27978515625, 15.819091796875, 16.3583984375, 16.897705078125, 17.43701171875, 17.976318359375, 18.515625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 11.0, 20.0, 30.0, 51.0, 112.0, 177.0, 266.0, 468.0, 847.0, 1374.0, 2288.0, 3813.0, 6378.0, 10740.0, 17784.0, 29248.0, 47339.0, 74269.0, 114430.0, 169608.0, 240301.0, 319101.0, 398717.0, 454638.0, 474231.0, 449031.0, 388734.0, 308566.0, 229636.0, 160930.0, 108743.0, 69560.0, 43984.0, 27363.0, 16654.0, 10086.0, 5901.0, 3633.0, 2066.0, 1287.0, 693.0, 439.0, 291.0, 182.0, 109.0, 57.0, 29.0, 24.0, 20.0, 14.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.53466796875, -15.0068359375, -14.47900390625, -13.951171875, -13.42333984375, -12.8955078125, -12.36767578125, -11.83984375, -11.31201171875, -10.7841796875, -10.25634765625, -9.728515625, -9.20068359375, -8.6728515625, -8.14501953125, -7.6171875, -7.08935546875, -6.5615234375, -6.03369140625, -5.505859375, -4.97802734375, -4.4501953125, -3.92236328125, -3.39453125, -2.86669921875, -2.3388671875, -1.81103515625, -1.283203125, -0.75537109375, -0.2275390625, 0.30029296875, 0.828125, 1.35595703125, 1.8837890625, 2.41162109375, 2.939453125, 3.46728515625, 3.9951171875, 4.52294921875, 5.05078125, 5.57861328125, 6.1064453125, 6.63427734375, 7.162109375, 7.68994140625, 8.2177734375, 8.74560546875, 9.2734375, 9.80126953125, 10.3291015625, 10.85693359375, 11.384765625, 11.91259765625, 12.4404296875, 12.96826171875, 13.49609375, 14.02392578125, 14.5517578125, 15.07958984375, 15.607421875, 16.13525390625, 16.6630859375, 17.19091796875, 17.71875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 5.0, 10.0, 13.0, 26.0, 16.0, 25.0, 27.0, 41.0, 51.0, 55.0, 68.0, 78.0, 88.0, 116.0, 133.0, 157.0, 173.0, 202.0, 193.0, 192.0, 203.0, 216.0, 251.0, 190.0, 212.0, 180.0, 157.0, 143.0, 151.0, 122.0, 102.0, 84.0, 69.0, 63.0, 53.0, 47.0, 39.0, 34.0, 21.0, 12.0, 13.0, 5.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.2578125, -7.990478515625, -7.72314453125, -7.455810546875, -7.1884765625, -6.921142578125, -6.65380859375, -6.386474609375, -6.119140625, -5.851806640625, -5.58447265625, -5.317138671875, -5.0498046875, -4.782470703125, -4.51513671875, -4.247802734375, -3.98046875, -3.713134765625, -3.44580078125, -3.178466796875, -2.9111328125, -2.643798828125, -2.37646484375, -2.109130859375, -1.841796875, -1.574462890625, -1.30712890625, -1.039794921875, -0.7724609375, -0.505126953125, -0.23779296875, 0.029541015625, 0.296875, 0.564208984375, 0.83154296875, 1.098876953125, 1.3662109375, 1.633544921875, 1.90087890625, 2.168212890625, 2.435546875, 2.702880859375, 2.97021484375, 3.237548828125, 3.5048828125, 3.772216796875, 4.03955078125, 4.306884765625, 4.57421875, 4.841552734375, 5.10888671875, 5.376220703125, 5.6435546875, 5.910888671875, 6.17822265625, 6.445556640625, 6.712890625, 6.980224609375, 7.24755859375, 7.514892578125, 7.7822265625, 8.049560546875, 8.31689453125, 8.584228515625, 8.8515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 15.0, 17.0, 8.0, 29.0, 32.0, 30.0, 39.0, 29.0, 33.0, 34.0, 48.0, 59.0, 41.0, 47.0, 55.0, 49.0, 44.0, 41.0, 42.0, 37.0, 47.0, 34.0, 26.0, 25.0, 19.0, 17.0, 17.0, 8.0, 13.0, 14.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.689062118530273, -17.978342056274414, -17.267623901367188, -16.556903839111328, -15.846183776855469, -15.135464668273926, -14.424745559692383, -13.714025497436523, -13.00330638885498, -12.292587280273438, -11.581867218017578, -10.871148109436035, -10.160429000854492, -9.449708938598633, -8.73898983001709, -8.028270721435547, -7.3175506591796875, -6.606831073760986, -5.896111488342285, -5.185392379760742, -4.474672794342041, -3.76395320892334, -3.053234100341797, -2.3425145149230957, -1.6317949295043945, -0.9210754632949829, -0.2103559970855713, 0.5003633499145508, 1.211082935333252, 1.9218025207519531, 2.632521629333496, 3.3432412147521973, 4.053962707519531, 4.764682292938232, 5.475401878356934, 6.186120986938477, 6.896840572357178, 7.607560157775879, 8.318279266357422, 9.028999328613281, 9.739718437194824, 10.450437545776367, 11.161157608032227, 11.87187671661377, 12.582595825195312, 13.293315887451172, 14.004034996032715, 14.714754104614258, 15.425474166870117, 16.136194229125977, 16.846912384033203, 17.557632446289062, 18.268352508544922, 18.97907257080078, 19.689790725708008, 20.400510787963867, 21.111228942871094, 21.821949005126953, 22.53266716003418, 23.24338722229004, 23.9541072845459, 24.664825439453125, 25.375545501708984, 26.086265563964844, 26.796985626220703]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 9.0, 7.0, 6.0, 12.0, 13.0, 18.0, 15.0, 25.0, 17.0, 30.0, 30.0, 40.0, 27.0, 30.0, 28.0, 45.0, 40.0, 44.0, 45.0, 46.0, 44.0, 34.0, 36.0, 37.0, 27.0, 35.0, 32.0, 22.0, 29.0, 18.0, 18.0, 15.0, 17.0, 22.0, 13.0, 15.0, 15.0, 13.0, 5.0, 8.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-22.43413734436035, -21.75115394592285, -21.06817054748535, -20.38518714904785, -19.70220375061035, -19.01922035217285, -18.336238861083984, -17.653255462646484, -16.970272064208984, -16.287288665771484, -15.604305267333984, -14.921321868896484, -14.238338470458984, -13.555355072021484, -12.8723726272583, -12.1893892288208, -11.506404876708984, -10.823421478271484, -10.140438079833984, -9.457454681396484, -8.774471282958984, -8.091487884521484, -7.408505439758301, -6.725522041320801, -6.042538642883301, -5.359555244445801, -4.676571846008301, -3.993588924407959, -3.310605525970459, -2.627622127532959, -1.9446392059326172, -1.2616558074951172, -0.5786724090576172, 0.10431087017059326, 0.7872941493988037, 1.4702773094177246, 2.1532607078552246, 2.8362441062927246, 3.5192270278930664, 4.202210426330566, 4.885193824768066, 5.568177223205566, 6.251160621643066, 6.934143543243408, 7.617126941680908, 8.30010986328125, 8.98309326171875, 9.66607666015625, 10.34906005859375, 11.03204345703125, 11.71502685546875, 12.39801025390625, 13.08099365234375, 13.76397705078125, 14.446959495544434, 15.129942893981934, 15.812926292419434, 16.495908737182617, 17.178892135620117, 17.861875534057617, 18.544858932495117, 19.227842330932617, 19.910825729370117, 20.593809127807617, 21.276792526245117]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 10.0, 7.0, 14.0, 21.0, 36.0, 56.0, 103.0, 130.0, 225.0, 390.0, 539.0, 897.0, 1252.0, 1895.0, 3057.0, 4324.0, 6527.0, 9232.0, 13413.0, 19140.0, 26694.0, 36998.0, 51230.0, 67899.0, 88286.0, 107495.0, 118073.0, 113450.0, 97462.0, 76652.0, 57905.0, 42494.0, 30632.0, 22254.0, 15709.0, 10922.0, 7667.0, 5207.0, 3574.0, 2374.0, 1478.0, 1028.0, 630.0, 430.0, 255.0, 166.0, 135.0, 76.0, 40.0, 31.0, 23.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.6591796875, -18.974609375, -18.2900390625, -17.60546875, -16.9208984375, -16.236328125, -15.5517578125, -14.8671875, -14.1826171875, -13.498046875, -12.8134765625, -12.12890625, -11.4443359375, -10.759765625, -10.0751953125, -9.390625, -8.7060546875, -8.021484375, -7.3369140625, -6.65234375, -5.9677734375, -5.283203125, -4.5986328125, -3.9140625, -3.2294921875, -2.544921875, -1.8603515625, -1.17578125, -0.4912109375, 0.193359375, 0.8779296875, 1.5625, 2.2470703125, 2.931640625, 3.6162109375, 4.30078125, 4.9853515625, 5.669921875, 6.3544921875, 7.0390625, 7.7236328125, 8.408203125, 9.0927734375, 9.77734375, 10.4619140625, 11.146484375, 11.8310546875, 12.515625, 13.2001953125, 13.884765625, 14.5693359375, 15.25390625, 15.9384765625, 16.623046875, 17.3076171875, 17.9921875, 18.6767578125, 19.361328125, 20.0458984375, 20.73046875, 21.4150390625, 22.099609375, 22.7841796875, 23.46875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 5.0, 7.0, 7.0, 10.0, 13.0, 17.0, 12.0, 28.0, 17.0, 29.0, 30.0, 23.0, 27.0, 39.0, 34.0, 41.0, 34.0, 46.0, 42.0, 38.0, 45.0, 45.0, 45.0, 36.0, 29.0, 31.0, 29.0, 30.0, 28.0, 26.0, 20.0, 20.0, 22.0, 18.0, 16.0, 10.0, 14.0, 9.0, 6.0, 3.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.03125, -20.412841796875, -19.79443359375, -19.176025390625, -18.5576171875, -17.939208984375, -17.32080078125, -16.702392578125, -16.083984375, -15.465576171875, -14.84716796875, -14.228759765625, -13.6103515625, -12.991943359375, -12.37353515625, -11.755126953125, -11.13671875, -10.518310546875, -9.89990234375, -9.281494140625, -8.6630859375, -8.044677734375, -7.42626953125, -6.807861328125, -6.189453125, -5.571044921875, -4.95263671875, -4.334228515625, -3.7158203125, -3.097412109375, -2.47900390625, -1.860595703125, -1.2421875, -0.623779296875, -0.00537109375, 0.613037109375, 1.2314453125, 1.849853515625, 2.46826171875, 3.086669921875, 3.705078125, 4.323486328125, 4.94189453125, 5.560302734375, 6.1787109375, 6.797119140625, 7.41552734375, 8.033935546875, 8.65234375, 9.270751953125, 9.88916015625, 10.507568359375, 11.1259765625, 11.744384765625, 12.36279296875, 12.981201171875, 13.599609375, 14.218017578125, 14.83642578125, 15.454833984375, 16.0732421875, 16.691650390625, 17.31005859375, 17.928466796875, 18.546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 11.0, 20.0, 29.0, 44.0, 71.0, 84.0, 175.0, 275.0, 428.0, 647.0, 1023.0, 1534.0, 2445.0, 3989.0, 6349.0, 9917.0, 15755.0, 25190.0, 39706.0, 62969.0, 98932.0, 145657.0, 176629.0, 156637.0, 109623.0, 70809.0, 44345.0, 27815.0, 17697.0, 10974.0, 7010.0, 4308.0, 2743.0, 1755.0, 1089.0, 702.0, 442.0, 261.0, 205.0, 108.0, 54.0, 37.0, 30.0, 14.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.015625, -28.152587890625, -27.28955078125, -26.426513671875, -25.5634765625, -24.700439453125, -23.83740234375, -22.974365234375, -22.111328125, -21.248291015625, -20.38525390625, -19.522216796875, -18.6591796875, -17.796142578125, -16.93310546875, -16.070068359375, -15.20703125, -14.343994140625, -13.48095703125, -12.617919921875, -11.7548828125, -10.891845703125, -10.02880859375, -9.165771484375, -8.302734375, -7.439697265625, -6.57666015625, -5.713623046875, -4.8505859375, -3.987548828125, -3.12451171875, -2.261474609375, -1.3984375, -0.535400390625, 0.32763671875, 1.190673828125, 2.0537109375, 2.916748046875, 3.77978515625, 4.642822265625, 5.505859375, 6.368896484375, 7.23193359375, 8.094970703125, 8.9580078125, 9.821044921875, 10.68408203125, 11.547119140625, 12.41015625, 13.273193359375, 14.13623046875, 14.999267578125, 15.8623046875, 16.725341796875, 17.58837890625, 18.451416015625, 19.314453125, 20.177490234375, 21.04052734375, 21.903564453125, 22.7666015625, 23.629638671875, 24.49267578125, 25.355712890625, 26.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 13.0, 11.0, 12.0, 10.0, 22.0, 19.0, 21.0, 26.0, 27.0, 20.0, 24.0, 40.0, 35.0, 35.0, 29.0, 34.0, 37.0, 38.0, 42.0, 35.0, 40.0, 43.0, 34.0, 39.0, 37.0, 31.0, 28.0, 31.0, 27.0, 24.0, 15.0, 18.0, 24.0, 5.0, 9.0, 8.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.1953125, -13.725830078125, -13.25634765625, -12.786865234375, -12.3173828125, -11.847900390625, -11.37841796875, -10.908935546875, -10.439453125, -9.969970703125, -9.50048828125, -9.031005859375, -8.5615234375, -8.092041015625, -7.62255859375, -7.153076171875, -6.68359375, -6.214111328125, -5.74462890625, -5.275146484375, -4.8056640625, -4.336181640625, -3.86669921875, -3.397216796875, -2.927734375, -2.458251953125, -1.98876953125, -1.519287109375, -1.0498046875, -0.580322265625, -0.11083984375, 0.358642578125, 0.828125, 1.297607421875, 1.76708984375, 2.236572265625, 2.7060546875, 3.175537109375, 3.64501953125, 4.114501953125, 4.583984375, 5.053466796875, 5.52294921875, 5.992431640625, 6.4619140625, 6.931396484375, 7.40087890625, 7.870361328125, 8.33984375, 8.809326171875, 9.27880859375, 9.748291015625, 10.2177734375, 10.687255859375, 11.15673828125, 11.626220703125, 12.095703125, 12.565185546875, 13.03466796875, 13.504150390625, 13.9736328125, 14.443115234375, 14.91259765625, 15.382080078125, 15.8515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 14.0, 7.0, 16.0, 21.0, 25.0, 24.0, 56.0, 74.0, 126.0, 163.0, 222.0, 314.0, 501.0, 798.0, 1127.0, 1890.0, 3131.0, 5146.0, 8695.0, 15690.0, 29482.0, 61524.0, 169305.0, 506826.0, 131857.0, 52704.0, 25372.0, 13562.0, 7837.0, 4530.0, 2700.0, 1686.0, 1070.0, 646.0, 467.0, 318.0, 197.0, 150.0, 88.0, 49.0, 44.0, 33.0, 25.0, 14.0, 15.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-66.75, -64.6240234375, -62.498046875, -60.3720703125, -58.24609375, -56.1201171875, -53.994140625, -51.8681640625, -49.7421875, -47.6162109375, -45.490234375, -43.3642578125, -41.23828125, -39.1123046875, -36.986328125, -34.8603515625, -32.734375, -30.6083984375, -28.482421875, -26.3564453125, -24.23046875, -22.1044921875, -19.978515625, -17.8525390625, -15.7265625, -13.6005859375, -11.474609375, -9.3486328125, -7.22265625, -5.0966796875, -2.970703125, -0.8447265625, 1.28125, 3.4072265625, 5.533203125, 7.6591796875, 9.78515625, 11.9111328125, 14.037109375, 16.1630859375, 18.2890625, 20.4150390625, 22.541015625, 24.6669921875, 26.79296875, 28.9189453125, 31.044921875, 33.1708984375, 35.296875, 37.4228515625, 39.548828125, 41.6748046875, 43.80078125, 45.9267578125, 48.052734375, 50.1787109375, 52.3046875, 54.4306640625, 56.556640625, 58.6826171875, 60.80859375, 62.9345703125, 65.060546875, 67.1865234375, 69.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 2.0, 8.0, 8.0, 13.0, 10.0, 14.0, 8.0, 19.0, 25.0, 43.0, 38.0, 66.0, 127.0, 221.0, 121.0, 61.0, 57.0, 37.0, 22.0, 22.0, 18.0, 14.0, 8.0, 8.0, 7.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00991058349609375, -0.009652256965637207, -0.009393930435180664, -0.009135603904724121, -0.008877277374267578, -0.008618950843811035, -0.008360624313354492, -0.00810229778289795, -0.007843971252441406, -0.007585644721984863, -0.00732731819152832, -0.007068991661071777, -0.006810665130615234, -0.006552338600158691, -0.0062940120697021484, -0.0060356855392456055, -0.0057773590087890625, -0.0055190324783325195, -0.0052607059478759766, -0.005002379417419434, -0.004744052886962891, -0.004485726356506348, -0.004227399826049805, -0.003969073295593262, -0.0037107467651367188, -0.0034524202346801758, -0.003194093704223633, -0.00293576717376709, -0.002677440643310547, -0.002419114112854004, -0.002160787582397461, -0.001902461051940918, -0.001644134521484375, -0.001385807991027832, -0.001127481460571289, -0.0008691549301147461, -0.0006108283996582031, -0.00035250186920166016, -9.417533874511719e-05, 0.00016415119171142578, 0.00042247772216796875, 0.0006808042526245117, 0.0009391307830810547, 0.0011974573135375977, 0.0014557838439941406, 0.0017141103744506836, 0.0019724369049072266, 0.0022307634353637695, 0.0024890899658203125, 0.0027474164962768555, 0.0030057430267333984, 0.0032640695571899414, 0.0035223960876464844, 0.0037807226181030273, 0.00403904914855957, 0.004297375679016113, 0.004555702209472656, 0.004814028739929199, 0.005072355270385742, 0.005330681800842285, 0.005589008331298828, 0.005847334861755371, 0.006105661392211914, 0.006363987922668457, 0.006622314453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 7.0, 4.0, 17.0, 24.0, 31.0, 42.0, 57.0, 59.0, 100.0, 139.0, 212.0, 305.0, 491.0, 707.0, 1166.0, 1750.0, 2793.0, 4159.0, 6594.0, 10062.0, 15599.0, 23878.0, 37810.0, 60880.0, 114595.0, 276048.0, 238086.0, 99373.0, 55859.0, 34483.0, 22403.0, 14225.0, 9568.0, 6083.0, 3879.0, 2424.0, 1573.0, 1029.0, 684.0, 411.0, 292.0, 191.0, 137.0, 98.0, 59.0, 45.0, 27.0, 27.0, 25.0, 10.0, 12.0, 9.0, 4.0, 7.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-32.15625, -31.0810546875, -30.005859375, -28.9306640625, -27.85546875, -26.7802734375, -25.705078125, -24.6298828125, -23.5546875, -22.4794921875, -21.404296875, -20.3291015625, -19.25390625, -18.1787109375, -17.103515625, -16.0283203125, -14.953125, -13.8779296875, -12.802734375, -11.7275390625, -10.65234375, -9.5771484375, -8.501953125, -7.4267578125, -6.3515625, -5.2763671875, -4.201171875, -3.1259765625, -2.05078125, -0.9755859375, 0.099609375, 1.1748046875, 2.25, 3.3251953125, 4.400390625, 5.4755859375, 6.55078125, 7.6259765625, 8.701171875, 9.7763671875, 10.8515625, 11.9267578125, 13.001953125, 14.0771484375, 15.15234375, 16.2275390625, 17.302734375, 18.3779296875, 19.453125, 20.5283203125, 21.603515625, 22.6787109375, 23.75390625, 24.8291015625, 25.904296875, 26.9794921875, 28.0546875, 29.1298828125, 30.205078125, 31.2802734375, 32.35546875, 33.4306640625, 34.505859375, 35.5810546875, 36.65625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 5.0, 3.0, 7.0, 10.0, 9.0, 7.0, 11.0, 14.0, 12.0, 14.0, 22.0, 25.0, 24.0, 38.0, 48.0, 77.0, 100.0, 145.0, 108.0, 55.0, 50.0, 47.0, 25.0, 31.0, 25.0, 18.0, 18.0, 7.0, 13.0, 8.0, 6.0, 5.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.534423828125, -15.99072265625, -15.447021484375, -14.9033203125, -14.359619140625, -13.81591796875, -13.272216796875, -12.728515625, -12.184814453125, -11.64111328125, -11.097412109375, -10.5537109375, -10.010009765625, -9.46630859375, -8.922607421875, -8.37890625, -7.835205078125, -7.29150390625, -6.747802734375, -6.2041015625, -5.660400390625, -5.11669921875, -4.572998046875, -4.029296875, -3.485595703125, -2.94189453125, -2.398193359375, -1.8544921875, -1.310791015625, -0.76708984375, -0.223388671875, 0.3203125, 0.864013671875, 1.40771484375, 1.951416015625, 2.4951171875, 3.038818359375, 3.58251953125, 4.126220703125, 4.669921875, 5.213623046875, 5.75732421875, 6.301025390625, 6.8447265625, 7.388427734375, 7.93212890625, 8.475830078125, 9.01953125, 9.563232421875, 10.10693359375, 10.650634765625, 11.1943359375, 11.738037109375, 12.28173828125, 12.825439453125, 13.369140625, 13.912841796875, 14.45654296875, 15.000244140625, 15.5439453125, 16.087646484375, 16.63134765625, 17.175048828125, 17.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 15.0, 15.0, 16.0, 18.0, 30.0, 36.0, 29.0, 39.0, 36.0, 42.0, 51.0, 63.0, 65.0, 53.0, 52.0, 54.0, 53.0, 47.0, 59.0, 28.0, 39.0, 37.0, 35.0, 24.0, 15.0, 15.0, 8.0, 7.0, 8.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.163423538208008, -24.25939178466797, -23.355361938476562, -22.451330184936523, -21.547300338745117, -20.643268585205078, -19.739238739013672, -18.835206985473633, -17.931175231933594, -17.027143478393555, -16.12311363220215, -15.21908187866211, -14.315052032470703, -13.411020278930664, -12.506989479064941, -11.602958679199219, -10.698928833007812, -9.79489803314209, -8.890867233276367, -7.986835956573486, -7.082805156707764, -6.178774356842041, -5.27474308013916, -4.3707122802734375, -3.466681480407715, -2.562650680541992, -1.6586196422576904, -0.7545886039733887, 0.14944219589233398, 1.0534729957580566, 1.9575042724609375, 2.86153507232666, 3.7655677795410156, 4.669598579406738, 5.573629379272461, 6.477660655975342, 7.3816914558410645, 8.285722732543945, 9.189753532409668, 10.09378433227539, 10.997815132141113, 11.901845932006836, 12.805876731872559, 13.709907531738281, 14.61393928527832, 15.517969131469727, 16.422000885009766, 17.326030731201172, 18.23006248474121, 19.13409423828125, 20.038124084472656, 20.942155838012695, 21.8461856842041, 22.75021743774414, 23.654247283935547, 24.558279037475586, 25.462310791015625, 26.366342544555664, 27.27037239074707, 28.17440414428711, 29.078433990478516, 29.982465744018555, 30.886497497558594, 31.79052734375, 32.694557189941406]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 7.0, 9.0, 9.0, 9.0, 17.0, 22.0, 23.0, 17.0, 24.0, 26.0, 28.0, 27.0, 31.0, 37.0, 43.0, 38.0, 46.0, 36.0, 38.0, 39.0, 33.0, 36.0, 31.0, 34.0, 40.0, 22.0, 45.0, 30.0, 27.0, 20.0, 19.0, 19.0, 14.0, 16.0, 11.0, 11.0, 8.0, 13.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.623764038085938, -22.84136199951172, -22.0589599609375, -21.27655792236328, -20.494157791137695, -19.711755752563477, -18.929353713989258, -18.14695167541504, -17.364551544189453, -16.582149505615234, -15.799748420715332, -15.017346382141113, -14.234945297241211, -13.452543258666992, -12.670141220092773, -11.887739181518555, -11.105337142944336, -10.322935104370117, -9.540534019470215, -8.758131980895996, -7.9757304191589355, -7.193328857421875, -6.410926818847656, -5.628525257110596, -4.846123695373535, -4.063722133636475, -3.281320333480835, -2.4989185333251953, -1.7165169715881348, -0.9341154098510742, -0.15171337127685547, 0.6306881904602051, 1.4130916595458984, 2.195493221282959, 2.9778950214385986, 3.7602968215942383, 4.542698383331299, 5.325099945068359, 6.107501983642578, 6.889903545379639, 7.672305107116699, 8.454707145690918, 9.23710823059082, 10.019510269165039, 10.801912307739258, 11.58431339263916, 12.366715431213379, 13.149116516113281, 13.9315185546875, 14.713920593261719, 15.496321678161621, 16.278724670410156, 17.061124801635742, 17.84352684020996, 18.62592887878418, 19.4083309173584, 20.190731048583984, 20.973133087158203, 21.755535125732422, 22.53793716430664, 23.320337295532227, 24.102739334106445, 24.885141372680664, 25.667543411254883, 26.4499454498291]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 2.0, 15.0, 13.0, 32.0, 38.0, 54.0, 96.0, 142.0, 192.0, 332.0, 504.0, 911.0, 1353.0, 2122.0, 3414.0, 5209.0, 8205.0, 12867.0, 19678.0, 29120.0, 42396.0, 59674.0, 78535.0, 96921.0, 110631.0, 115325.0, 109482.0, 95110.0, 76323.0, 57830.0, 41448.0, 28044.0, 18821.0, 12248.0, 7782.0, 5081.0, 3145.0, 1996.0, 1256.0, 775.0, 497.0, 354.0, 234.0, 124.0, 84.0, 56.0, 33.0, 20.0, 13.0, 9.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-16.515625, -16.006591796875, -15.49755859375, -14.988525390625, -14.4794921875, -13.970458984375, -13.46142578125, -12.952392578125, -12.443359375, -11.934326171875, -11.42529296875, -10.916259765625, -10.4072265625, -9.898193359375, -9.38916015625, -8.880126953125, -8.37109375, -7.862060546875, -7.35302734375, -6.843994140625, -6.3349609375, -5.825927734375, -5.31689453125, -4.807861328125, -4.298828125, -3.789794921875, -3.28076171875, -2.771728515625, -2.2626953125, -1.753662109375, -1.24462890625, -0.735595703125, -0.2265625, 0.282470703125, 0.79150390625, 1.300537109375, 1.8095703125, 2.318603515625, 2.82763671875, 3.336669921875, 3.845703125, 4.354736328125, 4.86376953125, 5.372802734375, 5.8818359375, 6.390869140625, 6.89990234375, 7.408935546875, 7.91796875, 8.427001953125, 8.93603515625, 9.445068359375, 9.9541015625, 10.463134765625, 10.97216796875, 11.481201171875, 11.990234375, 12.499267578125, 13.00830078125, 13.517333984375, 14.0263671875, 14.535400390625, 15.04443359375, 15.553466796875, 16.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 4.0, 5.0, 3.0, 10.0, 14.0, 12.0, 17.0, 21.0, 15.0, 22.0, 24.0, 30.0, 30.0, 31.0, 41.0, 33.0, 36.0, 41.0, 35.0, 43.0, 40.0, 37.0, 26.0, 41.0, 37.0, 34.0, 48.0, 27.0, 25.0, 23.0, 18.0, 20.0, 21.0, 20.0, 15.0, 15.0, 13.0, 13.0, 8.0, 7.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.1875, -21.440185546875, -20.69287109375, -19.945556640625, -19.1982421875, -18.450927734375, -17.70361328125, -16.956298828125, -16.208984375, -15.461669921875, -14.71435546875, -13.967041015625, -13.2197265625, -12.472412109375, -11.72509765625, -10.977783203125, -10.23046875, -9.483154296875, -8.73583984375, -7.988525390625, -7.2412109375, -6.493896484375, -5.74658203125, -4.999267578125, -4.251953125, -3.504638671875, -2.75732421875, -2.010009765625, -1.2626953125, -0.515380859375, 0.23193359375, 0.979248046875, 1.7265625, 2.473876953125, 3.22119140625, 3.968505859375, 4.7158203125, 5.463134765625, 6.21044921875, 6.957763671875, 7.705078125, 8.452392578125, 9.19970703125, 9.947021484375, 10.6943359375, 11.441650390625, 12.18896484375, 12.936279296875, 13.68359375, 14.430908203125, 15.17822265625, 15.925537109375, 16.6728515625, 17.420166015625, 18.16748046875, 18.914794921875, 19.662109375, 20.409423828125, 21.15673828125, 21.904052734375, 22.6513671875, 23.398681640625, 24.14599609375, 24.893310546875, 25.640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 23.0, 34.0, 37.0, 65.0, 97.0, 171.0, 247.0, 421.0, 677.0, 1057.0, 1790.0, 2771.0, 4405.0, 7330.0, 11687.0, 19050.0, 30067.0, 46098.0, 69042.0, 94694.0, 119314.0, 135038.0, 131570.0, 113148.0, 87064.0, 61768.0, 40802.0, 26452.0, 16548.0, 10355.0, 6441.0, 3908.0, 2403.0, 1439.0, 944.0, 591.0, 332.0, 233.0, 162.0, 96.0, 70.0, 34.0, 29.0, 11.0, 11.0, 7.0, 9.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.4375, -18.763916015625, -18.09033203125, -17.416748046875, -16.7431640625, -16.069580078125, -15.39599609375, -14.722412109375, -14.048828125, -13.375244140625, -12.70166015625, -12.028076171875, -11.3544921875, -10.680908203125, -10.00732421875, -9.333740234375, -8.66015625, -7.986572265625, -7.31298828125, -6.639404296875, -5.9658203125, -5.292236328125, -4.61865234375, -3.945068359375, -3.271484375, -2.597900390625, -1.92431640625, -1.250732421875, -0.5771484375, 0.096435546875, 0.77001953125, 1.443603515625, 2.1171875, 2.790771484375, 3.46435546875, 4.137939453125, 4.8115234375, 5.485107421875, 6.15869140625, 6.832275390625, 7.505859375, 8.179443359375, 8.85302734375, 9.526611328125, 10.2001953125, 10.873779296875, 11.54736328125, 12.220947265625, 12.89453125, 13.568115234375, 14.24169921875, 14.915283203125, 15.5888671875, 16.262451171875, 16.93603515625, 17.609619140625, 18.283203125, 18.956787109375, 19.63037109375, 20.303955078125, 20.9775390625, 21.651123046875, 22.32470703125, 22.998291015625, 23.671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 20.0, 16.0, 11.0, 14.0, 25.0, 19.0, 35.0, 24.0, 28.0, 31.0, 33.0, 31.0, 36.0, 46.0, 48.0, 39.0, 37.0, 49.0, 38.0, 38.0, 39.0, 38.0, 38.0, 27.0, 27.0, 24.0, 22.0, 17.0, 30.0, 20.0, 11.0, 19.0, 17.0, 10.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-20.984375, -20.398193359375, -19.81201171875, -19.225830078125, -18.6396484375, -18.053466796875, -17.46728515625, -16.881103515625, -16.294921875, -15.708740234375, -15.12255859375, -14.536376953125, -13.9501953125, -13.364013671875, -12.77783203125, -12.191650390625, -11.60546875, -11.019287109375, -10.43310546875, -9.846923828125, -9.2607421875, -8.674560546875, -8.08837890625, -7.502197265625, -6.916015625, -6.329833984375, -5.74365234375, -5.157470703125, -4.5712890625, -3.985107421875, -3.39892578125, -2.812744140625, -2.2265625, -1.640380859375, -1.05419921875, -0.468017578125, 0.1181640625, 0.704345703125, 1.29052734375, 1.876708984375, 2.462890625, 3.049072265625, 3.63525390625, 4.221435546875, 4.8076171875, 5.393798828125, 5.97998046875, 6.566162109375, 7.15234375, 7.738525390625, 8.32470703125, 8.910888671875, 9.4970703125, 10.083251953125, 10.66943359375, 11.255615234375, 11.841796875, 12.427978515625, 13.01416015625, 13.600341796875, 14.1865234375, 14.772705078125, 15.35888671875, 15.945068359375, 16.53125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 18.0, 31.0, 38.0, 63.0, 85.0, 137.0, 226.0, 391.0, 715.0, 1386.0, 3018.0, 6690.0, 16545.0, 45867.0, 141009.0, 335318.0, 310306.0, 121045.0, 39433.0, 14446.0, 6134.0, 2708.0, 1235.0, 681.0, 432.0, 218.0, 122.0, 84.0, 59.0, 35.0, 16.0, 18.0, 14.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.361083984375, -31.37841796875, -30.395751953125, -29.4130859375, -28.430419921875, -27.44775390625, -26.465087890625, -25.482421875, -24.499755859375, -23.51708984375, -22.534423828125, -21.5517578125, -20.569091796875, -19.58642578125, -18.603759765625, -17.62109375, -16.638427734375, -15.65576171875, -14.673095703125, -13.6904296875, -12.707763671875, -11.72509765625, -10.742431640625, -9.759765625, -8.777099609375, -7.79443359375, -6.811767578125, -5.8291015625, -4.846435546875, -3.86376953125, -2.881103515625, -1.8984375, -0.915771484375, 0.06689453125, 1.049560546875, 2.0322265625, 3.014892578125, 3.99755859375, 4.980224609375, 5.962890625, 6.945556640625, 7.92822265625, 8.910888671875, 9.8935546875, 10.876220703125, 11.85888671875, 12.841552734375, 13.82421875, 14.806884765625, 15.78955078125, 16.772216796875, 17.7548828125, 18.737548828125, 19.72021484375, 20.702880859375, 21.685546875, 22.668212890625, 23.65087890625, 24.633544921875, 25.6162109375, 26.598876953125, 27.58154296875, 28.564208984375, 29.546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 8.0, 12.0, 22.0, 27.0, 31.0, 45.0, 68.0, 75.0, 64.0, 86.0, 96.0, 107.0, 98.0, 60.0, 58.0, 44.0, 28.0, 21.0, 14.0, 9.0, 9.0, 1.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00316619873046875, -0.003093242645263672, -0.0030202865600585938, -0.0029473304748535156, -0.0028743743896484375, -0.0028014183044433594, -0.0027284622192382812, -0.002655506134033203, -0.002582550048828125, -0.002509593963623047, -0.0024366378784179688, -0.0023636817932128906, -0.0022907257080078125, -0.0022177696228027344, -0.0021448135375976562, -0.002071857452392578, -0.0019989013671875, -0.0019259452819824219, -0.0018529891967773438, -0.0017800331115722656, -0.0017070770263671875, -0.0016341209411621094, -0.0015611648559570312, -0.0014882087707519531, -0.001415252685546875, -0.0013422966003417969, -0.0012693405151367188, -0.0011963844299316406, -0.0011234283447265625, -0.0010504722595214844, -0.0009775161743164062, -0.0009045600891113281, -0.00083160400390625, -0.0007586479187011719, -0.0006856918334960938, -0.0006127357482910156, -0.0005397796630859375, -0.0004668235778808594, -0.00039386749267578125, -0.0003209114074707031, -0.000247955322265625, -0.00017499923706054688, -0.00010204315185546875, -2.9087066650390625e-05, 4.38690185546875e-05, 0.00011682510375976562, 0.00018978118896484375, 0.0002627372741699219, 0.000335693359375, 0.0004086494445800781, 0.00048160552978515625, 0.0005545616149902344, 0.0006275177001953125, 0.0007004737854003906, 0.0007734298706054688, 0.0008463859558105469, 0.000919342041015625, 0.0009922981262207031, 0.0010652542114257812, 0.0011382102966308594, 0.0012111663818359375, 0.0012841224670410156, 0.0013570785522460938, 0.0014300346374511719, 0.00150299072265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 8.0, 13.0, 8.0, 16.0, 21.0, 34.0, 56.0, 76.0, 92.0, 135.0, 199.0, 293.0, 422.0, 592.0, 827.0, 1331.0, 1941.0, 3199.0, 5232.0, 8563.0, 15148.0, 27463.0, 49963.0, 88290.0, 140126.0, 183069.0, 182509.0, 138982.0, 86878.0, 49005.0, 26804.0, 14622.0, 8400.0, 5029.0, 3104.0, 1964.0, 1319.0, 912.0, 565.0, 392.0, 308.0, 177.0, 141.0, 115.0, 66.0, 50.0, 31.0, 22.0, 13.0, 15.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.734375, -14.273681640625, -13.81298828125, -13.352294921875, -12.8916015625, -12.430908203125, -11.97021484375, -11.509521484375, -11.048828125, -10.588134765625, -10.12744140625, -9.666748046875, -9.2060546875, -8.745361328125, -8.28466796875, -7.823974609375, -7.36328125, -6.902587890625, -6.44189453125, -5.981201171875, -5.5205078125, -5.059814453125, -4.59912109375, -4.138427734375, -3.677734375, -3.217041015625, -2.75634765625, -2.295654296875, -1.8349609375, -1.374267578125, -0.91357421875, -0.452880859375, 0.0078125, 0.468505859375, 0.92919921875, 1.389892578125, 1.8505859375, 2.311279296875, 2.77197265625, 3.232666015625, 3.693359375, 4.154052734375, 4.61474609375, 5.075439453125, 5.5361328125, 5.996826171875, 6.45751953125, 6.918212890625, 7.37890625, 7.839599609375, 8.30029296875, 8.760986328125, 9.2216796875, 9.682373046875, 10.14306640625, 10.603759765625, 11.064453125, 11.525146484375, 11.98583984375, 12.446533203125, 12.9072265625, 13.367919921875, 13.82861328125, 14.289306640625, 14.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 7.0, 5.0, 9.0, 10.0, 14.0, 19.0, 20.0, 43.0, 30.0, 45.0, 62.0, 50.0, 65.0, 74.0, 64.0, 69.0, 72.0, 71.0, 48.0, 48.0, 43.0, 14.0, 30.0, 9.0, 11.0, 18.0, 5.0, 10.0, 5.0, 6.0, 4.0, 0.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.30078125, -7.04510498046875, -6.7894287109375, -6.53375244140625, -6.278076171875, -6.02239990234375, -5.7667236328125, -5.51104736328125, -5.25537109375, -4.99969482421875, -4.7440185546875, -4.48834228515625, -4.232666015625, -3.97698974609375, -3.7213134765625, -3.46563720703125, -3.2099609375, -2.95428466796875, -2.6986083984375, -2.44293212890625, -2.187255859375, -1.93157958984375, -1.6759033203125, -1.42022705078125, -1.16455078125, -0.90887451171875, -0.6531982421875, -0.39752197265625, -0.141845703125, 0.11383056640625, 0.3695068359375, 0.62518310546875, 0.880859375, 1.13653564453125, 1.3922119140625, 1.64788818359375, 1.903564453125, 2.15924072265625, 2.4149169921875, 2.67059326171875, 2.92626953125, 3.18194580078125, 3.4376220703125, 3.69329833984375, 3.948974609375, 4.20465087890625, 4.4603271484375, 4.71600341796875, 4.9716796875, 5.22735595703125, 5.4830322265625, 5.73870849609375, 5.994384765625, 6.25006103515625, 6.5057373046875, 6.76141357421875, 7.01708984375, 7.27276611328125, 7.5284423828125, 7.78411865234375, 8.039794921875, 8.29547119140625, 8.5511474609375, 8.80682373046875, 9.0625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 7.0, 7.0, 14.0, 18.0, 22.0, 29.0, 17.0, 30.0, 32.0, 35.0, 39.0, 36.0, 50.0, 52.0, 47.0, 65.0, 60.0, 50.0, 46.0, 47.0, 51.0, 33.0, 32.0, 29.0, 35.0, 29.0, 20.0, 14.0, 10.0, 13.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.14018440246582, -21.32505989074707, -20.509937286376953, -19.694812774658203, -18.879688262939453, -18.064563751220703, -17.249441146850586, -16.434316635131836, -15.619193077087402, -14.804069519042969, -13.988945007324219, -13.173821449279785, -12.358697891235352, -11.543573379516602, -10.728449821472168, -9.913326263427734, -9.098201751708984, -8.28307819366455, -7.467953681945801, -6.652830123901367, -5.837706089019775, -5.022582054138184, -4.20745849609375, -3.392334461212158, -2.5772104263305664, -1.7620865106582642, -0.9469625949859619, -0.13183879852294922, 0.6832852363586426, 1.4984092712402344, 2.313532829284668, 3.1286568641662598, 3.9437789916992188, 4.7589030265808105, 5.574027061462402, 6.389150619506836, 7.204274654388428, 8.01939868927002, 8.834522247314453, 9.649646759033203, 10.464770317077637, 11.27989387512207, 12.09501838684082, 12.910141944885254, 13.725265502929688, 14.540390014648438, 15.355513572692871, 16.170637130737305, 16.985761642456055, 17.800886154174805, 18.616008758544922, 19.431133270263672, 20.246257781982422, 21.061382293701172, 21.87650489807129, 22.69162940979004, 23.506752014160156, 24.321876525878906, 25.136999130249023, 25.952123641967773, 26.767248153686523, 27.58237075805664, 28.39749526977539, 29.21261978149414, 30.02774429321289]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 5.0, 4.0, 6.0, 7.0, 11.0, 11.0, 16.0, 11.0, 14.0, 20.0, 22.0, 24.0, 33.0, 24.0, 29.0, 42.0, 49.0, 34.0, 40.0, 44.0, 49.0, 36.0, 50.0, 41.0, 33.0, 41.0, 38.0, 34.0, 28.0, 29.0, 16.0, 13.0, 26.0, 17.0, 14.0, 12.0, 13.0, 11.0, 9.0, 18.0, 11.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.98694610595703, -24.161849975585938, -23.336753845214844, -22.51165771484375, -21.686561584472656, -20.861465454101562, -20.03636932373047, -19.211273193359375, -18.38617706298828, -17.561080932617188, -16.735984802246094, -15.910888671875, -15.085792541503906, -14.260696411132812, -13.435600280761719, -12.610504150390625, -11.785408973693848, -10.960312843322754, -10.13521671295166, -9.310120582580566, -8.485024452209473, -7.659928798675537, -6.834832668304443, -6.00973653793335, -5.184640407562256, -4.359544277191162, -3.5344481468200684, -2.7093522548675537, -1.88425612449646, -1.0591602325439453, -0.23406410217285156, 0.5910320281982422, 1.416128158569336, 2.2412242889404297, 3.0663204193115234, 3.891416311264038, 4.716512680053711, 5.5416083335876465, 6.36670446395874, 7.191800594329834, 8.016897201538086, 8.84199333190918, 9.667089462280273, 10.492185592651367, 11.317281723022461, 12.142377853393555, 12.967473983764648, 13.792570114135742, 14.61766529083252, 15.442761421203613, 16.26785659790039, 17.092952728271484, 17.918048858642578, 18.743144989013672, 19.568241119384766, 20.39333724975586, 21.218433380126953, 22.043529510498047, 22.86862564086914, 23.693721771240234, 24.518817901611328, 25.343914031982422, 26.169010162353516, 26.99410629272461, 27.819202423095703]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [6.0, 2.0, 3.0, 11.0, 10.0, 21.0, 25.0, 54.0, 63.0, 118.0, 181.0, 280.0, 398.0, 701.0, 1029.0, 1623.0, 2695.0, 4102.0, 6588.0, 10400.0, 16693.0, 26871.0, 43431.0, 69475.0, 109633.0, 168860.0, 249833.0, 345825.0, 441087.0, 506787.0, 517456.0, 469642.0, 380972.0, 283356.0, 194654.0, 127184.0, 81073.0, 50641.0, 31236.0, 19174.0, 11986.0, 7511.0, 4754.0, 2864.0, 1850.0, 1142.0, 689.0, 467.0, 304.0, 197.0, 121.0, 82.0, 52.0, 41.0, 21.0, 10.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.28125, -13.807861328125, -13.33447265625, -12.861083984375, -12.3876953125, -11.914306640625, -11.44091796875, -10.967529296875, -10.494140625, -10.020751953125, -9.54736328125, -9.073974609375, -8.6005859375, -8.127197265625, -7.65380859375, -7.180419921875, -6.70703125, -6.233642578125, -5.76025390625, -5.286865234375, -4.8134765625, -4.340087890625, -3.86669921875, -3.393310546875, -2.919921875, -2.446533203125, -1.97314453125, -1.499755859375, -1.0263671875, -0.552978515625, -0.07958984375, 0.393798828125, 0.8671875, 1.340576171875, 1.81396484375, 2.287353515625, 2.7607421875, 3.234130859375, 3.70751953125, 4.180908203125, 4.654296875, 5.127685546875, 5.60107421875, 6.074462890625, 6.5478515625, 7.021240234375, 7.49462890625, 7.968017578125, 8.44140625, 8.914794921875, 9.38818359375, 9.861572265625, 10.3349609375, 10.808349609375, 11.28173828125, 11.755126953125, 12.228515625, 12.701904296875, 13.17529296875, 13.648681640625, 14.1220703125, 14.595458984375, 15.06884765625, 15.542236328125, 16.015625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 6.0, 9.0, 5.0, 8.0, 17.0, 15.0, 21.0, 12.0, 20.0, 26.0, 31.0, 37.0, 46.0, 33.0, 40.0, 39.0, 37.0, 60.0, 36.0, 36.0, 44.0, 43.0, 49.0, 36.0, 28.0, 36.0, 27.0, 27.0, 19.0, 28.0, 19.0, 13.0, 18.0, 15.0, 13.0, 9.0, 8.0, 8.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.140625, -19.448974609375, -18.75732421875, -18.065673828125, -17.3740234375, -16.682373046875, -15.99072265625, -15.299072265625, -14.607421875, -13.915771484375, -13.22412109375, -12.532470703125, -11.8408203125, -11.149169921875, -10.45751953125, -9.765869140625, -9.07421875, -8.382568359375, -7.69091796875, -6.999267578125, -6.3076171875, -5.615966796875, -4.92431640625, -4.232666015625, -3.541015625, -2.849365234375, -2.15771484375, -1.466064453125, -0.7744140625, -0.082763671875, 0.60888671875, 1.300537109375, 1.9921875, 2.683837890625, 3.37548828125, 4.067138671875, 4.7587890625, 5.450439453125, 6.14208984375, 6.833740234375, 7.525390625, 8.217041015625, 8.90869140625, 9.600341796875, 10.2919921875, 10.983642578125, 11.67529296875, 12.366943359375, 13.05859375, 13.750244140625, 14.44189453125, 15.133544921875, 15.8251953125, 16.516845703125, 17.20849609375, 17.900146484375, 18.591796875, 19.283447265625, 19.97509765625, 20.666748046875, 21.3583984375, 22.050048828125, 22.74169921875, 23.433349609375, 24.125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 18.0, 15.0, 28.0, 42.0, 73.0, 121.0, 199.0, 341.0, 547.0, 807.0, 1406.0, 2348.0, 3903.0, 6599.0, 10908.0, 18151.0, 29493.0, 48699.0, 77264.0, 120593.0, 181727.0, 260787.0, 352846.0, 441256.0, 498357.0, 503226.0, 453310.0, 368168.0, 276057.0, 192767.0, 128462.0, 82593.0, 51800.0, 32033.0, 19494.0, 11785.0, 7079.0, 4422.0, 2581.0, 1542.0, 945.0, 546.0, 356.0, 243.0, 137.0, 84.0, 40.0, 34.0, 22.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 3.0], "bins": [-17.5, -16.970947265625, -16.44189453125, -15.912841796875, -15.3837890625, -14.854736328125, -14.32568359375, -13.796630859375, -13.267578125, -12.738525390625, -12.20947265625, -11.680419921875, -11.1513671875, -10.622314453125, -10.09326171875, -9.564208984375, -9.03515625, -8.506103515625, -7.97705078125, -7.447998046875, -6.9189453125, -6.389892578125, -5.86083984375, -5.331787109375, -4.802734375, -4.273681640625, -3.74462890625, -3.215576171875, -2.6865234375, -2.157470703125, -1.62841796875, -1.099365234375, -0.5703125, -0.041259765625, 0.48779296875, 1.016845703125, 1.5458984375, 2.074951171875, 2.60400390625, 3.133056640625, 3.662109375, 4.191162109375, 4.72021484375, 5.249267578125, 5.7783203125, 6.307373046875, 6.83642578125, 7.365478515625, 7.89453125, 8.423583984375, 8.95263671875, 9.481689453125, 10.0107421875, 10.539794921875, 11.06884765625, 11.597900390625, 12.126953125, 12.656005859375, 13.18505859375, 13.714111328125, 14.2431640625, 14.772216796875, 15.30126953125, 15.830322265625, 16.359375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 5.0, 14.0, 7.0, 18.0, 27.0, 36.0, 35.0, 54.0, 49.0, 66.0, 96.0, 103.0, 117.0, 143.0, 123.0, 170.0, 188.0, 201.0, 186.0, 188.0, 221.0, 229.0, 233.0, 190.0, 185.0, 199.0, 152.0, 137.0, 115.0, 104.0, 103.0, 71.0, 62.0, 44.0, 39.0, 28.0, 28.0, 27.0, 15.0, 18.0, 5.0, 6.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.953125, -8.68115234375, -8.4091796875, -8.13720703125, -7.865234375, -7.59326171875, -7.3212890625, -7.04931640625, -6.77734375, -6.50537109375, -6.2333984375, -5.96142578125, -5.689453125, -5.41748046875, -5.1455078125, -4.87353515625, -4.6015625, -4.32958984375, -4.0576171875, -3.78564453125, -3.513671875, -3.24169921875, -2.9697265625, -2.69775390625, -2.42578125, -2.15380859375, -1.8818359375, -1.60986328125, -1.337890625, -1.06591796875, -0.7939453125, -0.52197265625, -0.25, 0.02197265625, 0.2939453125, 0.56591796875, 0.837890625, 1.10986328125, 1.3818359375, 1.65380859375, 1.92578125, 2.19775390625, 2.4697265625, 2.74169921875, 3.013671875, 3.28564453125, 3.5576171875, 3.82958984375, 4.1015625, 4.37353515625, 4.6455078125, 4.91748046875, 5.189453125, 5.46142578125, 5.7333984375, 6.00537109375, 6.27734375, 6.54931640625, 6.8212890625, 7.09326171875, 7.365234375, 7.63720703125, 7.9091796875, 8.18115234375, 8.453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 9.0, 5.0, 7.0, 15.0, 4.0, 17.0, 34.0, 22.0, 25.0, 31.0, 28.0, 41.0, 38.0, 48.0, 51.0, 39.0, 45.0, 66.0, 51.0, 52.0, 54.0, 45.0, 34.0, 51.0, 34.0, 27.0, 16.0, 21.0, 22.0, 17.0, 15.0, 10.0, 9.0, 8.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.552875518798828, -20.764923095703125, -19.976972579956055, -19.18902015686035, -18.40106964111328, -17.613117218017578, -16.825164794921875, -16.037212371826172, -15.249261856079102, -14.461310386657715, -13.673358917236328, -12.885406494140625, -12.097455024719238, -11.309503555297852, -10.521551132202148, -9.733599662780762, -8.945648193359375, -8.157696723937988, -7.369744777679443, -6.581792831420898, -5.793841361999512, -5.005889892578125, -4.21793794631958, -3.429986000061035, -2.6420345306396484, -1.8540828227996826, -1.0661311149597168, -0.278179407119751, 0.5097723007202148, 1.2977240085601807, 2.0856757164001465, 2.8736276626586914, 3.6615772247314453, 4.449528694152832, 5.237480640411377, 6.025432586669922, 6.813384056091309, 7.601335525512695, 8.389287948608398, 9.177239418029785, 9.965190887451172, 10.753142356872559, 11.541093826293945, 12.329046249389648, 13.116997718811035, 13.904949188232422, 14.692901611328125, 15.480853080749512, 16.2688045501709, 17.0567569732666, 17.844707489013672, 18.632659912109375, 19.420612335205078, 20.20856285095215, 20.99651527404785, 21.784465789794922, 22.572418212890625, 23.360370635986328, 24.1483211517334, 24.9362735748291, 25.724224090576172, 26.512176513671875, 27.300128936767578, 28.08808135986328, 28.87603187561035]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 7.0, 10.0, 12.0, 7.0, 17.0, 13.0, 19.0, 19.0, 27.0, 30.0, 28.0, 26.0, 49.0, 38.0, 45.0, 37.0, 25.0, 49.0, 44.0, 47.0, 54.0, 31.0, 28.0, 34.0, 29.0, 36.0, 19.0, 31.0, 30.0, 15.0, 15.0, 13.0, 15.0, 16.0, 12.0, 17.0, 7.0, 9.0, 3.0, 9.0, 8.0, 3.0, 0.0, 1.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.072805404663086, -23.315345764160156, -22.557886123657227, -21.80042839050293, -21.04296875, -20.28550910949707, -19.52804946899414, -18.770591735839844, -18.013132095336914, -17.255672454833984, -16.498212814331055, -15.740754127502441, -14.983295440673828, -14.225835800170898, -13.468376159667969, -12.710917472839355, -11.953457832336426, -11.195998191833496, -10.438539505004883, -9.681079864501953, -8.92362117767334, -8.16616153717041, -7.408702373504639, -6.651243209838867, -5.893784046173096, -5.136324882507324, -4.378865718841553, -3.621406316757202, -2.8639471530914307, -2.106487989425659, -1.3490285873413086, -0.5915694236755371, 0.16588973999023438, 0.9233489632606506, 1.680808186531067, 2.438267469406128, 3.1957266330718994, 3.953185796737671, 4.7106451988220215, 5.468104362487793, 6.2255635261535645, 6.983022689819336, 7.740481853485107, 8.497941017150879, 9.255400657653809, 10.012859344482422, 10.770318984985352, 11.527778625488281, 12.285237312316895, 13.042696952819824, 13.800155639648438, 14.557615280151367, 15.31507396697998, 16.072532653808594, 16.829992294311523, 17.587451934814453, 18.344911575317383, 19.102371215820312, 19.859830856323242, 20.61728858947754, 21.37474822998047, 22.1322078704834, 22.889667510986328, 23.647125244140625, 24.404584884643555]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 11.0, 10.0, 16.0, 34.0, 39.0, 63.0, 87.0, 134.0, 186.0, 246.0, 365.0, 530.0, 797.0, 1171.0, 1689.0, 2591.0, 3878.0, 5662.0, 8432.0, 12723.0, 18935.0, 29591.0, 45826.0, 74023.0, 121248.0, 174733.0, 183303.0, 133248.0, 82578.0, 51117.0, 32256.0, 20959.0, 13926.0, 9252.0, 6195.0, 4024.0, 2699.0, 1877.0, 1256.0, 890.0, 619.0, 410.0, 300.0, 190.0, 137.0, 101.0, 78.0, 44.0, 35.0, 16.0, 17.0, 10.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.265625, -23.459716796875, -22.65380859375, -21.847900390625, -21.0419921875, -20.236083984375, -19.43017578125, -18.624267578125, -17.818359375, -17.012451171875, -16.20654296875, -15.400634765625, -14.5947265625, -13.788818359375, -12.98291015625, -12.177001953125, -11.37109375, -10.565185546875, -9.75927734375, -8.953369140625, -8.1474609375, -7.341552734375, -6.53564453125, -5.729736328125, -4.923828125, -4.117919921875, -3.31201171875, -2.506103515625, -1.7001953125, -0.894287109375, -0.08837890625, 0.717529296875, 1.5234375, 2.329345703125, 3.13525390625, 3.941162109375, 4.7470703125, 5.552978515625, 6.35888671875, 7.164794921875, 7.970703125, 8.776611328125, 9.58251953125, 10.388427734375, 11.1943359375, 12.000244140625, 12.80615234375, 13.612060546875, 14.41796875, 15.223876953125, 16.02978515625, 16.835693359375, 17.6416015625, 18.447509765625, 19.25341796875, 20.059326171875, 20.865234375, 21.671142578125, 22.47705078125, 23.282958984375, 24.0888671875, 24.894775390625, 25.70068359375, 26.506591796875, 27.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 2.0, 8.0, 14.0, 17.0, 17.0, 14.0, 15.0, 32.0, 25.0, 27.0, 32.0, 42.0, 32.0, 36.0, 50.0, 54.0, 34.0, 56.0, 38.0, 41.0, 39.0, 39.0, 44.0, 25.0, 34.0, 19.0, 27.0, 30.0, 22.0, 16.0, 18.0, 16.0, 15.0, 14.0, 11.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.28125, -24.515869140625, -23.75048828125, -22.985107421875, -22.2197265625, -21.454345703125, -20.68896484375, -19.923583984375, -19.158203125, -18.392822265625, -17.62744140625, -16.862060546875, -16.0966796875, -15.331298828125, -14.56591796875, -13.800537109375, -13.03515625, -12.269775390625, -11.50439453125, -10.739013671875, -9.9736328125, -9.208251953125, -8.44287109375, -7.677490234375, -6.912109375, -6.146728515625, -5.38134765625, -4.615966796875, -3.8505859375, -3.085205078125, -2.31982421875, -1.554443359375, -0.7890625, -0.023681640625, 0.74169921875, 1.507080078125, 2.2724609375, 3.037841796875, 3.80322265625, 4.568603515625, 5.333984375, 6.099365234375, 6.86474609375, 7.630126953125, 8.3955078125, 9.160888671875, 9.92626953125, 10.691650390625, 11.45703125, 12.222412109375, 12.98779296875, 13.753173828125, 14.5185546875, 15.283935546875, 16.04931640625, 16.814697265625, 17.580078125, 18.345458984375, 19.11083984375, 19.876220703125, 20.6416015625, 21.406982421875, 22.17236328125, 22.937744140625, 23.703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 22.0, 39.0, 33.0, 53.0, 82.0, 114.0, 189.0, 255.0, 349.0, 524.0, 816.0, 1157.0, 1735.0, 2620.0, 4162.0, 6359.0, 10060.0, 15883.0, 25987.0, 44026.0, 77628.0, 145491.0, 234267.0, 204785.0, 114606.0, 61942.0, 35787.0, 21954.0, 13550.0, 8311.0, 5484.0, 3547.0, 2245.0, 1502.0, 971.0, 673.0, 406.0, 281.0, 190.0, 136.0, 106.0, 68.0, 57.0, 24.0, 21.0, 19.0, 11.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.65625, -25.73095703125, -24.8056640625, -23.88037109375, -22.955078125, -22.02978515625, -21.1044921875, -20.17919921875, -19.25390625, -18.32861328125, -17.4033203125, -16.47802734375, -15.552734375, -14.62744140625, -13.7021484375, -12.77685546875, -11.8515625, -10.92626953125, -10.0009765625, -9.07568359375, -8.150390625, -7.22509765625, -6.2998046875, -5.37451171875, -4.44921875, -3.52392578125, -2.5986328125, -1.67333984375, -0.748046875, 0.17724609375, 1.1025390625, 2.02783203125, 2.953125, 3.87841796875, 4.8037109375, 5.72900390625, 6.654296875, 7.57958984375, 8.5048828125, 9.43017578125, 10.35546875, 11.28076171875, 12.2060546875, 13.13134765625, 14.056640625, 14.98193359375, 15.9072265625, 16.83251953125, 17.7578125, 18.68310546875, 19.6083984375, 20.53369140625, 21.458984375, 22.38427734375, 23.3095703125, 24.23486328125, 25.16015625, 26.08544921875, 27.0107421875, 27.93603515625, 28.861328125, 29.78662109375, 30.7119140625, 31.63720703125, 32.5625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 9.0, 14.0, 22.0, 21.0, 22.0, 19.0, 20.0, 30.0, 38.0, 35.0, 43.0, 36.0, 42.0, 49.0, 38.0, 42.0, 46.0, 39.0, 48.0, 49.0, 44.0, 44.0, 40.0, 34.0, 23.0, 27.0, 14.0, 16.0, 17.0, 14.0, 13.0, 10.0, 9.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.34375, -21.69140625, -21.0390625, -20.38671875, -19.734375, -19.08203125, -18.4296875, -17.77734375, -17.125, -16.47265625, -15.8203125, -15.16796875, -14.515625, -13.86328125, -13.2109375, -12.55859375, -11.90625, -11.25390625, -10.6015625, -9.94921875, -9.296875, -8.64453125, -7.9921875, -7.33984375, -6.6875, -6.03515625, -5.3828125, -4.73046875, -4.078125, -3.42578125, -2.7734375, -2.12109375, -1.46875, -0.81640625, -0.1640625, 0.48828125, 1.140625, 1.79296875, 2.4453125, 3.09765625, 3.75, 4.40234375, 5.0546875, 5.70703125, 6.359375, 7.01171875, 7.6640625, 8.31640625, 8.96875, 9.62109375, 10.2734375, 10.92578125, 11.578125, 12.23046875, 12.8828125, 13.53515625, 14.1875, 14.83984375, 15.4921875, 16.14453125, 16.796875, 17.44921875, 18.1015625, 18.75390625, 19.40625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 9.0, 7.0, 10.0, 15.0, 30.0, 29.0, 41.0, 73.0, 95.0, 144.0, 209.0, 304.0, 444.0, 603.0, 914.0, 1437.0, 2210.0, 3426.0, 5587.0, 9454.0, 16982.0, 39296.0, 209795.0, 617677.0, 81711.0, 25370.0, 12774.0, 7364.0, 4412.0, 2721.0, 1793.0, 1183.0, 765.0, 557.0, 346.0, 211.0, 146.0, 126.0, 76.0, 49.0, 40.0, 35.0, 31.0, 17.0, 14.0, 10.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-57.6875, -55.89990234375, -54.1123046875, -52.32470703125, -50.537109375, -48.74951171875, -46.9619140625, -45.17431640625, -43.38671875, -41.59912109375, -39.8115234375, -38.02392578125, -36.236328125, -34.44873046875, -32.6611328125, -30.87353515625, -29.0859375, -27.29833984375, -25.5107421875, -23.72314453125, -21.935546875, -20.14794921875, -18.3603515625, -16.57275390625, -14.78515625, -12.99755859375, -11.2099609375, -9.42236328125, -7.634765625, -5.84716796875, -4.0595703125, -2.27197265625, -0.484375, 1.30322265625, 3.0908203125, 4.87841796875, 6.666015625, 8.45361328125, 10.2412109375, 12.02880859375, 13.81640625, 15.60400390625, 17.3916015625, 19.17919921875, 20.966796875, 22.75439453125, 24.5419921875, 26.32958984375, 28.1171875, 29.90478515625, 31.6923828125, 33.47998046875, 35.267578125, 37.05517578125, 38.8427734375, 40.63037109375, 42.41796875, 44.20556640625, 45.9931640625, 47.78076171875, 49.568359375, 51.35595703125, 53.1435546875, 54.93115234375, 56.71875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 14.0, 9.0, 9.0, 16.0, 41.0, 82.0, 267.0, 319.0, 100.0, 30.0, 19.0, 16.0, 10.0, 8.0, 9.0, 4.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00960540771484375, -0.009371817111968994, -0.009138226509094238, -0.008904635906219482, -0.008671045303344727, -0.00843745470046997, -0.008203864097595215, -0.007970273494720459, -0.007736682891845703, -0.007503092288970947, -0.007269501686096191, -0.0070359110832214355, -0.00680232048034668, -0.006568729877471924, -0.006335139274597168, -0.006101548671722412, -0.005867958068847656, -0.0056343674659729, -0.0054007768630981445, -0.005167186260223389, -0.004933595657348633, -0.004700005054473877, -0.004466414451599121, -0.004232823848724365, -0.003999233245849609, -0.0037656426429748535, -0.0035320520401000977, -0.003298461437225342, -0.003064870834350586, -0.00283128023147583, -0.0025976896286010742, -0.0023640990257263184, -0.0021305084228515625, -0.0018969178199768066, -0.0016633272171020508, -0.001429736614227295, -0.001196146011352539, -0.0009625554084777832, -0.0007289648056030273, -0.0004953742027282715, -0.0002617835998535156, -2.8192996978759766e-05, 0.0002053976058959961, 0.00043898820877075195, 0.0006725788116455078, 0.0009061694145202637, 0.0011397600173950195, 0.0013733506202697754, 0.0016069412231445312, 0.0018405318260192871, 0.002074122428894043, 0.002307713031768799, 0.0025413036346435547, 0.0027748942375183105, 0.0030084848403930664, 0.0032420754432678223, 0.003475666046142578, 0.003709256649017334, 0.00394284725189209, 0.004176437854766846, 0.0044100284576416016, 0.004643619060516357, 0.004877209663391113, 0.005110800266265869, 0.005344390869140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 11.0, 23.0, 24.0, 42.0, 66.0, 92.0, 127.0, 166.0, 259.0, 327.0, 464.0, 643.0, 864.0, 1164.0, 1665.0, 2335.0, 3480.0, 5309.0, 8466.0, 14392.0, 28080.0, 75952.0, 344927.0, 397750.0, 88498.0, 31052.0, 15410.0, 8983.0, 5697.0, 3637.0, 2458.0, 1783.0, 1176.0, 862.0, 659.0, 434.0, 336.0, 269.0, 187.0, 140.0, 101.0, 70.0, 54.0, 30.0, 22.0, 17.0, 15.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.65625, -34.42919921875, -33.2021484375, -31.97509765625, -30.748046875, -29.52099609375, -28.2939453125, -27.06689453125, -25.83984375, -24.61279296875, -23.3857421875, -22.15869140625, -20.931640625, -19.70458984375, -18.4775390625, -17.25048828125, -16.0234375, -14.79638671875, -13.5693359375, -12.34228515625, -11.115234375, -9.88818359375, -8.6611328125, -7.43408203125, -6.20703125, -4.97998046875, -3.7529296875, -2.52587890625, -1.298828125, -0.07177734375, 1.1552734375, 2.38232421875, 3.609375, 4.83642578125, 6.0634765625, 7.29052734375, 8.517578125, 9.74462890625, 10.9716796875, 12.19873046875, 13.42578125, 14.65283203125, 15.8798828125, 17.10693359375, 18.333984375, 19.56103515625, 20.7880859375, 22.01513671875, 23.2421875, 24.46923828125, 25.6962890625, 26.92333984375, 28.150390625, 29.37744140625, 30.6044921875, 31.83154296875, 33.05859375, 34.28564453125, 35.5126953125, 36.73974609375, 37.966796875, 39.19384765625, 40.4208984375, 41.64794921875, 42.875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 2.0, 6.0, 5.0, 3.0, 7.0, 4.0, 11.0, 21.0, 27.0, 54.0, 69.0, 177.0, 222.0, 164.0, 81.0, 30.0, 28.0, 22.0, 9.0, 6.0, 9.0, 6.0, 9.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.109375, -19.490966796875, -18.87255859375, -18.254150390625, -17.6357421875, -17.017333984375, -16.39892578125, -15.780517578125, -15.162109375, -14.543701171875, -13.92529296875, -13.306884765625, -12.6884765625, -12.070068359375, -11.45166015625, -10.833251953125, -10.21484375, -9.596435546875, -8.97802734375, -8.359619140625, -7.7412109375, -7.122802734375, -6.50439453125, -5.885986328125, -5.267578125, -4.649169921875, -4.03076171875, -3.412353515625, -2.7939453125, -2.175537109375, -1.55712890625, -0.938720703125, -0.3203125, 0.298095703125, 0.91650390625, 1.534912109375, 2.1533203125, 2.771728515625, 3.39013671875, 4.008544921875, 4.626953125, 5.245361328125, 5.86376953125, 6.482177734375, 7.1005859375, 7.718994140625, 8.33740234375, 8.955810546875, 9.57421875, 10.192626953125, 10.81103515625, 11.429443359375, 12.0478515625, 12.666259765625, 13.28466796875, 13.903076171875, 14.521484375, 15.139892578125, 15.75830078125, 16.376708984375, 16.9951171875, 17.613525390625, 18.23193359375, 18.850341796875, 19.46875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 5.0, 16.0, 14.0, 15.0, 12.0, 33.0, 37.0, 36.0, 39.0, 50.0, 56.0, 54.0, 53.0, 51.0, 55.0, 54.0, 53.0, 57.0, 45.0, 55.0, 28.0, 42.0, 27.0, 18.0, 11.0, 12.0, 18.0, 12.0, 8.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.906810760498047, -28.981761932373047, -28.05671501159668, -27.13166618347168, -26.20661735534668, -25.281570434570312, -24.356521606445312, -23.431472778320312, -22.506423950195312, -21.581375122070312, -20.656328201293945, -19.731279373168945, -18.806230545043945, -17.881183624267578, -16.956134796142578, -16.031085968017578, -15.106039047241211, -14.180991172790527, -13.255942344665527, -12.330894470214844, -11.405845642089844, -10.48079776763916, -9.555749893188477, -8.630701065063477, -7.705653190612793, -6.780604839324951, -5.855556488037109, -4.930508613586426, -4.005460262298584, -3.080411911010742, -2.1553640365600586, -1.2303156852722168, -0.3052692413330078, 0.6197789907455444, 1.5448272228240967, 2.4698753356933594, 3.394923686981201, 4.319972038269043, 5.245019912719727, 6.170068264007568, 7.09511661529541, 8.020164489746094, 8.945213317871094, 9.870261192321777, 10.795309066772461, 11.720357894897461, 12.645405769348145, 13.570453643798828, 14.495502471923828, 15.420550346374512, 16.345598220825195, 17.270647048950195, 18.195695877075195, 19.120742797851562, 20.045791625976562, 20.970840454101562, 21.895889282226562, 22.820938110351562, 23.74598503112793, 24.67103385925293, 25.59608268737793, 26.521129608154297, 27.446178436279297, 28.371227264404297, 29.296274185180664]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 7.0, 7.0, 9.0, 13.0, 8.0, 12.0, 22.0, 16.0, 17.0, 32.0, 33.0, 32.0, 32.0, 30.0, 28.0, 35.0, 41.0, 49.0, 48.0, 40.0, 39.0, 41.0, 33.0, 35.0, 38.0, 36.0, 32.0, 28.0, 25.0, 24.0, 27.0, 16.0, 16.0, 19.0, 17.0, 11.0, 8.0, 5.0, 11.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.03859519958496, -27.12749671936035, -26.216400146484375, -25.305301666259766, -24.394203186035156, -23.483104705810547, -22.57200813293457, -21.66090965270996, -20.74981117248535, -19.838712692260742, -18.927616119384766, -18.016517639160156, -17.105419158935547, -16.194320678710938, -15.283224105834961, -14.372125625610352, -13.461028099060059, -12.549930572509766, -11.638832092285156, -10.727734565734863, -9.816636085510254, -8.905538558959961, -7.99444055557251, -7.083342552185059, -6.172244548797607, -5.261146545410156, -4.350048542022705, -3.438950777053833, -2.527852773666382, -1.6167550086975098, -0.7056570053100586, 0.20544099807739258, 1.1165390014648438, 2.027637004852295, 2.938735008239746, 3.849832773208618, 4.760931015014648, 5.672028541564941, 6.583126544952393, 7.494224548339844, 8.405323028564453, 9.316420555114746, 10.227519035339355, 11.138616561889648, 12.049715042114258, 12.96081256866455, 13.871910095214844, 14.783008575439453, 15.694106101989746, 16.60520362854004, 17.51630210876465, 18.427400588989258, 19.338497161865234, 20.249595642089844, 21.160694122314453, 22.071792602539062, 22.98288917541504, 23.89398765563965, 24.805084228515625, 25.716182708740234, 26.627281188964844, 27.538379669189453, 28.44947624206543, 29.36057472229004, 30.27167320251465]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 13.0, 20.0, 25.0, 62.0, 82.0, 117.0, 188.0, 378.0, 668.0, 1090.0, 1892.0, 3111.0, 5125.0, 8646.0, 13874.0, 22580.0, 34533.0, 52325.0, 74060.0, 97966.0, 118796.0, 128630.0, 124204.0, 106852.0, 83298.0, 59956.0, 40780.0, 26470.0, 16970.0, 10322.0, 6260.0, 3667.0, 2317.0, 1360.0, 791.0, 473.0, 255.0, 154.0, 100.0, 65.0, 31.0, 16.0, 12.0, 10.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.10009765625, -19.4658203125, -18.83154296875, -18.197265625, -17.56298828125, -16.9287109375, -16.29443359375, -15.66015625, -15.02587890625, -14.3916015625, -13.75732421875, -13.123046875, -12.48876953125, -11.8544921875, -11.22021484375, -10.5859375, -9.95166015625, -9.3173828125, -8.68310546875, -8.048828125, -7.41455078125, -6.7802734375, -6.14599609375, -5.51171875, -4.87744140625, -4.2431640625, -3.60888671875, -2.974609375, -2.34033203125, -1.7060546875, -1.07177734375, -0.4375, 0.19677734375, 0.8310546875, 1.46533203125, 2.099609375, 2.73388671875, 3.3681640625, 4.00244140625, 4.63671875, 5.27099609375, 5.9052734375, 6.53955078125, 7.173828125, 7.80810546875, 8.4423828125, 9.07666015625, 9.7109375, 10.34521484375, 10.9794921875, 11.61376953125, 12.248046875, 12.88232421875, 13.5166015625, 14.15087890625, 14.78515625, 15.41943359375, 16.0537109375, 16.68798828125, 17.322265625, 17.95654296875, 18.5908203125, 19.22509765625, 19.859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 9.0, 14.0, 11.0, 15.0, 13.0, 19.0, 21.0, 29.0, 25.0, 40.0, 28.0, 34.0, 31.0, 41.0, 40.0, 38.0, 43.0, 41.0, 41.0, 40.0, 26.0, 38.0, 36.0, 32.0, 33.0, 35.0, 31.0, 21.0, 19.0, 24.0, 15.0, 21.0, 14.0, 7.0, 6.0, 10.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-27.453125, -26.61083984375, -25.7685546875, -24.92626953125, -24.083984375, -23.24169921875, -22.3994140625, -21.55712890625, -20.71484375, -19.87255859375, -19.0302734375, -18.18798828125, -17.345703125, -16.50341796875, -15.6611328125, -14.81884765625, -13.9765625, -13.13427734375, -12.2919921875, -11.44970703125, -10.607421875, -9.76513671875, -8.9228515625, -8.08056640625, -7.23828125, -6.39599609375, -5.5537109375, -4.71142578125, -3.869140625, -3.02685546875, -2.1845703125, -1.34228515625, -0.5, 0.34228515625, 1.1845703125, 2.02685546875, 2.869140625, 3.71142578125, 4.5537109375, 5.39599609375, 6.23828125, 7.08056640625, 7.9228515625, 8.76513671875, 9.607421875, 10.44970703125, 11.2919921875, 12.13427734375, 12.9765625, 13.81884765625, 14.6611328125, 15.50341796875, 16.345703125, 17.18798828125, 18.0302734375, 18.87255859375, 19.71484375, 20.55712890625, 21.3994140625, 22.24169921875, 23.083984375, 23.92626953125, 24.7685546875, 25.61083984375, 26.453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 10.0, 9.0, 21.0, 31.0, 48.0, 78.0, 92.0, 188.0, 274.0, 419.0, 793.0, 1331.0, 2302.0, 4004.0, 7234.0, 12902.0, 22705.0, 39137.0, 65038.0, 100956.0, 139025.0, 162264.0, 155284.0, 123102.0, 85522.0, 53214.0, 31167.0, 17931.0, 10093.0, 5649.0, 3191.0, 1819.0, 1087.0, 643.0, 357.0, 211.0, 165.0, 84.0, 57.0, 32.0, 27.0, 13.0, 11.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-28.484375, -27.61572265625, -26.7470703125, -25.87841796875, -25.009765625, -24.14111328125, -23.2724609375, -22.40380859375, -21.53515625, -20.66650390625, -19.7978515625, -18.92919921875, -18.060546875, -17.19189453125, -16.3232421875, -15.45458984375, -14.5859375, -13.71728515625, -12.8486328125, -11.97998046875, -11.111328125, -10.24267578125, -9.3740234375, -8.50537109375, -7.63671875, -6.76806640625, -5.8994140625, -5.03076171875, -4.162109375, -3.29345703125, -2.4248046875, -1.55615234375, -0.6875, 0.18115234375, 1.0498046875, 1.91845703125, 2.787109375, 3.65576171875, 4.5244140625, 5.39306640625, 6.26171875, 7.13037109375, 7.9990234375, 8.86767578125, 9.736328125, 10.60498046875, 11.4736328125, 12.34228515625, 13.2109375, 14.07958984375, 14.9482421875, 15.81689453125, 16.685546875, 17.55419921875, 18.4228515625, 19.29150390625, 20.16015625, 21.02880859375, 21.8974609375, 22.76611328125, 23.634765625, 24.50341796875, 25.3720703125, 26.24072265625, 27.109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 10.0, 13.0, 17.0, 14.0, 17.0, 17.0, 21.0, 44.0, 34.0, 24.0, 37.0, 37.0, 51.0, 45.0, 36.0, 50.0, 35.0, 36.0, 43.0, 40.0, 40.0, 39.0, 29.0, 30.0, 33.0, 35.0, 31.0, 16.0, 15.0, 8.0, 11.0, 16.0, 16.0, 7.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.890380859375, -15.26513671875, -14.639892578125, -14.0146484375, -13.389404296875, -12.76416015625, -12.138916015625, -11.513671875, -10.888427734375, -10.26318359375, -9.637939453125, -9.0126953125, -8.387451171875, -7.76220703125, -7.136962890625, -6.51171875, -5.886474609375, -5.26123046875, -4.635986328125, -4.0107421875, -3.385498046875, -2.76025390625, -2.135009765625, -1.509765625, -0.884521484375, -0.25927734375, 0.365966796875, 0.9912109375, 1.616455078125, 2.24169921875, 2.866943359375, 3.4921875, 4.117431640625, 4.74267578125, 5.367919921875, 5.9931640625, 6.618408203125, 7.24365234375, 7.868896484375, 8.494140625, 9.119384765625, 9.74462890625, 10.369873046875, 10.9951171875, 11.620361328125, 12.24560546875, 12.870849609375, 13.49609375, 14.121337890625, 14.74658203125, 15.371826171875, 15.9970703125, 16.622314453125, 17.24755859375, 17.872802734375, 18.498046875, 19.123291015625, 19.74853515625, 20.373779296875, 20.9990234375, 21.624267578125, 22.24951171875, 22.874755859375, 23.5]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 3.0, 11.0, 16.0, 22.0, 40.0, 53.0, 87.0, 135.0, 171.0, 327.0, 484.0, 740.0, 1233.0, 2210.0, 3984.0, 7684.0, 16381.0, 38401.0, 95587.0, 217484.0, 305971.0, 203671.0, 87510.0, 34990.0, 15263.0, 7131.0, 3623.0, 2087.0, 1235.0, 725.0, 460.0, 294.0, 163.0, 134.0, 82.0, 43.0, 37.0, 28.0, 14.0, 12.0, 4.0, 5.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -24.94970703125, -24.1025390625, -23.25537109375, -22.408203125, -21.56103515625, -20.7138671875, -19.86669921875, -19.01953125, -18.17236328125, -17.3251953125, -16.47802734375, -15.630859375, -14.78369140625, -13.9365234375, -13.08935546875, -12.2421875, -11.39501953125, -10.5478515625, -9.70068359375, -8.853515625, -8.00634765625, -7.1591796875, -6.31201171875, -5.46484375, -4.61767578125, -3.7705078125, -2.92333984375, -2.076171875, -1.22900390625, -0.3818359375, 0.46533203125, 1.3125, 2.15966796875, 3.0068359375, 3.85400390625, 4.701171875, 5.54833984375, 6.3955078125, 7.24267578125, 8.08984375, 8.93701171875, 9.7841796875, 10.63134765625, 11.478515625, 12.32568359375, 13.1728515625, 14.02001953125, 14.8671875, 15.71435546875, 16.5615234375, 17.40869140625, 18.255859375, 19.10302734375, 19.9501953125, 20.79736328125, 21.64453125, 22.49169921875, 23.3388671875, 24.18603515625, 25.033203125, 25.88037109375, 26.7275390625, 27.57470703125, 28.421875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 2.0, 4.0, 13.0, 17.0, 20.0, 19.0, 21.0, 21.0, 33.0, 41.0, 45.0, 51.0, 50.0, 63.0, 72.0, 55.0, 58.0, 70.0, 53.0, 51.0, 38.0, 33.0, 27.0, 30.0, 18.0, 23.0, 7.0, 13.0, 11.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0015687942504882812, -0.0015223771333694458, -0.0014759600162506104, -0.001429542899131775, -0.0013831257820129395, -0.001336708664894104, -0.0012902915477752686, -0.001243874430656433, -0.0011974573135375977, -0.0011510401964187622, -0.0011046230792999268, -0.0010582059621810913, -0.0010117888450622559, -0.0009653717279434204, -0.000918954610824585, -0.0008725374937057495, -0.0008261203765869141, -0.0007797032594680786, -0.0007332861423492432, -0.0006868690252304077, -0.0006404519081115723, -0.0005940347909927368, -0.0005476176738739014, -0.0005012005567550659, -0.00045478343963623047, -0.000408366322517395, -0.00036194920539855957, -0.0003155320882797241, -0.00026911497116088867, -0.00022269785404205322, -0.00017628073692321777, -0.00012986361980438232, -8.344650268554688e-05, -3.7029385566711426e-05, 9.387731552124023e-06, 5.580484867095947e-05, 0.00010222196578979492, 0.00014863908290863037, 0.00019505620002746582, 0.00024147331714630127, 0.0002878904342651367, 0.00033430755138397217, 0.0003807246685028076, 0.00042714178562164307, 0.0004735589027404785, 0.000519976019859314, 0.0005663931369781494, 0.0006128102540969849, 0.0006592273712158203, 0.0007056444883346558, 0.0007520616054534912, 0.0007984787225723267, 0.0008448958396911621, 0.0008913129568099976, 0.000937730073928833, 0.0009841471910476685, 0.001030564308166504, 0.0010769814252853394, 0.0011233985424041748, 0.0011698156595230103, 0.0012162327766418457, 0.0012626498937606812, 0.0013090670108795166, 0.001355484127998352, 0.0014019012451171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 10.0, 16.0, 20.0, 29.0, 45.0, 61.0, 59.0, 129.0, 171.0, 269.0, 368.0, 539.0, 841.0, 1248.0, 2020.0, 3439.0, 5662.0, 10170.0, 18962.0, 36229.0, 68600.0, 120417.0, 178480.0, 201469.0, 165387.0, 106195.0, 58878.0, 30555.0, 16105.0, 8911.0, 4963.0, 2982.0, 1834.0, 1181.0, 715.0, 515.0, 324.0, 243.0, 166.0, 108.0, 79.0, 40.0, 38.0, 28.0, 20.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0], "bins": [-18.296875, -17.7796630859375, -17.262451171875, -16.7452392578125, -16.22802734375, -15.7108154296875, -15.193603515625, -14.6763916015625, -14.1591796875, -13.6419677734375, -13.124755859375, -12.6075439453125, -12.09033203125, -11.5731201171875, -11.055908203125, -10.5386962890625, -10.021484375, -9.5042724609375, -8.987060546875, -8.4698486328125, -7.95263671875, -7.4354248046875, -6.918212890625, -6.4010009765625, -5.8837890625, -5.3665771484375, -4.849365234375, -4.3321533203125, -3.81494140625, -3.2977294921875, -2.780517578125, -2.2633056640625, -1.74609375, -1.2288818359375, -0.711669921875, -0.1944580078125, 0.32275390625, 0.8399658203125, 1.357177734375, 1.8743896484375, 2.3916015625, 2.9088134765625, 3.426025390625, 3.9432373046875, 4.46044921875, 4.9776611328125, 5.494873046875, 6.0120849609375, 6.529296875, 7.0465087890625, 7.563720703125, 8.0809326171875, 8.59814453125, 9.1153564453125, 9.632568359375, 10.1497802734375, 10.6669921875, 11.1842041015625, 11.701416015625, 12.2186279296875, 12.73583984375, 13.2530517578125, 13.770263671875, 14.2874755859375, 14.8046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 2.0, 3.0, 1.0, 11.0, 13.0, 12.0, 14.0, 23.0, 27.0, 46.0, 45.0, 63.0, 59.0, 73.0, 80.0, 99.0, 92.0, 58.0, 63.0, 47.0, 37.0, 26.0, 22.0, 22.0, 15.0, 11.0, 6.0, 4.0, 4.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6875, -10.3619384765625, -10.036376953125, -9.7108154296875, -9.38525390625, -9.0596923828125, -8.734130859375, -8.4085693359375, -8.0830078125, -7.7574462890625, -7.431884765625, -7.1063232421875, -6.78076171875, -6.4552001953125, -6.129638671875, -5.8040771484375, -5.478515625, -5.1529541015625, -4.827392578125, -4.5018310546875, -4.17626953125, -3.8507080078125, -3.525146484375, -3.1995849609375, -2.8740234375, -2.5484619140625, -2.222900390625, -1.8973388671875, -1.57177734375, -1.2462158203125, -0.920654296875, -0.5950927734375, -0.26953125, 0.0560302734375, 0.381591796875, 0.7071533203125, 1.03271484375, 1.3582763671875, 1.683837890625, 2.0093994140625, 2.3349609375, 2.6605224609375, 2.986083984375, 3.3116455078125, 3.63720703125, 3.9627685546875, 4.288330078125, 4.6138916015625, 4.939453125, 5.2650146484375, 5.590576171875, 5.9161376953125, 6.24169921875, 6.5672607421875, 6.892822265625, 7.2183837890625, 7.5439453125, 7.8695068359375, 8.195068359375, 8.5206298828125, 8.84619140625, 9.1717529296875, 9.497314453125, 9.8228759765625, 10.1484375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 6.0, 5.0, 5.0, 10.0, 25.0, 28.0, 38.0, 35.0, 37.0, 49.0, 40.0, 40.0, 54.0, 57.0, 57.0, 40.0, 91.0, 52.0, 51.0, 46.0, 47.0, 35.0, 29.0, 17.0, 15.0, 18.0, 18.0, 13.0, 12.0, 11.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-37.04381561279297, -36.105934143066406, -35.168052673339844, -34.230167388916016, -33.29228591918945, -32.35440444946289, -31.416521072387695, -30.478639602661133, -29.540756225585938, -28.602874755859375, -27.66499137878418, -26.727109909057617, -25.789226531982422, -24.85134506225586, -23.913461685180664, -22.9755802154541, -22.037696838378906, -21.099815368652344, -20.16193199157715, -19.224050521850586, -18.28616714477539, -17.348285675048828, -16.410402297973633, -15.47252082824707, -14.534639358520508, -13.596756935119629, -12.65887451171875, -11.720992088317871, -10.783109664916992, -9.84522819519043, -8.907344818115234, -7.969462871551514, -7.031579971313477, -6.093697547912598, -5.155815124511719, -4.21793270111084, -3.28005051612854, -2.3421683311462402, -1.4042859077453613, -0.4664034843444824, 0.4714789390563965, 1.4093613624572754, 2.3472437858581543, 3.285125970840454, 4.223008155822754, 5.160890579223633, 6.098773002624512, 7.036655426025391, 7.9745378494262695, 8.912420272827148, 9.850302696228027, 10.788185119628906, 11.726067543029785, 12.663949966430664, 13.601831436157227, 14.539714813232422, 15.477596282958984, 16.415477752685547, 17.353361129760742, 18.291242599487305, 19.2291259765625, 20.167007446289062, 21.104890823364258, 22.04277229309082, 22.980655670166016]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 14.0, 3.0, 6.0, 5.0, 11.0, 14.0, 15.0, 19.0, 24.0, 19.0, 26.0, 38.0, 45.0, 32.0, 40.0, 31.0, 46.0, 44.0, 38.0, 41.0, 36.0, 36.0, 31.0, 53.0, 30.0, 34.0, 25.0, 34.0, 29.0, 30.0, 17.0, 24.0, 18.0, 13.0, 9.0, 5.0, 9.0, 13.0, 13.0, 1.0, 2.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.39780616760254, -28.473628997802734, -27.549453735351562, -26.62527847290039, -25.701101303100586, -24.77692413330078, -23.85274887084961, -22.928573608398438, -22.004396438598633, -21.080219268798828, -20.156044006347656, -19.231868743896484, -18.30769157409668, -17.383514404296875, -16.459339141845703, -15.535162925720215, -14.610986709594727, -13.686810493469238, -12.76263427734375, -11.838458061218262, -10.914281845092773, -9.990105628967285, -9.065929412841797, -8.141753196716309, -7.21757698059082, -6.293400764465332, -5.369224548339844, -4.4450483322143555, -3.520872116088867, -2.596695899963379, -1.6725196838378906, -0.7483434677124023, 0.17583084106445312, 1.1000070571899414, 2.0241832733154297, 2.948359489440918, 3.8725357055664062, 4.7967119216918945, 5.720888137817383, 6.645064353942871, 7.569240570068359, 8.493416786193848, 9.417593002319336, 10.341769218444824, 11.265945434570312, 12.1901216506958, 13.114297866821289, 14.038474082946777, 14.962650299072266, 15.886826515197754, 16.811002731323242, 17.735179901123047, 18.65935516357422, 19.58353042602539, 20.507707595825195, 21.431884765625, 22.356060028076172, 23.280235290527344, 24.20441246032715, 25.128589630126953, 26.052764892578125, 26.976940155029297, 27.9011173248291, 28.825294494628906, 29.749469757080078]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 9.0, 8.0, 14.0, 15.0, 35.0, 53.0, 86.0, 126.0, 212.0, 342.0, 486.0, 812.0, 1183.0, 2031.0, 3205.0, 5177.0, 8132.0, 13815.0, 22271.0, 37912.0, 63093.0, 107131.0, 178316.0, 284551.0, 418990.0, 548678.0, 612573.0, 578651.0, 462897.0, 324516.0, 206970.0, 125897.0, 74844.0, 44112.0, 26256.0, 15563.0, 9643.0, 5953.0, 3629.0, 2247.0, 1459.0, 894.0, 548.0, 371.0, 228.0, 130.0, 77.0, 66.0, 38.0, 26.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.502197265625, -15.92626953125, -15.350341796875, -14.7744140625, -14.198486328125, -13.62255859375, -13.046630859375, -12.470703125, -11.894775390625, -11.31884765625, -10.742919921875, -10.1669921875, -9.591064453125, -9.01513671875, -8.439208984375, -7.86328125, -7.287353515625, -6.71142578125, -6.135498046875, -5.5595703125, -4.983642578125, -4.40771484375, -3.831787109375, -3.255859375, -2.679931640625, -2.10400390625, -1.528076171875, -0.9521484375, -0.376220703125, 0.19970703125, 0.775634765625, 1.3515625, 1.927490234375, 2.50341796875, 3.079345703125, 3.6552734375, 4.231201171875, 4.80712890625, 5.383056640625, 5.958984375, 6.534912109375, 7.11083984375, 7.686767578125, 8.2626953125, 8.838623046875, 9.41455078125, 9.990478515625, 10.56640625, 11.142333984375, 11.71826171875, 12.294189453125, 12.8701171875, 13.446044921875, 14.02197265625, 14.597900390625, 15.173828125, 15.749755859375, 16.32568359375, 16.901611328125, 17.4775390625, 18.053466796875, 18.62939453125, 19.205322265625, 19.78125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 5.0, 9.0, 6.0, 19.0, 19.0, 24.0, 20.0, 28.0, 36.0, 31.0, 37.0, 35.0, 40.0, 46.0, 46.0, 44.0, 41.0, 38.0, 58.0, 39.0, 34.0, 49.0, 34.0, 33.0, 32.0, 20.0, 30.0, 16.0, 19.0, 15.0, 23.0, 12.0, 5.0, 5.0, 8.0, 8.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.216064453125, -22.41650390625, -21.616943359375, -20.8173828125, -20.017822265625, -19.21826171875, -18.418701171875, -17.619140625, -16.819580078125, -16.02001953125, -15.220458984375, -14.4208984375, -13.621337890625, -12.82177734375, -12.022216796875, -11.22265625, -10.423095703125, -9.62353515625, -8.823974609375, -8.0244140625, -7.224853515625, -6.42529296875, -5.625732421875, -4.826171875, -4.026611328125, -3.22705078125, -2.427490234375, -1.6279296875, -0.828369140625, -0.02880859375, 0.770751953125, 1.5703125, 2.369873046875, 3.16943359375, 3.968994140625, 4.7685546875, 5.568115234375, 6.36767578125, 7.167236328125, 7.966796875, 8.766357421875, 9.56591796875, 10.365478515625, 11.1650390625, 11.964599609375, 12.76416015625, 13.563720703125, 14.36328125, 15.162841796875, 15.96240234375, 16.761962890625, 17.5615234375, 18.361083984375, 19.16064453125, 19.960205078125, 20.759765625, 21.559326171875, 22.35888671875, 23.158447265625, 23.9580078125, 24.757568359375, 25.55712890625, 26.356689453125, 27.15625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 9.0, 7.0, 18.0, 41.0, 49.0, 80.0, 129.0, 219.0, 339.0, 590.0, 967.0, 1547.0, 2501.0, 3932.0, 6447.0, 10495.0, 17044.0, 28087.0, 45789.0, 74113.0, 117548.0, 180703.0, 266869.0, 370853.0, 470259.0, 532574.0, 529425.0, 460563.0, 356364.0, 254627.0, 171708.0, 110665.0, 68892.0, 42783.0, 26430.0, 15954.0, 9862.0, 6072.0, 3743.0, 2318.0, 1472.0, 850.0, 517.0, 309.0, 217.0, 134.0, 71.0, 52.0, 24.0, 11.0, 9.0, 4.0, 4.0, 2.0, 4.0], "bins": [-20.0, -19.427490234375, -18.85498046875, -18.282470703125, -17.7099609375, -17.137451171875, -16.56494140625, -15.992431640625, -15.419921875, -14.847412109375, -14.27490234375, -13.702392578125, -13.1298828125, -12.557373046875, -11.98486328125, -11.412353515625, -10.83984375, -10.267333984375, -9.69482421875, -9.122314453125, -8.5498046875, -7.977294921875, -7.40478515625, -6.832275390625, -6.259765625, -5.687255859375, -5.11474609375, -4.542236328125, -3.9697265625, -3.397216796875, -2.82470703125, -2.252197265625, -1.6796875, -1.107177734375, -0.53466796875, 0.037841796875, 0.6103515625, 1.182861328125, 1.75537109375, 2.327880859375, 2.900390625, 3.472900390625, 4.04541015625, 4.617919921875, 5.1904296875, 5.762939453125, 6.33544921875, 6.907958984375, 7.48046875, 8.052978515625, 8.62548828125, 9.197998046875, 9.7705078125, 10.343017578125, 10.91552734375, 11.488037109375, 12.060546875, 12.633056640625, 13.20556640625, 13.778076171875, 14.3505859375, 14.923095703125, 15.49560546875, 16.068115234375, 16.640625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 9.0, 17.0, 17.0, 34.0, 22.0, 45.0, 52.0, 62.0, 70.0, 87.0, 103.0, 124.0, 133.0, 151.0, 179.0, 185.0, 196.0, 226.0, 234.0, 206.0, 222.0, 219.0, 206.0, 173.0, 187.0, 152.0, 119.0, 108.0, 93.0, 79.0, 65.0, 72.0, 46.0, 32.0, 28.0, 25.0, 16.0, 17.0, 13.0, 14.0, 5.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.28125, -9.97265625, -9.6640625, -9.35546875, -9.046875, -8.73828125, -8.4296875, -8.12109375, -7.8125, -7.50390625, -7.1953125, -6.88671875, -6.578125, -6.26953125, -5.9609375, -5.65234375, -5.34375, -5.03515625, -4.7265625, -4.41796875, -4.109375, -3.80078125, -3.4921875, -3.18359375, -2.875, -2.56640625, -2.2578125, -1.94921875, -1.640625, -1.33203125, -1.0234375, -0.71484375, -0.40625, -0.09765625, 0.2109375, 0.51953125, 0.828125, 1.13671875, 1.4453125, 1.75390625, 2.0625, 2.37109375, 2.6796875, 2.98828125, 3.296875, 3.60546875, 3.9140625, 4.22265625, 4.53125, 4.83984375, 5.1484375, 5.45703125, 5.765625, 6.07421875, 6.3828125, 6.69140625, 7.0, 7.30859375, 7.6171875, 7.92578125, 8.234375, 8.54296875, 8.8515625, 9.16015625, 9.46875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 14.0, 12.0, 12.0, 17.0, 26.0, 21.0, 39.0, 42.0, 41.0, 37.0, 41.0, 39.0, 44.0, 64.0, 49.0, 47.0, 50.0, 41.0, 45.0, 51.0, 38.0, 28.0, 29.0, 23.0, 18.0, 25.0, 10.0, 13.0, 12.0, 10.0, 7.0, 5.0, 9.0, 6.0, 11.0, 0.0, 2.0, 2.0, 2.0], "bins": [-30.46190643310547, -29.689592361450195, -28.917280197143555, -28.14496612548828, -27.372652053833008, -26.600337982177734, -25.828025817871094, -25.05571174621582, -24.283397674560547, -23.511083602905273, -22.738771438598633, -21.96645736694336, -21.194143295288086, -20.421829223632812, -19.649517059326172, -18.8772029876709, -18.104890823364258, -17.332576751708984, -16.560264587402344, -15.78795051574707, -15.015636444091797, -14.24332332611084, -13.471010208129883, -12.69869613647461, -11.926383018493652, -11.154069900512695, -10.381755828857422, -9.609442710876465, -8.837129592895508, -8.064815521240234, -7.292502403259277, -6.520188808441162, -5.747875213623047, -4.975561618804932, -4.203248023986816, -3.4309349060058594, -2.658621311187744, -1.886307716369629, -1.1139945983886719, -0.34168100357055664, 0.4306325912475586, 1.2029460668563843, 1.97525954246521, 2.747572898864746, 3.5198864936828613, 4.292200088500977, 5.064513206481934, 5.836826801300049, 6.609140396118164, 7.381453990936279, 8.153767585754395, 8.926080703735352, 9.698394775390625, 10.470707893371582, 11.243021011352539, 12.015335083007812, 12.78764820098877, 13.559961318969727, 14.332275390625, 15.104588508605957, 15.876901626586914, 16.649215698242188, 17.421527862548828, 18.1938419342041, 18.966156005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 8.0, 12.0, 5.0, 17.0, 19.0, 18.0, 14.0, 21.0, 16.0, 31.0, 28.0, 26.0, 42.0, 27.0, 32.0, 27.0, 27.0, 40.0, 43.0, 47.0, 50.0, 39.0, 39.0, 35.0, 34.0, 35.0, 32.0, 33.0, 22.0, 25.0, 27.0, 18.0, 16.0, 13.0, 18.0, 13.0, 12.0, 5.0, 3.0, 6.0, 8.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-27.46792984008789, -26.59942054748535, -25.730911254882812, -24.862403869628906, -23.993894577026367, -23.125385284423828, -22.25687599182129, -21.38836669921875, -20.51985740661621, -19.651348114013672, -18.782838821411133, -17.914329528808594, -17.045822143554688, -16.17731285095215, -15.30880355834961, -14.44029426574707, -13.571785926818848, -12.703276634216309, -11.834768295288086, -10.966259002685547, -10.097749710083008, -9.229240417480469, -8.360732078552246, -7.492222785949707, -6.623713970184326, -5.755205154418945, -4.886695861816406, -4.018187046051025, -3.1496779918670654, -2.2811689376831055, -1.4126601219177246, -0.5441508293151855, 0.3243579864501953, 1.1928670406341553, 2.0613760948181152, 2.929884910583496, 3.798393964767456, 4.666903018951416, 5.535411834716797, 6.403921127319336, 7.272429943084717, 8.140938758850098, 9.009448051452637, 9.87795639038086, 10.746465682983398, 11.614974975585938, 12.483484268188477, 13.351993560791016, 14.220501899719238, 15.089011192321777, 15.95751953125, 16.82602882385254, 17.694538116455078, 18.563047409057617, 19.431556701660156, 20.300064086914062, 21.1685733795166, 22.03708267211914, 22.90559196472168, 23.77410125732422, 24.642608642578125, 25.511117935180664, 26.379627227783203, 27.248136520385742, 28.11664581298828]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 5.0, 12.0, 16.0, 14.0, 36.0, 41.0, 62.0, 83.0, 147.0, 233.0, 357.0, 526.0, 822.0, 1231.0, 2091.0, 3234.0, 5211.0, 8612.0, 14099.0, 23630.0, 39871.0, 68061.0, 115028.0, 176568.0, 199777.0, 154617.0, 95531.0, 55358.0, 33178.0, 19696.0, 11610.0, 6913.0, 4353.0, 2756.0, 1662.0, 1126.0, 708.0, 451.0, 295.0, 187.0, 122.0, 75.0, 51.0, 30.0, 26.0, 16.0, 10.0, 12.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.7255859375, -19.966796875, -19.2080078125, -18.44921875, -17.6904296875, -16.931640625, -16.1728515625, -15.4140625, -14.6552734375, -13.896484375, -13.1376953125, -12.37890625, -11.6201171875, -10.861328125, -10.1025390625, -9.34375, -8.5849609375, -7.826171875, -7.0673828125, -6.30859375, -5.5498046875, -4.791015625, -4.0322265625, -3.2734375, -2.5146484375, -1.755859375, -0.9970703125, -0.23828125, 0.5205078125, 1.279296875, 2.0380859375, 2.796875, 3.5556640625, 4.314453125, 5.0732421875, 5.83203125, 6.5908203125, 7.349609375, 8.1083984375, 8.8671875, 9.6259765625, 10.384765625, 11.1435546875, 11.90234375, 12.6611328125, 13.419921875, 14.1787109375, 14.9375, 15.6962890625, 16.455078125, 17.2138671875, 17.97265625, 18.7314453125, 19.490234375, 20.2490234375, 21.0078125, 21.7666015625, 22.525390625, 23.2841796875, 24.04296875, 24.8017578125, 25.560546875, 26.3193359375, 27.078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 19.0, 9.0, 22.0, 11.0, 23.0, 18.0, 21.0, 24.0, 22.0, 32.0, 45.0, 37.0, 36.0, 38.0, 35.0, 45.0, 44.0, 42.0, 46.0, 39.0, 49.0, 35.0, 40.0, 26.0, 43.0, 22.0, 22.0, 27.0, 17.0, 19.0, 9.0, 15.0, 17.0, 9.0, 7.0, 6.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-30.421875, -29.4990234375, -28.576171875, -27.6533203125, -26.73046875, -25.8076171875, -24.884765625, -23.9619140625, -23.0390625, -22.1162109375, -21.193359375, -20.2705078125, -19.34765625, -18.4248046875, -17.501953125, -16.5791015625, -15.65625, -14.7333984375, -13.810546875, -12.8876953125, -11.96484375, -11.0419921875, -10.119140625, -9.1962890625, -8.2734375, -7.3505859375, -6.427734375, -5.5048828125, -4.58203125, -3.6591796875, -2.736328125, -1.8134765625, -0.890625, 0.0322265625, 0.955078125, 1.8779296875, 2.80078125, 3.7236328125, 4.646484375, 5.5693359375, 6.4921875, 7.4150390625, 8.337890625, 9.2607421875, 10.18359375, 11.1064453125, 12.029296875, 12.9521484375, 13.875, 14.7978515625, 15.720703125, 16.6435546875, 17.56640625, 18.4892578125, 19.412109375, 20.3349609375, 21.2578125, 22.1806640625, 23.103515625, 24.0263671875, 24.94921875, 25.8720703125, 26.794921875, 27.7177734375, 28.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 12.0, 18.0, 11.0, 25.0, 38.0, 60.0, 89.0, 125.0, 224.0, 299.0, 502.0, 647.0, 1098.0, 1756.0, 2900.0, 4798.0, 7793.0, 12652.0, 21210.0, 36438.0, 64239.0, 112443.0, 184520.0, 218662.0, 157421.0, 92484.0, 52455.0, 30268.0, 17873.0, 10527.0, 6429.0, 3960.0, 2394.0, 1511.0, 990.0, 599.0, 377.0, 242.0, 154.0, 90.0, 77.0, 47.0, 33.0, 23.0, 12.0, 11.0, 6.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.984375, -23.193359375, -22.40234375, -21.611328125, -20.8203125, -20.029296875, -19.23828125, -18.447265625, -17.65625, -16.865234375, -16.07421875, -15.283203125, -14.4921875, -13.701171875, -12.91015625, -12.119140625, -11.328125, -10.537109375, -9.74609375, -8.955078125, -8.1640625, -7.373046875, -6.58203125, -5.791015625, -5.0, -4.208984375, -3.41796875, -2.626953125, -1.8359375, -1.044921875, -0.25390625, 0.537109375, 1.328125, 2.119140625, 2.91015625, 3.701171875, 4.4921875, 5.283203125, 6.07421875, 6.865234375, 7.65625, 8.447265625, 9.23828125, 10.029296875, 10.8203125, 11.611328125, 12.40234375, 13.193359375, 13.984375, 14.775390625, 15.56640625, 16.357421875, 17.1484375, 17.939453125, 18.73046875, 19.521484375, 20.3125, 21.103515625, 21.89453125, 22.685546875, 23.4765625, 24.267578125, 25.05859375, 25.849609375, 26.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 12.0, 3.0, 8.0, 10.0, 16.0, 13.0, 13.0, 16.0, 18.0, 24.0, 25.0, 28.0, 31.0, 27.0, 34.0, 50.0, 27.0, 32.0, 38.0, 33.0, 43.0, 42.0, 35.0, 37.0, 31.0, 27.0, 35.0, 28.0, 30.0, 29.0, 23.0, 15.0, 20.0, 25.0, 21.0, 13.0, 14.0, 9.0, 18.0, 11.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.8125, -18.263671875, -17.71484375, -17.166015625, -16.6171875, -16.068359375, -15.51953125, -14.970703125, -14.421875, -13.873046875, -13.32421875, -12.775390625, -12.2265625, -11.677734375, -11.12890625, -10.580078125, -10.03125, -9.482421875, -8.93359375, -8.384765625, -7.8359375, -7.287109375, -6.73828125, -6.189453125, -5.640625, -5.091796875, -4.54296875, -3.994140625, -3.4453125, -2.896484375, -2.34765625, -1.798828125, -1.25, -0.701171875, -0.15234375, 0.396484375, 0.9453125, 1.494140625, 2.04296875, 2.591796875, 3.140625, 3.689453125, 4.23828125, 4.787109375, 5.3359375, 5.884765625, 6.43359375, 6.982421875, 7.53125, 8.080078125, 8.62890625, 9.177734375, 9.7265625, 10.275390625, 10.82421875, 11.373046875, 11.921875, 12.470703125, 13.01953125, 13.568359375, 14.1171875, 14.666015625, 15.21484375, 15.763671875, 16.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 10.0, 9.0, 19.0, 27.0, 40.0, 40.0, 99.0, 131.0, 180.0, 274.0, 406.0, 681.0, 1085.0, 1730.0, 2827.0, 4655.0, 7939.0, 14225.0, 26487.0, 53924.0, 127161.0, 300149.0, 282857.0, 115765.0, 50220.0, 24978.0, 13309.0, 7630.0, 4518.0, 2562.0, 1668.0, 1066.0, 668.0, 411.0, 263.0, 179.0, 118.0, 75.0, 57.0, 29.0, 27.0, 15.0, 9.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.314697265625, -15.77001953125, -15.225341796875, -14.6806640625, -14.135986328125, -13.59130859375, -13.046630859375, -12.501953125, -11.957275390625, -11.41259765625, -10.867919921875, -10.3232421875, -9.778564453125, -9.23388671875, -8.689208984375, -8.14453125, -7.599853515625, -7.05517578125, -6.510498046875, -5.9658203125, -5.421142578125, -4.87646484375, -4.331787109375, -3.787109375, -3.242431640625, -2.69775390625, -2.153076171875, -1.6083984375, -1.063720703125, -0.51904296875, 0.025634765625, 0.5703125, 1.114990234375, 1.65966796875, 2.204345703125, 2.7490234375, 3.293701171875, 3.83837890625, 4.383056640625, 4.927734375, 5.472412109375, 6.01708984375, 6.561767578125, 7.1064453125, 7.651123046875, 8.19580078125, 8.740478515625, 9.28515625, 9.829833984375, 10.37451171875, 10.919189453125, 11.4638671875, 12.008544921875, 12.55322265625, 13.097900390625, 13.642578125, 14.187255859375, 14.73193359375, 15.276611328125, 15.8212890625, 16.365966796875, 16.91064453125, 17.455322265625, 18.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 5.0, 7.0, 2.0, 3.0, 4.0, 13.0, 4.0, 14.0, 8.0, 21.0, 22.0, 22.0, 35.0, 49.0, 53.0, 86.0, 102.0, 87.0, 102.0, 70.0, 68.0, 49.0, 35.0, 33.0, 24.0, 20.0, 10.0, 8.0, 7.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001346588134765625, -0.0013026893138885498, -0.0012587904930114746, -0.0012148916721343994, -0.0011709928512573242, -0.001127094030380249, -0.0010831952095031738, -0.0010392963886260986, -0.0009953975677490234, -0.0009514987468719482, -0.000907599925994873, -0.0008637011051177979, -0.0008198022842407227, -0.0007759034633636475, -0.0007320046424865723, -0.0006881058216094971, -0.0006442070007324219, -0.0006003081798553467, -0.0005564093589782715, -0.0005125105381011963, -0.0004686117172241211, -0.0004247128963470459, -0.0003808140754699707, -0.0003369152545928955, -0.0002930164337158203, -0.0002491176128387451, -0.00020521879196166992, -0.00016131997108459473, -0.00011742115020751953, -7.352232933044434e-05, -2.962350845336914e-05, 1.4275312423706055e-05, 5.817413330078125e-05, 0.00010207295417785645, 0.00014597177505493164, 0.00018987059593200684, 0.00023376941680908203, 0.0002776682376861572, 0.0003215670585632324, 0.0003654658794403076, 0.0004093647003173828, 0.000453263521194458, 0.0004971623420715332, 0.0005410611629486084, 0.0005849599838256836, 0.0006288588047027588, 0.000672757625579834, 0.0007166564464569092, 0.0007605552673339844, 0.0008044540882110596, 0.0008483529090881348, 0.00089225172996521, 0.0009361505508422852, 0.0009800493717193604, 0.0010239481925964355, 0.0010678470134735107, 0.001111745834350586, 0.0011556446552276611, 0.0011995434761047363, 0.0012434422969818115, 0.0012873411178588867, 0.001331239938735962, 0.0013751387596130371, 0.0014190375804901123, 0.0014629364013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 12.0, 14.0, 31.0, 35.0, 66.0, 105.0, 140.0, 198.0, 327.0, 433.0, 737.0, 1175.0, 1821.0, 3004.0, 4657.0, 7477.0, 12552.0, 20635.0, 36148.0, 67724.0, 129813.0, 215107.0, 226433.0, 144811.0, 76204.0, 40712.0, 22791.0, 13306.0, 8379.0, 4958.0, 3090.0, 2035.0, 1288.0, 834.0, 532.0, 341.0, 207.0, 141.0, 108.0, 64.0, 39.0, 28.0, 22.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.828125, -14.3800048828125, -13.931884765625, -13.4837646484375, -13.03564453125, -12.5875244140625, -12.139404296875, -11.6912841796875, -11.2431640625, -10.7950439453125, -10.346923828125, -9.8988037109375, -9.45068359375, -9.0025634765625, -8.554443359375, -8.1063232421875, -7.658203125, -7.2100830078125, -6.761962890625, -6.3138427734375, -5.86572265625, -5.4176025390625, -4.969482421875, -4.5213623046875, -4.0732421875, -3.6251220703125, -3.177001953125, -2.7288818359375, -2.28076171875, -1.8326416015625, -1.384521484375, -0.9364013671875, -0.48828125, -0.0401611328125, 0.407958984375, 0.8560791015625, 1.30419921875, 1.7523193359375, 2.200439453125, 2.6485595703125, 3.0966796875, 3.5447998046875, 3.992919921875, 4.4410400390625, 4.88916015625, 5.3372802734375, 5.785400390625, 6.2335205078125, 6.681640625, 7.1297607421875, 7.577880859375, 8.0260009765625, 8.47412109375, 8.9222412109375, 9.370361328125, 9.8184814453125, 10.2666015625, 10.7147216796875, 11.162841796875, 11.6109619140625, 12.05908203125, 12.5072021484375, 12.955322265625, 13.4034423828125, 13.8515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 9.0, 6.0, 13.0, 11.0, 11.0, 18.0, 24.0, 31.0, 26.0, 33.0, 30.0, 37.0, 50.0, 50.0, 56.0, 50.0, 51.0, 68.0, 56.0, 61.0, 43.0, 43.0, 31.0, 23.0, 21.0, 15.0, 9.0, 17.0, 15.0, 8.0, 13.0, 6.0, 6.0, 5.0, 8.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.59814453125, -4.4541015625, -4.31005859375, -4.166015625, -4.02197265625, -3.8779296875, -3.73388671875, -3.58984375, -3.44580078125, -3.3017578125, -3.15771484375, -3.013671875, -2.86962890625, -2.7255859375, -2.58154296875, -2.4375, -2.29345703125, -2.1494140625, -2.00537109375, -1.861328125, -1.71728515625, -1.5732421875, -1.42919921875, -1.28515625, -1.14111328125, -0.9970703125, -0.85302734375, -0.708984375, -0.56494140625, -0.4208984375, -0.27685546875, -0.1328125, 0.01123046875, 0.1552734375, 0.29931640625, 0.443359375, 0.58740234375, 0.7314453125, 0.87548828125, 1.01953125, 1.16357421875, 1.3076171875, 1.45166015625, 1.595703125, 1.73974609375, 1.8837890625, 2.02783203125, 2.171875, 2.31591796875, 2.4599609375, 2.60400390625, 2.748046875, 2.89208984375, 3.0361328125, 3.18017578125, 3.32421875, 3.46826171875, 3.6123046875, 3.75634765625, 3.900390625, 4.04443359375, 4.1884765625, 4.33251953125, 4.4765625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 17.0, 20.0, 13.0, 24.0, 27.0, 35.0, 45.0, 34.0, 49.0, 47.0, 49.0, 45.0, 58.0, 49.0, 56.0, 54.0, 41.0, 45.0, 44.0, 26.0, 37.0, 33.0, 19.0, 16.0, 17.0, 13.0, 16.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-29.077295303344727, -28.300304412841797, -27.523313522338867, -26.746322631835938, -25.969331741333008, -25.192340850830078, -24.41535186767578, -23.63836097717285, -22.861370086669922, -22.084379196166992, -21.307388305664062, -20.530397415161133, -19.753406524658203, -18.976417541503906, -18.199424743652344, -17.422435760498047, -16.645442962646484, -15.868452072143555, -15.091461181640625, -14.314470291137695, -13.537480354309082, -12.760489463806152, -11.983498573303223, -11.20650863647461, -10.42951774597168, -9.65252685546875, -8.87553596496582, -8.09854507446289, -7.321555137634277, -6.544564247131348, -5.767573356628418, -4.9905829429626465, -4.213592529296875, -3.4366018772125244, -2.659611225128174, -1.8826203346252441, -1.1056296825408936, -0.32863903045654297, 0.4483518600463867, 1.2253422737121582, 2.002333164215088, 2.7793238162994385, 3.556314468383789, 4.333305358886719, 5.110296249389648, 5.88728666305542, 6.66427755355835, 7.441267967224121, 8.21825885772705, 8.99524974822998, 9.77224063873291, 10.549230575561523, 11.326221466064453, 12.103212356567383, 12.880203247070312, 13.657194137573242, 14.434185028076172, 15.211175918579102, 15.988166809082031, 16.76515769958496, 17.54214859008789, 18.319137573242188, 19.09613037109375, 19.873119354248047, 20.650110244750977]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 8.0, 15.0, 17.0, 15.0, 21.0, 22.0, 13.0, 21.0, 26.0, 30.0, 40.0, 30.0, 33.0, 31.0, 40.0, 32.0, 47.0, 43.0, 35.0, 50.0, 43.0, 45.0, 31.0, 30.0, 32.0, 25.0, 33.0, 24.0, 33.0, 20.0, 18.0, 14.0, 13.0, 11.0, 12.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-29.650087356567383, -28.74713897705078, -27.844188690185547, -26.941240310668945, -26.038291931152344, -25.13534164428711, -24.232393264770508, -23.329444885253906, -22.426494598388672, -21.52354621887207, -20.620595932006836, -19.717647552490234, -18.814699172973633, -17.91175079345703, -17.008800506591797, -16.105852127075195, -15.202903747558594, -14.299954414367676, -13.397006034851074, -12.494056701660156, -11.591108322143555, -10.688158988952637, -9.785209655761719, -8.882261276245117, -7.979311943054199, -7.0763630867004395, -6.17341423034668, -5.270464897155762, -4.367516040802002, -3.464567184448242, -2.561617851257324, -1.6586689949035645, -0.7557220458984375, 0.14722692966461182, 1.0501759052276611, 1.953125, 2.8560738563537598, 3.7590227127075195, 4.6619720458984375, 5.564920902252197, 6.467869758605957, 7.370818614959717, 8.273767471313477, 9.176716804504395, 10.079666137695312, 10.982614517211914, 11.885563850402832, 12.78851318359375, 13.691461563110352, 14.59441089630127, 15.497359275817871, 16.40030860900879, 17.30325698852539, 18.206207275390625, 19.109155654907227, 20.012104034423828, 20.915054321289062, 21.818002700805664, 22.7209529876709, 23.6239013671875, 24.5268497467041, 25.429798126220703, 26.332748413085938, 27.23569679260254, 28.13864517211914]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 20.0, 27.0, 52.0, 71.0, 116.0, 176.0, 261.0, 461.0, 719.0, 1175.0, 1820.0, 2860.0, 4497.0, 6986.0, 10645.0, 16204.0, 23990.0, 35134.0, 49318.0, 66577.0, 84676.0, 101040.0, 110917.0, 111948.0, 102304.0, 87356.0, 68859.0, 50960.0, 36099.0, 25222.0, 17078.0, 11144.0, 7207.0, 4627.0, 2906.0, 1916.0, 1169.0, 727.0, 498.0, 294.0, 169.0, 123.0, 67.0, 57.0, 27.0, 21.0, 14.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.512939453125, -14.97900390625, -14.445068359375, -13.9111328125, -13.377197265625, -12.84326171875, -12.309326171875, -11.775390625, -11.241455078125, -10.70751953125, -10.173583984375, -9.6396484375, -9.105712890625, -8.57177734375, -8.037841796875, -7.50390625, -6.969970703125, -6.43603515625, -5.902099609375, -5.3681640625, -4.834228515625, -4.30029296875, -3.766357421875, -3.232421875, -2.698486328125, -2.16455078125, -1.630615234375, -1.0966796875, -0.562744140625, -0.02880859375, 0.505126953125, 1.0390625, 1.572998046875, 2.10693359375, 2.640869140625, 3.1748046875, 3.708740234375, 4.24267578125, 4.776611328125, 5.310546875, 5.844482421875, 6.37841796875, 6.912353515625, 7.4462890625, 7.980224609375, 8.51416015625, 9.048095703125, 9.58203125, 10.115966796875, 10.64990234375, 11.183837890625, 11.7177734375, 12.251708984375, 12.78564453125, 13.319580078125, 13.853515625, 14.387451171875, 14.92138671875, 15.455322265625, 15.9892578125, 16.523193359375, 17.05712890625, 17.591064453125, 18.125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 9.0, 16.0, 12.0, 13.0, 14.0, 30.0, 16.0, 29.0, 39.0, 26.0, 32.0, 34.0, 27.0, 40.0, 45.0, 41.0, 51.0, 45.0, 57.0, 49.0, 36.0, 38.0, 27.0, 40.0, 29.0, 31.0, 29.0, 20.0, 25.0, 14.0, 12.0, 10.0, 15.0, 6.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-31.921875, -30.98388671875, -30.0458984375, -29.10791015625, -28.169921875, -27.23193359375, -26.2939453125, -25.35595703125, -24.41796875, -23.47998046875, -22.5419921875, -21.60400390625, -20.666015625, -19.72802734375, -18.7900390625, -17.85205078125, -16.9140625, -15.97607421875, -15.0380859375, -14.10009765625, -13.162109375, -12.22412109375, -11.2861328125, -10.34814453125, -9.41015625, -8.47216796875, -7.5341796875, -6.59619140625, -5.658203125, -4.72021484375, -3.7822265625, -2.84423828125, -1.90625, -0.96826171875, -0.0302734375, 0.90771484375, 1.845703125, 2.78369140625, 3.7216796875, 4.65966796875, 5.59765625, 6.53564453125, 7.4736328125, 8.41162109375, 9.349609375, 10.28759765625, 11.2255859375, 12.16357421875, 13.1015625, 14.03955078125, 14.9775390625, 15.91552734375, 16.853515625, 17.79150390625, 18.7294921875, 19.66748046875, 20.60546875, 21.54345703125, 22.4814453125, 23.41943359375, 24.357421875, 25.29541015625, 26.2333984375, 27.17138671875, 28.109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 12.0, 12.0, 27.0, 32.0, 60.0, 87.0, 119.0, 179.0, 311.0, 481.0, 722.0, 1204.0, 1903.0, 2913.0, 4747.0, 7543.0, 11935.0, 18863.0, 28877.0, 44647.0, 65898.0, 91225.0, 116578.0, 132425.0, 132051.0, 114951.0, 88453.0, 62950.0, 42750.0, 27841.0, 17803.0, 11297.0, 7224.0, 4650.0, 2826.0, 1783.0, 1082.0, 729.0, 446.0, 302.0, 222.0, 130.0, 81.0, 59.0, 40.0, 28.0, 17.0, 14.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-22.78125, -22.08984375, -21.3984375, -20.70703125, -20.015625, -19.32421875, -18.6328125, -17.94140625, -17.25, -16.55859375, -15.8671875, -15.17578125, -14.484375, -13.79296875, -13.1015625, -12.41015625, -11.71875, -11.02734375, -10.3359375, -9.64453125, -8.953125, -8.26171875, -7.5703125, -6.87890625, -6.1875, -5.49609375, -4.8046875, -4.11328125, -3.421875, -2.73046875, -2.0390625, -1.34765625, -0.65625, 0.03515625, 0.7265625, 1.41796875, 2.109375, 2.80078125, 3.4921875, 4.18359375, 4.875, 5.56640625, 6.2578125, 6.94921875, 7.640625, 8.33203125, 9.0234375, 9.71484375, 10.40625, 11.09765625, 11.7890625, 12.48046875, 13.171875, 13.86328125, 14.5546875, 15.24609375, 15.9375, 16.62890625, 17.3203125, 18.01171875, 18.703125, 19.39453125, 20.0859375, 20.77734375, 21.46875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 9.0, 8.0, 6.0, 9.0, 15.0, 12.0, 23.0, 15.0, 21.0, 21.0, 21.0, 22.0, 23.0, 36.0, 30.0, 44.0, 35.0, 47.0, 50.0, 46.0, 44.0, 56.0, 42.0, 34.0, 41.0, 44.0, 35.0, 28.0, 25.0, 26.0, 27.0, 28.0, 20.0, 10.0, 13.0, 7.0, 5.0, 6.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.015625, -20.3408203125, -19.666015625, -18.9912109375, -18.31640625, -17.6416015625, -16.966796875, -16.2919921875, -15.6171875, -14.9423828125, -14.267578125, -13.5927734375, -12.91796875, -12.2431640625, -11.568359375, -10.8935546875, -10.21875, -9.5439453125, -8.869140625, -8.1943359375, -7.51953125, -6.8447265625, -6.169921875, -5.4951171875, -4.8203125, -4.1455078125, -3.470703125, -2.7958984375, -2.12109375, -1.4462890625, -0.771484375, -0.0966796875, 0.578125, 1.2529296875, 1.927734375, 2.6025390625, 3.27734375, 3.9521484375, 4.626953125, 5.3017578125, 5.9765625, 6.6513671875, 7.326171875, 8.0009765625, 8.67578125, 9.3505859375, 10.025390625, 10.7001953125, 11.375, 12.0498046875, 12.724609375, 13.3994140625, 14.07421875, 14.7490234375, 15.423828125, 16.0986328125, 16.7734375, 17.4482421875, 18.123046875, 18.7978515625, 19.47265625, 20.1474609375, 20.822265625, 21.4970703125, 22.171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 15.0, 13.0, 15.0, 25.0, 23.0, 37.0, 56.0, 67.0, 93.0, 142.0, 203.0, 287.0, 398.0, 551.0, 904.0, 1423.0, 2437.0, 4274.0, 7844.0, 14821.0, 29334.0, 58372.0, 115865.0, 200701.0, 239413.0, 174626.0, 96168.0, 48052.0, 24173.0, 12247.0, 6557.0, 3614.0, 1996.0, 1298.0, 773.0, 521.0, 362.0, 251.0, 175.0, 104.0, 79.0, 60.0, 48.0, 41.0, 27.0, 19.0, 11.0, 16.0, 6.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.125, -19.439453125, -18.75390625, -18.068359375, -17.3828125, -16.697265625, -16.01171875, -15.326171875, -14.640625, -13.955078125, -13.26953125, -12.583984375, -11.8984375, -11.212890625, -10.52734375, -9.841796875, -9.15625, -8.470703125, -7.78515625, -7.099609375, -6.4140625, -5.728515625, -5.04296875, -4.357421875, -3.671875, -2.986328125, -2.30078125, -1.615234375, -0.9296875, -0.244140625, 0.44140625, 1.126953125, 1.8125, 2.498046875, 3.18359375, 3.869140625, 4.5546875, 5.240234375, 5.92578125, 6.611328125, 7.296875, 7.982421875, 8.66796875, 9.353515625, 10.0390625, 10.724609375, 11.41015625, 12.095703125, 12.78125, 13.466796875, 14.15234375, 14.837890625, 15.5234375, 16.208984375, 16.89453125, 17.580078125, 18.265625, 18.951171875, 19.63671875, 20.322265625, 21.0078125, 21.693359375, 22.37890625, 23.064453125, 23.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 8.0, 4.0, 5.0, 10.0, 14.0, 23.0, 32.0, 33.0, 44.0, 57.0, 69.0, 74.0, 85.0, 96.0, 102.0, 74.0, 56.0, 53.0, 35.0, 39.0, 21.0, 20.0, 11.0, 13.0, 9.0, 6.0, 3.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00250244140625, -0.002427995204925537, -0.0023535490036010742, -0.0022791028022766113, -0.0022046566009521484, -0.0021302103996276855, -0.0020557641983032227, -0.0019813179969787598, -0.0019068717956542969, -0.001832425594329834, -0.001757979393005371, -0.0016835331916809082, -0.0016090869903564453, -0.0015346407890319824, -0.0014601945877075195, -0.0013857483863830566, -0.0013113021850585938, -0.0012368559837341309, -0.001162409782409668, -0.001087963581085205, -0.0010135173797607422, -0.0009390711784362793, -0.0008646249771118164, -0.0007901787757873535, -0.0007157325744628906, -0.0006412863731384277, -0.0005668401718139648, -0.000492393970489502, -0.00041794776916503906, -0.00034350156784057617, -0.0002690553665161133, -0.0001946091651916504, -0.0001201629638671875, -4.571676254272461e-05, 2.872943878173828e-05, 0.00010317564010620117, 0.00017762184143066406, 0.00025206804275512695, 0.00032651424407958984, 0.00040096044540405273, 0.0004754066467285156, 0.0005498528480529785, 0.0006242990493774414, 0.0006987452507019043, 0.0007731914520263672, 0.0008476376533508301, 0.000922083854675293, 0.0009965300559997559, 0.0010709762573242188, 0.0011454224586486816, 0.0012198686599731445, 0.0012943148612976074, 0.0013687610626220703, 0.0014432072639465332, 0.001517653465270996, 0.001592099666595459, 0.0016665458679199219, 0.0017409920692443848, 0.0018154382705688477, 0.0018898844718933105, 0.0019643306732177734, 0.0020387768745422363, 0.0021132230758666992, 0.002187669277191162, 0.002262115478515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 14.0, 19.0, 28.0, 46.0, 65.0, 84.0, 113.0, 174.0, 287.0, 430.0, 605.0, 1073.0, 1685.0, 2829.0, 4808.0, 8253.0, 14270.0, 24852.0, 43785.0, 74731.0, 118791.0, 162882.0, 178708.0, 151719.0, 105307.0, 64421.0, 37140.0, 21447.0, 12185.0, 7008.0, 4104.0, 2490.0, 1458.0, 950.0, 602.0, 423.0, 242.0, 171.0, 120.0, 72.0, 53.0, 27.0, 21.0, 14.0, 9.0, 12.0, 3.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.546875, -15.06640625, -14.5859375, -14.10546875, -13.625, -13.14453125, -12.6640625, -12.18359375, -11.703125, -11.22265625, -10.7421875, -10.26171875, -9.78125, -9.30078125, -8.8203125, -8.33984375, -7.859375, -7.37890625, -6.8984375, -6.41796875, -5.9375, -5.45703125, -4.9765625, -4.49609375, -4.015625, -3.53515625, -3.0546875, -2.57421875, -2.09375, -1.61328125, -1.1328125, -0.65234375, -0.171875, 0.30859375, 0.7890625, 1.26953125, 1.75, 2.23046875, 2.7109375, 3.19140625, 3.671875, 4.15234375, 4.6328125, 5.11328125, 5.59375, 6.07421875, 6.5546875, 7.03515625, 7.515625, 7.99609375, 8.4765625, 8.95703125, 9.4375, 9.91796875, 10.3984375, 10.87890625, 11.359375, 11.83984375, 12.3203125, 12.80078125, 13.28125, 13.76171875, 14.2421875, 14.72265625, 15.203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 6.0, 11.0, 9.0, 20.0, 28.0, 38.0, 43.0, 55.0, 78.0, 61.0, 88.0, 85.0, 68.0, 83.0, 76.0, 61.0, 42.0, 30.0, 29.0, 22.0, 17.0, 9.0, 8.0, 2.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.280517578125, -8.94384765625, -8.607177734375, -8.2705078125, -7.933837890625, -7.59716796875, -7.260498046875, -6.923828125, -6.587158203125, -6.25048828125, -5.913818359375, -5.5771484375, -5.240478515625, -4.90380859375, -4.567138671875, -4.23046875, -3.893798828125, -3.55712890625, -3.220458984375, -2.8837890625, -2.547119140625, -2.21044921875, -1.873779296875, -1.537109375, -1.200439453125, -0.86376953125, -0.527099609375, -0.1904296875, 0.146240234375, 0.48291015625, 0.819580078125, 1.15625, 1.492919921875, 1.82958984375, 2.166259765625, 2.5029296875, 2.839599609375, 3.17626953125, 3.512939453125, 3.849609375, 4.186279296875, 4.52294921875, 4.859619140625, 5.1962890625, 5.532958984375, 5.86962890625, 6.206298828125, 6.54296875, 6.879638671875, 7.21630859375, 7.552978515625, 7.8896484375, 8.226318359375, 8.56298828125, 8.899658203125, 9.236328125, 9.572998046875, 9.90966796875, 10.246337890625, 10.5830078125, 10.919677734375, 11.25634765625, 11.593017578125, 11.9296875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 2.0, 12.0, 14.0, 17.0, 18.0, 32.0, 20.0, 35.0, 37.0, 39.0, 42.0, 59.0, 50.0, 40.0, 53.0, 44.0, 48.0, 59.0, 39.0, 52.0, 46.0, 42.0, 29.0, 31.0, 26.0, 12.0, 19.0, 14.0, 11.0, 8.0, 6.0, 6.0, 7.0, 3.0, 5.0, 5.0, 1.0, 5.0], "bins": [-32.30500793457031, -31.516483306884766, -30.727956771850586, -29.93943214416504, -29.150907516479492, -28.362380981445312, -27.573856353759766, -26.78533172607422, -25.996807098388672, -25.208282470703125, -24.419755935668945, -23.6312313079834, -22.84270668029785, -22.054180145263672, -21.265655517578125, -20.477130889892578, -19.6886043548584, -18.90007972717285, -18.111553192138672, -17.323028564453125, -16.534503936767578, -15.745978355407715, -14.957452774047852, -14.168928146362305, -13.380402565002441, -12.591876983642578, -11.803352355957031, -11.014826774597168, -10.226301193237305, -9.437776565551758, -8.649250984191895, -7.8607258796691895, -7.072198867797852, -6.2836737632751465, -5.495148658752441, -4.706623077392578, -3.918097972869873, -3.129572868347168, -2.3410472869873047, -1.5525221824645996, -0.7639970779418945, 0.024528145790100098, 0.8130533695220947, 1.601578712463379, 2.390103816986084, 3.178628921508789, 3.9671545028686523, 4.755679607391357, 5.5442047119140625, 6.332729816436768, 7.121254920959473, 7.909780502319336, 8.698305130004883, 9.486830711364746, 10.27535629272461, 11.063880920410156, 11.85240650177002, 12.640932083129883, 13.42945671081543, 14.217982292175293, 15.006507873535156, 15.795032501220703, 16.58355712890625, 17.37208366394043, 18.160608291625977]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 9.0, 2.0, 7.0, 4.0, 5.0, 4.0, 12.0, 10.0, 7.0, 14.0, 24.0, 19.0, 20.0, 31.0, 36.0, 30.0, 33.0, 23.0, 29.0, 37.0, 33.0, 40.0, 34.0, 38.0, 33.0, 45.0, 38.0, 43.0, 28.0, 42.0, 34.0, 23.0, 40.0, 28.0, 27.0, 28.0, 18.0, 15.0, 7.0, 13.0, 9.0, 6.0, 7.0, 2.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.205394744873047, -24.30290985107422, -23.40042495727539, -22.49793815612793, -21.5954532623291, -20.692968368530273, -19.790481567382812, -18.887996673583984, -17.985511779785156, -17.083026885986328, -16.1805419921875, -15.278055191040039, -14.375570297241211, -13.473085403442383, -12.570599555969238, -11.668113708496094, -10.765628814697266, -9.863143920898438, -8.960658073425293, -8.058172225952148, -7.15568733215332, -6.253201961517334, -5.350716590881348, -4.448231220245361, -3.545745849609375, -2.6432604789733887, -1.7407751083374023, -0.838289737701416, 0.06419563293457031, 0.9666810035705566, 1.869166374206543, 2.7716517448425293, 3.6741371154785156, 4.576622486114502, 5.479107856750488, 6.381593227386475, 7.284078598022461, 8.186563491821289, 9.089049339294434, 9.991535186767578, 10.894020080566406, 11.796504974365234, 12.698990821838379, 13.601476669311523, 14.503961563110352, 15.40644645690918, 16.30893325805664, 17.21141815185547, 18.113903045654297, 19.016387939453125, 19.918872833251953, 20.821359634399414, 21.723844528198242, 22.62632942199707, 23.52881622314453, 24.43130111694336, 25.333786010742188, 26.236270904541016, 27.138755798339844, 28.041242599487305, 28.943727493286133, 29.84621238708496, 30.748699188232422, 31.65118408203125, 32.55366897583008]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 14.0, 34.0, 47.0, 57.0, 103.0, 164.0, 238.0, 368.0, 601.0, 1012.0, 1526.0, 2387.0, 3973.0, 6604.0, 10788.0, 18430.0, 31089.0, 53124.0, 90123.0, 150711.0, 244683.0, 369966.0, 506163.0, 598654.0, 598541.0, 507836.0, 374785.0, 248451.0, 152631.0, 91274.0, 53119.0, 31002.0, 18114.0, 10943.0, 6392.0, 4002.0, 2356.0, 1415.0, 879.0, 618.0, 338.0, 243.0, 172.0, 106.0, 62.0, 51.0, 30.0, 17.0, 12.0, 14.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-17.6875, -17.1171875, -16.546875, -15.9765625, -15.40625, -14.8359375, -14.265625, -13.6953125, -13.125, -12.5546875, -11.984375, -11.4140625, -10.84375, -10.2734375, -9.703125, -9.1328125, -8.5625, -7.9921875, -7.421875, -6.8515625, -6.28125, -5.7109375, -5.140625, -4.5703125, -4.0, -3.4296875, -2.859375, -2.2890625, -1.71875, -1.1484375, -0.578125, -0.0078125, 0.5625, 1.1328125, 1.703125, 2.2734375, 2.84375, 3.4140625, 3.984375, 4.5546875, 5.125, 5.6953125, 6.265625, 6.8359375, 7.40625, 7.9765625, 8.546875, 9.1171875, 9.6875, 10.2578125, 10.828125, 11.3984375, 11.96875, 12.5390625, 13.109375, 13.6796875, 14.25, 14.8203125, 15.390625, 15.9609375, 16.53125, 17.1015625, 17.671875, 18.2421875, 18.8125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 5.0, 1.0, 3.0, 4.0, 9.0, 5.0, 6.0, 9.0, 12.0, 9.0, 12.0, 19.0, 23.0, 29.0, 21.0, 34.0, 32.0, 24.0, 24.0, 38.0, 28.0, 37.0, 34.0, 32.0, 39.0, 39.0, 34.0, 38.0, 38.0, 40.0, 42.0, 23.0, 28.0, 34.0, 33.0, 33.0, 26.0, 18.0, 18.0, 12.0, 7.0, 8.0, 4.0, 7.0, 10.0, 4.0, 8.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.46875, -18.78173828125, -18.0947265625, -17.40771484375, -16.720703125, -16.03369140625, -15.3466796875, -14.65966796875, -13.97265625, -13.28564453125, -12.5986328125, -11.91162109375, -11.224609375, -10.53759765625, -9.8505859375, -9.16357421875, -8.4765625, -7.78955078125, -7.1025390625, -6.41552734375, -5.728515625, -5.04150390625, -4.3544921875, -3.66748046875, -2.98046875, -2.29345703125, -1.6064453125, -0.91943359375, -0.232421875, 0.45458984375, 1.1416015625, 1.82861328125, 2.515625, 3.20263671875, 3.8896484375, 4.57666015625, 5.263671875, 5.95068359375, 6.6376953125, 7.32470703125, 8.01171875, 8.69873046875, 9.3857421875, 10.07275390625, 10.759765625, 11.44677734375, 12.1337890625, 12.82080078125, 13.5078125, 14.19482421875, 14.8818359375, 15.56884765625, 16.255859375, 16.94287109375, 17.6298828125, 18.31689453125, 19.00390625, 19.69091796875, 20.3779296875, 21.06494140625, 21.751953125, 22.43896484375, 23.1259765625, 23.81298828125, 24.5]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 5.0, 6.0, 14.0, 14.0, 37.0, 47.0, 61.0, 89.0, 159.0, 188.0, 324.0, 523.0, 852.0, 1225.0, 2020.0, 3090.0, 4594.0, 7431.0, 11670.0, 18027.0, 28873.0, 44529.0, 68998.0, 105704.0, 157994.0, 226122.0, 308528.0, 395126.0, 463484.0, 490183.0, 462684.0, 396481.0, 309245.0, 226935.0, 159234.0, 105779.0, 69526.0, 45354.0, 28496.0, 18504.0, 11735.0, 7391.0, 4671.0, 2971.0, 1887.0, 1248.0, 813.0, 510.0, 329.0, 195.0, 146.0, 83.0, 62.0, 38.0, 22.0, 10.0, 12.0, 5.0, 8.0, 1.0, 4.0], "bins": [-16.59375, -16.083251953125, -15.57275390625, -15.062255859375, -14.5517578125, -14.041259765625, -13.53076171875, -13.020263671875, -12.509765625, -11.999267578125, -11.48876953125, -10.978271484375, -10.4677734375, -9.957275390625, -9.44677734375, -8.936279296875, -8.42578125, -7.915283203125, -7.40478515625, -6.894287109375, -6.3837890625, -5.873291015625, -5.36279296875, -4.852294921875, -4.341796875, -3.831298828125, -3.32080078125, -2.810302734375, -2.2998046875, -1.789306640625, -1.27880859375, -0.768310546875, -0.2578125, 0.252685546875, 0.76318359375, 1.273681640625, 1.7841796875, 2.294677734375, 2.80517578125, 3.315673828125, 3.826171875, 4.336669921875, 4.84716796875, 5.357666015625, 5.8681640625, 6.378662109375, 6.88916015625, 7.399658203125, 7.91015625, 8.420654296875, 8.93115234375, 9.441650390625, 9.9521484375, 10.462646484375, 10.97314453125, 11.483642578125, 11.994140625, 12.504638671875, 13.01513671875, 13.525634765625, 14.0361328125, 14.546630859375, 15.05712890625, 15.567626953125, 16.078125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 11.0, 14.0, 20.0, 19.0, 22.0, 35.0, 48.0, 28.0, 64.0, 89.0, 106.0, 123.0, 132.0, 135.0, 163.0, 197.0, 182.0, 227.0, 175.0, 217.0, 245.0, 237.0, 208.0, 207.0, 170.0, 146.0, 145.0, 127.0, 92.0, 85.0, 77.0, 64.0, 53.0, 45.0, 35.0, 31.0, 21.0, 23.0, 13.0, 15.0, 12.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.2093505859375, -8.903076171875, -8.5968017578125, -8.29052734375, -7.9842529296875, -7.677978515625, -7.3717041015625, -7.0654296875, -6.7591552734375, -6.452880859375, -6.1466064453125, -5.84033203125, -5.5340576171875, -5.227783203125, -4.9215087890625, -4.615234375, -4.3089599609375, -4.002685546875, -3.6964111328125, -3.39013671875, -3.0838623046875, -2.777587890625, -2.4713134765625, -2.1650390625, -1.8587646484375, -1.552490234375, -1.2462158203125, -0.93994140625, -0.6336669921875, -0.327392578125, -0.0211181640625, 0.28515625, 0.5914306640625, 0.897705078125, 1.2039794921875, 1.51025390625, 1.8165283203125, 2.122802734375, 2.4290771484375, 2.7353515625, 3.0416259765625, 3.347900390625, 3.6541748046875, 3.96044921875, 4.2667236328125, 4.572998046875, 4.8792724609375, 5.185546875, 5.4918212890625, 5.798095703125, 6.1043701171875, 6.41064453125, 6.7169189453125, 7.023193359375, 7.3294677734375, 7.6357421875, 7.9420166015625, 8.248291015625, 8.5545654296875, 8.86083984375, 9.1671142578125, 9.473388671875, 9.7796630859375, 10.0859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 12.0, 15.0, 9.0, 15.0, 19.0, 17.0, 27.0, 25.0, 35.0, 36.0, 31.0, 37.0, 43.0, 47.0, 39.0, 43.0, 54.0, 48.0, 48.0, 55.0, 51.0, 45.0, 34.0, 23.0, 29.0, 25.0, 20.0, 26.0, 10.0, 10.0, 12.0, 7.0, 9.0, 7.0, 8.0, 2.0, 3.0, 2.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.60715103149414, -23.904407501220703, -23.201663970947266, -22.498920440673828, -21.79617691040039, -21.093433380126953, -20.390689849853516, -19.687946319580078, -18.98520278930664, -18.282459259033203, -17.579715728759766, -16.876972198486328, -16.17422866821289, -15.471485137939453, -14.768741607666016, -14.065998077392578, -13.36325454711914, -12.660511016845703, -11.957767486572266, -11.255023956298828, -10.55228042602539, -9.849536895751953, -9.146793365478516, -8.444049835205078, -7.741306304931641, -7.038562774658203, -6.335819244384766, -5.633075714111328, -4.930332183837891, -4.227588653564453, -3.5248451232910156, -2.822101593017578, -2.119356155395508, -1.4166126251220703, -0.7138690948486328, -0.011125564575195312, 0.6916179656982422, 1.3943614959716797, 2.097105026245117, 2.7998485565185547, 3.502592086791992, 4.20533561706543, 4.908079147338867, 5.610822677612305, 6.313566207885742, 7.01630973815918, 7.719053268432617, 8.421796798706055, 9.124540328979492, 9.82728385925293, 10.530027389526367, 11.232770919799805, 11.935514450073242, 12.63825798034668, 13.341001510620117, 14.043745040893555, 14.746488571166992, 15.44923210144043, 16.151975631713867, 16.854719161987305, 17.557462692260742, 18.26020622253418, 18.962949752807617, 19.665693283081055, 20.368436813354492]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 10.0, 16.0, 10.0, 13.0, 15.0, 28.0, 23.0, 18.0, 27.0, 29.0, 29.0, 29.0, 34.0, 27.0, 37.0, 34.0, 31.0, 40.0, 51.0, 44.0, 48.0, 39.0, 39.0, 30.0, 38.0, 40.0, 31.0, 25.0, 11.0, 22.0, 19.0, 20.0, 17.0, 11.0, 8.0, 6.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.19291114807129, -25.311534881591797, -24.430158615112305, -23.54878044128418, -22.667404174804688, -21.786027908325195, -20.904651641845703, -20.023273468017578, -19.141897201538086, -18.260520935058594, -17.3791446685791, -16.497766494750977, -15.616390228271484, -14.735013961791992, -13.8536376953125, -12.972260475158691, -12.0908842086792, -11.209507942199707, -10.328130722045898, -9.446754455566406, -8.565377235412598, -7.6840009689331055, -6.802624225616455, -5.921247482299805, -5.039870738983154, -4.158493995666504, -3.2771172523498535, -2.3957407474517822, -1.5143640041351318, -0.6329874992370605, 0.24838924407958984, 1.1297659873962402, 2.0111427307128906, 2.892519474029541, 3.7738962173461914, 4.655272483825684, 5.536649703979492, 6.418025970458984, 7.299402713775635, 8.180779457092285, 9.062156677246094, 9.943532943725586, 10.824910163879395, 11.706286430358887, 12.587663650512695, 13.469039916992188, 14.35041618347168, 15.231793403625488, 16.113170623779297, 16.99454689025879, 17.87592315673828, 18.757301330566406, 19.6386775970459, 20.52005386352539, 21.401430130004883, 22.282806396484375, 23.164182662963867, 24.04555892944336, 24.92693519592285, 25.808313369750977, 26.68968963623047, 27.57106590270996, 28.452442169189453, 29.333820343017578, 30.21519660949707]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 16.0, 25.0, 35.0, 60.0, 81.0, 114.0, 149.0, 222.0, 331.0, 513.0, 732.0, 1132.0, 1706.0, 2603.0, 4090.0, 6378.0, 10305.0, 16526.0, 26816.0, 42939.0, 70304.0, 108693.0, 153279.0, 174713.0, 148326.0, 103687.0, 65836.0, 40887.0, 25210.0, 15629.0, 9957.0, 6150.0, 3779.0, 2472.0, 1629.0, 1018.0, 692.0, 483.0, 328.0, 210.0, 154.0, 96.0, 76.0, 57.0, 28.0, 22.0, 19.0, 23.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-17.828125, -17.278564453125, -16.72900390625, -16.179443359375, -15.6298828125, -15.080322265625, -14.53076171875, -13.981201171875, -13.431640625, -12.882080078125, -12.33251953125, -11.782958984375, -11.2333984375, -10.683837890625, -10.13427734375, -9.584716796875, -9.03515625, -8.485595703125, -7.93603515625, -7.386474609375, -6.8369140625, -6.287353515625, -5.73779296875, -5.188232421875, -4.638671875, -4.089111328125, -3.53955078125, -2.989990234375, -2.4404296875, -1.890869140625, -1.34130859375, -0.791748046875, -0.2421875, 0.307373046875, 0.85693359375, 1.406494140625, 1.9560546875, 2.505615234375, 3.05517578125, 3.604736328125, 4.154296875, 4.703857421875, 5.25341796875, 5.802978515625, 6.3525390625, 6.902099609375, 7.45166015625, 8.001220703125, 8.55078125, 9.100341796875, 9.64990234375, 10.199462890625, 10.7490234375, 11.298583984375, 11.84814453125, 12.397705078125, 12.947265625, 13.496826171875, 14.04638671875, 14.595947265625, 15.1455078125, 15.695068359375, 16.24462890625, 16.794189453125, 17.34375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 10.0, 14.0, 6.0, 17.0, 13.0, 21.0, 25.0, 27.0, 32.0, 22.0, 29.0, 31.0, 36.0, 39.0, 33.0, 35.0, 46.0, 48.0, 50.0, 51.0, 34.0, 32.0, 41.0, 32.0, 36.0, 36.0, 31.0, 21.0, 20.0, 23.0, 14.0, 18.0, 9.0, 9.0, 11.0, 3.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.875, -25.9609375, -25.046875, -24.1328125, -23.21875, -22.3046875, -21.390625, -20.4765625, -19.5625, -18.6484375, -17.734375, -16.8203125, -15.90625, -14.9921875, -14.078125, -13.1640625, -12.25, -11.3359375, -10.421875, -9.5078125, -8.59375, -7.6796875, -6.765625, -5.8515625, -4.9375, -4.0234375, -3.109375, -2.1953125, -1.28125, -0.3671875, 0.546875, 1.4609375, 2.375, 3.2890625, 4.203125, 5.1171875, 6.03125, 6.9453125, 7.859375, 8.7734375, 9.6875, 10.6015625, 11.515625, 12.4296875, 13.34375, 14.2578125, 15.171875, 16.0859375, 17.0, 17.9140625, 18.828125, 19.7421875, 20.65625, 21.5703125, 22.484375, 23.3984375, 24.3125, 25.2265625, 26.140625, 27.0546875, 27.96875, 28.8828125, 29.796875, 30.7109375, 31.625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 8.0, 19.0, 30.0, 47.0, 67.0, 93.0, 106.0, 194.0, 262.0, 387.0, 610.0, 946.0, 1503.0, 2228.0, 3578.0, 5673.0, 9014.0, 14482.0, 24076.0, 39938.0, 68235.0, 114405.0, 174177.0, 198581.0, 152698.0, 94766.0, 56307.0, 33066.0, 19813.0, 12109.0, 7640.0, 4704.0, 3082.0, 1951.0, 1293.0, 827.0, 534.0, 404.0, 242.0, 147.0, 106.0, 68.0, 38.0, 31.0, 17.0, 18.0, 7.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0], "bins": [-20.25, -19.64208984375, -19.0341796875, -18.42626953125, -17.818359375, -17.21044921875, -16.6025390625, -15.99462890625, -15.38671875, -14.77880859375, -14.1708984375, -13.56298828125, -12.955078125, -12.34716796875, -11.7392578125, -11.13134765625, -10.5234375, -9.91552734375, -9.3076171875, -8.69970703125, -8.091796875, -7.48388671875, -6.8759765625, -6.26806640625, -5.66015625, -5.05224609375, -4.4443359375, -3.83642578125, -3.228515625, -2.62060546875, -2.0126953125, -1.40478515625, -0.796875, -0.18896484375, 0.4189453125, 1.02685546875, 1.634765625, 2.24267578125, 2.8505859375, 3.45849609375, 4.06640625, 4.67431640625, 5.2822265625, 5.89013671875, 6.498046875, 7.10595703125, 7.7138671875, 8.32177734375, 8.9296875, 9.53759765625, 10.1455078125, 10.75341796875, 11.361328125, 11.96923828125, 12.5771484375, 13.18505859375, 13.79296875, 14.40087890625, 15.0087890625, 15.61669921875, 16.224609375, 16.83251953125, 17.4404296875, 18.04833984375, 18.65625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 3.0, 2.0, 5.0, 13.0, 15.0, 15.0, 19.0, 23.0, 22.0, 20.0, 22.0, 26.0, 22.0, 22.0, 39.0, 39.0, 27.0, 42.0, 44.0, 30.0, 50.0, 38.0, 36.0, 30.0, 30.0, 33.0, 31.0, 28.0, 19.0, 26.0, 24.0, 28.0, 27.0, 20.0, 18.0, 21.0, 12.0, 19.0, 10.0, 5.0, 9.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-17.65625, -17.11669921875, -16.5771484375, -16.03759765625, -15.498046875, -14.95849609375, -14.4189453125, -13.87939453125, -13.33984375, -12.80029296875, -12.2607421875, -11.72119140625, -11.181640625, -10.64208984375, -10.1025390625, -9.56298828125, -9.0234375, -8.48388671875, -7.9443359375, -7.40478515625, -6.865234375, -6.32568359375, -5.7861328125, -5.24658203125, -4.70703125, -4.16748046875, -3.6279296875, -3.08837890625, -2.548828125, -2.00927734375, -1.4697265625, -0.93017578125, -0.390625, 0.14892578125, 0.6884765625, 1.22802734375, 1.767578125, 2.30712890625, 2.8466796875, 3.38623046875, 3.92578125, 4.46533203125, 5.0048828125, 5.54443359375, 6.083984375, 6.62353515625, 7.1630859375, 7.70263671875, 8.2421875, 8.78173828125, 9.3212890625, 9.86083984375, 10.400390625, 10.93994140625, 11.4794921875, 12.01904296875, 12.55859375, 13.09814453125, 13.6376953125, 14.17724609375, 14.716796875, 15.25634765625, 15.7958984375, 16.33544921875, 16.875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 18.0, 13.0, 16.0, 37.0, 46.0, 70.0, 95.0, 118.0, 166.0, 246.0, 340.0, 485.0, 736.0, 1118.0, 1760.0, 2606.0, 4044.0, 6386.0, 10644.0, 17462.0, 30885.0, 56423.0, 108053.0, 199440.0, 248642.0, 163915.0, 85484.0, 45168.0, 25309.0, 14582.0, 8749.0, 5399.0, 3414.0, 2205.0, 1508.0, 920.0, 611.0, 444.0, 308.0, 189.0, 142.0, 101.0, 75.0, 54.0, 36.0, 22.0, 17.0, 19.0, 9.0, 8.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.5703125, -9.2647705078125, -8.959228515625, -8.6536865234375, -8.34814453125, -8.0426025390625, -7.737060546875, -7.4315185546875, -7.1259765625, -6.8204345703125, -6.514892578125, -6.2093505859375, -5.90380859375, -5.5982666015625, -5.292724609375, -4.9871826171875, -4.681640625, -4.3760986328125, -4.070556640625, -3.7650146484375, -3.45947265625, -3.1539306640625, -2.848388671875, -2.5428466796875, -2.2373046875, -1.9317626953125, -1.626220703125, -1.3206787109375, -1.01513671875, -0.7095947265625, -0.404052734375, -0.0985107421875, 0.20703125, 0.5125732421875, 0.818115234375, 1.1236572265625, 1.42919921875, 1.7347412109375, 2.040283203125, 2.3458251953125, 2.6513671875, 2.9569091796875, 3.262451171875, 3.5679931640625, 3.87353515625, 4.1790771484375, 4.484619140625, 4.7901611328125, 5.095703125, 5.4012451171875, 5.706787109375, 6.0123291015625, 6.31787109375, 6.6234130859375, 6.928955078125, 7.2344970703125, 7.5400390625, 7.8455810546875, 8.151123046875, 8.4566650390625, 8.76220703125, 9.0677490234375, 9.373291015625, 9.6788330078125, 9.984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 7.0, 21.0, 20.0, 24.0, 31.0, 72.0, 109.0, 135.0, 182.0, 131.0, 96.0, 58.0, 28.0, 19.0, 10.0, 11.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014295578002929688, -0.0013772249221801758, -0.0013248920440673828, -0.0012725591659545898, -0.0012202262878417969, -0.001167893409729004, -0.001115560531616211, -0.001063227653503418, -0.001010894775390625, -0.000958561897277832, -0.0009062290191650391, -0.0008538961410522461, -0.0008015632629394531, -0.0007492303848266602, -0.0006968975067138672, -0.0006445646286010742, -0.0005922317504882812, -0.0005398988723754883, -0.0004875659942626953, -0.00043523311614990234, -0.0003829002380371094, -0.0003305673599243164, -0.00027823448181152344, -0.00022590160369873047, -0.0001735687255859375, -0.00012123584747314453, -6.890296936035156e-05, -1.6570091247558594e-05, 3.5762786865234375e-05, 8.809566497802734e-05, 0.0001404285430908203, 0.00019276142120361328, 0.00024509429931640625, 0.0002974271774291992, 0.0003497600555419922, 0.00040209293365478516, 0.0004544258117675781, 0.0005067586898803711, 0.0005590915679931641, 0.000611424446105957, 0.00066375732421875, 0.000716090202331543, 0.0007684230804443359, 0.0008207559585571289, 0.0008730888366699219, 0.0009254217147827148, 0.0009777545928955078, 0.0010300874710083008, 0.0010824203491210938, 0.0011347532272338867, 0.0011870861053466797, 0.0012394189834594727, 0.0012917518615722656, 0.0013440847396850586, 0.0013964176177978516, 0.0014487504959106445, 0.0015010833740234375, 0.0015534162521362305, 0.0016057491302490234, 0.0016580820083618164, 0.0017104148864746094, 0.0017627477645874023, 0.0018150806427001953, 0.0018674135208129883, 0.0019197463989257812]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 12.0, 9.0, 14.0, 32.0, 43.0, 60.0, 90.0, 205.0, 287.0, 436.0, 690.0, 996.0, 1615.0, 2496.0, 3930.0, 6003.0, 9401.0, 14683.0, 23275.0, 36741.0, 57589.0, 89971.0, 133555.0, 167673.0, 160394.0, 120435.0, 79594.0, 50605.0, 31585.0, 20230.0, 12859.0, 8162.0, 5274.0, 3448.0, 2172.0, 1419.0, 906.0, 649.0, 386.0, 238.0, 134.0, 99.0, 60.0, 39.0, 31.0, 11.0, 7.0, 9.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.91455078125, -7.6494140625, -7.38427734375, -7.119140625, -6.85400390625, -6.5888671875, -6.32373046875, -6.05859375, -5.79345703125, -5.5283203125, -5.26318359375, -4.998046875, -4.73291015625, -4.4677734375, -4.20263671875, -3.9375, -3.67236328125, -3.4072265625, -3.14208984375, -2.876953125, -2.61181640625, -2.3466796875, -2.08154296875, -1.81640625, -1.55126953125, -1.2861328125, -1.02099609375, -0.755859375, -0.49072265625, -0.2255859375, 0.03955078125, 0.3046875, 0.56982421875, 0.8349609375, 1.10009765625, 1.365234375, 1.63037109375, 1.8955078125, 2.16064453125, 2.42578125, 2.69091796875, 2.9560546875, 3.22119140625, 3.486328125, 3.75146484375, 4.0166015625, 4.28173828125, 4.546875, 4.81201171875, 5.0771484375, 5.34228515625, 5.607421875, 5.87255859375, 6.1376953125, 6.40283203125, 6.66796875, 6.93310546875, 7.1982421875, 7.46337890625, 7.728515625, 7.99365234375, 8.2587890625, 8.52392578125, 8.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 7.0, 3.0, 3.0, 5.0, 9.0, 5.0, 15.0, 12.0, 10.0, 16.0, 20.0, 25.0, 21.0, 33.0, 43.0, 59.0, 49.0, 59.0, 71.0, 54.0, 61.0, 65.0, 45.0, 62.0, 41.0, 35.0, 21.0, 29.0, 17.0, 21.0, 14.0, 7.0, 13.0, 10.0, 16.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.74609375, -3.628570556640625, -3.51104736328125, -3.393524169921875, -3.2760009765625, -3.158477783203125, -3.04095458984375, -2.923431396484375, -2.805908203125, -2.688385009765625, -2.57086181640625, -2.453338623046875, -2.3358154296875, -2.218292236328125, -2.10076904296875, -1.983245849609375, -1.86572265625, -1.748199462890625, -1.63067626953125, -1.513153076171875, -1.3956298828125, -1.278106689453125, -1.16058349609375, -1.043060302734375, -0.925537109375, -0.808013916015625, -0.69049072265625, -0.572967529296875, -0.4554443359375, -0.337921142578125, -0.22039794921875, -0.102874755859375, 0.0146484375, 0.132171630859375, 0.24969482421875, 0.367218017578125, 0.4847412109375, 0.602264404296875, 0.71978759765625, 0.837310791015625, 0.954833984375, 1.072357177734375, 1.18988037109375, 1.307403564453125, 1.4249267578125, 1.542449951171875, 1.65997314453125, 1.777496337890625, 1.89501953125, 2.012542724609375, 2.13006591796875, 2.247589111328125, 2.3651123046875, 2.482635498046875, 2.60015869140625, 2.717681884765625, 2.835205078125, 2.952728271484375, 3.07025146484375, 3.187774658203125, 3.3052978515625, 3.422821044921875, 3.54034423828125, 3.657867431640625, 3.775390625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 5.0, 7.0, 8.0, 11.0, 14.0, 19.0, 22.0, 24.0, 17.0, 27.0, 31.0, 22.0, 30.0, 40.0, 47.0, 46.0, 58.0, 46.0, 34.0, 55.0, 55.0, 49.0, 47.0, 43.0, 31.0, 26.0, 41.0, 23.0, 27.0, 14.0, 8.0, 15.0, 5.0, 7.0, 9.0, 10.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.748291015625, -23.056793212890625, -22.365293502807617, -21.67379379272461, -20.982295989990234, -20.29079818725586, -19.59929847717285, -18.907798767089844, -18.21630096435547, -17.524803161621094, -16.833303451538086, -16.141803741455078, -15.450305938720703, -14.758807182312012, -14.06730842590332, -13.375809669494629, -12.684310913085938, -11.992812156677246, -11.301313400268555, -10.609814643859863, -9.918315887451172, -9.22681713104248, -8.535318374633789, -7.843819618225098, -7.152320861816406, -6.460822105407715, -5.769323348999023, -5.077824592590332, -4.386325836181641, -3.694827079772949, -3.003328323364258, -2.3118295669555664, -1.620330810546875, -0.9288320541381836, -0.2373332977294922, 0.4541654586791992, 1.1456642150878906, 1.837162971496582, 2.5286617279052734, 3.220160484313965, 3.9116592407226562, 4.603157997131348, 5.294656753540039, 5.9861555099487305, 6.677654266357422, 7.369153022766113, 8.060651779174805, 8.752150535583496, 9.443649291992188, 10.135148048400879, 10.82664680480957, 11.518145561218262, 12.209644317626953, 12.901143074035645, 13.592641830444336, 14.284140586853027, 14.975639343261719, 15.66713809967041, 16.3586368560791, 17.05013656616211, 17.741634368896484, 18.43313217163086, 19.124631881713867, 19.816131591796875, 20.50762939453125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 14.0, 17.0, 13.0, 18.0, 12.0, 32.0, 23.0, 26.0, 21.0, 31.0, 26.0, 29.0, 43.0, 28.0, 38.0, 27.0, 36.0, 62.0, 39.0, 47.0, 45.0, 34.0, 35.0, 33.0, 43.0, 30.0, 22.0, 25.0, 17.0, 20.0, 23.0, 10.0, 12.0, 9.0, 8.0, 8.0, 2.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.028541564941406, -25.133867263793945, -24.239192962646484, -23.34451675415039, -22.44984245300293, -21.55516815185547, -20.660493850708008, -19.765819549560547, -18.871143341064453, -17.976469039916992, -17.08179473876953, -16.187118530273438, -15.292444229125977, -14.397769927978516, -13.503095626831055, -12.608420372009277, -11.713746070861816, -10.819071769714355, -9.924396514892578, -9.029722213745117, -8.13504695892334, -7.240372657775879, -6.34569787979126, -5.451023101806641, -4.5563483238220215, -3.6616735458374023, -2.766998767852783, -1.8723242282867432, -0.977649450302124, -0.08297491073608398, 0.8116998672485352, 1.7063746452331543, 2.6010494232177734, 3.4957242012023926, 4.390398979187012, 5.285073280334473, 6.17974853515625, 7.074422836303711, 7.96909761428833, 8.86377239227295, 9.758447647094727, 10.653121948242188, 11.547797203063965, 12.442471504211426, 13.337146759033203, 14.231821060180664, 15.126495361328125, 16.02117156982422, 16.915843963623047, 17.810518264770508, 18.70519256591797, 19.599868774414062, 20.494543075561523, 21.389217376708984, 22.283891677856445, 23.178565979003906, 24.0732421875, 24.96791648864746, 25.862590789794922, 26.757266998291016, 27.651941299438477, 28.546615600585938, 29.4412899017334, 30.33596420288086, 31.230640411376953]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 11.0, 25.0, 41.0, 52.0, 95.0, 132.0, 200.0, 316.0, 492.0, 756.0, 1158.0, 1733.0, 2616.0, 3991.0, 6040.0, 8907.0, 13242.0, 19252.0, 27370.0, 38099.0, 51118.0, 66181.0, 81243.0, 92243.0, 100360.0, 101183.0, 94545.0, 82923.0, 68301.0, 53250.0, 40316.0, 28949.0, 20423.0, 14267.0, 9785.0, 6430.0, 4270.0, 2787.0, 1905.0, 1199.0, 808.0, 497.0, 332.0, 251.0, 147.0, 101.0, 86.0, 49.0, 25.0, 11.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-13.78125, -13.337890625, -12.89453125, -12.451171875, -12.0078125, -11.564453125, -11.12109375, -10.677734375, -10.234375, -9.791015625, -9.34765625, -8.904296875, -8.4609375, -8.017578125, -7.57421875, -7.130859375, -6.6875, -6.244140625, -5.80078125, -5.357421875, -4.9140625, -4.470703125, -4.02734375, -3.583984375, -3.140625, -2.697265625, -2.25390625, -1.810546875, -1.3671875, -0.923828125, -0.48046875, -0.037109375, 0.40625, 0.849609375, 1.29296875, 1.736328125, 2.1796875, 2.623046875, 3.06640625, 3.509765625, 3.953125, 4.396484375, 4.83984375, 5.283203125, 5.7265625, 6.169921875, 6.61328125, 7.056640625, 7.5, 7.943359375, 8.38671875, 8.830078125, 9.2734375, 9.716796875, 10.16015625, 10.603515625, 11.046875, 11.490234375, 11.93359375, 12.376953125, 12.8203125, 13.263671875, 13.70703125, 14.150390625, 14.59375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 15.0, 23.0, 16.0, 23.0, 21.0, 18.0, 29.0, 32.0, 25.0, 27.0, 28.0, 31.0, 44.0, 34.0, 36.0, 38.0, 32.0, 46.0, 35.0, 51.0, 50.0, 35.0, 34.0, 33.0, 28.0, 27.0, 23.0, 23.0, 18.0, 15.0, 21.0, 16.0, 13.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.125, -24.23681640625, -23.3486328125, -22.46044921875, -21.572265625, -20.68408203125, -19.7958984375, -18.90771484375, -18.01953125, -17.13134765625, -16.2431640625, -15.35498046875, -14.466796875, -13.57861328125, -12.6904296875, -11.80224609375, -10.9140625, -10.02587890625, -9.1376953125, -8.24951171875, -7.361328125, -6.47314453125, -5.5849609375, -4.69677734375, -3.80859375, -2.92041015625, -2.0322265625, -1.14404296875, -0.255859375, 0.63232421875, 1.5205078125, 2.40869140625, 3.296875, 4.18505859375, 5.0732421875, 5.96142578125, 6.849609375, 7.73779296875, 8.6259765625, 9.51416015625, 10.40234375, 11.29052734375, 12.1787109375, 13.06689453125, 13.955078125, 14.84326171875, 15.7314453125, 16.61962890625, 17.5078125, 18.39599609375, 19.2841796875, 20.17236328125, 21.060546875, 21.94873046875, 22.8369140625, 23.72509765625, 24.61328125, 25.50146484375, 26.3896484375, 27.27783203125, 28.166015625, 29.05419921875, 29.9423828125, 30.83056640625, 31.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 6.0, 7.0, 7.0, 10.0, 21.0, 23.0, 43.0, 64.0, 84.0, 135.0, 242.0, 337.0, 561.0, 843.0, 1372.0, 2183.0, 3543.0, 5776.0, 9352.0, 14953.0, 24029.0, 37038.0, 56241.0, 80864.0, 105945.0, 126433.0, 133264.0, 122356.0, 101699.0, 75787.0, 52377.0, 34616.0, 22066.0, 13883.0, 8425.0, 5257.0, 3183.0, 2055.0, 1303.0, 817.0, 459.0, 322.0, 182.0, 124.0, 98.0, 62.0, 38.0, 36.0, 12.0, 15.0, 10.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.41162109375, -16.7763671875, -16.14111328125, -15.505859375, -14.87060546875, -14.2353515625, -13.60009765625, -12.96484375, -12.32958984375, -11.6943359375, -11.05908203125, -10.423828125, -9.78857421875, -9.1533203125, -8.51806640625, -7.8828125, -7.24755859375, -6.6123046875, -5.97705078125, -5.341796875, -4.70654296875, -4.0712890625, -3.43603515625, -2.80078125, -2.16552734375, -1.5302734375, -0.89501953125, -0.259765625, 0.37548828125, 1.0107421875, 1.64599609375, 2.28125, 2.91650390625, 3.5517578125, 4.18701171875, 4.822265625, 5.45751953125, 6.0927734375, 6.72802734375, 7.36328125, 7.99853515625, 8.6337890625, 9.26904296875, 9.904296875, 10.53955078125, 11.1748046875, 11.81005859375, 12.4453125, 13.08056640625, 13.7158203125, 14.35107421875, 14.986328125, 15.62158203125, 16.2568359375, 16.89208984375, 17.52734375, 18.16259765625, 18.7978515625, 19.43310546875, 20.068359375, 20.70361328125, 21.3388671875, 21.97412109375, 22.609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 1.0, 8.0, 9.0, 9.0, 5.0, 17.0, 21.0, 22.0, 25.0, 29.0, 28.0, 21.0, 29.0, 33.0, 29.0, 41.0, 39.0, 39.0, 36.0, 54.0, 41.0, 44.0, 49.0, 31.0, 31.0, 36.0, 32.0, 30.0, 41.0, 23.0, 19.0, 17.0, 18.0, 24.0, 14.0, 15.0, 9.0, 7.0, 5.0, 10.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.093994140625, -16.43798828125, -15.781982421875, -15.1259765625, -14.469970703125, -13.81396484375, -13.157958984375, -12.501953125, -11.845947265625, -11.18994140625, -10.533935546875, -9.8779296875, -9.221923828125, -8.56591796875, -7.909912109375, -7.25390625, -6.597900390625, -5.94189453125, -5.285888671875, -4.6298828125, -3.973876953125, -3.31787109375, -2.661865234375, -2.005859375, -1.349853515625, -0.69384765625, -0.037841796875, 0.6181640625, 1.274169921875, 1.93017578125, 2.586181640625, 3.2421875, 3.898193359375, 4.55419921875, 5.210205078125, 5.8662109375, 6.522216796875, 7.17822265625, 7.834228515625, 8.490234375, 9.146240234375, 9.80224609375, 10.458251953125, 11.1142578125, 11.770263671875, 12.42626953125, 13.082275390625, 13.73828125, 14.394287109375, 15.05029296875, 15.706298828125, 16.3623046875, 17.018310546875, 17.67431640625, 18.330322265625, 18.986328125, 19.642333984375, 20.29833984375, 20.954345703125, 21.6103515625, 22.266357421875, 22.92236328125, 23.578369140625, 24.234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 9.0, 6.0, 15.0, 13.0, 29.0, 36.0, 47.0, 69.0, 99.0, 159.0, 214.0, 349.0, 500.0, 779.0, 1380.0, 2047.0, 3404.0, 5782.0, 9679.0, 17402.0, 30250.0, 54933.0, 92629.0, 138973.0, 174858.0, 171150.0, 134679.0, 87971.0, 52099.0, 29230.0, 16318.0, 9385.0, 5471.0, 3169.0, 1934.0, 1232.0, 730.0, 530.0, 323.0, 212.0, 148.0, 90.0, 63.0, 42.0, 29.0, 33.0, 18.0, 12.0, 11.0, 4.0, 11.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.9375, -12.5325927734375, -12.127685546875, -11.7227783203125, -11.31787109375, -10.9129638671875, -10.508056640625, -10.1031494140625, -9.6982421875, -9.2933349609375, -8.888427734375, -8.4835205078125, -8.07861328125, -7.6737060546875, -7.268798828125, -6.8638916015625, -6.458984375, -6.0540771484375, -5.649169921875, -5.2442626953125, -4.83935546875, -4.4344482421875, -4.029541015625, -3.6246337890625, -3.2197265625, -2.8148193359375, -2.409912109375, -2.0050048828125, -1.60009765625, -1.1951904296875, -0.790283203125, -0.3853759765625, 0.01953125, 0.4244384765625, 0.829345703125, 1.2342529296875, 1.63916015625, 2.0440673828125, 2.448974609375, 2.8538818359375, 3.2587890625, 3.6636962890625, 4.068603515625, 4.4735107421875, 4.87841796875, 5.2833251953125, 5.688232421875, 6.0931396484375, 6.498046875, 6.9029541015625, 7.307861328125, 7.7127685546875, 8.11767578125, 8.5225830078125, 8.927490234375, 9.3323974609375, 9.7373046875, 10.1422119140625, 10.547119140625, 10.9520263671875, 11.35693359375, 11.7618408203125, 12.166748046875, 12.5716552734375, 12.9765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 7.0, 5.0, 8.0, 10.0, 10.0, 14.0, 12.0, 16.0, 13.0, 23.0, 22.0, 25.0, 27.0, 25.0, 38.0, 39.0, 45.0, 45.0, 33.0, 43.0, 53.0, 50.0, 42.0, 42.0, 47.0, 41.0, 28.0, 24.0, 23.0, 28.0, 30.0, 18.0, 15.0, 17.0, 13.0, 11.0, 9.0, 10.0, 5.0, 9.0, 1.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009455680847167969, -0.0009164810180664062, -0.0008873939514160156, -0.000858306884765625, -0.0008292198181152344, -0.0008001327514648438, -0.0007710456848144531, -0.0007419586181640625, -0.0007128715515136719, -0.0006837844848632812, -0.0006546974182128906, -0.0006256103515625, -0.0005965232849121094, -0.0005674362182617188, -0.0005383491516113281, -0.0005092620849609375, -0.0004801750183105469, -0.00045108795166015625, -0.0004220008850097656, -0.000392913818359375, -0.0003638267517089844, -0.00033473968505859375, -0.0003056526184082031, -0.0002765655517578125, -0.0002474784851074219, -0.00021839141845703125, -0.00018930435180664062, -0.00016021728515625, -0.00013113021850585938, -0.00010204315185546875, -7.295608520507812e-05, -4.38690185546875e-05, -1.4781951904296875e-05, 1.430511474609375e-05, 4.3392181396484375e-05, 7.2479248046875e-05, 0.00010156631469726562, 0.00013065338134765625, 0.00015974044799804688, 0.0001888275146484375, 0.00021791458129882812, 0.00024700164794921875, 0.0002760887145996094, 0.00030517578125, 0.0003342628479003906, 0.00036334991455078125, 0.0003924369812011719, 0.0004215240478515625, 0.0004506111145019531, 0.00047969818115234375, 0.0005087852478027344, 0.000537872314453125, 0.0005669593811035156, 0.0005960464477539062, 0.0006251335144042969, 0.0006542205810546875, 0.0006833076477050781, 0.0007123947143554688, 0.0007414817810058594, 0.00077056884765625, 0.0007996559143066406, 0.0008287429809570312, 0.0008578300476074219, 0.0008869171142578125, 0.0009160041809082031]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 9.0, 22.0, 25.0, 34.0, 44.0, 60.0, 98.0, 144.0, 187.0, 304.0, 491.0, 818.0, 1401.0, 2300.0, 4005.0, 7179.0, 12819.0, 23420.0, 41784.0, 70599.0, 110234.0, 149547.0, 169817.0, 155494.0, 117234.0, 76027.0, 45561.0, 25891.0, 14112.0, 7963.0, 4427.0, 2547.0, 1520.0, 895.0, 552.0, 346.0, 223.0, 131.0, 89.0, 59.0, 34.0, 27.0, 27.0, 14.0, 22.0, 7.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.015625, -11.6468505859375, -11.278076171875, -10.9093017578125, -10.54052734375, -10.1717529296875, -9.802978515625, -9.4342041015625, -9.0654296875, -8.6966552734375, -8.327880859375, -7.9591064453125, -7.59033203125, -7.2215576171875, -6.852783203125, -6.4840087890625, -6.115234375, -5.7464599609375, -5.377685546875, -5.0089111328125, -4.64013671875, -4.2713623046875, -3.902587890625, -3.5338134765625, -3.1650390625, -2.7962646484375, -2.427490234375, -2.0587158203125, -1.68994140625, -1.3211669921875, -0.952392578125, -0.5836181640625, -0.21484375, 0.1539306640625, 0.522705078125, 0.8914794921875, 1.26025390625, 1.6290283203125, 1.997802734375, 2.3665771484375, 2.7353515625, 3.1041259765625, 3.472900390625, 3.8416748046875, 4.21044921875, 4.5792236328125, 4.947998046875, 5.3167724609375, 5.685546875, 6.0543212890625, 6.423095703125, 6.7918701171875, 7.16064453125, 7.5294189453125, 7.898193359375, 8.2669677734375, 8.6357421875, 9.0045166015625, 9.373291015625, 9.7420654296875, 10.11083984375, 10.4796142578125, 10.848388671875, 11.2171630859375, 11.5859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 10.0, 4.0, 14.0, 10.0, 20.0, 28.0, 35.0, 46.0, 35.0, 38.0, 81.0, 68.0, 66.0, 88.0, 79.0, 63.0, 56.0, 57.0, 34.0, 36.0, 28.0, 19.0, 16.0, 15.0, 10.0, 14.0, 8.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.21484375, -5.95672607421875, -5.6986083984375, -5.44049072265625, -5.182373046875, -4.92425537109375, -4.6661376953125, -4.40802001953125, -4.14990234375, -3.89178466796875, -3.6336669921875, -3.37554931640625, -3.117431640625, -2.85931396484375, -2.6011962890625, -2.34307861328125, -2.0849609375, -1.82684326171875, -1.5687255859375, -1.31060791015625, -1.052490234375, -0.79437255859375, -0.5362548828125, -0.27813720703125, -0.02001953125, 0.23809814453125, 0.4962158203125, 0.75433349609375, 1.012451171875, 1.27056884765625, 1.5286865234375, 1.78680419921875, 2.044921875, 2.30303955078125, 2.5611572265625, 2.81927490234375, 3.077392578125, 3.33551025390625, 3.5936279296875, 3.85174560546875, 4.10986328125, 4.36798095703125, 4.6260986328125, 4.88421630859375, 5.142333984375, 5.40045166015625, 5.6585693359375, 5.91668701171875, 6.1748046875, 6.43292236328125, 6.6910400390625, 6.94915771484375, 7.207275390625, 7.46539306640625, 7.7235107421875, 7.98162841796875, 8.23974609375, 8.49786376953125, 8.7559814453125, 9.01409912109375, 9.272216796875, 9.53033447265625, 9.7884521484375, 10.04656982421875, 10.3046875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 16.0, 7.0, 15.0, 18.0, 17.0, 14.0, 16.0, 28.0, 24.0, 29.0, 42.0, 23.0, 48.0, 55.0, 56.0, 36.0, 61.0, 40.0, 53.0, 58.0, 47.0, 47.0, 36.0, 28.0, 33.0, 26.0, 20.0, 14.0, 17.0, 14.0, 14.0, 11.0, 2.0, 10.0, 6.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.085845947265625, -21.354745864868164, -20.623647689819336, -19.892547607421875, -19.161447525024414, -18.430347442626953, -17.699249267578125, -16.968149185180664, -16.237049102783203, -15.505949974060059, -14.774849891662598, -14.043750762939453, -13.312650680541992, -12.581551551818848, -11.850452423095703, -11.119352340698242, -10.388254165649414, -9.65715503692627, -8.926054954528809, -8.194955825805664, -7.463856220245361, -6.732756614685059, -6.001657485961914, -5.270557880401611, -4.539458274841309, -3.808358669281006, -3.0772593021392822, -2.3461599349975586, -1.6150603294372559, -0.8839607238769531, -0.1528615951538086, 0.5782380104064941, 1.3093376159667969, 2.0404372215270996, 2.7715365886688232, 3.502635955810547, 4.23373556137085, 4.964835166931152, 5.695934295654297, 6.4270339012146, 7.158133506774902, 7.889233112335205, 8.620332717895508, 9.351431846618652, 10.082530975341797, 10.813631057739258, 11.544730186462402, 12.275829315185547, 13.006929397583008, 13.738028526306152, 14.469128608703613, 15.200227737426758, 15.931327819824219, 16.662425994873047, 17.393526077270508, 18.12462615966797, 18.855724334716797, 19.586824417114258, 20.317922592163086, 21.049022674560547, 21.780122756958008, 22.51122283935547, 23.242321014404297, 23.973421096801758, 24.70452117919922]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 8.0, 7.0, 3.0, 11.0, 15.0, 13.0, 18.0, 22.0, 15.0, 21.0, 23.0, 29.0, 35.0, 24.0, 32.0, 37.0, 23.0, 35.0, 40.0, 36.0, 44.0, 33.0, 43.0, 44.0, 36.0, 28.0, 30.0, 32.0, 39.0, 31.0, 29.0, 30.0, 15.0, 21.0, 15.0, 19.0, 12.0, 9.0, 7.0, 10.0, 8.0, 3.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.8968505859375, -27.958961486816406, -27.021072387695312, -26.08318328857422, -25.145292282104492, -24.2074031829834, -23.269514083862305, -22.33162498474121, -21.393733978271484, -20.45584487915039, -19.517955780029297, -18.580066680908203, -17.642175674438477, -16.704286575317383, -15.766397476196289, -14.828508377075195, -13.890619277954102, -12.952730178833008, -12.014840126037598, -11.076951026916504, -10.139060974121094, -9.201171875, -8.263282775878906, -7.325393199920654, -6.387503623962402, -5.44961404800415, -4.511724472045898, -3.5738353729248047, -2.6359457969665527, -1.6980562210083008, -0.760167121887207, 0.17772245407104492, 1.115610122680664, 2.053499698638916, 2.991389036178589, 3.9292783737182617, 4.867167949676514, 5.805057525634766, 6.742946624755859, 7.680836200714111, 8.618725776672363, 9.556614875793457, 10.494504928588867, 11.432394027709961, 12.370283126831055, 13.308173179626465, 14.246062278747559, 15.183952331542969, 16.121841430664062, 17.059730529785156, 17.99761962890625, 18.935508728027344, 19.87339973449707, 20.811288833618164, 21.749177932739258, 22.68706703186035, 23.624958038330078, 24.562847137451172, 25.500736236572266, 26.43862533569336, 27.376516342163086, 28.31440544128418, 29.252294540405273, 30.190183639526367, 31.12807273864746]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 13.0, 30.0, 45.0, 70.0, 132.0, 223.0, 342.0, 546.0, 915.0, 1531.0, 2601.0, 4367.0, 7348.0, 12868.0, 22292.0, 38971.0, 67808.0, 117602.0, 201687.0, 324878.0, 478329.0, 610866.0, 649698.0, 568915.0, 419756.0, 273884.0, 165495.0, 95840.0, 54649.0, 30515.0, 17409.0, 10023.0, 5873.0, 3388.0, 2081.0, 1192.0, 804.0, 480.0, 308.0, 170.0, 104.0, 87.0, 68.0, 28.0, 25.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.46875, -18.865966796875, -18.26318359375, -17.660400390625, -17.0576171875, -16.454833984375, -15.85205078125, -15.249267578125, -14.646484375, -14.043701171875, -13.44091796875, -12.838134765625, -12.2353515625, -11.632568359375, -11.02978515625, -10.427001953125, -9.82421875, -9.221435546875, -8.61865234375, -8.015869140625, -7.4130859375, -6.810302734375, -6.20751953125, -5.604736328125, -5.001953125, -4.399169921875, -3.79638671875, -3.193603515625, -2.5908203125, -1.988037109375, -1.38525390625, -0.782470703125, -0.1796875, 0.423095703125, 1.02587890625, 1.628662109375, 2.2314453125, 2.834228515625, 3.43701171875, 4.039794921875, 4.642578125, 5.245361328125, 5.84814453125, 6.450927734375, 7.0537109375, 7.656494140625, 8.25927734375, 8.862060546875, 9.46484375, 10.067626953125, 10.67041015625, 11.273193359375, 11.8759765625, 12.478759765625, 13.08154296875, 13.684326171875, 14.287109375, 14.889892578125, 15.49267578125, 16.095458984375, 16.6982421875, 17.301025390625, 17.90380859375, 18.506591796875, 19.109375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 9.0, 12.0, 17.0, 17.0, 16.0, 18.0, 19.0, 25.0, 28.0, 36.0, 31.0, 34.0, 32.0, 22.0, 36.0, 38.0, 55.0, 40.0, 37.0, 36.0, 38.0, 32.0, 33.0, 43.0, 33.0, 34.0, 36.0, 22.0, 29.0, 23.0, 24.0, 10.0, 9.0, 18.0, 12.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.44091796875, -19.6787109375, -18.91650390625, -18.154296875, -17.39208984375, -16.6298828125, -15.86767578125, -15.10546875, -14.34326171875, -13.5810546875, -12.81884765625, -12.056640625, -11.29443359375, -10.5322265625, -9.77001953125, -9.0078125, -8.24560546875, -7.4833984375, -6.72119140625, -5.958984375, -5.19677734375, -4.4345703125, -3.67236328125, -2.91015625, -2.14794921875, -1.3857421875, -0.62353515625, 0.138671875, 0.90087890625, 1.6630859375, 2.42529296875, 3.1875, 3.94970703125, 4.7119140625, 5.47412109375, 6.236328125, 6.99853515625, 7.7607421875, 8.52294921875, 9.28515625, 10.04736328125, 10.8095703125, 11.57177734375, 12.333984375, 13.09619140625, 13.8583984375, 14.62060546875, 15.3828125, 16.14501953125, 16.9072265625, 17.66943359375, 18.431640625, 19.19384765625, 19.9560546875, 20.71826171875, 21.48046875, 22.24267578125, 23.0048828125, 23.76708984375, 24.529296875, 25.29150390625, 26.0537109375, 26.81591796875, 27.578125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 10.0, 17.0, 37.0, 46.0, 93.0, 128.0, 215.0, 387.0, 639.0, 1052.0, 1916.0, 3113.0, 5409.0, 9453.0, 16877.0, 29537.0, 52510.0, 89866.0, 151007.0, 244282.0, 364686.0, 496457.0, 590157.0, 594229.0, 511619.0, 383884.0, 257991.0, 161654.0, 96707.0, 55908.0, 32303.0, 17876.0, 10228.0, 5812.0, 3404.0, 2011.0, 1138.0, 636.0, 381.0, 212.0, 161.0, 81.0, 55.0, 36.0, 27.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.859375, -20.228515625, -19.59765625, -18.966796875, -18.3359375, -17.705078125, -17.07421875, -16.443359375, -15.8125, -15.181640625, -14.55078125, -13.919921875, -13.2890625, -12.658203125, -12.02734375, -11.396484375, -10.765625, -10.134765625, -9.50390625, -8.873046875, -8.2421875, -7.611328125, -6.98046875, -6.349609375, -5.71875, -5.087890625, -4.45703125, -3.826171875, -3.1953125, -2.564453125, -1.93359375, -1.302734375, -0.671875, -0.041015625, 0.58984375, 1.220703125, 1.8515625, 2.482421875, 3.11328125, 3.744140625, 4.375, 5.005859375, 5.63671875, 6.267578125, 6.8984375, 7.529296875, 8.16015625, 8.791015625, 9.421875, 10.052734375, 10.68359375, 11.314453125, 11.9453125, 12.576171875, 13.20703125, 13.837890625, 14.46875, 15.099609375, 15.73046875, 16.361328125, 16.9921875, 17.623046875, 18.25390625, 18.884765625, 19.515625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 2.0, 6.0, 8.0, 6.0, 13.0, 16.0, 28.0, 30.0, 33.0, 44.0, 54.0, 74.0, 101.0, 102.0, 116.0, 165.0, 170.0, 192.0, 201.0, 220.0, 229.0, 238.0, 242.0, 234.0, 217.0, 225.0, 208.0, 167.0, 137.0, 108.0, 119.0, 95.0, 71.0, 44.0, 33.0, 31.0, 14.0, 20.0, 12.0, 17.0, 13.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.25, -10.8980712890625, -10.546142578125, -10.1942138671875, -9.84228515625, -9.4903564453125, -9.138427734375, -8.7864990234375, -8.4345703125, -8.0826416015625, -7.730712890625, -7.3787841796875, -7.02685546875, -6.6749267578125, -6.322998046875, -5.9710693359375, -5.619140625, -5.2672119140625, -4.915283203125, -4.5633544921875, -4.21142578125, -3.8594970703125, -3.507568359375, -3.1556396484375, -2.8037109375, -2.4517822265625, -2.099853515625, -1.7479248046875, -1.39599609375, -1.0440673828125, -0.692138671875, -0.3402099609375, 0.01171875, 0.3636474609375, 0.715576171875, 1.0675048828125, 1.41943359375, 1.7713623046875, 2.123291015625, 2.4752197265625, 2.8271484375, 3.1790771484375, 3.531005859375, 3.8829345703125, 4.23486328125, 4.5867919921875, 4.938720703125, 5.2906494140625, 5.642578125, 5.9945068359375, 6.346435546875, 6.6983642578125, 7.05029296875, 7.4022216796875, 7.754150390625, 8.1060791015625, 8.4580078125, 8.8099365234375, 9.161865234375, 9.5137939453125, 9.86572265625, 10.2176513671875, 10.569580078125, 10.9215087890625, 11.2734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 5.0, 4.0, 7.0, 10.0, 5.0, 5.0, 12.0, 19.0, 17.0, 22.0, 25.0, 24.0, 33.0, 37.0, 42.0, 39.0, 61.0, 47.0, 50.0, 36.0, 45.0, 39.0, 50.0, 43.0, 34.0, 38.0, 39.0, 35.0, 28.0, 19.0, 18.0, 21.0, 17.0, 21.0, 13.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.41901206970215, -19.735322952270508, -19.051633834838867, -18.367944717407227, -17.684255599975586, -17.000566482543945, -16.316879272460938, -15.63318920135498, -14.94950008392334, -14.2658109664917, -13.582121849060059, -12.898433685302734, -12.214744567871094, -11.531055450439453, -10.847366333007812, -10.163677215576172, -9.479988098144531, -8.79629898071289, -8.11260986328125, -7.428921222686768, -6.745232105255127, -6.061542987823486, -5.377854347229004, -4.694165229797363, -4.010476112365723, -3.326786994934082, -2.6430981159210205, -1.959409236907959, -1.2757201194763184, -0.5920310020446777, 0.09165763854980469, 0.7753467559814453, 1.4590339660644531, 2.1427230834960938, 2.8264119625091553, 3.510100841522217, 4.193789958953857, 4.877479076385498, 5.5611677169799805, 6.244856834411621, 6.928545951843262, 7.612235069274902, 8.295924186706543, 8.979612350463867, 9.663301467895508, 10.346990585327148, 11.030679702758789, 11.71436882019043, 12.39805793762207, 13.081747055053711, 13.765436172485352, 14.449125289916992, 15.132814407348633, 15.816503524780273, 16.50019073486328, 17.183879852294922, 17.867568969726562, 18.551258087158203, 19.234947204589844, 19.918636322021484, 20.602325439453125, 21.286014556884766, 21.969703674316406, 22.653392791748047, 23.337081909179688]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 7.0, 5.0, 4.0, 13.0, 10.0, 11.0, 12.0, 12.0, 14.0, 17.0, 16.0, 22.0, 28.0, 33.0, 35.0, 19.0, 29.0, 27.0, 37.0, 44.0, 29.0, 34.0, 41.0, 41.0, 44.0, 44.0, 32.0, 22.0, 35.0, 38.0, 29.0, 21.0, 30.0, 33.0, 18.0, 15.0, 18.0, 10.0, 15.0, 6.0, 13.0, 8.0, 8.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.08544158935547, -24.21485710144043, -23.344270706176758, -22.47368621826172, -21.60310173034668, -20.73251724243164, -19.86193084716797, -18.99134635925293, -18.12076187133789, -17.25017738342285, -16.37959098815918, -15.50900650024414, -14.638422012329102, -13.767836570739746, -12.89725112915039, -12.026666641235352, -11.15608024597168, -10.285494804382324, -9.414910316467285, -8.54432487487793, -7.673739910125732, -6.803154945373535, -5.93256950378418, -5.061984539031982, -4.191399574279785, -3.320814609527588, -2.4502294063568115, -1.5796442031860352, -0.7090592384338379, 0.16152572631835938, 1.0321111679077148, 1.902696132659912, 2.7732791900634766, 3.643864154815674, 4.514449119567871, 5.385034561157227, 6.255619525909424, 7.126204490661621, 7.996789932250977, 8.867374420166016, 9.737959861755371, 10.608545303344727, 11.479129791259766, 12.349715232849121, 13.220300674438477, 14.090885162353516, 14.961470603942871, 15.832056045532227, 16.702640533447266, 17.573225021362305, 18.443811416625977, 19.314395904541016, 20.184980392456055, 21.055564880371094, 21.926151275634766, 22.796735763549805, 23.667320251464844, 24.537904739379883, 25.408491134643555, 26.279075622558594, 27.149660110473633, 28.020244598388672, 28.890830993652344, 29.761415481567383, 30.632001876831055]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 13.0, 20.0, 40.0, 42.0, 65.0, 105.0, 152.0, 231.0, 342.0, 573.0, 891.0, 1498.0, 2663.0, 4792.0, 8801.0, 16295.0, 30236.0, 55988.0, 98297.0, 155512.0, 198151.0, 181405.0, 127048.0, 74736.0, 41039.0, 22240.0, 12140.0, 6608.0, 3510.0, 2024.0, 1190.0, 664.0, 425.0, 271.0, 148.0, 134.0, 70.0, 53.0, 38.0, 25.0, 20.0, 8.0, 5.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.390625, -14.9058837890625, -14.421142578125, -13.9364013671875, -13.45166015625, -12.9669189453125, -12.482177734375, -11.9974365234375, -11.5126953125, -11.0279541015625, -10.543212890625, -10.0584716796875, -9.57373046875, -9.0889892578125, -8.604248046875, -8.1195068359375, -7.634765625, -7.1500244140625, -6.665283203125, -6.1805419921875, -5.69580078125, -5.2110595703125, -4.726318359375, -4.2415771484375, -3.7568359375, -3.2720947265625, -2.787353515625, -2.3026123046875, -1.81787109375, -1.3331298828125, -0.848388671875, -0.3636474609375, 0.12109375, 0.6058349609375, 1.090576171875, 1.5753173828125, 2.06005859375, 2.5447998046875, 3.029541015625, 3.5142822265625, 3.9990234375, 4.4837646484375, 4.968505859375, 5.4532470703125, 5.93798828125, 6.4227294921875, 6.907470703125, 7.3922119140625, 7.876953125, 8.3616943359375, 8.846435546875, 9.3311767578125, 9.81591796875, 10.3006591796875, 10.785400390625, 11.2701416015625, 11.7548828125, 12.2396240234375, 12.724365234375, 13.2091064453125, 13.69384765625, 14.1785888671875, 14.663330078125, 15.1480712890625, 15.6328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 3.0, 10.0, 12.0, 14.0, 16.0, 19.0, 8.0, 18.0, 24.0, 34.0, 30.0, 25.0, 21.0, 27.0, 34.0, 38.0, 39.0, 46.0, 38.0, 33.0, 40.0, 49.0, 42.0, 32.0, 29.0, 34.0, 29.0, 31.0, 37.0, 33.0, 17.0, 14.0, 12.0, 24.0, 12.0, 14.0, 10.0, 7.0, 9.0, 8.0, 3.0, 5.0, 3.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.1875, -24.27783203125, -23.3681640625, -22.45849609375, -21.548828125, -20.63916015625, -19.7294921875, -18.81982421875, -17.91015625, -17.00048828125, -16.0908203125, -15.18115234375, -14.271484375, -13.36181640625, -12.4521484375, -11.54248046875, -10.6328125, -9.72314453125, -8.8134765625, -7.90380859375, -6.994140625, -6.08447265625, -5.1748046875, -4.26513671875, -3.35546875, -2.44580078125, -1.5361328125, -0.62646484375, 0.283203125, 1.19287109375, 2.1025390625, 3.01220703125, 3.921875, 4.83154296875, 5.7412109375, 6.65087890625, 7.560546875, 8.47021484375, 9.3798828125, 10.28955078125, 11.19921875, 12.10888671875, 13.0185546875, 13.92822265625, 14.837890625, 15.74755859375, 16.6572265625, 17.56689453125, 18.4765625, 19.38623046875, 20.2958984375, 21.20556640625, 22.115234375, 23.02490234375, 23.9345703125, 24.84423828125, 25.75390625, 26.66357421875, 27.5732421875, 28.48291015625, 29.392578125, 30.30224609375, 31.2119140625, 32.12158203125, 33.03125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 17.0, 22.0, 24.0, 59.0, 65.0, 104.0, 177.0, 281.0, 457.0, 718.0, 1243.0, 2073.0, 3562.0, 6700.0, 12326.0, 23997.0, 47400.0, 93701.0, 170788.0, 237589.0, 202225.0, 118432.0, 61075.0, 30727.0, 15773.0, 8257.0, 4417.0, 2591.0, 1460.0, 813.0, 557.0, 312.0, 215.0, 127.0, 95.0, 52.0, 40.0, 27.0, 24.0, 13.0, 6.0, 6.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-20.78125, -20.2147216796875, -19.648193359375, -19.0816650390625, -18.51513671875, -17.9486083984375, -17.382080078125, -16.8155517578125, -16.2490234375, -15.6824951171875, -15.115966796875, -14.5494384765625, -13.98291015625, -13.4163818359375, -12.849853515625, -12.2833251953125, -11.716796875, -11.1502685546875, -10.583740234375, -10.0172119140625, -9.45068359375, -8.8841552734375, -8.317626953125, -7.7510986328125, -7.1845703125, -6.6180419921875, -6.051513671875, -5.4849853515625, -4.91845703125, -4.3519287109375, -3.785400390625, -3.2188720703125, -2.65234375, -2.0858154296875, -1.519287109375, -0.9527587890625, -0.38623046875, 0.1802978515625, 0.746826171875, 1.3133544921875, 1.8798828125, 2.4464111328125, 3.012939453125, 3.5794677734375, 4.14599609375, 4.7125244140625, 5.279052734375, 5.8455810546875, 6.412109375, 6.9786376953125, 7.545166015625, 8.1116943359375, 8.67822265625, 9.2447509765625, 9.811279296875, 10.3778076171875, 10.9443359375, 11.5108642578125, 12.077392578125, 12.6439208984375, 13.21044921875, 13.7769775390625, 14.343505859375, 14.9100341796875, 15.4765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 6.0, 13.0, 12.0, 12.0, 13.0, 16.0, 20.0, 25.0, 38.0, 25.0, 29.0, 26.0, 36.0, 23.0, 30.0, 25.0, 39.0, 43.0, 44.0, 38.0, 38.0, 46.0, 36.0, 30.0, 26.0, 20.0, 30.0, 23.0, 35.0, 30.0, 23.0, 16.0, 18.0, 16.0, 20.0, 14.0, 9.0, 11.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.609375, -17.038818359375, -16.46826171875, -15.897705078125, -15.3271484375, -14.756591796875, -14.18603515625, -13.615478515625, -13.044921875, -12.474365234375, -11.90380859375, -11.333251953125, -10.7626953125, -10.192138671875, -9.62158203125, -9.051025390625, -8.48046875, -7.909912109375, -7.33935546875, -6.768798828125, -6.1982421875, -5.627685546875, -5.05712890625, -4.486572265625, -3.916015625, -3.345458984375, -2.77490234375, -2.204345703125, -1.6337890625, -1.063232421875, -0.49267578125, 0.077880859375, 0.6484375, 1.218994140625, 1.78955078125, 2.360107421875, 2.9306640625, 3.501220703125, 4.07177734375, 4.642333984375, 5.212890625, 5.783447265625, 6.35400390625, 6.924560546875, 7.4951171875, 8.065673828125, 8.63623046875, 9.206787109375, 9.77734375, 10.347900390625, 10.91845703125, 11.489013671875, 12.0595703125, 12.630126953125, 13.20068359375, 13.771240234375, 14.341796875, 14.912353515625, 15.48291015625, 16.053466796875, 16.6240234375, 17.194580078125, 17.76513671875, 18.335693359375, 18.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 17.0, 22.0, 27.0, 24.0, 35.0, 54.0, 71.0, 95.0, 129.0, 200.0, 323.0, 472.0, 710.0, 1241.0, 2101.0, 3974.0, 7976.0, 19279.0, 57207.0, 204214.0, 443411.0, 210458.0, 58911.0, 19775.0, 8249.0, 3956.0, 2095.0, 1223.0, 759.0, 488.0, 305.0, 215.0, 146.0, 113.0, 94.0, 50.0, 42.0, 19.0, 18.0, 11.0, 6.0, 10.0, 5.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.34375, -13.8885498046875, -13.433349609375, -12.9781494140625, -12.52294921875, -12.0677490234375, -11.612548828125, -11.1573486328125, -10.7021484375, -10.2469482421875, -9.791748046875, -9.3365478515625, -8.88134765625, -8.4261474609375, -7.970947265625, -7.5157470703125, -7.060546875, -6.6053466796875, -6.150146484375, -5.6949462890625, -5.23974609375, -4.7845458984375, -4.329345703125, -3.8741455078125, -3.4189453125, -2.9637451171875, -2.508544921875, -2.0533447265625, -1.59814453125, -1.1429443359375, -0.687744140625, -0.2325439453125, 0.22265625, 0.6778564453125, 1.133056640625, 1.5882568359375, 2.04345703125, 2.4986572265625, 2.953857421875, 3.4090576171875, 3.8642578125, 4.3194580078125, 4.774658203125, 5.2298583984375, 5.68505859375, 6.1402587890625, 6.595458984375, 7.0506591796875, 7.505859375, 7.9610595703125, 8.416259765625, 8.8714599609375, 9.32666015625, 9.7818603515625, 10.237060546875, 10.6922607421875, 11.1474609375, 11.6026611328125, 12.057861328125, 12.5130615234375, 12.96826171875, 13.4234619140625, 13.878662109375, 14.3338623046875, 14.7890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 8.0, 13.0, 16.0, 30.0, 26.0, 57.0, 68.0, 98.0, 133.0, 149.0, 114.0, 87.0, 67.0, 49.0, 24.0, 15.0, 11.0, 7.0, 4.0, 4.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008373260498046875, -0.0008054673671722412, -0.0007736086845397949, -0.0007417500019073486, -0.0007098913192749023, -0.0006780326366424561, -0.0006461739540100098, -0.0006143152713775635, -0.0005824565887451172, -0.0005505979061126709, -0.0005187392234802246, -0.0004868805408477783, -0.00045502185821533203, -0.00042316317558288574, -0.00039130449295043945, -0.00035944581031799316, -0.0003275871276855469, -0.0002957284450531006, -0.0002638697624206543, -0.000232011079788208, -0.00020015239715576172, -0.00016829371452331543, -0.00013643503189086914, -0.00010457634925842285, -7.271766662597656e-05, -4.0858983993530273e-05, -9.000301361083984e-06, 2.2858381271362305e-05, 5.4717063903808594e-05, 8.657574653625488e-05, 0.00011843442916870117, 0.00015029311180114746, 0.00018215179443359375, 0.00021401047706604004, 0.00024586915969848633, 0.0002777278423309326, 0.0003095865249633789, 0.0003414452075958252, 0.0003733038902282715, 0.0004051625728607178, 0.00043702125549316406, 0.00046887993812561035, 0.0005007386207580566, 0.0005325973033905029, 0.0005644559860229492, 0.0005963146686553955, 0.0006281733512878418, 0.0006600320339202881, 0.0006918907165527344, 0.0007237493991851807, 0.000755608081817627, 0.0007874667644500732, 0.0008193254470825195, 0.0008511841297149658, 0.0008830428123474121, 0.0009149014949798584, 0.0009467601776123047, 0.000978618860244751, 0.0010104775428771973, 0.0010423362255096436, 0.0010741949081420898, 0.0011060535907745361, 0.0011379122734069824, 0.0011697709560394287, 0.001201629638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 9.0, 2.0, 8.0, 5.0, 11.0, 10.0, 27.0, 21.0, 29.0, 48.0, 70.0, 110.0, 147.0, 218.0, 320.0, 452.0, 724.0, 1110.0, 1728.0, 2769.0, 5178.0, 10748.0, 25532.0, 67579.0, 180000.0, 325048.0, 252202.0, 104374.0, 38303.0, 15316.0, 6892.0, 3529.0, 2055.0, 1291.0, 839.0, 527.0, 388.0, 271.0, 179.0, 146.0, 107.0, 72.0, 44.0, 37.0, 25.0, 19.0, 17.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.1875, -11.77734375, -11.3671875, -10.95703125, -10.546875, -10.13671875, -9.7265625, -9.31640625, -8.90625, -8.49609375, -8.0859375, -7.67578125, -7.265625, -6.85546875, -6.4453125, -6.03515625, -5.625, -5.21484375, -4.8046875, -4.39453125, -3.984375, -3.57421875, -3.1640625, -2.75390625, -2.34375, -1.93359375, -1.5234375, -1.11328125, -0.703125, -0.29296875, 0.1171875, 0.52734375, 0.9375, 1.34765625, 1.7578125, 2.16796875, 2.578125, 2.98828125, 3.3984375, 3.80859375, 4.21875, 4.62890625, 5.0390625, 5.44921875, 5.859375, 6.26953125, 6.6796875, 7.08984375, 7.5, 7.91015625, 8.3203125, 8.73046875, 9.140625, 9.55078125, 9.9609375, 10.37109375, 10.78125, 11.19140625, 11.6015625, 12.01171875, 12.421875, 12.83203125, 13.2421875, 13.65234375, 14.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 10.0, 19.0, 16.0, 20.0, 24.0, 40.0, 47.0, 58.0, 86.0, 98.0, 77.0, 101.0, 100.0, 79.0, 49.0, 40.0, 33.0, 24.0, 18.0, 9.0, 9.0, 7.0, 8.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.45361328125, -5.2626953125, -5.07177734375, -4.880859375, -4.68994140625, -4.4990234375, -4.30810546875, -4.1171875, -3.92626953125, -3.7353515625, -3.54443359375, -3.353515625, -3.16259765625, -2.9716796875, -2.78076171875, -2.58984375, -2.39892578125, -2.2080078125, -2.01708984375, -1.826171875, -1.63525390625, -1.4443359375, -1.25341796875, -1.0625, -0.87158203125, -0.6806640625, -0.48974609375, -0.298828125, -0.10791015625, 0.0830078125, 0.27392578125, 0.46484375, 0.65576171875, 0.8466796875, 1.03759765625, 1.228515625, 1.41943359375, 1.6103515625, 1.80126953125, 1.9921875, 2.18310546875, 2.3740234375, 2.56494140625, 2.755859375, 2.94677734375, 3.1376953125, 3.32861328125, 3.51953125, 3.71044921875, 3.9013671875, 4.09228515625, 4.283203125, 4.47412109375, 4.6650390625, 4.85595703125, 5.046875, 5.23779296875, 5.4287109375, 5.61962890625, 5.810546875, 6.00146484375, 6.1923828125, 6.38330078125, 6.57421875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 4.0, 5.0, 9.0, 8.0, 11.0, 7.0, 8.0, 18.0, 15.0, 23.0, 26.0, 25.0, 29.0, 37.0, 43.0, 44.0, 61.0, 39.0, 53.0, 45.0, 45.0, 51.0, 42.0, 45.0, 36.0, 31.0, 46.0, 28.0, 22.0, 17.0, 24.0, 26.0, 20.0, 13.0, 9.0, 8.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.514890670776367, -19.821317672729492, -19.127744674682617, -18.434171676635742, -17.740598678588867, -17.047025680541992, -16.35345458984375, -15.659880638122559, -14.966307640075684, -14.272734642028809, -13.579161643981934, -12.885589599609375, -12.1920166015625, -11.498443603515625, -10.80487060546875, -10.111297607421875, -9.417724609375, -8.724151611328125, -8.03057861328125, -7.337006092071533, -6.643433094024658, -5.949860095977783, -5.256287574768066, -4.562714576721191, -3.8691415786743164, -3.1755685806274414, -2.4819958209991455, -1.7884230613708496, -1.0948500633239746, -0.4012770652770996, 0.2922954559326172, 0.9858684539794922, 1.6794414520263672, 2.373014450073242, 3.066587209701538, 3.760159969329834, 4.453732967376709, 5.147305965423584, 5.840878486633301, 6.534451484680176, 7.228024482727051, 7.921597480773926, 8.6151704788208, 9.30874252319336, 10.002315521240234, 10.69588851928711, 11.389461517333984, 12.08303451538086, 12.776607513427734, 13.47018051147461, 14.163753509521484, 14.85732650756836, 15.550899505615234, 16.24447250366211, 16.938045501708984, 17.63161849975586, 18.325191497802734, 19.01876449584961, 19.712337493896484, 20.40591049194336, 21.099483489990234, 21.79305648803711, 22.486629486083984, 23.18020248413086, 23.8737735748291]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 7.0, 9.0, 4.0, 10.0, 8.0, 14.0, 14.0, 15.0, 16.0, 21.0, 25.0, 26.0, 22.0, 28.0, 30.0, 35.0, 32.0, 39.0, 24.0, 35.0, 43.0, 35.0, 38.0, 51.0, 36.0, 38.0, 25.0, 29.0, 25.0, 37.0, 27.0, 26.0, 37.0, 23.0, 12.0, 16.0, 16.0, 8.0, 11.0, 8.0, 8.0, 11.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.788162231445312, -22.935501098632812, -22.08283805847168, -21.23017692565918, -20.377513885498047, -19.524852752685547, -18.672191619873047, -17.819528579711914, -16.96686553955078, -16.11420440673828, -15.261541366577148, -14.408880233764648, -13.556217193603516, -12.703556060791016, -11.8508939743042, -10.998231887817383, -10.145570755004883, -9.292908668518066, -8.44024658203125, -7.587584972381592, -6.734922885894775, -5.882260799407959, -5.029599189758301, -4.176937103271484, -3.324275016784668, -2.4716129302978516, -1.6189510822296143, -0.766289234161377, 0.08637285232543945, 0.9390349388122559, 1.791696548461914, 2.6443586349487305, 3.497018814086914, 4.3496809005737305, 5.202342987060547, 6.055004596710205, 6.9076666831970215, 7.760328769683838, 8.612990379333496, 9.465652465820312, 10.318314552307129, 11.170976638793945, 12.023638725280762, 12.876300811767578, 13.728961944580078, 14.581624984741211, 15.434286117553711, 16.286949157714844, 17.139610290527344, 17.992271423339844, 18.844934463500977, 19.697595596313477, 20.55025863647461, 21.40291976928711, 22.25558090209961, 23.108243942260742, 23.960906982421875, 24.813568115234375, 25.666231155395508, 26.518892288208008, 27.37155532836914, 28.22421646118164, 29.07687759399414, 29.929540634155273, 30.782201766967773]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 11.0, 17.0, 26.0, 38.0, 61.0, 94.0, 165.0, 213.0, 343.0, 486.0, 709.0, 1130.0, 1800.0, 2560.0, 3778.0, 5619.0, 8248.0, 12354.0, 18316.0, 25882.0, 35867.0, 48735.0, 62570.0, 77795.0, 90969.0, 100383.0, 101916.0, 96898.0, 84785.0, 70993.0, 55524.0, 41841.0, 30540.0, 21524.0, 15077.0, 10355.0, 7023.0, 4672.0, 3000.0, 2116.0, 1351.0, 920.0, 594.0, 425.0, 287.0, 177.0, 121.0, 94.0, 53.0, 34.0, 21.0, 14.0, 12.0, 2.0, 4.0, 3.0, 4.0, 2.0], "bins": [-13.34375, -12.9300537109375, -12.516357421875, -12.1026611328125, -11.68896484375, -11.2752685546875, -10.861572265625, -10.4478759765625, -10.0341796875, -9.6204833984375, -9.206787109375, -8.7930908203125, -8.37939453125, -7.9656982421875, -7.552001953125, -7.1383056640625, -6.724609375, -6.3109130859375, -5.897216796875, -5.4835205078125, -5.06982421875, -4.6561279296875, -4.242431640625, -3.8287353515625, -3.4150390625, -3.0013427734375, -2.587646484375, -2.1739501953125, -1.76025390625, -1.3465576171875, -0.932861328125, -0.5191650390625, -0.10546875, 0.3082275390625, 0.721923828125, 1.1356201171875, 1.54931640625, 1.9630126953125, 2.376708984375, 2.7904052734375, 3.2041015625, 3.6177978515625, 4.031494140625, 4.4451904296875, 4.85888671875, 5.2725830078125, 5.686279296875, 6.0999755859375, 6.513671875, 6.9273681640625, 7.341064453125, 7.7547607421875, 8.16845703125, 8.5821533203125, 8.995849609375, 9.4095458984375, 9.8232421875, 10.2369384765625, 10.650634765625, 11.0643310546875, 11.47802734375, 11.8917236328125, 12.305419921875, 12.7191162109375, 13.1328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 9.0, 14.0, 11.0, 14.0, 13.0, 22.0, 14.0, 17.0, 31.0, 22.0, 39.0, 36.0, 33.0, 51.0, 25.0, 34.0, 43.0, 41.0, 42.0, 42.0, 41.0, 39.0, 29.0, 32.0, 34.0, 37.0, 29.0, 26.0, 22.0, 20.0, 21.0, 17.0, 17.0, 13.0, 13.0, 7.0, 3.0, 11.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.35498046875, -22.4599609375, -21.56494140625, -20.669921875, -19.77490234375, -18.8798828125, -17.98486328125, -17.08984375, -16.19482421875, -15.2998046875, -14.40478515625, -13.509765625, -12.61474609375, -11.7197265625, -10.82470703125, -9.9296875, -9.03466796875, -8.1396484375, -7.24462890625, -6.349609375, -5.45458984375, -4.5595703125, -3.66455078125, -2.76953125, -1.87451171875, -0.9794921875, -0.08447265625, 0.810546875, 1.70556640625, 2.6005859375, 3.49560546875, 4.390625, 5.28564453125, 6.1806640625, 7.07568359375, 7.970703125, 8.86572265625, 9.7607421875, 10.65576171875, 11.55078125, 12.44580078125, 13.3408203125, 14.23583984375, 15.130859375, 16.02587890625, 16.9208984375, 17.81591796875, 18.7109375, 19.60595703125, 20.5009765625, 21.39599609375, 22.291015625, 23.18603515625, 24.0810546875, 24.97607421875, 25.87109375, 26.76611328125, 27.6611328125, 28.55615234375, 29.451171875, 30.34619140625, 31.2412109375, 32.13623046875, 33.03125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 16.0, 12.0, 14.0, 39.0, 64.0, 61.0, 129.0, 168.0, 255.0, 404.0, 649.0, 1000.0, 1608.0, 2315.0, 3792.0, 5891.0, 9508.0, 14962.0, 23894.0, 37023.0, 56072.0, 79311.0, 104538.0, 124001.0, 131275.0, 122341.0, 101451.0, 76123.0, 53740.0, 35692.0, 22972.0, 14313.0, 9213.0, 5635.0, 3698.0, 2346.0, 1495.0, 885.0, 573.0, 393.0, 232.0, 165.0, 102.0, 61.0, 46.0, 31.0, 20.0, 11.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.109375, -17.55126953125, -16.9931640625, -16.43505859375, -15.876953125, -15.31884765625, -14.7607421875, -14.20263671875, -13.64453125, -13.08642578125, -12.5283203125, -11.97021484375, -11.412109375, -10.85400390625, -10.2958984375, -9.73779296875, -9.1796875, -8.62158203125, -8.0634765625, -7.50537109375, -6.947265625, -6.38916015625, -5.8310546875, -5.27294921875, -4.71484375, -4.15673828125, -3.5986328125, -3.04052734375, -2.482421875, -1.92431640625, -1.3662109375, -0.80810546875, -0.25, 0.30810546875, 0.8662109375, 1.42431640625, 1.982421875, 2.54052734375, 3.0986328125, 3.65673828125, 4.21484375, 4.77294921875, 5.3310546875, 5.88916015625, 6.447265625, 7.00537109375, 7.5634765625, 8.12158203125, 8.6796875, 9.23779296875, 9.7958984375, 10.35400390625, 10.912109375, 11.47021484375, 12.0283203125, 12.58642578125, 13.14453125, 13.70263671875, 14.2607421875, 14.81884765625, 15.376953125, 15.93505859375, 16.4931640625, 17.05126953125, 17.609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 3.0, 7.0, 7.0, 5.0, 13.0, 9.0, 14.0, 18.0, 15.0, 22.0, 23.0, 20.0, 26.0, 33.0, 25.0, 40.0, 46.0, 46.0, 45.0, 41.0, 52.0, 37.0, 30.0, 46.0, 52.0, 35.0, 32.0, 44.0, 35.0, 22.0, 30.0, 19.0, 21.0, 15.0, 16.0, 16.0, 13.0, 9.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.890625, -20.190673828125, -19.49072265625, -18.790771484375, -18.0908203125, -17.390869140625, -16.69091796875, -15.990966796875, -15.291015625, -14.591064453125, -13.89111328125, -13.191162109375, -12.4912109375, -11.791259765625, -11.09130859375, -10.391357421875, -9.69140625, -8.991455078125, -8.29150390625, -7.591552734375, -6.8916015625, -6.191650390625, -5.49169921875, -4.791748046875, -4.091796875, -3.391845703125, -2.69189453125, -1.991943359375, -1.2919921875, -0.592041015625, 0.10791015625, 0.807861328125, 1.5078125, 2.207763671875, 2.90771484375, 3.607666015625, 4.3076171875, 5.007568359375, 5.70751953125, 6.407470703125, 7.107421875, 7.807373046875, 8.50732421875, 9.207275390625, 9.9072265625, 10.607177734375, 11.30712890625, 12.007080078125, 12.70703125, 13.406982421875, 14.10693359375, 14.806884765625, 15.5068359375, 16.206787109375, 16.90673828125, 17.606689453125, 18.306640625, 19.006591796875, 19.70654296875, 20.406494140625, 21.1064453125, 21.806396484375, 22.50634765625, 23.206298828125, 23.90625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 7.0, 18.0, 37.0, 41.0, 65.0, 86.0, 131.0, 185.0, 258.0, 365.0, 534.0, 765.0, 1167.0, 1828.0, 2735.0, 4373.0, 7157.0, 11825.0, 20262.0, 36076.0, 64387.0, 111295.0, 168394.0, 197070.0, 165200.0, 107450.0, 61794.0, 34710.0, 19657.0, 11558.0, 6774.0, 4297.0, 2668.0, 1770.0, 1117.0, 789.0, 542.0, 349.0, 257.0, 152.0, 110.0, 88.0, 62.0, 42.0, 29.0, 21.0, 15.0, 13.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-14.921875, -14.4622802734375, -14.002685546875, -13.5430908203125, -13.08349609375, -12.6239013671875, -12.164306640625, -11.7047119140625, -11.2451171875, -10.7855224609375, -10.325927734375, -9.8663330078125, -9.40673828125, -8.9471435546875, -8.487548828125, -8.0279541015625, -7.568359375, -7.1087646484375, -6.649169921875, -6.1895751953125, -5.72998046875, -5.2703857421875, -4.810791015625, -4.3511962890625, -3.8916015625, -3.4320068359375, -2.972412109375, -2.5128173828125, -2.05322265625, -1.5936279296875, -1.134033203125, -0.6744384765625, -0.21484375, 0.2447509765625, 0.704345703125, 1.1639404296875, 1.62353515625, 2.0831298828125, 2.542724609375, 3.0023193359375, 3.4619140625, 3.9215087890625, 4.381103515625, 4.8406982421875, 5.30029296875, 5.7598876953125, 6.219482421875, 6.6790771484375, 7.138671875, 7.5982666015625, 8.057861328125, 8.5174560546875, 8.97705078125, 9.4366455078125, 9.896240234375, 10.3558349609375, 10.8154296875, 11.2750244140625, 11.734619140625, 12.1942138671875, 12.65380859375, 13.1134033203125, 13.572998046875, 14.0325927734375, 14.4921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 12.0, 11.0, 14.0, 11.0, 14.0, 29.0, 30.0, 26.0, 48.0, 36.0, 51.0, 46.0, 57.0, 72.0, 64.0, 65.0, 67.0, 66.0, 45.0, 45.0, 34.0, 28.0, 26.0, 22.0, 20.0, 16.0, 12.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013151168823242188, -0.0012736916542053223, -0.0012322664260864258, -0.0011908411979675293, -0.0011494159698486328, -0.0011079907417297363, -0.0010665655136108398, -0.0010251402854919434, -0.0009837150573730469, -0.0009422898292541504, -0.0009008646011352539, -0.0008594393730163574, -0.0008180141448974609, -0.0007765889167785645, -0.000735163688659668, -0.0006937384605407715, -0.000652313232421875, -0.0006108880043029785, -0.000569462776184082, -0.0005280375480651855, -0.00048661231994628906, -0.0004451870918273926, -0.0004037618637084961, -0.0003623366355895996, -0.0003209114074707031, -0.00027948617935180664, -0.00023806095123291016, -0.00019663572311401367, -0.0001552104949951172, -0.0001137852668762207, -7.236003875732422e-05, -3.0934810638427734e-05, 1.049041748046875e-05, 5.1915645599365234e-05, 9.334087371826172e-05, 0.0001347661018371582, 0.0001761913299560547, 0.00021761655807495117, 0.00025904178619384766, 0.00030046701431274414, 0.0003418922424316406, 0.0003833174705505371, 0.0004247426986694336, 0.0004661679267883301, 0.0005075931549072266, 0.000549018383026123, 0.0005904436111450195, 0.000631868839263916, 0.0006732940673828125, 0.000714719295501709, 0.0007561445236206055, 0.000797569751739502, 0.0008389949798583984, 0.0008804202079772949, 0.0009218454360961914, 0.0009632706642150879, 0.0010046958923339844, 0.0010461211204528809, 0.0010875463485717773, 0.0011289715766906738, 0.0011703968048095703, 0.0012118220329284668, 0.0012532472610473633, 0.0012946724891662598, 0.0013360977172851562]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 15.0, 16.0, 33.0, 41.0, 56.0, 92.0, 102.0, 159.0, 196.0, 325.0, 429.0, 638.0, 895.0, 1312.0, 1910.0, 2837.0, 4295.0, 6555.0, 10085.0, 15931.0, 24733.0, 38872.0, 60328.0, 88548.0, 118603.0, 139950.0, 141830.0, 121807.0, 90883.0, 62703.0, 40676.0, 25714.0, 16529.0, 10623.0, 6929.0, 4388.0, 3064.0, 2007.0, 1415.0, 894.0, 644.0, 419.0, 341.0, 212.0, 170.0, 97.0, 87.0, 48.0, 30.0, 25.0, 25.0, 13.0, 12.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-10.578125, -10.248046875, -9.91796875, -9.587890625, -9.2578125, -8.927734375, -8.59765625, -8.267578125, -7.9375, -7.607421875, -7.27734375, -6.947265625, -6.6171875, -6.287109375, -5.95703125, -5.626953125, -5.296875, -4.966796875, -4.63671875, -4.306640625, -3.9765625, -3.646484375, -3.31640625, -2.986328125, -2.65625, -2.326171875, -1.99609375, -1.666015625, -1.3359375, -1.005859375, -0.67578125, -0.345703125, -0.015625, 0.314453125, 0.64453125, 0.974609375, 1.3046875, 1.634765625, 1.96484375, 2.294921875, 2.625, 2.955078125, 3.28515625, 3.615234375, 3.9453125, 4.275390625, 4.60546875, 4.935546875, 5.265625, 5.595703125, 5.92578125, 6.255859375, 6.5859375, 6.916015625, 7.24609375, 7.576171875, 7.90625, 8.236328125, 8.56640625, 8.896484375, 9.2265625, 9.556640625, 9.88671875, 10.216796875, 10.546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 9.0, 4.0, 7.0, 7.0, 21.0, 15.0, 24.0, 18.0, 23.0, 30.0, 28.0, 34.0, 43.0, 57.0, 68.0, 61.0, 58.0, 64.0, 52.0, 56.0, 40.0, 47.0, 23.0, 32.0, 19.0, 24.0, 19.0, 16.0, 11.0, 14.0, 10.0, 9.0, 6.0, 6.0, 13.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7109375, -8.426025390625, -8.14111328125, -7.856201171875, -7.5712890625, -7.286376953125, -7.00146484375, -6.716552734375, -6.431640625, -6.146728515625, -5.86181640625, -5.576904296875, -5.2919921875, -5.007080078125, -4.72216796875, -4.437255859375, -4.15234375, -3.867431640625, -3.58251953125, -3.297607421875, -3.0126953125, -2.727783203125, -2.44287109375, -2.157958984375, -1.873046875, -1.588134765625, -1.30322265625, -1.018310546875, -0.7333984375, -0.448486328125, -0.16357421875, 0.121337890625, 0.40625, 0.691162109375, 0.97607421875, 1.260986328125, 1.5458984375, 1.830810546875, 2.11572265625, 2.400634765625, 2.685546875, 2.970458984375, 3.25537109375, 3.540283203125, 3.8251953125, 4.110107421875, 4.39501953125, 4.679931640625, 4.96484375, 5.249755859375, 5.53466796875, 5.819580078125, 6.1044921875, 6.389404296875, 6.67431640625, 6.959228515625, 7.244140625, 7.529052734375, 7.81396484375, 8.098876953125, 8.3837890625, 8.668701171875, 8.95361328125, 9.238525390625, 9.5234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 8.0, 5.0, 11.0, 15.0, 12.0, 13.0, 15.0, 20.0, 26.0, 34.0, 20.0, 34.0, 45.0, 52.0, 42.0, 57.0, 58.0, 38.0, 44.0, 58.0, 48.0, 43.0, 46.0, 37.0, 29.0, 40.0, 25.0, 28.0, 21.0, 13.0, 14.0, 9.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.716594696044922, -20.99232292175293, -20.26805305480957, -19.543781280517578, -18.819509506225586, -18.095237731933594, -17.370967864990234, -16.646696090698242, -15.92242431640625, -15.198153495788574, -14.473881721496582, -13.749610900878906, -13.025339126586914, -12.301068305969238, -11.576797485351562, -10.85252571105957, -10.128254890441895, -9.403984069824219, -8.679712295532227, -7.955441474914551, -7.231169700622559, -6.506898880004883, -5.782627582550049, -5.058356285095215, -4.334084987640381, -3.609813690185547, -2.885542392730713, -2.161271333694458, -1.437000036239624, -0.71272873878479, 0.011542320251464844, 0.7358136177062988, 1.4600849151611328, 2.184356212615967, 2.908627510070801, 3.6328985691070557, 4.357170104980469, 5.0814409255981445, 5.8057122230529785, 6.5299835205078125, 7.2542548179626465, 7.9785261154174805, 8.702796936035156, 9.427068710327148, 10.151339530944824, 10.875611305236816, 11.599882125854492, 12.324153900146484, 13.04842472076416, 13.772695541381836, 14.496967315673828, 15.221238136291504, 15.945509910583496, 16.669780731201172, 17.394052505493164, 18.118324279785156, 18.842594146728516, 19.566865921020508, 20.291135787963867, 21.01540756225586, 21.73967933654785, 22.463951110839844, 23.188220977783203, 23.912492752075195, 24.636764526367188]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 0.0, 2.0, 6.0, 11.0, 9.0, 8.0, 12.0, 13.0, 10.0, 20.0, 10.0, 18.0, 27.0, 32.0, 21.0, 24.0, 27.0, 34.0, 31.0, 36.0, 38.0, 34.0, 47.0, 31.0, 45.0, 46.0, 40.0, 33.0, 34.0, 37.0, 25.0, 29.0, 28.0, 24.0, 19.0, 23.0, 15.0, 14.0, 12.0, 22.0, 10.0, 12.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.908458709716797, -25.028287887573242, -24.148115158081055, -23.2679443359375, -22.387773513793945, -21.50760269165039, -20.627429962158203, -19.74725914001465, -18.867088317871094, -17.98691749572754, -17.10674476623535, -16.226573944091797, -15.346403121948242, -14.466231346130371, -13.5860595703125, -12.705888748168945, -11.825716018676758, -10.945544242858887, -10.065373420715332, -9.185201644897461, -8.305030822753906, -7.424859046936035, -6.544687271118164, -5.664515972137451, -4.784344673156738, -3.9041733741760254, -3.0240018367767334, -2.1438302993774414, -1.2636590003967285, -0.3834877014160156, 0.49668407440185547, 1.3768553733825684, 2.257028579711914, 3.137199878692627, 4.01737117767334, 4.897542953491211, 5.777714252471924, 6.657885551452637, 7.538057327270508, 8.418228149414062, 9.298399925231934, 10.178571701049805, 11.05874252319336, 11.93891429901123, 12.819086074829102, 13.699256896972656, 14.579428672790527, 15.459600448608398, 16.339771270751953, 17.219942092895508, 18.100114822387695, 18.98028564453125, 19.860456466674805, 20.74062728881836, 21.620800018310547, 22.5009708404541, 23.381141662597656, 24.26131248474121, 25.1414852142334, 26.021656036376953, 26.901826858520508, 27.781997680664062, 28.66217041015625, 29.542341232299805, 30.422513961791992]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 8.0, 14.0, 9.0, 13.0, 32.0, 68.0, 106.0, 133.0, 256.0, 397.0, 606.0, 1002.0, 1590.0, 2689.0, 4293.0, 7156.0, 11924.0, 19874.0, 33091.0, 55862.0, 93614.0, 153926.0, 245272.0, 367213.0, 493260.0, 585574.0, 587684.0, 501184.0, 374239.0, 251873.0, 158468.0, 96087.0, 57850.0, 35116.0, 20906.0, 12635.0, 7747.0, 4693.0, 2878.0, 1844.0, 1108.0, 732.0, 441.0, 288.0, 219.0, 114.0, 68.0, 51.0, 32.0, 14.0, 15.0, 6.0, 6.0, 3.0, 6.0, 1.0, 1.0], "bins": [-18.1875, -17.636962890625, -17.08642578125, -16.535888671875, -15.9853515625, -15.434814453125, -14.88427734375, -14.333740234375, -13.783203125, -13.232666015625, -12.68212890625, -12.131591796875, -11.5810546875, -11.030517578125, -10.47998046875, -9.929443359375, -9.37890625, -8.828369140625, -8.27783203125, -7.727294921875, -7.1767578125, -6.626220703125, -6.07568359375, -5.525146484375, -4.974609375, -4.424072265625, -3.87353515625, -3.322998046875, -2.7724609375, -2.221923828125, -1.67138671875, -1.120849609375, -0.5703125, -0.019775390625, 0.53076171875, 1.081298828125, 1.6318359375, 2.182373046875, 2.73291015625, 3.283447265625, 3.833984375, 4.384521484375, 4.93505859375, 5.485595703125, 6.0361328125, 6.586669921875, 7.13720703125, 7.687744140625, 8.23828125, 8.788818359375, 9.33935546875, 9.889892578125, 10.4404296875, 10.990966796875, 11.54150390625, 12.092041015625, 12.642578125, 13.193115234375, 13.74365234375, 14.294189453125, 14.8447265625, 15.395263671875, 15.94580078125, 16.496337890625, 17.046875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 3.0, 4.0, 6.0, 4.0, 1.0, 9.0, 10.0, 15.0, 10.0, 12.0, 15.0, 12.0, 12.0, 21.0, 27.0, 24.0, 28.0, 24.0, 41.0, 30.0, 27.0, 44.0, 34.0, 35.0, 41.0, 40.0, 37.0, 33.0, 39.0, 46.0, 35.0, 40.0, 28.0, 25.0, 20.0, 27.0, 23.0, 24.0, 18.0, 12.0, 9.0, 18.0, 11.0, 11.0, 6.0, 4.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.765625, -21.066650390625, -20.36767578125, -19.668701171875, -18.9697265625, -18.270751953125, -17.57177734375, -16.872802734375, -16.173828125, -15.474853515625, -14.77587890625, -14.076904296875, -13.3779296875, -12.678955078125, -11.97998046875, -11.281005859375, -10.58203125, -9.883056640625, -9.18408203125, -8.485107421875, -7.7861328125, -7.087158203125, -6.38818359375, -5.689208984375, -4.990234375, -4.291259765625, -3.59228515625, -2.893310546875, -2.1943359375, -1.495361328125, -0.79638671875, -0.097412109375, 0.6015625, 1.300537109375, 1.99951171875, 2.698486328125, 3.3974609375, 4.096435546875, 4.79541015625, 5.494384765625, 6.193359375, 6.892333984375, 7.59130859375, 8.290283203125, 8.9892578125, 9.688232421875, 10.38720703125, 11.086181640625, 11.78515625, 12.484130859375, 13.18310546875, 13.882080078125, 14.5810546875, 15.280029296875, 15.97900390625, 16.677978515625, 17.376953125, 18.075927734375, 18.77490234375, 19.473876953125, 20.1728515625, 20.871826171875, 21.57080078125, 22.269775390625, 22.96875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 15.0, 32.0, 54.0, 83.0, 134.0, 205.0, 330.0, 563.0, 883.0, 1509.0, 2640.0, 4270.0, 7450.0, 12624.0, 21815.0, 37343.0, 63004.0, 105131.0, 168205.0, 258851.0, 370394.0, 484327.0, 556448.0, 558196.0, 482242.0, 371631.0, 259091.0, 168812.0, 104830.0, 62965.0, 37506.0, 21710.0, 12858.0, 7402.0, 4326.0, 2583.0, 1455.0, 879.0, 567.0, 334.0, 204.0, 126.0, 77.0, 59.0, 35.0, 27.0, 24.0, 7.0, 5.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.75, -18.1640625, -17.578125, -16.9921875, -16.40625, -15.8203125, -15.234375, -14.6484375, -14.0625, -13.4765625, -12.890625, -12.3046875, -11.71875, -11.1328125, -10.546875, -9.9609375, -9.375, -8.7890625, -8.203125, -7.6171875, -7.03125, -6.4453125, -5.859375, -5.2734375, -4.6875, -4.1015625, -3.515625, -2.9296875, -2.34375, -1.7578125, -1.171875, -0.5859375, 0.0, 0.5859375, 1.171875, 1.7578125, 2.34375, 2.9296875, 3.515625, 4.1015625, 4.6875, 5.2734375, 5.859375, 6.4453125, 7.03125, 7.6171875, 8.203125, 8.7890625, 9.375, 9.9609375, 10.546875, 11.1328125, 11.71875, 12.3046875, 12.890625, 13.4765625, 14.0625, 14.6484375, 15.234375, 15.8203125, 16.40625, 16.9921875, 17.578125, 18.1640625, 18.75]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 12.0, 10.0, 27.0, 20.0, 36.0, 33.0, 48.0, 68.0, 87.0, 88.0, 110.0, 156.0, 172.0, 191.0, 208.0, 235.0, 283.0, 231.0, 242.0, 267.0, 230.0, 222.0, 208.0, 182.0, 149.0, 136.0, 91.0, 73.0, 61.0, 54.0, 45.0, 21.0, 26.0, 19.0, 11.0, 12.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1014404296875, -9.734130859375, -9.3668212890625, -8.99951171875, -8.6322021484375, -8.264892578125, -7.8975830078125, -7.5302734375, -7.1629638671875, -6.795654296875, -6.4283447265625, -6.06103515625, -5.6937255859375, -5.326416015625, -4.9591064453125, -4.591796875, -4.2244873046875, -3.857177734375, -3.4898681640625, -3.12255859375, -2.7552490234375, -2.387939453125, -2.0206298828125, -1.6533203125, -1.2860107421875, -0.918701171875, -0.5513916015625, -0.18408203125, 0.1832275390625, 0.550537109375, 0.9178466796875, 1.28515625, 1.6524658203125, 2.019775390625, 2.3870849609375, 2.75439453125, 3.1217041015625, 3.489013671875, 3.8563232421875, 4.2236328125, 4.5909423828125, 4.958251953125, 5.3255615234375, 5.69287109375, 6.0601806640625, 6.427490234375, 6.7947998046875, 7.162109375, 7.5294189453125, 7.896728515625, 8.2640380859375, 8.63134765625, 8.9986572265625, 9.365966796875, 9.7332763671875, 10.1005859375, 10.4678955078125, 10.835205078125, 11.2025146484375, 11.56982421875, 11.9371337890625, 12.304443359375, 12.6717529296875, 13.0390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 7.0, 3.0, 2.0, 5.0, 7.0, 6.0, 10.0, 13.0, 17.0, 21.0, 16.0, 22.0, 21.0, 28.0, 35.0, 41.0, 40.0, 29.0, 39.0, 60.0, 33.0, 42.0, 48.0, 41.0, 38.0, 40.0, 55.0, 48.0, 38.0, 30.0, 26.0, 25.0, 16.0, 15.0, 18.0, 14.0, 11.0, 9.0, 10.0, 3.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.928218841552734, -20.271717071533203, -19.615217208862305, -18.958715438842773, -18.302215576171875, -17.645713806152344, -16.989213943481445, -16.332712173461914, -15.676212310791016, -15.0197114944458, -14.363210678100586, -13.706709861755371, -13.050209045410156, -12.393708229064941, -11.737207412719727, -11.080705642700195, -10.42420482635498, -9.767704010009766, -9.11120319366455, -8.454702377319336, -7.798201560974121, -7.141700744628906, -6.485199451446533, -5.828698635101318, -5.1721978187561035, -4.515697002410889, -3.859196186065674, -3.20269513130188, -2.546194314956665, -1.8896934986114502, -1.2331924438476562, -0.5766916275024414, 0.07980918884277344, 0.7363100647926331, 1.3928109407424927, 2.049311876296997, 2.705812692642212, 3.3623135089874268, 4.018814563751221, 4.6753153800964355, 5.33181619644165, 5.988317012786865, 6.64481782913208, 7.301319122314453, 7.957819938659668, 8.614320755004883, 9.270821571350098, 9.927322387695312, 10.583823204040527, 11.240324020385742, 11.896824836730957, 12.553325653076172, 13.209826469421387, 13.866327285766602, 14.522829055786133, 15.179328918457031, 15.835830688476562, 16.492332458496094, 17.148832321166992, 17.805334091186523, 18.461833953857422, 19.118335723876953, 19.77483558654785, 20.431337356567383, 21.08783721923828]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 10.0, 9.0, 7.0, 12.0, 11.0, 12.0, 17.0, 16.0, 20.0, 38.0, 20.0, 20.0, 46.0, 30.0, 23.0, 38.0, 43.0, 34.0, 44.0, 45.0, 47.0, 38.0, 46.0, 45.0, 44.0, 33.0, 30.0, 23.0, 21.0, 31.0, 21.0, 17.0, 14.0, 23.0, 13.0, 13.0, 11.0, 7.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.027969360351562, -27.137474060058594, -26.246976852416992, -25.356481552124023, -24.465984344482422, -23.575489044189453, -22.684993743896484, -21.794496536254883, -20.90399932861328, -20.013504028320312, -19.12300682067871, -18.232511520385742, -17.34201431274414, -16.451519012451172, -15.561022758483887, -14.670526504516602, -13.780031204223633, -12.889534950256348, -11.999038696289062, -11.108543395996094, -10.218046188354492, -9.327550888061523, -8.437054634094238, -7.546558380126953, -6.656062126159668, -5.765565872192383, -4.875069618225098, -3.9845738410949707, -3.0940775871276855, -2.2035813331604004, -1.3130855560302734, -0.4225893020629883, 0.4679069519042969, 1.3584030866622925, 2.248899221420288, 3.139395236968994, 4.029891490936279, 4.9203877449035645, 5.810883522033691, 6.701379776000977, 7.591876029968262, 8.482372283935547, 9.372868537902832, 10.263364791870117, 11.153860092163086, 12.044357299804688, 12.934852600097656, 13.825348854064941, 14.715845108032227, 15.606341361999512, 16.496837615966797, 17.387332916259766, 18.277830123901367, 19.168325424194336, 20.058822631835938, 20.949317932128906, 21.839813232421875, 22.730308532714844, 23.620805740356445, 24.511301040649414, 25.401798248291016, 26.292293548583984, 27.182788848876953, 28.073286056518555, 28.963783264160156]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 14.0, 13.0, 19.0, 33.0, 36.0, 54.0, 87.0, 131.0, 195.0, 345.0, 543.0, 910.0, 1550.0, 2620.0, 4623.0, 8368.0, 15604.0, 29452.0, 54777.0, 98866.0, 157047.0, 198076.0, 183305.0, 128012.0, 74735.0, 40940.0, 21668.0, 11630.0, 6371.0, 3523.0, 2039.0, 1162.0, 646.0, 411.0, 261.0, 156.0, 107.0, 73.0, 59.0, 35.0, 20.0, 15.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-14.7890625, -14.38671875, -13.984375, -13.58203125, -13.1796875, -12.77734375, -12.375, -11.97265625, -11.5703125, -11.16796875, -10.765625, -10.36328125, -9.9609375, -9.55859375, -9.15625, -8.75390625, -8.3515625, -7.94921875, -7.546875, -7.14453125, -6.7421875, -6.33984375, -5.9375, -5.53515625, -5.1328125, -4.73046875, -4.328125, -3.92578125, -3.5234375, -3.12109375, -2.71875, -2.31640625, -1.9140625, -1.51171875, -1.109375, -0.70703125, -0.3046875, 0.09765625, 0.5, 0.90234375, 1.3046875, 1.70703125, 2.109375, 2.51171875, 2.9140625, 3.31640625, 3.71875, 4.12109375, 4.5234375, 4.92578125, 5.328125, 5.73046875, 6.1328125, 6.53515625, 6.9375, 7.33984375, 7.7421875, 8.14453125, 8.546875, 8.94921875, 9.3515625, 9.75390625, 10.15625, 10.55859375, 10.9609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 5.0, 7.0, 10.0, 12.0, 15.0, 14.0, 15.0, 21.0, 17.0, 27.0, 27.0, 33.0, 34.0, 24.0, 35.0, 29.0, 39.0, 51.0, 43.0, 47.0, 48.0, 43.0, 50.0, 32.0, 48.0, 40.0, 28.0, 18.0, 22.0, 23.0, 18.0, 20.0, 20.0, 15.0, 20.0, 5.0, 13.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-29.609375, -28.697998046875, -27.78662109375, -26.875244140625, -25.9638671875, -25.052490234375, -24.14111328125, -23.229736328125, -22.318359375, -21.406982421875, -20.49560546875, -19.584228515625, -18.6728515625, -17.761474609375, -16.85009765625, -15.938720703125, -15.02734375, -14.115966796875, -13.20458984375, -12.293212890625, -11.3818359375, -10.470458984375, -9.55908203125, -8.647705078125, -7.736328125, -6.824951171875, -5.91357421875, -5.002197265625, -4.0908203125, -3.179443359375, -2.26806640625, -1.356689453125, -0.4453125, 0.466064453125, 1.37744140625, 2.288818359375, 3.2001953125, 4.111572265625, 5.02294921875, 5.934326171875, 6.845703125, 7.757080078125, 8.66845703125, 9.579833984375, 10.4912109375, 11.402587890625, 12.31396484375, 13.225341796875, 14.13671875, 15.048095703125, 15.95947265625, 16.870849609375, 17.7822265625, 18.693603515625, 19.60498046875, 20.516357421875, 21.427734375, 22.339111328125, 23.25048828125, 24.161865234375, 25.0732421875, 25.984619140625, 26.89599609375, 27.807373046875, 28.71875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 3.0, 4.0, 9.0, 20.0, 23.0, 20.0, 44.0, 46.0, 74.0, 89.0, 137.0, 192.0, 305.0, 490.0, 789.0, 1316.0, 2218.0, 3967.0, 7546.0, 15483.0, 32233.0, 70520.0, 147388.0, 244725.0, 241860.0, 145581.0, 69412.0, 31929.0, 15017.0, 7399.0, 3964.0, 2231.0, 1274.0, 781.0, 488.0, 307.0, 190.0, 139.0, 98.0, 69.0, 43.0, 37.0, 21.0, 18.0, 15.0, 10.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-16.640625, -16.13623046875, -15.6318359375, -15.12744140625, -14.623046875, -14.11865234375, -13.6142578125, -13.10986328125, -12.60546875, -12.10107421875, -11.5966796875, -11.09228515625, -10.587890625, -10.08349609375, -9.5791015625, -9.07470703125, -8.5703125, -8.06591796875, -7.5615234375, -7.05712890625, -6.552734375, -6.04833984375, -5.5439453125, -5.03955078125, -4.53515625, -4.03076171875, -3.5263671875, -3.02197265625, -2.517578125, -2.01318359375, -1.5087890625, -1.00439453125, -0.5, 0.00439453125, 0.5087890625, 1.01318359375, 1.517578125, 2.02197265625, 2.5263671875, 3.03076171875, 3.53515625, 4.03955078125, 4.5439453125, 5.04833984375, 5.552734375, 6.05712890625, 6.5615234375, 7.06591796875, 7.5703125, 8.07470703125, 8.5791015625, 9.08349609375, 9.587890625, 10.09228515625, 10.5966796875, 11.10107421875, 11.60546875, 12.10986328125, 12.6142578125, 13.11865234375, 13.623046875, 14.12744140625, 14.6318359375, 15.13623046875, 15.640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 8.0, 7.0, 14.0, 14.0, 14.0, 20.0, 18.0, 22.0, 37.0, 28.0, 32.0, 36.0, 39.0, 51.0, 49.0, 61.0, 29.0, 41.0, 45.0, 39.0, 52.0, 44.0, 45.0, 26.0, 37.0, 27.0, 27.0, 27.0, 16.0, 16.0, 15.0, 7.0, 13.0, 5.0, 8.0, 9.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.0625, -20.44580078125, -19.8291015625, -19.21240234375, -18.595703125, -17.97900390625, -17.3623046875, -16.74560546875, -16.12890625, -15.51220703125, -14.8955078125, -14.27880859375, -13.662109375, -13.04541015625, -12.4287109375, -11.81201171875, -11.1953125, -10.57861328125, -9.9619140625, -9.34521484375, -8.728515625, -8.11181640625, -7.4951171875, -6.87841796875, -6.26171875, -5.64501953125, -5.0283203125, -4.41162109375, -3.794921875, -3.17822265625, -2.5615234375, -1.94482421875, -1.328125, -0.71142578125, -0.0947265625, 0.52197265625, 1.138671875, 1.75537109375, 2.3720703125, 2.98876953125, 3.60546875, 4.22216796875, 4.8388671875, 5.45556640625, 6.072265625, 6.68896484375, 7.3056640625, 7.92236328125, 8.5390625, 9.15576171875, 9.7724609375, 10.38916015625, 11.005859375, 11.62255859375, 12.2392578125, 12.85595703125, 13.47265625, 14.08935546875, 14.7060546875, 15.32275390625, 15.939453125, 16.55615234375, 17.1728515625, 17.78955078125, 18.40625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 8.0, 14.0, 15.0, 18.0, 27.0, 43.0, 41.0, 67.0, 83.0, 124.0, 167.0, 205.0, 289.0, 389.0, 544.0, 785.0, 1302.0, 1985.0, 3493.0, 6739.0, 14613.0, 39866.0, 125817.0, 346296.0, 326816.0, 113359.0, 36112.0, 13690.0, 6307.0, 3370.0, 1955.0, 1275.0, 755.0, 576.0, 369.0, 291.0, 207.0, 129.0, 126.0, 80.0, 46.0, 35.0, 36.0, 25.0, 23.0, 14.0, 10.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.8828125, -11.510986328125, -11.13916015625, -10.767333984375, -10.3955078125, -10.023681640625, -9.65185546875, -9.280029296875, -8.908203125, -8.536376953125, -8.16455078125, -7.792724609375, -7.4208984375, -7.049072265625, -6.67724609375, -6.305419921875, -5.93359375, -5.561767578125, -5.18994140625, -4.818115234375, -4.4462890625, -4.074462890625, -3.70263671875, -3.330810546875, -2.958984375, -2.587158203125, -2.21533203125, -1.843505859375, -1.4716796875, -1.099853515625, -0.72802734375, -0.356201171875, 0.015625, 0.387451171875, 0.75927734375, 1.131103515625, 1.5029296875, 1.874755859375, 2.24658203125, 2.618408203125, 2.990234375, 3.362060546875, 3.73388671875, 4.105712890625, 4.4775390625, 4.849365234375, 5.22119140625, 5.593017578125, 5.96484375, 6.336669921875, 6.70849609375, 7.080322265625, 7.4521484375, 7.823974609375, 8.19580078125, 8.567626953125, 8.939453125, 9.311279296875, 9.68310546875, 10.054931640625, 10.4267578125, 10.798583984375, 11.17041015625, 11.542236328125, 11.9140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 15.0, 13.0, 42.0, 65.0, 102.0, 142.0, 143.0, 126.0, 115.0, 73.0, 47.0, 30.0, 26.0, 8.0, 9.0, 2.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010738372802734375, -0.0010475069284439087, -0.0010211765766143799, -0.000994846224784851, -0.0009685158729553223, -0.0009421855211257935, -0.0009158551692962646, -0.0008895248174667358, -0.000863194465637207, -0.0008368641138076782, -0.0008105337619781494, -0.0007842034101486206, -0.0007578730583190918, -0.000731542706489563, -0.0007052123546600342, -0.0006788820028305054, -0.0006525516510009766, -0.0006262212991714478, -0.0005998909473419189, -0.0005735605955123901, -0.0005472302436828613, -0.0005208998918533325, -0.0004945695400238037, -0.0004682391881942749, -0.0004419088363647461, -0.0004155784845352173, -0.0003892481327056885, -0.00036291778087615967, -0.00033658742904663086, -0.00031025707721710205, -0.00028392672538757324, -0.00025759637355804443, -0.00023126602172851562, -0.00020493566989898682, -0.000178605318069458, -0.0001522749662399292, -0.0001259446144104004, -9.961426258087158e-05, -7.328391075134277e-05, -4.6953558921813965e-05, -2.0623207092285156e-05, 5.707144737243652e-06, 3.203749656677246e-05, 5.836784839630127e-05, 8.469820022583008e-05, 0.00011102855205535889, 0.0001373589038848877, 0.0001636892557144165, 0.0001900196075439453, 0.00021634995937347412, 0.00024268031120300293, 0.00026901066303253174, 0.00029534101486206055, 0.00032167136669158936, 0.00034800171852111816, 0.00037433207035064697, 0.0004006624221801758, 0.0004269927740097046, 0.0004533231258392334, 0.0004796534776687622, 0.000505983829498291, 0.0005323141813278198, 0.0005586445331573486, 0.0005849748849868774, 0.0006113052368164062]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 4.0, 9.0, 15.0, 17.0, 22.0, 26.0, 46.0, 52.0, 76.0, 96.0, 122.0, 182.0, 228.0, 314.0, 450.0, 673.0, 889.0, 1623.0, 2655.0, 4725.0, 8830.0, 18347.0, 40157.0, 91352.0, 190694.0, 273334.0, 213520.0, 107824.0, 47309.0, 21172.0, 10131.0, 5203.0, 3052.0, 1763.0, 1087.0, 721.0, 503.0, 338.0, 270.0, 165.0, 135.0, 119.0, 75.0, 68.0, 45.0, 25.0, 28.0, 20.0, 13.0, 8.0, 8.0, 8.0, 0.0, 1.0, 5.0, 2.0, 1.0], "bins": [-9.953125, -9.6478271484375, -9.342529296875, -9.0372314453125, -8.73193359375, -8.4266357421875, -8.121337890625, -7.8160400390625, -7.5107421875, -7.2054443359375, -6.900146484375, -6.5948486328125, -6.28955078125, -5.9842529296875, -5.678955078125, -5.3736572265625, -5.068359375, -4.7630615234375, -4.457763671875, -4.1524658203125, -3.84716796875, -3.5418701171875, -3.236572265625, -2.9312744140625, -2.6259765625, -2.3206787109375, -2.015380859375, -1.7100830078125, -1.40478515625, -1.0994873046875, -0.794189453125, -0.4888916015625, -0.18359375, 0.1217041015625, 0.427001953125, 0.7322998046875, 1.03759765625, 1.3428955078125, 1.648193359375, 1.9534912109375, 2.2587890625, 2.5640869140625, 2.869384765625, 3.1746826171875, 3.47998046875, 3.7852783203125, 4.090576171875, 4.3958740234375, 4.701171875, 5.0064697265625, 5.311767578125, 5.6170654296875, 5.92236328125, 6.2276611328125, 6.532958984375, 6.8382568359375, 7.1435546875, 7.4488525390625, 7.754150390625, 8.0594482421875, 8.36474609375, 8.6700439453125, 8.975341796875, 9.2806396484375, 9.5859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 6.0, 8.0, 15.0, 18.0, 27.0, 28.0, 44.0, 54.0, 63.0, 80.0, 94.0, 81.0, 77.0, 66.0, 80.0, 57.0, 34.0, 33.0, 28.0, 23.0, 15.0, 10.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.689453125, -3.564910888671875, -3.44036865234375, -3.315826416015625, -3.1912841796875, -3.066741943359375, -2.94219970703125, -2.817657470703125, -2.693115234375, -2.568572998046875, -2.44403076171875, -2.319488525390625, -2.1949462890625, -2.070404052734375, -1.94586181640625, -1.821319580078125, -1.69677734375, -1.572235107421875, -1.44769287109375, -1.323150634765625, -1.1986083984375, -1.074066162109375, -0.94952392578125, -0.824981689453125, -0.700439453125, -0.575897216796875, -0.45135498046875, -0.326812744140625, -0.2022705078125, -0.077728271484375, 0.04681396484375, 0.171356201171875, 0.2958984375, 0.420440673828125, 0.54498291015625, 0.669525146484375, 0.7940673828125, 0.918609619140625, 1.04315185546875, 1.167694091796875, 1.292236328125, 1.416778564453125, 1.54132080078125, 1.665863037109375, 1.7904052734375, 1.914947509765625, 2.03948974609375, 2.164031982421875, 2.28857421875, 2.413116455078125, 2.53765869140625, 2.662200927734375, 2.7867431640625, 2.911285400390625, 3.03582763671875, 3.160369873046875, 3.284912109375, 3.409454345703125, 3.53399658203125, 3.658538818359375, 3.7830810546875, 3.907623291015625, 4.03216552734375, 4.156707763671875, 4.28125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 6.0, 9.0, 17.0, 20.0, 17.0, 19.0, 24.0, 29.0, 38.0, 36.0, 32.0, 36.0, 48.0, 47.0, 44.0, 40.0, 40.0, 46.0, 35.0, 41.0, 52.0, 47.0, 37.0, 42.0, 28.0, 23.0, 20.0, 18.0, 12.0, 14.0, 9.0, 13.0, 5.0, 7.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.23821258544922, -20.594074249267578, -19.949934005737305, -19.305795669555664, -18.66165542602539, -18.01751708984375, -17.373376846313477, -16.729238510131836, -16.085098266601562, -15.440958976745605, -14.796819686889648, -14.152680397033691, -13.508541107177734, -12.864402770996094, -12.220263481140137, -11.57612419128418, -10.931985855102539, -10.287846565246582, -9.643707275390625, -8.999567985534668, -8.355428695678711, -7.711289882659912, -7.067151069641113, -6.423011779785156, -5.778872489929199, -5.134733200073242, -4.490593910217285, -3.8464550971984863, -3.2023158073425293, -2.5581765174865723, -1.9140374660491943, -1.2698984146118164, -0.6257610321044922, 0.018378138542175293, 0.6625173091888428, 1.3066564798355103, 1.9507956504821777, 2.5949349403381348, 3.2390739917755127, 3.8832130432128906, 4.527352333068848, 5.171491622924805, 5.815630912780762, 6.4597697257995605, 7.103909015655518, 7.748048305511475, 8.392187118530273, 9.03632640838623, 9.680465698242188, 10.324604988098145, 10.968744277954102, 11.612883567810059, 12.257022857666016, 12.901161193847656, 13.545300483703613, 14.18943977355957, 14.833579063415527, 15.477718353271484, 16.121856689453125, 16.7659969329834, 17.41013526916504, 18.054275512695312, 18.698413848876953, 19.342552185058594, 19.986692428588867]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 8.0, 8.0, 7.0, 8.0, 10.0, 10.0, 11.0, 12.0, 21.0, 18.0, 24.0, 31.0, 23.0, 20.0, 34.0, 34.0, 39.0, 37.0, 35.0, 34.0, 39.0, 52.0, 38.0, 50.0, 37.0, 46.0, 44.0, 32.0, 30.0, 20.0, 23.0, 34.0, 15.0, 19.0, 17.0, 18.0, 18.0, 10.0, 8.0, 7.0, 6.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.404603958129883, -26.529218673706055, -25.65383529663086, -24.77845001220703, -23.903064727783203, -23.027681350708008, -22.15229606628418, -21.276912689208984, -20.401527404785156, -19.526142120361328, -18.650758743286133, -17.775373458862305, -16.89999008178711, -16.02460479736328, -15.149219512939453, -14.273835182189941, -13.39845085144043, -12.523066520690918, -11.647682189941406, -10.772296905517578, -9.896912574768066, -9.021528244018555, -8.146142959594727, -7.270758628845215, -6.395374298095703, -5.519989967346191, -4.6446051597595215, -3.7692205905914307, -2.89383602142334, -2.018451690673828, -1.1430668830871582, -0.2676820755004883, 0.6077003479003906, 1.4830849170684814, 2.3584694862365723, 3.233854055404663, 4.109238624572754, 4.984622955322266, 5.8600077629089355, 6.7353925704956055, 7.610776901245117, 8.486161231994629, 9.36154556274414, 10.236930847167969, 11.11231517791748, 11.987699508666992, 12.86308479309082, 13.738469123840332, 14.613853454589844, 15.489237785339355, 16.364622116088867, 17.240007400512695, 18.11539077758789, 18.99077606201172, 19.866161346435547, 20.741546630859375, 21.61693000793457, 22.4923152923584, 23.367698669433594, 24.243083953857422, 25.11846923828125, 25.993852615356445, 26.869237899780273, 27.74462127685547, 28.620006561279297]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 18.0, 19.0, 19.0, 34.0, 58.0, 85.0, 109.0, 206.0, 282.0, 461.0, 722.0, 1118.0, 1880.0, 2878.0, 4797.0, 7349.0, 11760.0, 18167.0, 27663.0, 40532.0, 57383.0, 76599.0, 96650.0, 111412.0, 117517.0, 112854.0, 98105.0, 78388.0, 58858.0, 42275.0, 28251.0, 18853.0, 12102.0, 7895.0, 4886.0, 3088.0, 1957.0, 1233.0, 745.0, 492.0, 306.0, 214.0, 123.0, 75.0, 45.0, 32.0, 17.0, 15.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-14.0703125, -13.624267578125, -13.17822265625, -12.732177734375, -12.2861328125, -11.840087890625, -11.39404296875, -10.947998046875, -10.501953125, -10.055908203125, -9.60986328125, -9.163818359375, -8.7177734375, -8.271728515625, -7.82568359375, -7.379638671875, -6.93359375, -6.487548828125, -6.04150390625, -5.595458984375, -5.1494140625, -4.703369140625, -4.25732421875, -3.811279296875, -3.365234375, -2.919189453125, -2.47314453125, -2.027099609375, -1.5810546875, -1.135009765625, -0.68896484375, -0.242919921875, 0.203125, 0.649169921875, 1.09521484375, 1.541259765625, 1.9873046875, 2.433349609375, 2.87939453125, 3.325439453125, 3.771484375, 4.217529296875, 4.66357421875, 5.109619140625, 5.5556640625, 6.001708984375, 6.44775390625, 6.893798828125, 7.33984375, 7.785888671875, 8.23193359375, 8.677978515625, 9.1240234375, 9.570068359375, 10.01611328125, 10.462158203125, 10.908203125, 11.354248046875, 11.80029296875, 12.246337890625, 12.6923828125, 13.138427734375, 13.58447265625, 14.030517578125, 14.4765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 3.0, 7.0, 15.0, 17.0, 17.0, 20.0, 15.0, 24.0, 19.0, 29.0, 34.0, 34.0, 45.0, 41.0, 35.0, 38.0, 46.0, 47.0, 55.0, 46.0, 43.0, 39.0, 41.0, 35.0, 25.0, 36.0, 32.0, 19.0, 21.0, 21.0, 14.0, 18.0, 9.0, 14.0, 8.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.762939453125, -27.82275390625, -26.882568359375, -25.9423828125, -25.002197265625, -24.06201171875, -23.121826171875, -22.181640625, -21.241455078125, -20.30126953125, -19.361083984375, -18.4208984375, -17.480712890625, -16.54052734375, -15.600341796875, -14.66015625, -13.719970703125, -12.77978515625, -11.839599609375, -10.8994140625, -9.959228515625, -9.01904296875, -8.078857421875, -7.138671875, -6.198486328125, -5.25830078125, -4.318115234375, -3.3779296875, -2.437744140625, -1.49755859375, -0.557373046875, 0.3828125, 1.322998046875, 2.26318359375, 3.203369140625, 4.1435546875, 5.083740234375, 6.02392578125, 6.964111328125, 7.904296875, 8.844482421875, 9.78466796875, 10.724853515625, 11.6650390625, 12.605224609375, 13.54541015625, 14.485595703125, 15.42578125, 16.365966796875, 17.30615234375, 18.246337890625, 19.1865234375, 20.126708984375, 21.06689453125, 22.007080078125, 22.947265625, 23.887451171875, 24.82763671875, 25.767822265625, 26.7080078125, 27.648193359375, 28.58837890625, 29.528564453125, 30.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 9.0, 13.0, 23.0, 42.0, 50.0, 91.0, 149.0, 195.0, 328.0, 489.0, 789.0, 1137.0, 1891.0, 2830.0, 4401.0, 6748.0, 10666.0, 15783.0, 24648.0, 35923.0, 50947.0, 69355.0, 88619.0, 104791.0, 114673.0, 113436.0, 102240.0, 85558.0, 65564.0, 48116.0, 33788.0, 22530.0, 14995.0, 9838.0, 6307.0, 4122.0, 2649.0, 1738.0, 1031.0, 737.0, 461.0, 303.0, 209.0, 122.0, 84.0, 56.0, 26.0, 17.0, 14.0, 9.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.984375, -13.531982421875, -13.07958984375, -12.627197265625, -12.1748046875, -11.722412109375, -11.27001953125, -10.817626953125, -10.365234375, -9.912841796875, -9.46044921875, -9.008056640625, -8.5556640625, -8.103271484375, -7.65087890625, -7.198486328125, -6.74609375, -6.293701171875, -5.84130859375, -5.388916015625, -4.9365234375, -4.484130859375, -4.03173828125, -3.579345703125, -3.126953125, -2.674560546875, -2.22216796875, -1.769775390625, -1.3173828125, -0.864990234375, -0.41259765625, 0.039794921875, 0.4921875, 0.944580078125, 1.39697265625, 1.849365234375, 2.3017578125, 2.754150390625, 3.20654296875, 3.658935546875, 4.111328125, 4.563720703125, 5.01611328125, 5.468505859375, 5.9208984375, 6.373291015625, 6.82568359375, 7.278076171875, 7.73046875, 8.182861328125, 8.63525390625, 9.087646484375, 9.5400390625, 9.992431640625, 10.44482421875, 10.897216796875, 11.349609375, 11.802001953125, 12.25439453125, 12.706787109375, 13.1591796875, 13.611572265625, 14.06396484375, 14.516357421875, 14.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 9.0, 7.0, 4.0, 2.0, 13.0, 15.0, 23.0, 19.0, 17.0, 12.0, 25.0, 21.0, 29.0, 28.0, 33.0, 32.0, 51.0, 42.0, 37.0, 46.0, 51.0, 46.0, 39.0, 40.0, 36.0, 36.0, 37.0, 38.0, 39.0, 23.0, 27.0, 24.0, 18.0, 14.0, 9.0, 9.0, 8.0, 11.0, 9.0, 10.0, 5.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.392822265625, -18.78564453125, -18.178466796875, -17.5712890625, -16.964111328125, -16.35693359375, -15.749755859375, -15.142578125, -14.535400390625, -13.92822265625, -13.321044921875, -12.7138671875, -12.106689453125, -11.49951171875, -10.892333984375, -10.28515625, -9.677978515625, -9.07080078125, -8.463623046875, -7.8564453125, -7.249267578125, -6.64208984375, -6.034912109375, -5.427734375, -4.820556640625, -4.21337890625, -3.606201171875, -2.9990234375, -2.391845703125, -1.78466796875, -1.177490234375, -0.5703125, 0.036865234375, 0.64404296875, 1.251220703125, 1.8583984375, 2.465576171875, 3.07275390625, 3.679931640625, 4.287109375, 4.894287109375, 5.50146484375, 6.108642578125, 6.7158203125, 7.322998046875, 7.93017578125, 8.537353515625, 9.14453125, 9.751708984375, 10.35888671875, 10.966064453125, 11.5732421875, 12.180419921875, 12.78759765625, 13.394775390625, 14.001953125, 14.609130859375, 15.21630859375, 15.823486328125, 16.4306640625, 17.037841796875, 17.64501953125, 18.252197265625, 18.859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 12.0, 14.0, 18.0, 23.0, 41.0, 43.0, 71.0, 114.0, 141.0, 256.0, 414.0, 540.0, 839.0, 1228.0, 2045.0, 3113.0, 5008.0, 8136.0, 13416.0, 22039.0, 36236.0, 57430.0, 87597.0, 120727.0, 144884.0, 148262.0, 128859.0, 95936.0, 65112.0, 40674.0, 25328.0, 15135.0, 9169.0, 5749.0, 3551.0, 2197.0, 1444.0, 926.0, 571.0, 396.0, 298.0, 168.0, 122.0, 68.0, 77.0, 36.0, 30.0, 17.0, 14.0, 11.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-8.8203125, -8.5540771484375, -8.287841796875, -8.0216064453125, -7.75537109375, -7.4891357421875, -7.222900390625, -6.9566650390625, -6.6904296875, -6.4241943359375, -6.157958984375, -5.8917236328125, -5.62548828125, -5.3592529296875, -5.093017578125, -4.8267822265625, -4.560546875, -4.2943115234375, -4.028076171875, -3.7618408203125, -3.49560546875, -3.2293701171875, -2.963134765625, -2.6968994140625, -2.4306640625, -2.1644287109375, -1.898193359375, -1.6319580078125, -1.36572265625, -1.0994873046875, -0.833251953125, -0.5670166015625, -0.30078125, -0.0345458984375, 0.231689453125, 0.4979248046875, 0.76416015625, 1.0303955078125, 1.296630859375, 1.5628662109375, 1.8291015625, 2.0953369140625, 2.361572265625, 2.6278076171875, 2.89404296875, 3.1602783203125, 3.426513671875, 3.6927490234375, 3.958984375, 4.2252197265625, 4.491455078125, 4.7576904296875, 5.02392578125, 5.2901611328125, 5.556396484375, 5.8226318359375, 6.0888671875, 6.3551025390625, 6.621337890625, 6.8875732421875, 7.15380859375, 7.4200439453125, 7.686279296875, 7.9525146484375, 8.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 12.0, 10.0, 12.0, 16.0, 20.0, 36.0, 33.0, 40.0, 59.0, 60.0, 54.0, 53.0, 56.0, 45.0, 47.0, 48.0, 60.0, 50.0, 44.0, 36.0, 30.0, 26.0, 23.0, 17.0, 25.0, 16.0, 11.0, 7.0, 12.0, 6.0, 3.0, 10.0, 3.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007410049438476562, -0.0007145777344703674, -0.0006881505250930786, -0.0006617233157157898, -0.000635296106338501, -0.0006088688969612122, -0.0005824416875839233, -0.0005560144782066345, -0.0005295872688293457, -0.0005031600594520569, -0.00047673285007476807, -0.00045030564069747925, -0.00042387843132019043, -0.0003974512219429016, -0.0003710240125656128, -0.000344596803188324, -0.00031816959381103516, -0.00029174238443374634, -0.0002653151750564575, -0.0002388879656791687, -0.00021246075630187988, -0.00018603354692459106, -0.00015960633754730225, -0.00013317912817001343, -0.00010675191879272461, -8.032470941543579e-05, -5.389750003814697e-05, -2.7470290660858154e-05, -1.043081283569336e-06, 2.5384128093719482e-05, 5.18113374710083e-05, 7.823854684829712e-05, 0.00010466575622558594, 0.00013109296560287476, 0.00015752017498016357, 0.0001839473843574524, 0.0002103745937347412, 0.00023680180311203003, 0.00026322901248931885, 0.00028965622186660767, 0.0003160834312438965, 0.0003425106406211853, 0.0003689378499984741, 0.00039536505937576294, 0.00042179226875305176, 0.0004482194781303406, 0.0004746466875076294, 0.0005010738968849182, 0.000527501106262207, 0.0005539283156394958, 0.0005803555250167847, 0.0006067827343940735, 0.0006332099437713623, 0.0006596371531486511, 0.0006860643625259399, 0.0007124915719032288, 0.0007389187812805176, 0.0007653459906578064, 0.0007917732000350952, 0.000818200409412384, 0.0008446276187896729, 0.0008710548281669617, 0.0008974820375442505, 0.0009239092469215393, 0.0009503364562988281]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 7.0, 16.0, 18.0, 41.0, 37.0, 60.0, 87.0, 148.0, 210.0, 281.0, 474.0, 794.0, 1342.0, 2312.0, 3756.0, 6462.0, 10975.0, 18740.0, 31723.0, 52731.0, 81288.0, 114916.0, 143562.0, 152299.0, 137047.0, 105337.0, 71854.0, 45022.0, 27652.0, 16344.0, 9437.0, 5376.0, 3127.0, 1937.0, 1221.0, 697.0, 428.0, 281.0, 180.0, 113.0, 59.0, 46.0, 37.0, 20.0, 18.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.953125, -8.6763916015625, -8.399658203125, -8.1229248046875, -7.84619140625, -7.5694580078125, -7.292724609375, -7.0159912109375, -6.7392578125, -6.4625244140625, -6.185791015625, -5.9090576171875, -5.63232421875, -5.3555908203125, -5.078857421875, -4.8021240234375, -4.525390625, -4.2486572265625, -3.971923828125, -3.6951904296875, -3.41845703125, -3.1417236328125, -2.864990234375, -2.5882568359375, -2.3115234375, -2.0347900390625, -1.758056640625, -1.4813232421875, -1.20458984375, -0.9278564453125, -0.651123046875, -0.3743896484375, -0.09765625, 0.1790771484375, 0.455810546875, 0.7325439453125, 1.00927734375, 1.2860107421875, 1.562744140625, 1.8394775390625, 2.1162109375, 2.3929443359375, 2.669677734375, 2.9464111328125, 3.22314453125, 3.4998779296875, 3.776611328125, 4.0533447265625, 4.330078125, 4.6068115234375, 4.883544921875, 5.1602783203125, 5.43701171875, 5.7137451171875, 5.990478515625, 6.2672119140625, 6.5439453125, 6.8206787109375, 7.097412109375, 7.3741455078125, 7.65087890625, 7.9276123046875, 8.204345703125, 8.4810791015625, 8.7578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 1.0, 6.0, 7.0, 9.0, 16.0, 21.0, 10.0, 16.0, 33.0, 23.0, 30.0, 42.0, 37.0, 49.0, 55.0, 52.0, 69.0, 58.0, 54.0, 59.0, 59.0, 46.0, 43.0, 38.0, 44.0, 24.0, 17.0, 15.0, 13.0, 8.0, 8.0, 8.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-8.1796875, -7.96417236328125, -7.7486572265625, -7.53314208984375, -7.317626953125, -7.10211181640625, -6.8865966796875, -6.67108154296875, -6.45556640625, -6.24005126953125, -6.0245361328125, -5.80902099609375, -5.593505859375, -5.37799072265625, -5.1624755859375, -4.94696044921875, -4.7314453125, -4.51593017578125, -4.3004150390625, -4.08489990234375, -3.869384765625, -3.65386962890625, -3.4383544921875, -3.22283935546875, -3.00732421875, -2.79180908203125, -2.5762939453125, -2.36077880859375, -2.145263671875, -1.92974853515625, -1.7142333984375, -1.49871826171875, -1.283203125, -1.06768798828125, -0.8521728515625, -0.63665771484375, -0.421142578125, -0.20562744140625, 0.0098876953125, 0.22540283203125, 0.44091796875, 0.65643310546875, 0.8719482421875, 1.08746337890625, 1.302978515625, 1.51849365234375, 1.7340087890625, 1.94952392578125, 2.1650390625, 2.38055419921875, 2.5960693359375, 2.81158447265625, 3.027099609375, 3.24261474609375, 3.4581298828125, 3.67364501953125, 3.88916015625, 4.10467529296875, 4.3201904296875, 4.53570556640625, 4.751220703125, 4.96673583984375, 5.1822509765625, 5.39776611328125, 5.61328125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 2.0, 6.0, 15.0, 22.0, 10.0, 13.0, 18.0, 21.0, 29.0, 42.0, 35.0, 36.0, 46.0, 36.0, 32.0, 45.0, 61.0, 72.0, 51.0, 44.0, 43.0, 48.0, 43.0, 47.0, 26.0, 28.0, 18.0, 25.0, 20.0, 11.0, 12.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.688817977905273, -21.973594665527344, -21.25836944580078, -20.54314613342285, -19.82792091369629, -19.11269760131836, -18.397472381591797, -17.682249069213867, -16.967023849487305, -16.251800537109375, -15.536575317382812, -14.821351051330566, -14.10612678527832, -13.390902519226074, -12.675678253173828, -11.960454940795898, -11.245230674743652, -10.530006408691406, -9.81478214263916, -9.099557876586914, -8.384333610534668, -7.669109344482422, -6.953885555267334, -6.238661289215088, -5.523437023162842, -4.808212757110596, -4.09298849105835, -3.3777644634246826, -2.6625401973724365, -1.9473159313201904, -1.2320919036865234, -0.5168676376342773, 0.19835662841796875, 0.9135808348655701, 1.6288050413131714, 2.344029188156128, 3.059253454208374, 3.77447772026062, 4.489701747894287, 5.204926013946533, 5.920150279998779, 6.635374546051025, 7.3505988121032715, 8.06582260131836, 8.781046867370605, 9.496271133422852, 10.211495399475098, 10.926719665527344, 11.64194393157959, 12.357168197631836, 13.072392463684082, 13.787616729736328, 14.502840995788574, 15.21806526184082, 15.93328857421875, 16.648513793945312, 17.363737106323242, 18.078960418701172, 18.794185638427734, 19.509408950805664, 20.224634170532227, 20.939857482910156, 21.65508270263672, 22.37030601501465, 23.08553123474121]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 6.0, 11.0, 8.0, 12.0, 13.0, 14.0, 13.0, 31.0, 23.0, 33.0, 22.0, 29.0, 40.0, 49.0, 23.0, 40.0, 46.0, 52.0, 45.0, 35.0, 40.0, 42.0, 28.0, 30.0, 37.0, 38.0, 30.0, 34.0, 24.0, 20.0, 23.0, 19.0, 16.0, 8.0, 9.0, 12.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.70754051208496, -24.83597755432129, -23.964412689208984, -23.092849731445312, -22.22128677368164, -21.34972381591797, -20.478158950805664, -19.606595993041992, -18.735031127929688, -17.863468170166016, -16.99190330505371, -16.12034034729004, -15.248777389526367, -14.377213478088379, -13.50564956665039, -12.634086608886719, -11.762523651123047, -10.890959739685059, -10.019396781921387, -9.147832870483398, -8.276269912719727, -7.404706001281738, -6.53314208984375, -5.66157865524292, -4.79001522064209, -3.9184517860412598, -3.0468881130218506, -2.1753244400024414, -1.3037610054016113, -0.43219757080078125, 0.43936634063720703, 1.310929775238037, 2.182493209838867, 3.0540566444396973, 3.9256203174591064, 4.797183990478516, 5.668747425079346, 6.540310859680176, 7.411874771118164, 8.283437728881836, 9.155001640319824, 10.026565551757812, 10.898128509521484, 11.769692420959473, 12.641256332397461, 13.512819290161133, 14.384383201599121, 15.25594711303711, 16.12751007080078, 16.999073028564453, 17.870637893676758, 18.74220085144043, 19.6137638092041, 20.485328674316406, 21.356891632080078, 22.22845458984375, 23.100017547607422, 23.971580505371094, 24.8431453704834, 25.71470832824707, 26.586271286010742, 27.457836151123047, 28.32939910888672, 29.20096206665039, 30.072526931762695]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 9.0, 15.0, 18.0, 28.0, 37.0, 71.0, 95.0, 165.0, 217.0, 344.0, 524.0, 733.0, 1157.0, 1699.0, 2614.0, 3939.0, 5976.0, 9204.0, 14587.0, 22455.0, 34937.0, 54133.0, 84059.0, 128716.0, 192566.0, 276622.0, 371909.0, 459375.0, 509053.0, 499611.0, 438015.0, 341931.0, 249285.0, 169977.0, 113674.0, 73487.0, 47401.0, 30724.0, 19276.0, 12560.0, 8177.0, 5100.0, 3315.0, 2196.0, 1448.0, 987.0, 668.0, 407.0, 273.0, 181.0, 109.0, 76.0, 57.0, 42.0, 29.0, 15.0, 8.0, 3.0, 1.0, 1.0], "bins": [-15.8203125, -15.338623046875, -14.85693359375, -14.375244140625, -13.8935546875, -13.411865234375, -12.93017578125, -12.448486328125, -11.966796875, -11.485107421875, -11.00341796875, -10.521728515625, -10.0400390625, -9.558349609375, -9.07666015625, -8.594970703125, -8.11328125, -7.631591796875, -7.14990234375, -6.668212890625, -6.1865234375, -5.704833984375, -5.22314453125, -4.741455078125, -4.259765625, -3.778076171875, -3.29638671875, -2.814697265625, -2.3330078125, -1.851318359375, -1.36962890625, -0.887939453125, -0.40625, 0.075439453125, 0.55712890625, 1.038818359375, 1.5205078125, 2.002197265625, 2.48388671875, 2.965576171875, 3.447265625, 3.928955078125, 4.41064453125, 4.892333984375, 5.3740234375, 5.855712890625, 6.33740234375, 6.819091796875, 7.30078125, 7.782470703125, 8.26416015625, 8.745849609375, 9.2275390625, 9.709228515625, 10.19091796875, 10.672607421875, 11.154296875, 11.635986328125, 12.11767578125, 12.599365234375, 13.0810546875, 13.562744140625, 14.04443359375, 14.526123046875, 15.0078125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 6.0, 8.0, 16.0, 17.0, 14.0, 24.0, 17.0, 18.0, 30.0, 29.0, 24.0, 46.0, 44.0, 39.0, 38.0, 44.0, 28.0, 44.0, 44.0, 40.0, 35.0, 41.0, 27.0, 37.0, 33.0, 39.0, 22.0, 34.0, 26.0, 18.0, 21.0, 11.0, 13.0, 10.0, 7.0, 11.0, 4.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.046875, -20.3583984375, -19.669921875, -18.9814453125, -18.29296875, -17.6044921875, -16.916015625, -16.2275390625, -15.5390625, -14.8505859375, -14.162109375, -13.4736328125, -12.78515625, -12.0966796875, -11.408203125, -10.7197265625, -10.03125, -9.3427734375, -8.654296875, -7.9658203125, -7.27734375, -6.5888671875, -5.900390625, -5.2119140625, -4.5234375, -3.8349609375, -3.146484375, -2.4580078125, -1.76953125, -1.0810546875, -0.392578125, 0.2958984375, 0.984375, 1.6728515625, 2.361328125, 3.0498046875, 3.73828125, 4.4267578125, 5.115234375, 5.8037109375, 6.4921875, 7.1806640625, 7.869140625, 8.5576171875, 9.24609375, 9.9345703125, 10.623046875, 11.3115234375, 12.0, 12.6884765625, 13.376953125, 14.0654296875, 14.75390625, 15.4423828125, 16.130859375, 16.8193359375, 17.5078125, 18.1962890625, 18.884765625, 19.5732421875, 20.26171875, 20.9501953125, 21.638671875, 22.3271484375, 23.015625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 18.0, 24.0, 44.0, 61.0, 99.0, 169.0, 265.0, 425.0, 703.0, 1219.0, 2021.0, 3275.0, 5557.0, 9196.0, 15272.0, 25905.0, 42696.0, 68875.0, 110974.0, 171648.0, 254881.0, 352463.0, 453136.0, 518332.0, 524795.0, 470715.0, 376972.0, 275848.0, 189614.0, 123356.0, 76990.0, 47241.0, 28371.0, 17201.0, 10370.0, 6153.0, 3697.0, 2249.0, 1338.0, 852.0, 445.0, 322.0, 204.0, 102.0, 78.0, 41.0, 30.0, 14.0, 11.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.078125, -16.510986328125, -15.94384765625, -15.376708984375, -14.8095703125, -14.242431640625, -13.67529296875, -13.108154296875, -12.541015625, -11.973876953125, -11.40673828125, -10.839599609375, -10.2724609375, -9.705322265625, -9.13818359375, -8.571044921875, -8.00390625, -7.436767578125, -6.86962890625, -6.302490234375, -5.7353515625, -5.168212890625, -4.60107421875, -4.033935546875, -3.466796875, -2.899658203125, -2.33251953125, -1.765380859375, -1.1982421875, -0.631103515625, -0.06396484375, 0.503173828125, 1.0703125, 1.637451171875, 2.20458984375, 2.771728515625, 3.3388671875, 3.906005859375, 4.47314453125, 5.040283203125, 5.607421875, 6.174560546875, 6.74169921875, 7.308837890625, 7.8759765625, 8.443115234375, 9.01025390625, 9.577392578125, 10.14453125, 10.711669921875, 11.27880859375, 11.845947265625, 12.4130859375, 12.980224609375, 13.54736328125, 14.114501953125, 14.681640625, 15.248779296875, 15.81591796875, 16.383056640625, 16.9501953125, 17.517333984375, 18.08447265625, 18.651611328125, 19.21875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 11.0, 15.0, 12.0, 25.0, 31.0, 38.0, 41.0, 47.0, 70.0, 82.0, 122.0, 116.0, 131.0, 168.0, 171.0, 180.0, 206.0, 230.0, 222.0, 228.0, 232.0, 202.0, 221.0, 212.0, 160.0, 136.0, 141.0, 123.0, 96.0, 86.0, 61.0, 56.0, 36.0, 44.0, 24.0, 16.0, 21.0, 12.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.265625, -10.949462890625, -10.63330078125, -10.317138671875, -10.0009765625, -9.684814453125, -9.36865234375, -9.052490234375, -8.736328125, -8.420166015625, -8.10400390625, -7.787841796875, -7.4716796875, -7.155517578125, -6.83935546875, -6.523193359375, -6.20703125, -5.890869140625, -5.57470703125, -5.258544921875, -4.9423828125, -4.626220703125, -4.31005859375, -3.993896484375, -3.677734375, -3.361572265625, -3.04541015625, -2.729248046875, -2.4130859375, -2.096923828125, -1.78076171875, -1.464599609375, -1.1484375, -0.832275390625, -0.51611328125, -0.199951171875, 0.1162109375, 0.432373046875, 0.74853515625, 1.064697265625, 1.380859375, 1.697021484375, 2.01318359375, 2.329345703125, 2.6455078125, 2.961669921875, 3.27783203125, 3.593994140625, 3.91015625, 4.226318359375, 4.54248046875, 4.858642578125, 5.1748046875, 5.490966796875, 5.80712890625, 6.123291015625, 6.439453125, 6.755615234375, 7.07177734375, 7.387939453125, 7.7041015625, 8.020263671875, 8.33642578125, 8.652587890625, 8.96875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 8.0, 6.0, 8.0, 9.0, 20.0, 18.0, 19.0, 25.0, 29.0, 42.0, 33.0, 44.0, 48.0, 57.0, 63.0, 44.0, 57.0, 75.0, 59.0, 38.0, 51.0, 48.0, 42.0, 36.0, 23.0, 26.0, 22.0, 12.0, 18.0, 6.0, 7.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.37006950378418, -26.518503189086914, -25.66693687438965, -24.815372467041016, -23.96380615234375, -23.112239837646484, -22.26067352294922, -21.409107208251953, -20.557540893554688, -19.705974578857422, -18.854408264160156, -18.00284194946289, -17.151277542114258, -16.299711227416992, -15.448144912719727, -14.596578598022461, -13.745014190673828, -12.893447875976562, -12.041882514953613, -11.190316200256348, -10.338750839233398, -9.487184524536133, -8.635618209838867, -7.78405237197876, -6.932486534118652, -6.080920696258545, -5.2293548583984375, -4.377788543701172, -3.5262227058410645, -2.674656867980957, -1.8230905532836914, -0.971524715423584, -0.11995697021484375, 0.7316089868545532, 1.5831749439239502, 2.4347410202026367, 3.286306858062744, 4.137872695922852, 4.989439010620117, 5.841004848480225, 6.692570686340332, 7.5441365242004395, 8.395702362060547, 9.247268676757812, 10.098834991455078, 10.950400352478027, 11.801966667175293, 12.653532028198242, 13.505098342895508, 14.356664657592773, 15.208230018615723, 16.059795379638672, 16.911361694335938, 17.762928009033203, 18.61449432373047, 19.466060638427734, 20.317626953125, 21.169193267822266, 22.02075958251953, 22.872325897216797, 23.72389030456543, 24.575456619262695, 25.42702293395996, 26.278589248657227, 27.13015365600586]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 10.0, 7.0, 10.0, 15.0, 12.0, 20.0, 24.0, 17.0, 23.0, 24.0, 35.0, 44.0, 39.0, 36.0, 49.0, 39.0, 49.0, 36.0, 51.0, 37.0, 45.0, 31.0, 33.0, 46.0, 30.0, 35.0, 35.0, 30.0, 17.0, 26.0, 21.0, 13.0, 9.0, 9.0, 7.0, 6.0, 6.0, 9.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.633066177368164, -26.737417221069336, -25.841766357421875, -24.946117401123047, -24.050466537475586, -23.154817581176758, -22.259166717529297, -21.36351776123047, -20.46786880493164, -19.572219848632812, -18.67656898498535, -17.780920028686523, -16.885269165039062, -15.989620208740234, -15.09397029876709, -14.198320388793945, -13.302669525146484, -12.40701961517334, -11.511369705200195, -10.615720748901367, -9.720069885253906, -8.824420928955078, -7.928771018981934, -7.033121109008789, -6.1374711990356445, -5.2418212890625, -4.3461713790893555, -3.450521945953369, -2.5548720359802246, -1.65922212600708, -0.7635726928710938, 0.13207721710205078, 1.0277271270751953, 1.9233769178390503, 2.8190267086029053, 3.7146763801574707, 4.610326290130615, 5.50597620010376, 6.401625633239746, 7.297275543212891, 8.192925453186035, 9.08857536315918, 9.984225273132324, 10.879875183105469, 11.775524139404297, 12.671175003051758, 13.566823959350586, 14.46247386932373, 15.358123779296875, 16.253772735595703, 17.149423599243164, 18.045072555541992, 18.940723419189453, 19.83637237548828, 20.73202133178711, 21.62767219543457, 22.52332305908203, 23.41897201538086, 24.31462287902832, 25.21027183532715, 26.10592269897461, 27.001571655273438, 27.897220611572266, 28.792871475219727, 29.688520431518555]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 7.0, 10.0, 16.0, 25.0, 38.0, 54.0, 91.0, 134.0, 222.0, 311.0, 523.0, 893.0, 1448.0, 2490.0, 4140.0, 7341.0, 13552.0, 24793.0, 45578.0, 81096.0, 129538.0, 175944.0, 185125.0, 149756.0, 98136.0, 57032.0, 31259.0, 16916.0, 9204.0, 5197.0, 3033.0, 1754.0, 1122.0, 635.0, 407.0, 295.0, 141.0, 89.0, 61.0, 53.0, 36.0, 23.0, 15.0, 11.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1669921875, -8.841796875, -8.5166015625, -8.19140625, -7.8662109375, -7.541015625, -7.2158203125, -6.890625, -6.5654296875, -6.240234375, -5.9150390625, -5.58984375, -5.2646484375, -4.939453125, -4.6142578125, -4.2890625, -3.9638671875, -3.638671875, -3.3134765625, -2.98828125, -2.6630859375, -2.337890625, -2.0126953125, -1.6875, -1.3623046875, -1.037109375, -0.7119140625, -0.38671875, -0.0615234375, 0.263671875, 0.5888671875, 0.9140625, 1.2392578125, 1.564453125, 1.8896484375, 2.21484375, 2.5400390625, 2.865234375, 3.1904296875, 3.515625, 3.8408203125, 4.166015625, 4.4912109375, 4.81640625, 5.1416015625, 5.466796875, 5.7919921875, 6.1171875, 6.4423828125, 6.767578125, 7.0927734375, 7.41796875, 7.7431640625, 8.068359375, 8.3935546875, 8.71875, 9.0439453125, 9.369140625, 9.6943359375, 10.01953125, 10.3447265625, 10.669921875, 10.9951171875, 11.3203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 2.0, 7.0, 9.0, 9.0, 9.0, 12.0, 13.0, 14.0, 21.0, 23.0, 28.0, 33.0, 35.0, 40.0, 40.0, 45.0, 40.0, 36.0, 50.0, 47.0, 43.0, 46.0, 41.0, 43.0, 54.0, 37.0, 31.0, 38.0, 25.0, 18.0, 24.0, 22.0, 17.0, 9.0, 5.0, 9.0, 8.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.242919921875, -28.28271484375, -27.322509765625, -26.3623046875, -25.402099609375, -24.44189453125, -23.481689453125, -22.521484375, -21.561279296875, -20.60107421875, -19.640869140625, -18.6806640625, -17.720458984375, -16.76025390625, -15.800048828125, -14.83984375, -13.879638671875, -12.91943359375, -11.959228515625, -10.9990234375, -10.038818359375, -9.07861328125, -8.118408203125, -7.158203125, -6.197998046875, -5.23779296875, -4.277587890625, -3.3173828125, -2.357177734375, -1.39697265625, -0.436767578125, 0.5234375, 1.483642578125, 2.44384765625, 3.404052734375, 4.3642578125, 5.324462890625, 6.28466796875, 7.244873046875, 8.205078125, 9.165283203125, 10.12548828125, 11.085693359375, 12.0458984375, 13.006103515625, 13.96630859375, 14.926513671875, 15.88671875, 16.846923828125, 17.80712890625, 18.767333984375, 19.7275390625, 20.687744140625, 21.64794921875, 22.608154296875, 23.568359375, 24.528564453125, 25.48876953125, 26.448974609375, 27.4091796875, 28.369384765625, 29.32958984375, 30.289794921875, 31.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 9.0, 11.0, 20.0, 14.0, 21.0, 44.0, 59.0, 97.0, 120.0, 187.0, 266.0, 464.0, 782.0, 1297.0, 2332.0, 4314.0, 8182.0, 16938.0, 34467.0, 70952.0, 134677.0, 211436.0, 227438.0, 160098.0, 86996.0, 43723.0, 20868.0, 10523.0, 5397.0, 2874.0, 1541.0, 919.0, 498.0, 370.0, 204.0, 129.0, 90.0, 66.0, 40.0, 34.0, 27.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -11.9581298828125, -11.533447265625, -11.1087646484375, -10.68408203125, -10.2593994140625, -9.834716796875, -9.4100341796875, -8.9853515625, -8.5606689453125, -8.135986328125, -7.7113037109375, -7.28662109375, -6.8619384765625, -6.437255859375, -6.0125732421875, -5.587890625, -5.1632080078125, -4.738525390625, -4.3138427734375, -3.88916015625, -3.4644775390625, -3.039794921875, -2.6151123046875, -2.1904296875, -1.7657470703125, -1.341064453125, -0.9163818359375, -0.49169921875, -0.0670166015625, 0.357666015625, 0.7823486328125, 1.20703125, 1.6317138671875, 2.056396484375, 2.4810791015625, 2.90576171875, 3.3304443359375, 3.755126953125, 4.1798095703125, 4.6044921875, 5.0291748046875, 5.453857421875, 5.8785400390625, 6.30322265625, 6.7279052734375, 7.152587890625, 7.5772705078125, 8.001953125, 8.4266357421875, 8.851318359375, 9.2760009765625, 9.70068359375, 10.1253662109375, 10.550048828125, 10.9747314453125, 11.3994140625, 11.8240966796875, 12.248779296875, 12.6734619140625, 13.09814453125, 13.5228271484375, 13.947509765625, 14.3721923828125, 14.796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 2.0, 10.0, 7.0, 12.0, 11.0, 6.0, 12.0, 20.0, 14.0, 14.0, 26.0, 22.0, 24.0, 32.0, 37.0, 27.0, 35.0, 29.0, 38.0, 30.0, 32.0, 38.0, 35.0, 49.0, 29.0, 38.0, 27.0, 34.0, 28.0, 32.0, 23.0, 17.0, 17.0, 22.0, 23.0, 19.0, 22.0, 16.0, 13.0, 10.0, 8.0, 11.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-14.4453125, -13.98779296875, -13.5302734375, -13.07275390625, -12.615234375, -12.15771484375, -11.7001953125, -11.24267578125, -10.78515625, -10.32763671875, -9.8701171875, -9.41259765625, -8.955078125, -8.49755859375, -8.0400390625, -7.58251953125, -7.125, -6.66748046875, -6.2099609375, -5.75244140625, -5.294921875, -4.83740234375, -4.3798828125, -3.92236328125, -3.46484375, -3.00732421875, -2.5498046875, -2.09228515625, -1.634765625, -1.17724609375, -0.7197265625, -0.26220703125, 0.1953125, 0.65283203125, 1.1103515625, 1.56787109375, 2.025390625, 2.48291015625, 2.9404296875, 3.39794921875, 3.85546875, 4.31298828125, 4.7705078125, 5.22802734375, 5.685546875, 6.14306640625, 6.6005859375, 7.05810546875, 7.515625, 7.97314453125, 8.4306640625, 8.88818359375, 9.345703125, 9.80322265625, 10.2607421875, 10.71826171875, 11.17578125, 11.63330078125, 12.0908203125, 12.54833984375, 13.005859375, 13.46337890625, 13.9208984375, 14.37841796875, 14.8359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 6.0, 12.0, 12.0, 39.0, 41.0, 75.0, 114.0, 160.0, 248.0, 414.0, 610.0, 1119.0, 2096.0, 4241.0, 9490.0, 23514.0, 65261.0, 180533.0, 345773.0, 255161.0, 98798.0, 35099.0, 13480.0, 5876.0, 2738.0, 1431.0, 813.0, 475.0, 302.0, 196.0, 139.0, 83.0, 47.0, 47.0, 38.0, 18.0, 13.0, 11.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.09747314453125, -6.8316650390625, -6.56585693359375, -6.300048828125, -6.03424072265625, -5.7684326171875, -5.50262451171875, -5.23681640625, -4.97100830078125, -4.7052001953125, -4.43939208984375, -4.173583984375, -3.90777587890625, -3.6419677734375, -3.37615966796875, -3.1103515625, -2.84454345703125, -2.5787353515625, -2.31292724609375, -2.047119140625, -1.78131103515625, -1.5155029296875, -1.24969482421875, -0.98388671875, -0.71807861328125, -0.4522705078125, -0.18646240234375, 0.079345703125, 0.34515380859375, 0.6109619140625, 0.87677001953125, 1.142578125, 1.40838623046875, 1.6741943359375, 1.94000244140625, 2.205810546875, 2.47161865234375, 2.7374267578125, 3.00323486328125, 3.26904296875, 3.53485107421875, 3.8006591796875, 4.06646728515625, 4.332275390625, 4.59808349609375, 4.8638916015625, 5.12969970703125, 5.3955078125, 5.66131591796875, 5.9271240234375, 6.19293212890625, 6.458740234375, 6.72454833984375, 6.9903564453125, 7.25616455078125, 7.52197265625, 7.78778076171875, 8.0535888671875, 8.31939697265625, 8.585205078125, 8.85101318359375, 9.1168212890625, 9.38262939453125, 9.6484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 23.0, 27.0, 56.0, 51.0, 79.0, 97.0, 133.0, 117.0, 110.0, 86.0, 68.0, 48.0, 35.0, 25.0, 12.0, 9.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005540847778320312, -0.0005336850881576538, -0.0005132853984832764, -0.0004928857088088989, -0.0004724860191345215, -0.00045208632946014404, -0.0004316866397857666, -0.00041128695011138916, -0.0003908872604370117, -0.0003704875707626343, -0.00035008788108825684, -0.0003296881914138794, -0.00030928850173950195, -0.0002888888120651245, -0.00026848912239074707, -0.00024808943271636963, -0.0002276897430419922, -0.00020729005336761475, -0.0001868903636932373, -0.00016649067401885986, -0.00014609098434448242, -0.00012569129467010498, -0.00010529160499572754, -8.48919153213501e-05, -6.449222564697266e-05, -4.4092535972595215e-05, -2.3692846298217773e-05, -3.293156623840332e-06, 1.710653305053711e-05, 3.750622272491455e-05, 5.790591239929199e-05, 7.830560207366943e-05, 9.870529174804688e-05, 0.00011910498142242432, 0.00013950467109680176, 0.0001599043607711792, 0.00018030405044555664, 0.00020070374011993408, 0.00022110342979431152, 0.00024150311946868896, 0.0002619028091430664, 0.00028230249881744385, 0.0003027021884918213, 0.00032310187816619873, 0.00034350156784057617, 0.0003639012575149536, 0.00038430094718933105, 0.0004047006368637085, 0.00042510032653808594, 0.0004455000162124634, 0.0004658997058868408, 0.00048629939556121826, 0.0005066990852355957, 0.0005270987749099731, 0.0005474984645843506, 0.000567898154258728, 0.0005882978439331055, 0.0006086975336074829, 0.0006290972232818604, 0.0006494969129562378, 0.0006698966026306152, 0.0006902962923049927, 0.0007106959819793701, 0.0007310956716537476, 0.000751495361328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 6.0, 9.0, 13.0, 17.0, 27.0, 24.0, 56.0, 79.0, 102.0, 152.0, 236.0, 341.0, 502.0, 712.0, 1120.0, 1767.0, 2736.0, 4410.0, 7496.0, 13014.0, 22576.0, 40265.0, 68789.0, 110885.0, 155887.0, 177900.0, 157872.0, 113513.0, 70501.0, 40869.0, 23352.0, 13168.0, 7556.0, 4597.0, 2887.0, 1656.0, 1143.0, 734.0, 479.0, 328.0, 214.0, 187.0, 127.0, 81.0, 60.0, 34.0, 30.0, 18.0, 11.0, 9.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.14453125, -4.9813232421875, -4.818115234375, -4.6549072265625, -4.49169921875, -4.3284912109375, -4.165283203125, -4.0020751953125, -3.8388671875, -3.6756591796875, -3.512451171875, -3.3492431640625, -3.18603515625, -3.0228271484375, -2.859619140625, -2.6964111328125, -2.533203125, -2.3699951171875, -2.206787109375, -2.0435791015625, -1.88037109375, -1.7171630859375, -1.553955078125, -1.3907470703125, -1.2275390625, -1.0643310546875, -0.901123046875, -0.7379150390625, -0.57470703125, -0.4114990234375, -0.248291015625, -0.0850830078125, 0.078125, 0.2413330078125, 0.404541015625, 0.5677490234375, 0.73095703125, 0.8941650390625, 1.057373046875, 1.2205810546875, 1.3837890625, 1.5469970703125, 1.710205078125, 1.8734130859375, 2.03662109375, 2.1998291015625, 2.363037109375, 2.5262451171875, 2.689453125, 2.8526611328125, 3.015869140625, 3.1790771484375, 3.34228515625, 3.5054931640625, 3.668701171875, 3.8319091796875, 3.9951171875, 4.1583251953125, 4.321533203125, 4.4847412109375, 4.64794921875, 4.8111572265625, 4.974365234375, 5.1375732421875, 5.30078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 10.0, 10.0, 22.0, 30.0, 40.0, 55.0, 51.0, 51.0, 50.0, 57.0, 82.0, 58.0, 76.0, 87.0, 44.0, 59.0, 39.0, 42.0, 26.0, 27.0, 20.0, 11.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.874847412109375, -2.79071044921875, -2.706573486328125, -2.6224365234375, -2.538299560546875, -2.45416259765625, -2.370025634765625, -2.285888671875, -2.201751708984375, -2.11761474609375, -2.033477783203125, -1.9493408203125, -1.865203857421875, -1.78106689453125, -1.696929931640625, -1.61279296875, -1.528656005859375, -1.44451904296875, -1.360382080078125, -1.2762451171875, -1.192108154296875, -1.10797119140625, -1.023834228515625, -0.939697265625, -0.855560302734375, -0.77142333984375, -0.687286376953125, -0.6031494140625, -0.519012451171875, -0.43487548828125, -0.350738525390625, -0.2666015625, -0.182464599609375, -0.09832763671875, -0.014190673828125, 0.0699462890625, 0.154083251953125, 0.23822021484375, 0.322357177734375, 0.406494140625, 0.490631103515625, 0.57476806640625, 0.658905029296875, 0.7430419921875, 0.827178955078125, 0.91131591796875, 0.995452880859375, 1.07958984375, 1.163726806640625, 1.24786376953125, 1.332000732421875, 1.4161376953125, 1.500274658203125, 1.58441162109375, 1.668548583984375, 1.752685546875, 1.836822509765625, 1.92095947265625, 2.005096435546875, 2.0892333984375, 2.173370361328125, 2.25750732421875, 2.341644287109375, 2.42578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 4.0, 12.0, 12.0, 13.0, 18.0, 20.0, 22.0, 24.0, 40.0, 41.0, 40.0, 43.0, 48.0, 66.0, 51.0, 60.0, 60.0, 66.0, 48.0, 45.0, 44.0, 50.0, 31.0, 24.0, 24.0, 23.0, 16.0, 15.0, 12.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.589956283569336, -26.762981414794922, -25.936006546020508, -25.109031677246094, -24.28205680847168, -23.455081939697266, -22.62810707092285, -21.801132202148438, -20.974157333374023, -20.14718246459961, -19.320207595825195, -18.49323272705078, -17.666257858276367, -16.839282989501953, -16.01230812072754, -15.185333251953125, -14.358358383178711, -13.531383514404297, -12.704408645629883, -11.877433776855469, -11.050458908081055, -10.22348403930664, -9.396509170532227, -8.569534301757812, -7.742559432983398, -6.915584564208984, -6.08860969543457, -5.261634826660156, -4.434659957885742, -3.607685089111328, -2.780710220336914, -1.9537353515625, -1.1267585754394531, -0.29978370666503906, 0.527191162109375, 1.354166030883789, 2.181140899658203, 3.008115768432617, 3.8350906372070312, 4.662065505981445, 5.489040374755859, 6.316015243530273, 7.1429901123046875, 7.969964981079102, 8.796939849853516, 9.62391471862793, 10.450889587402344, 11.277864456176758, 12.104839324951172, 12.931814193725586, 13.7587890625, 14.585763931274414, 15.412738800048828, 16.239713668823242, 17.066688537597656, 17.89366340637207, 18.720638275146484, 19.5476131439209, 20.374588012695312, 21.201562881469727, 22.02853775024414, 22.855512619018555, 23.68248748779297, 24.509462356567383, 25.336437225341797]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 10.0, 8.0, 14.0, 16.0, 21.0, 21.0, 22.0, 19.0, 34.0, 28.0, 43.0, 42.0, 45.0, 43.0, 43.0, 40.0, 47.0, 35.0, 47.0, 45.0, 32.0, 31.0, 42.0, 30.0, 39.0, 30.0, 24.0, 29.0, 19.0, 22.0, 8.0, 11.0, 9.0, 7.0, 6.0, 4.0, 10.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.389484405517578, -26.497068405151367, -25.604652404785156, -24.712234497070312, -23.8198184967041, -22.92740249633789, -22.03498649597168, -21.14257049560547, -20.250152587890625, -19.357736587524414, -18.465320587158203, -17.57290267944336, -16.68048667907715, -15.788070678710938, -14.895654678344727, -14.003238677978516, -13.110822677612305, -12.218406677246094, -11.325989723205566, -10.433573722839355, -9.541156768798828, -8.648740768432617, -7.756324768066406, -6.863908290863037, -5.971491813659668, -5.079075336456299, -4.18665885925293, -3.2942428588867188, -2.4018263816833496, -1.5094099044799805, -0.6169939041137695, 0.2754225730895996, 1.167837142944336, 2.060253620147705, 2.952669858932495, 3.845086097717285, 4.737502574920654, 5.629919052124023, 6.522335052490234, 7.4147515296936035, 8.307168006896973, 9.199584007263184, 10.092000961303711, 10.984416961669922, 11.876832962036133, 12.76924991607666, 13.661665916442871, 14.554082870483398, 15.44649887084961, 16.33891487121582, 17.23133087158203, 18.123748779296875, 19.016164779663086, 19.908580780029297, 20.800996780395508, 21.69341278076172, 22.585830688476562, 23.478246688842773, 24.370662689208984, 25.263080596923828, 26.15549659729004, 27.04791259765625, 27.94032859802246, 28.832744598388672, 29.725160598754883]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 18.0, 15.0, 35.0, 50.0, 91.0, 145.0, 211.0, 298.0, 467.0, 754.0, 1206.0, 1795.0, 2944.0, 4648.0, 7411.0, 11607.0, 18106.0, 27342.0, 39803.0, 56225.0, 75072.0, 93928.0, 108251.0, 114222.0, 110976.0, 98767.0, 80435.0, 62008.0, 44558.0, 30204.0, 20233.0, 13252.0, 8549.0, 5500.0, 3399.0, 2204.0, 1389.0, 904.0, 555.0, 367.0, 209.0, 149.0, 106.0, 44.0, 43.0, 19.0, 19.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-14.171875, -13.750732421875, -13.32958984375, -12.908447265625, -12.4873046875, -12.066162109375, -11.64501953125, -11.223876953125, -10.802734375, -10.381591796875, -9.96044921875, -9.539306640625, -9.1181640625, -8.697021484375, -8.27587890625, -7.854736328125, -7.43359375, -7.012451171875, -6.59130859375, -6.170166015625, -5.7490234375, -5.327880859375, -4.90673828125, -4.485595703125, -4.064453125, -3.643310546875, -3.22216796875, -2.801025390625, -2.3798828125, -1.958740234375, -1.53759765625, -1.116455078125, -0.6953125, -0.274169921875, 0.14697265625, 0.568115234375, 0.9892578125, 1.410400390625, 1.83154296875, 2.252685546875, 2.673828125, 3.094970703125, 3.51611328125, 3.937255859375, 4.3583984375, 4.779541015625, 5.20068359375, 5.621826171875, 6.04296875, 6.464111328125, 6.88525390625, 7.306396484375, 7.7275390625, 8.148681640625, 8.56982421875, 8.990966796875, 9.412109375, 9.833251953125, 10.25439453125, 10.675537109375, 11.0966796875, 11.517822265625, 11.93896484375, 12.360107421875, 12.78125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 10.0, 12.0, 9.0, 23.0, 20.0, 19.0, 14.0, 25.0, 29.0, 38.0, 43.0, 43.0, 41.0, 32.0, 42.0, 40.0, 45.0, 34.0, 32.0, 38.0, 29.0, 39.0, 37.0, 29.0, 41.0, 25.0, 37.0, 23.0, 22.0, 18.0, 16.0, 16.0, 7.0, 8.0, 10.0, 7.0, 5.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.46875, -27.6279296875, -26.787109375, -25.9462890625, -25.10546875, -24.2646484375, -23.423828125, -22.5830078125, -21.7421875, -20.9013671875, -20.060546875, -19.2197265625, -18.37890625, -17.5380859375, -16.697265625, -15.8564453125, -15.015625, -14.1748046875, -13.333984375, -12.4931640625, -11.65234375, -10.8115234375, -9.970703125, -9.1298828125, -8.2890625, -7.4482421875, -6.607421875, -5.7666015625, -4.92578125, -4.0849609375, -3.244140625, -2.4033203125, -1.5625, -0.7216796875, 0.119140625, 0.9599609375, 1.80078125, 2.6416015625, 3.482421875, 4.3232421875, 5.1640625, 6.0048828125, 6.845703125, 7.6865234375, 8.52734375, 9.3681640625, 10.208984375, 11.0498046875, 11.890625, 12.7314453125, 13.572265625, 14.4130859375, 15.25390625, 16.0947265625, 16.935546875, 17.7763671875, 18.6171875, 19.4580078125, 20.298828125, 21.1396484375, 21.98046875, 22.8212890625, 23.662109375, 24.5029296875, 25.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 15.0, 30.0, 41.0, 87.0, 148.0, 248.0, 398.0, 666.0, 1114.0, 1877.0, 3122.0, 5228.0, 8603.0, 14106.0, 22449.0, 35812.0, 52911.0, 75404.0, 98076.0, 118563.0, 127004.0, 122036.0, 106114.0, 83835.0, 60379.0, 41133.0, 26722.0, 16744.0, 10234.0, 6217.0, 3681.0, 2201.0, 1385.0, 790.0, 452.0, 289.0, 158.0, 90.0, 79.0, 44.0, 23.0, 15.0, 6.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4140625, -13.9283447265625, -13.442626953125, -12.9569091796875, -12.47119140625, -11.9854736328125, -11.499755859375, -11.0140380859375, -10.5283203125, -10.0426025390625, -9.556884765625, -9.0711669921875, -8.58544921875, -8.0997314453125, -7.614013671875, -7.1282958984375, -6.642578125, -6.1568603515625, -5.671142578125, -5.1854248046875, -4.69970703125, -4.2139892578125, -3.728271484375, -3.2425537109375, -2.7568359375, -2.2711181640625, -1.785400390625, -1.2996826171875, -0.81396484375, -0.3282470703125, 0.157470703125, 0.6431884765625, 1.12890625, 1.6146240234375, 2.100341796875, 2.5860595703125, 3.07177734375, 3.5574951171875, 4.043212890625, 4.5289306640625, 5.0146484375, 5.5003662109375, 5.986083984375, 6.4718017578125, 6.95751953125, 7.4432373046875, 7.928955078125, 8.4146728515625, 8.900390625, 9.3861083984375, 9.871826171875, 10.3575439453125, 10.84326171875, 11.3289794921875, 11.814697265625, 12.3004150390625, 12.7861328125, 13.2718505859375, 13.757568359375, 14.2432861328125, 14.72900390625, 15.2147216796875, 15.700439453125, 16.1861572265625, 16.671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 8.0, 5.0, 9.0, 11.0, 17.0, 14.0, 18.0, 22.0, 28.0, 21.0, 35.0, 43.0, 32.0, 31.0, 37.0, 28.0, 42.0, 48.0, 40.0, 31.0, 47.0, 37.0, 41.0, 38.0, 41.0, 33.0, 23.0, 28.0, 20.0, 34.0, 25.0, 18.0, 15.0, 17.0, 8.0, 12.0, 10.0, 3.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-17.90625, -17.364501953125, -16.82275390625, -16.281005859375, -15.7392578125, -15.197509765625, -14.65576171875, -14.114013671875, -13.572265625, -13.030517578125, -12.48876953125, -11.947021484375, -11.4052734375, -10.863525390625, -10.32177734375, -9.780029296875, -9.23828125, -8.696533203125, -8.15478515625, -7.613037109375, -7.0712890625, -6.529541015625, -5.98779296875, -5.446044921875, -4.904296875, -4.362548828125, -3.82080078125, -3.279052734375, -2.7373046875, -2.195556640625, -1.65380859375, -1.112060546875, -0.5703125, -0.028564453125, 0.51318359375, 1.054931640625, 1.5966796875, 2.138427734375, 2.68017578125, 3.221923828125, 3.763671875, 4.305419921875, 4.84716796875, 5.388916015625, 5.9306640625, 6.472412109375, 7.01416015625, 7.555908203125, 8.09765625, 8.639404296875, 9.18115234375, 9.722900390625, 10.2646484375, 10.806396484375, 11.34814453125, 11.889892578125, 12.431640625, 12.973388671875, 13.51513671875, 14.056884765625, 14.5986328125, 15.140380859375, 15.68212890625, 16.223876953125, 16.765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 11.0, 19.0, 31.0, 50.0, 72.0, 122.0, 193.0, 297.0, 459.0, 765.0, 1280.0, 2060.0, 3409.0, 6001.0, 10317.0, 16993.0, 29336.0, 48318.0, 75482.0, 109108.0, 138282.0, 150624.0, 140251.0, 111744.0, 78081.0, 50517.0, 30600.0, 18101.0, 10592.0, 6255.0, 3685.0, 2152.0, 1284.0, 751.0, 485.0, 299.0, 197.0, 123.0, 71.0, 48.0, 22.0, 18.0, 18.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.94921875, -7.69720458984375, -7.4451904296875, -7.19317626953125, -6.941162109375, -6.68914794921875, -6.4371337890625, -6.18511962890625, -5.93310546875, -5.68109130859375, -5.4290771484375, -5.17706298828125, -4.925048828125, -4.67303466796875, -4.4210205078125, -4.16900634765625, -3.9169921875, -3.66497802734375, -3.4129638671875, -3.16094970703125, -2.908935546875, -2.65692138671875, -2.4049072265625, -2.15289306640625, -1.90087890625, -1.64886474609375, -1.3968505859375, -1.14483642578125, -0.892822265625, -0.64080810546875, -0.3887939453125, -0.13677978515625, 0.115234375, 0.36724853515625, 0.6192626953125, 0.87127685546875, 1.123291015625, 1.37530517578125, 1.6273193359375, 1.87933349609375, 2.13134765625, 2.38336181640625, 2.6353759765625, 2.88739013671875, 3.139404296875, 3.39141845703125, 3.6434326171875, 3.89544677734375, 4.1474609375, 4.39947509765625, 4.6514892578125, 4.90350341796875, 5.155517578125, 5.40753173828125, 5.6595458984375, 5.91156005859375, 6.16357421875, 6.41558837890625, 6.6676025390625, 6.91961669921875, 7.171630859375, 7.42364501953125, 7.6756591796875, 7.92767333984375, 8.1796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 4.0, 4.0, 7.0, 7.0, 8.0, 10.0, 9.0, 17.0, 17.0, 22.0, 30.0, 44.0, 37.0, 33.0, 41.0, 38.0, 54.0, 54.0, 54.0, 60.0, 51.0, 50.0, 43.0, 36.0, 38.0, 29.0, 42.0, 36.0, 21.0, 25.0, 17.0, 15.0, 11.0, 8.0, 7.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006213188171386719, -0.0005975440144538879, -0.000573769211769104, -0.0005499944090843201, -0.0005262196063995361, -0.0005024448037147522, -0.00047867000102996826, -0.0004548951983451843, -0.0004311203956604004, -0.00040734559297561646, -0.0003835707902908325, -0.0003597959876060486, -0.00033602118492126465, -0.0003122463822364807, -0.0002884715795516968, -0.00026469677686691284, -0.0002409219741821289, -0.00021714717149734497, -0.00019337236881256104, -0.0001695975661277771, -0.00014582276344299316, -0.00012204796075820923, -9.827315807342529e-05, -7.449835538864136e-05, -5.072355270385742e-05, -2.6948750019073486e-05, -3.1739473342895508e-06, 2.0600855350494385e-05, 4.437565803527832e-05, 6.815046072006226e-05, 9.192526340484619e-05, 0.00011570006608963013, 0.00013947486877441406, 0.000163249671459198, 0.00018702447414398193, 0.00021079927682876587, 0.0002345740795135498, 0.00025834888219833374, 0.0002821236848831177, 0.0003058984875679016, 0.00032967329025268555, 0.0003534480929374695, 0.0003772228956222534, 0.00040099769830703735, 0.0004247725009918213, 0.0004485473036766052, 0.00047232210636138916, 0.0004960969090461731, 0.000519871711730957, 0.000543646514415741, 0.0005674213171005249, 0.0005911961197853088, 0.0006149709224700928, 0.0006387457251548767, 0.0006625205278396606, 0.0006862953305244446, 0.0007100701332092285, 0.0007338449358940125, 0.0007576197385787964, 0.0007813945412635803, 0.0008051693439483643, 0.0008289441466331482, 0.0008527189493179321, 0.0008764937520027161, 0.0009002685546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 6.0, 7.0, 7.0, 20.0, 27.0, 32.0, 77.0, 92.0, 174.0, 312.0, 481.0, 873.0, 1470.0, 2512.0, 4097.0, 7118.0, 12032.0, 20158.0, 32855.0, 52319.0, 77329.0, 106317.0, 130790.0, 140676.0, 132279.0, 108470.0, 79052.0, 53330.0, 34188.0, 21103.0, 12685.0, 7328.0, 4177.0, 2526.0, 1499.0, 841.0, 493.0, 315.0, 196.0, 102.0, 77.0, 49.0, 31.0, 17.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.860107421875, -7.61083984375, -7.361572265625, -7.1123046875, -6.863037109375, -6.61376953125, -6.364501953125, -6.115234375, -5.865966796875, -5.61669921875, -5.367431640625, -5.1181640625, -4.868896484375, -4.61962890625, -4.370361328125, -4.12109375, -3.871826171875, -3.62255859375, -3.373291015625, -3.1240234375, -2.874755859375, -2.62548828125, -2.376220703125, -2.126953125, -1.877685546875, -1.62841796875, -1.379150390625, -1.1298828125, -0.880615234375, -0.63134765625, -0.382080078125, -0.1328125, 0.116455078125, 0.36572265625, 0.614990234375, 0.8642578125, 1.113525390625, 1.36279296875, 1.612060546875, 1.861328125, 2.110595703125, 2.35986328125, 2.609130859375, 2.8583984375, 3.107666015625, 3.35693359375, 3.606201171875, 3.85546875, 4.104736328125, 4.35400390625, 4.603271484375, 4.8525390625, 5.101806640625, 5.35107421875, 5.600341796875, 5.849609375, 6.098876953125, 6.34814453125, 6.597412109375, 6.8466796875, 7.095947265625, 7.34521484375, 7.594482421875, 7.84375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 6.0, 4.0, 5.0, 10.0, 14.0, 12.0, 20.0, 24.0, 28.0, 38.0, 38.0, 50.0, 34.0, 63.0, 56.0, 62.0, 65.0, 55.0, 59.0, 53.0, 59.0, 44.0, 41.0, 33.0, 23.0, 25.0, 15.0, 10.0, 9.0, 8.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.78515625, -6.59808349609375, -6.4110107421875, -6.22393798828125, -6.036865234375, -5.84979248046875, -5.6627197265625, -5.47564697265625, -5.28857421875, -5.10150146484375, -4.9144287109375, -4.72735595703125, -4.540283203125, -4.35321044921875, -4.1661376953125, -3.97906494140625, -3.7919921875, -3.60491943359375, -3.4178466796875, -3.23077392578125, -3.043701171875, -2.85662841796875, -2.6695556640625, -2.48248291015625, -2.29541015625, -2.10833740234375, -1.9212646484375, -1.73419189453125, -1.547119140625, -1.36004638671875, -1.1729736328125, -0.98590087890625, -0.798828125, -0.61175537109375, -0.4246826171875, -0.23760986328125, -0.050537109375, 0.13653564453125, 0.3236083984375, 0.51068115234375, 0.69775390625, 0.88482666015625, 1.0718994140625, 1.25897216796875, 1.446044921875, 1.63311767578125, 1.8201904296875, 2.00726318359375, 2.1943359375, 2.38140869140625, 2.5684814453125, 2.75555419921875, 2.942626953125, 3.12969970703125, 3.3167724609375, 3.50384521484375, 3.69091796875, 3.87799072265625, 4.0650634765625, 4.25213623046875, 4.439208984375, 4.62628173828125, 4.8133544921875, 5.00042724609375, 5.1875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 3.0, 5.0, 6.0, 8.0, 17.0, 15.0, 16.0, 25.0, 22.0, 33.0, 26.0, 39.0, 39.0, 36.0, 43.0, 47.0, 48.0, 47.0, 58.0, 50.0, 44.0, 45.0, 41.0, 51.0, 45.0, 38.0, 27.0, 30.0, 25.0, 15.0, 7.0, 14.0, 8.0, 9.0, 4.0, 2.0, 4.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.082735061645508, -24.34210777282715, -23.601478576660156, -22.860851287841797, -22.120223999023438, -21.379596710205078, -20.638967514038086, -19.898340225219727, -19.157711029052734, -18.417083740234375, -17.676454544067383, -16.935827255249023, -16.195199966430664, -15.454571723937988, -14.713943481445312, -13.973316192626953, -13.232688903808594, -12.492060661315918, -11.751433372497559, -11.010805130004883, -10.270177841186523, -9.529549598693848, -8.788921356201172, -8.048294067382812, -7.307665824890137, -6.567038059234619, -5.826410293579102, -5.085782051086426, -4.345154285430908, -3.6045265197753906, -2.863898277282715, -2.1232705116271973, -1.3826427459716797, -0.6420148611068726, 0.09861302375793457, 0.8392410278320312, 1.5798687934875488, 2.3204965591430664, 3.061124801635742, 3.8017525672912598, 4.542380332946777, 5.283008098602295, 6.0236358642578125, 6.764264106750488, 7.504891872406006, 8.245519638061523, 8.9861478805542, 9.726776123046875, 10.467403411865234, 11.20803165435791, 11.94865894317627, 12.689287185668945, 13.429914474487305, 14.17054271697998, 14.911170959472656, 15.651798248291016, 16.392425537109375, 17.133052825927734, 17.873682022094727, 18.614309310913086, 19.354936599731445, 20.095565795898438, 20.836193084716797, 21.576820373535156, 22.31744956970215]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 5.0, 9.0, 14.0, 10.0, 10.0, 10.0, 22.0, 28.0, 28.0, 34.0, 29.0, 47.0, 40.0, 52.0, 49.0, 50.0, 49.0, 62.0, 43.0, 55.0, 52.0, 29.0, 39.0, 25.0, 34.0, 34.0, 34.0, 23.0, 17.0, 12.0, 11.0, 8.0, 12.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.29084587097168, -30.28542137145996, -29.279996871948242, -28.274572372436523, -27.269145965576172, -26.263721466064453, -25.258296966552734, -24.252872467041016, -23.247447967529297, -22.242023468017578, -21.23659896850586, -20.23117446899414, -19.225749969482422, -18.220325469970703, -17.21489906311035, -16.209474563598633, -15.204050064086914, -14.198625564575195, -13.193201065063477, -12.187775611877441, -11.182351112365723, -10.176926612854004, -9.171501159667969, -8.16607666015625, -7.160652160644531, -6.1552276611328125, -5.1498026847839355, -4.144377708435059, -3.13895320892334, -2.133528709411621, -1.1281037330627441, -0.12267875671386719, 0.8827438354492188, 1.8881685733795166, 2.8935933113098145, 3.8990180492401123, 4.90444278717041, 5.909867286682129, 6.915292263031006, 7.920717239379883, 8.926141738891602, 9.93156623840332, 10.936990737915039, 11.942416191101074, 12.947840690612793, 13.953265190124512, 14.958690643310547, 15.964115142822266, 16.969539642333984, 17.974964141845703, 18.980388641357422, 19.98581314086914, 20.99123764038086, 21.996662139892578, 23.00208854675293, 24.00751304626465, 25.012937545776367, 26.018362045288086, 27.023786544799805, 28.029211044311523, 29.034637451171875, 30.040061950683594, 31.045486450195312, 32.05091094970703, 33.05633544921875]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 15.0, 14.0, 13.0, 25.0, 58.0, 91.0, 147.0, 202.0, 351.0, 551.0, 937.0, 1466.0, 2518.0, 3955.0, 6564.0, 10963.0, 18473.0, 31939.0, 54351.0, 91820.0, 153668.0, 244579.0, 368679.0, 501541.0, 592878.0, 594663.0, 503892.0, 373500.0, 249029.0, 155709.0, 94419.0, 56068.0, 32989.0, 19146.0, 11726.0, 6949.0, 4114.0, 2356.0, 1480.0, 936.0, 553.0, 377.0, 227.0, 133.0, 78.0, 53.0, 28.0, 19.0, 19.0, 16.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.8583984375, -17.263671875, -16.6689453125, -16.07421875, -15.4794921875, -14.884765625, -14.2900390625, -13.6953125, -13.1005859375, -12.505859375, -11.9111328125, -11.31640625, -10.7216796875, -10.126953125, -9.5322265625, -8.9375, -8.3427734375, -7.748046875, -7.1533203125, -6.55859375, -5.9638671875, -5.369140625, -4.7744140625, -4.1796875, -3.5849609375, -2.990234375, -2.3955078125, -1.80078125, -1.2060546875, -0.611328125, -0.0166015625, 0.578125, 1.1728515625, 1.767578125, 2.3623046875, 2.95703125, 3.5517578125, 4.146484375, 4.7412109375, 5.3359375, 5.9306640625, 6.525390625, 7.1201171875, 7.71484375, 8.3095703125, 8.904296875, 9.4990234375, 10.09375, 10.6884765625, 11.283203125, 11.8779296875, 12.47265625, 13.0673828125, 13.662109375, 14.2568359375, 14.8515625, 15.4462890625, 16.041015625, 16.6357421875, 17.23046875, 17.8251953125, 18.419921875, 19.0146484375, 19.609375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 11.0, 11.0, 12.0, 15.0, 19.0, 23.0, 36.0, 29.0, 36.0, 23.0, 24.0, 49.0, 46.0, 41.0, 37.0, 54.0, 38.0, 50.0, 44.0, 43.0, 41.0, 41.0, 23.0, 41.0, 27.0, 20.0, 30.0, 30.0, 15.0, 19.0, 11.0, 9.0, 4.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.27978515625, -21.5439453125, -20.80810546875, -20.072265625, -19.33642578125, -18.6005859375, -17.86474609375, -17.12890625, -16.39306640625, -15.6572265625, -14.92138671875, -14.185546875, -13.44970703125, -12.7138671875, -11.97802734375, -11.2421875, -10.50634765625, -9.7705078125, -9.03466796875, -8.298828125, -7.56298828125, -6.8271484375, -6.09130859375, -5.35546875, -4.61962890625, -3.8837890625, -3.14794921875, -2.412109375, -1.67626953125, -0.9404296875, -0.20458984375, 0.53125, 1.26708984375, 2.0029296875, 2.73876953125, 3.474609375, 4.21044921875, 4.9462890625, 5.68212890625, 6.41796875, 7.15380859375, 7.8896484375, 8.62548828125, 9.361328125, 10.09716796875, 10.8330078125, 11.56884765625, 12.3046875, 13.04052734375, 13.7763671875, 14.51220703125, 15.248046875, 15.98388671875, 16.7197265625, 17.45556640625, 18.19140625, 18.92724609375, 19.6630859375, 20.39892578125, 21.134765625, 21.87060546875, 22.6064453125, 23.34228515625, 24.078125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 5.0, 7.0, 12.0, 22.0, 45.0, 80.0, 124.0, 195.0, 353.0, 557.0, 985.0, 1743.0, 3055.0, 5370.0, 9488.0, 17128.0, 30564.0, 53513.0, 92709.0, 156123.0, 247826.0, 367750.0, 489325.0, 572564.0, 583194.0, 506518.0, 386383.0, 264951.0, 168008.0, 101211.0, 58450.0, 32954.0, 18550.0, 10577.0, 5920.0, 3315.0, 1951.0, 1112.0, 664.0, 393.0, 236.0, 141.0, 96.0, 47.0, 27.0, 18.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.425537109375, -16.75732421875, -16.089111328125, -15.4208984375, -14.752685546875, -14.08447265625, -13.416259765625, -12.748046875, -12.079833984375, -11.41162109375, -10.743408203125, -10.0751953125, -9.406982421875, -8.73876953125, -8.070556640625, -7.40234375, -6.734130859375, -6.06591796875, -5.397705078125, -4.7294921875, -4.061279296875, -3.39306640625, -2.724853515625, -2.056640625, -1.388427734375, -0.72021484375, -0.052001953125, 0.6162109375, 1.284423828125, 1.95263671875, 2.620849609375, 3.2890625, 3.957275390625, 4.62548828125, 5.293701171875, 5.9619140625, 6.630126953125, 7.29833984375, 7.966552734375, 8.634765625, 9.302978515625, 9.97119140625, 10.639404296875, 11.3076171875, 11.975830078125, 12.64404296875, 13.312255859375, 13.98046875, 14.648681640625, 15.31689453125, 15.985107421875, 16.6533203125, 17.321533203125, 17.98974609375, 18.657958984375, 19.326171875, 19.994384765625, 20.66259765625, 21.330810546875, 21.9990234375, 22.667236328125, 23.33544921875, 24.003662109375, 24.671875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 5.0, 3.0, 5.0, 12.0, 11.0, 9.0, 17.0, 17.0, 31.0, 35.0, 41.0, 43.0, 86.0, 73.0, 81.0, 72.0, 117.0, 129.0, 145.0, 153.0, 155.0, 189.0, 211.0, 200.0, 214.0, 190.0, 223.0, 185.0, 218.0, 181.0, 135.0, 135.0, 122.0, 106.0, 92.0, 71.0, 63.0, 72.0, 51.0, 33.0, 33.0, 28.0, 26.0, 13.0, 16.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.875, -9.5758056640625, -9.276611328125, -8.9774169921875, -8.67822265625, -8.3790283203125, -8.079833984375, -7.7806396484375, -7.4814453125, -7.1822509765625, -6.883056640625, -6.5838623046875, -6.28466796875, -5.9854736328125, -5.686279296875, -5.3870849609375, -5.087890625, -4.7886962890625, -4.489501953125, -4.1903076171875, -3.89111328125, -3.5919189453125, -3.292724609375, -2.9935302734375, -2.6943359375, -2.3951416015625, -2.095947265625, -1.7967529296875, -1.49755859375, -1.1983642578125, -0.899169921875, -0.5999755859375, -0.30078125, -0.0015869140625, 0.297607421875, 0.5968017578125, 0.89599609375, 1.1951904296875, 1.494384765625, 1.7935791015625, 2.0927734375, 2.3919677734375, 2.691162109375, 2.9903564453125, 3.28955078125, 3.5887451171875, 3.887939453125, 4.1871337890625, 4.486328125, 4.7855224609375, 5.084716796875, 5.3839111328125, 5.68310546875, 5.9822998046875, 6.281494140625, 6.5806884765625, 6.8798828125, 7.1790771484375, 7.478271484375, 7.7774658203125, 8.07666015625, 8.3758544921875, 8.675048828125, 8.9742431640625, 9.2734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 19.0, 10.0, 4.0, 19.0, 12.0, 13.0, 24.0, 25.0, 19.0, 23.0, 25.0, 42.0, 37.0, 47.0, 34.0, 53.0, 39.0, 53.0, 41.0, 50.0, 45.0, 37.0, 39.0, 39.0, 34.0, 29.0, 37.0, 27.0, 19.0, 20.0, 12.0, 18.0, 6.0, 8.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.151472091674805, -22.441726684570312, -21.731979370117188, -21.022233963012695, -20.312488555908203, -19.602741241455078, -18.892995834350586, -18.183250427246094, -17.47350311279297, -16.763757705688477, -16.05401039123535, -15.34426498413086, -14.63451862335205, -13.924772262573242, -13.21502685546875, -12.505280494689941, -11.795534133911133, -11.085787773132324, -10.376041412353516, -9.666296005249023, -8.956549644470215, -8.246803283691406, -7.537057399749756, -6.8273115158081055, -6.117565155029297, -5.407818794250488, -4.698072910308838, -3.9883267879486084, -3.278580665588379, -2.5688345432281494, -1.85908842086792, -1.1493425369262695, -0.43959617614746094, 0.27014994621276855, 0.979896068572998, 1.6896421909332275, 2.399388313293457, 3.1091344356536865, 3.818880558013916, 4.528626441955566, 5.238372802734375, 5.948119163513184, 6.657865047454834, 7.367610931396484, 8.077357292175293, 8.787103652954102, 9.496849060058594, 10.206595420837402, 10.916341781616211, 11.62608814239502, 12.335834503173828, 13.04557991027832, 13.755326271057129, 14.465072631835938, 15.17481803894043, 15.884564399719238, 16.594310760498047, 17.30405616760254, 18.013803482055664, 18.723548889160156, 19.43329620361328, 20.143041610717773, 20.852787017822266, 21.56253433227539, 22.272279739379883]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 7.0, 3.0, 11.0, 12.0, 16.0, 27.0, 18.0, 21.0, 27.0, 30.0, 41.0, 43.0, 42.0, 59.0, 42.0, 45.0, 48.0, 42.0, 44.0, 44.0, 52.0, 45.0, 41.0, 32.0, 38.0, 29.0, 29.0, 9.0, 23.0, 15.0, 16.0, 10.0, 9.0, 10.0, 1.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.966981887817383, -26.00594711303711, -25.044912338256836, -24.083877563476562, -23.122844696044922, -22.16180992126465, -21.200775146484375, -20.2397403717041, -19.278705596923828, -18.317670822143555, -17.35663604736328, -16.39560317993164, -15.434568405151367, -14.473533630371094, -13.51249885559082, -12.551464080810547, -11.590431213378906, -10.629396438598633, -9.668362617492676, -8.707327842712402, -7.746293544769287, -6.785259246826172, -5.824224472045898, -4.863190174102783, -3.902155876159668, -2.9411215782165527, -1.9800870418548584, -1.019052505493164, -0.05801820755004883, 0.9030160903930664, 1.8640508651733398, 2.825085163116455, 3.7861175537109375, 4.747151851654053, 5.708186149597168, 6.669220924377441, 7.630255222320557, 8.591289520263672, 9.552324295043945, 10.513359069824219, 11.474392890930176, 12.43542766571045, 13.396461486816406, 14.35749626159668, 15.318531036376953, 16.279563903808594, 17.2406005859375, 18.20163345336914, 19.162668228149414, 20.123703002929688, 21.08473777770996, 22.045772552490234, 23.006805419921875, 23.96784019470215, 24.928874969482422, 25.889909744262695, 26.85094451904297, 27.811979293823242, 28.773014068603516, 29.734046936035156, 30.69508171081543, 31.656116485595703, 32.617149353027344, 33.57818603515625, 34.53921890258789]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 16.0, 33.0, 29.0, 68.0, 97.0, 163.0, 283.0, 571.0, 957.0, 1495.0, 2560.0, 4450.0, 7462.0, 12392.0, 20088.0, 32623.0, 50866.0, 73886.0, 101904.0, 126931.0, 137394.0, 131140.0, 109072.0, 82383.0, 56784.0, 36888.0, 23118.0, 14190.0, 8470.0, 5061.0, 2948.0, 1738.0, 977.0, 605.0, 358.0, 216.0, 122.0, 76.0, 52.0, 34.0, 16.0, 13.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.640625, -7.4200439453125, -7.199462890625, -6.9788818359375, -6.75830078125, -6.5377197265625, -6.317138671875, -6.0965576171875, -5.8759765625, -5.6553955078125, -5.434814453125, -5.2142333984375, -4.99365234375, -4.7730712890625, -4.552490234375, -4.3319091796875, -4.111328125, -3.8907470703125, -3.670166015625, -3.4495849609375, -3.22900390625, -3.0084228515625, -2.787841796875, -2.5672607421875, -2.3466796875, -2.1260986328125, -1.905517578125, -1.6849365234375, -1.46435546875, -1.2437744140625, -1.023193359375, -0.8026123046875, -0.58203125, -0.3614501953125, -0.140869140625, 0.0797119140625, 0.30029296875, 0.5208740234375, 0.741455078125, 0.9620361328125, 1.1826171875, 1.4031982421875, 1.623779296875, 1.8443603515625, 2.06494140625, 2.2855224609375, 2.506103515625, 2.7266845703125, 2.947265625, 3.1678466796875, 3.388427734375, 3.6090087890625, 3.82958984375, 4.0501708984375, 4.270751953125, 4.4913330078125, 4.7119140625, 4.9324951171875, 5.153076171875, 5.3736572265625, 5.59423828125, 5.8148193359375, 6.035400390625, 6.2559814453125, 6.4765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 11.0, 8.0, 6.0, 8.0, 22.0, 17.0, 26.0, 31.0, 45.0, 29.0, 37.0, 49.0, 49.0, 36.0, 45.0, 41.0, 43.0, 50.0, 54.0, 50.0, 50.0, 35.0, 45.0, 31.0, 24.0, 27.0, 21.0, 13.0, 25.0, 10.0, 10.0, 10.0, 6.0, 10.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.7451171875, -24.771484375, -23.7978515625, -22.82421875, -21.8505859375, -20.876953125, -19.9033203125, -18.9296875, -17.9560546875, -16.982421875, -16.0087890625, -15.03515625, -14.0615234375, -13.087890625, -12.1142578125, -11.140625, -10.1669921875, -9.193359375, -8.2197265625, -7.24609375, -6.2724609375, -5.298828125, -4.3251953125, -3.3515625, -2.3779296875, -1.404296875, -0.4306640625, 0.54296875, 1.5166015625, 2.490234375, 3.4638671875, 4.4375, 5.4111328125, 6.384765625, 7.3583984375, 8.33203125, 9.3056640625, 10.279296875, 11.2529296875, 12.2265625, 13.2001953125, 14.173828125, 15.1474609375, 16.12109375, 17.0947265625, 18.068359375, 19.0419921875, 20.015625, 20.9892578125, 21.962890625, 22.9365234375, 23.91015625, 24.8837890625, 25.857421875, 26.8310546875, 27.8046875, 28.7783203125, 29.751953125, 30.7255859375, 31.69921875, 32.6728515625, 33.646484375, 34.6201171875, 35.59375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 11.0, 8.0, 11.0, 22.0, 38.0, 65.0, 108.0, 136.0, 265.0, 387.0, 573.0, 965.0, 1521.0, 2711.0, 4231.0, 7183.0, 12311.0, 20577.0, 33977.0, 55466.0, 86708.0, 124093.0, 156150.0, 159181.0, 132382.0, 94374.0, 61289.0, 37458.0, 22752.0, 13335.0, 8051.0, 4667.0, 2887.0, 1784.0, 1065.0, 666.0, 393.0, 282.0, 172.0, 105.0, 78.0, 44.0, 25.0, 16.0, 7.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.79296875, -7.52520751953125, -7.2574462890625, -6.98968505859375, -6.721923828125, -6.45416259765625, -6.1864013671875, -5.91864013671875, -5.65087890625, -5.38311767578125, -5.1153564453125, -4.84759521484375, -4.579833984375, -4.31207275390625, -4.0443115234375, -3.77655029296875, -3.5087890625, -3.24102783203125, -2.9732666015625, -2.70550537109375, -2.437744140625, -2.16998291015625, -1.9022216796875, -1.63446044921875, -1.36669921875, -1.09893798828125, -0.8311767578125, -0.56341552734375, -0.295654296875, -0.02789306640625, 0.2398681640625, 0.50762939453125, 0.775390625, 1.04315185546875, 1.3109130859375, 1.57867431640625, 1.846435546875, 2.11419677734375, 2.3819580078125, 2.64971923828125, 2.91748046875, 3.18524169921875, 3.4530029296875, 3.72076416015625, 3.988525390625, 4.25628662109375, 4.5240478515625, 4.79180908203125, 5.0595703125, 5.32733154296875, 5.5950927734375, 5.86285400390625, 6.130615234375, 6.39837646484375, 6.6661376953125, 6.93389892578125, 7.20166015625, 7.46942138671875, 7.7371826171875, 8.00494384765625, 8.272705078125, 8.54046630859375, 8.8082275390625, 9.07598876953125, 9.34375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 7.0, 7.0, 9.0, 6.0, 10.0, 8.0, 18.0, 17.0, 18.0, 19.0, 27.0, 27.0, 27.0, 27.0, 27.0, 39.0, 37.0, 42.0, 36.0, 47.0, 43.0, 33.0, 41.0, 34.0, 38.0, 35.0, 37.0, 31.0, 40.0, 27.0, 25.0, 17.0, 22.0, 24.0, 19.0, 14.0, 12.0, 8.0, 10.0, 5.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.78125, -13.29833984375, -12.8154296875, -12.33251953125, -11.849609375, -11.36669921875, -10.8837890625, -10.40087890625, -9.91796875, -9.43505859375, -8.9521484375, -8.46923828125, -7.986328125, -7.50341796875, -7.0205078125, -6.53759765625, -6.0546875, -5.57177734375, -5.0888671875, -4.60595703125, -4.123046875, -3.64013671875, -3.1572265625, -2.67431640625, -2.19140625, -1.70849609375, -1.2255859375, -0.74267578125, -0.259765625, 0.22314453125, 0.7060546875, 1.18896484375, 1.671875, 2.15478515625, 2.6376953125, 3.12060546875, 3.603515625, 4.08642578125, 4.5693359375, 5.05224609375, 5.53515625, 6.01806640625, 6.5009765625, 6.98388671875, 7.466796875, 7.94970703125, 8.4326171875, 8.91552734375, 9.3984375, 9.88134765625, 10.3642578125, 10.84716796875, 11.330078125, 11.81298828125, 12.2958984375, 12.77880859375, 13.26171875, 13.74462890625, 14.2275390625, 14.71044921875, 15.193359375, 15.67626953125, 16.1591796875, 16.64208984375, 17.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 14.0, 14.0, 22.0, 30.0, 45.0, 76.0, 128.0, 200.0, 334.0, 545.0, 1071.0, 1894.0, 3431.0, 6557.0, 12711.0, 24846.0, 46924.0, 86830.0, 147134.0, 201806.0, 197692.0, 140575.0, 82643.0, 44066.0, 23063.0, 12046.0, 6270.0, 3365.0, 1714.0, 1022.0, 572.0, 350.0, 213.0, 131.0, 62.0, 52.0, 32.0, 18.0, 19.0, 8.0, 10.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1484375, -4.014404296875, -3.88037109375, -3.746337890625, -3.6123046875, -3.478271484375, -3.34423828125, -3.210205078125, -3.076171875, -2.942138671875, -2.80810546875, -2.674072265625, -2.5400390625, -2.406005859375, -2.27197265625, -2.137939453125, -2.00390625, -1.869873046875, -1.73583984375, -1.601806640625, -1.4677734375, -1.333740234375, -1.19970703125, -1.065673828125, -0.931640625, -0.797607421875, -0.66357421875, -0.529541015625, -0.3955078125, -0.261474609375, -0.12744140625, 0.006591796875, 0.140625, 0.274658203125, 0.40869140625, 0.542724609375, 0.6767578125, 0.810791015625, 0.94482421875, 1.078857421875, 1.212890625, 1.346923828125, 1.48095703125, 1.614990234375, 1.7490234375, 1.883056640625, 2.01708984375, 2.151123046875, 2.28515625, 2.419189453125, 2.55322265625, 2.687255859375, 2.8212890625, 2.955322265625, 3.08935546875, 3.223388671875, 3.357421875, 3.491455078125, 3.62548828125, 3.759521484375, 3.8935546875, 4.027587890625, 4.16162109375, 4.295654296875, 4.4296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 9.0, 17.0, 19.0, 18.0, 30.0, 29.0, 37.0, 28.0, 39.0, 51.0, 51.0, 52.0, 40.0, 53.0, 54.0, 46.0, 44.0, 50.0, 55.0, 27.0, 39.0, 25.0, 30.0, 34.0, 19.0, 19.0, 19.0, 15.0, 7.0, 10.0, 7.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002307891845703125, -0.00022307410836219788, -0.00021535903215408325, -0.00020764395594596863, -0.000199928879737854, -0.00019221380352973938, -0.00018449872732162476, -0.00017678365111351013, -0.0001690685749053955, -0.00016135349869728088, -0.00015363842248916626, -0.00014592334628105164, -0.000138208270072937, -0.0001304931938648224, -0.00012277811765670776, -0.00011506304144859314, -0.00010734796524047852, -9.963288903236389e-05, -9.191781282424927e-05, -8.420273661613464e-05, -7.648766040802002e-05, -6.87725841999054e-05, -6.105750799179077e-05, -5.334243178367615e-05, -4.5627355575561523e-05, -3.79122793674469e-05, -3.0197203159332275e-05, -2.248212695121765e-05, -1.4767050743103027e-05, -7.051974534988403e-06, 6.631016731262207e-07, 8.378177881240845e-06, 1.609325408935547e-05, 2.3808330297470093e-05, 3.152340650558472e-05, 3.923848271369934e-05, 4.6953558921813965e-05, 5.466863512992859e-05, 6.238371133804321e-05, 7.009878754615784e-05, 7.781386375427246e-05, 8.552893996238708e-05, 9.324401617050171e-05, 0.00010095909237861633, 0.00010867416858673096, 0.00011638924479484558, 0.0001241043210029602, 0.00013181939721107483, 0.00013953447341918945, 0.00014724954962730408, 0.0001549646258354187, 0.00016267970204353333, 0.00017039477825164795, 0.00017810985445976257, 0.0001858249306678772, 0.00019354000687599182, 0.00020125508308410645, 0.00020897015929222107, 0.0002166852355003357, 0.00022440031170845032, 0.00023211538791656494, 0.00023983046412467957, 0.0002475455403327942, 0.0002552606165409088, 0.00026297569274902344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 11.0, 6.0, 11.0, 25.0, 50.0, 70.0, 106.0, 154.0, 238.0, 374.0, 565.0, 873.0, 1396.0, 2268.0, 3654.0, 5886.0, 9103.0, 14484.0, 22537.0, 33938.0, 49313.0, 69154.0, 91677.0, 111717.0, 122613.0, 121597.0, 107181.0, 86031.0, 63819.0, 44615.0, 30382.0, 20017.0, 12760.0, 8167.0, 5096.0, 3240.0, 2031.0, 1238.0, 774.0, 509.0, 322.0, 207.0, 131.0, 85.0, 47.0, 33.0, 22.0, 14.0, 8.0, 5.0, 0.0, 3.0, 3.0], "bins": [-3.642578125, -3.541015625, -3.439453125, -3.337890625, -3.236328125, -3.134765625, -3.033203125, -2.931640625, -2.830078125, -2.728515625, -2.626953125, -2.525390625, -2.423828125, -2.322265625, -2.220703125, -2.119140625, -2.017578125, -1.916015625, -1.814453125, -1.712890625, -1.611328125, -1.509765625, -1.408203125, -1.306640625, -1.205078125, -1.103515625, -1.001953125, -0.900390625, -0.798828125, -0.697265625, -0.595703125, -0.494140625, -0.392578125, -0.291015625, -0.189453125, -0.087890625, 0.013671875, 0.115234375, 0.216796875, 0.318359375, 0.419921875, 0.521484375, 0.623046875, 0.724609375, 0.826171875, 0.927734375, 1.029296875, 1.130859375, 1.232421875, 1.333984375, 1.435546875, 1.537109375, 1.638671875, 1.740234375, 1.841796875, 1.943359375, 2.044921875, 2.146484375, 2.248046875, 2.349609375, 2.451171875, 2.552734375, 2.654296875, 2.755859375, 2.857421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 5.0, 7.0, 20.0, 9.0, 12.0, 19.0, 15.0, 18.0, 24.0, 22.0, 39.0, 35.0, 34.0, 43.0, 46.0, 46.0, 58.0, 45.0, 48.0, 48.0, 45.0, 52.0, 37.0, 45.0, 30.0, 31.0, 25.0, 23.0, 13.0, 15.0, 13.0, 8.0, 12.0, 10.0, 11.0, 5.0, 8.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.64453125, -1.5956573486328125, -1.546783447265625, -1.4979095458984375, -1.44903564453125, -1.4001617431640625, -1.351287841796875, -1.3024139404296875, -1.2535400390625, -1.2046661376953125, -1.155792236328125, -1.1069183349609375, -1.05804443359375, -1.0091705322265625, -0.960296630859375, -0.9114227294921875, -0.862548828125, -0.8136749267578125, -0.764801025390625, -0.7159271240234375, -0.66705322265625, -0.6181793212890625, -0.569305419921875, -0.5204315185546875, -0.4715576171875, -0.4226837158203125, -0.373809814453125, -0.3249359130859375, -0.27606201171875, -0.2271881103515625, -0.178314208984375, -0.1294403076171875, -0.08056640625, -0.0316925048828125, 0.017181396484375, 0.0660552978515625, 0.11492919921875, 0.1638031005859375, 0.212677001953125, 0.2615509033203125, 0.3104248046875, 0.3592987060546875, 0.408172607421875, 0.4570465087890625, 0.50592041015625, 0.5547943115234375, 0.603668212890625, 0.6525421142578125, 0.701416015625, 0.7502899169921875, 0.799163818359375, 0.8480377197265625, 0.89691162109375, 0.9457855224609375, 0.994659423828125, 1.0435333251953125, 1.0924072265625, 1.1412811279296875, 1.190155029296875, 1.2390289306640625, 1.28790283203125, 1.3367767333984375, 1.385650634765625, 1.4345245361328125, 1.4833984375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 5.0, 7.0, 4.0, 10.0, 10.0, 12.0, 12.0, 15.0, 20.0, 16.0, 24.0, 26.0, 21.0, 28.0, 39.0, 41.0, 44.0, 37.0, 47.0, 49.0, 54.0, 46.0, 47.0, 38.0, 37.0, 43.0, 37.0, 44.0, 26.0, 32.0, 28.0, 21.0, 19.0, 9.0, 14.0, 5.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.872983932495117, -22.14501190185547, -21.417041778564453, -20.689069747924805, -19.961097717285156, -19.23312759399414, -18.505155563354492, -17.777183532714844, -17.049213409423828, -16.32124137878418, -15.593271255493164, -14.865299224853516, -14.137328147888184, -13.409357070922852, -12.681385040283203, -11.953413963317871, -11.225442886352539, -10.497471809387207, -9.769500732421875, -9.041528701782227, -8.313557624816895, -7.5855865478515625, -6.857614994049072, -6.129643440246582, -5.40167236328125, -4.673701286315918, -3.9457297325134277, -3.2177584171295166, -2.4897871017456055, -1.7618157863616943, -1.0338444709777832, -0.30587291717529297, 0.42209815979003906, 1.1500694751739502, 1.8780407905578613, 2.6060121059417725, 3.3339834213256836, 4.061954498291016, 4.789926052093506, 5.517897605895996, 6.245868682861328, 6.97383975982666, 7.70181131362915, 8.42978286743164, 9.157753944396973, 9.885725021362305, 10.613697052001953, 11.341668128967285, 12.069639205932617, 12.79761028289795, 13.525581359863281, 14.25355339050293, 14.981524467468262, 15.709495544433594, 16.437467575073242, 17.16543960571289, 17.893409729003906, 18.621381759643555, 19.34935188293457, 20.07732391357422, 20.805294036865234, 21.533266067504883, 22.26123809814453, 22.989208221435547, 23.717180252075195]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 11.0, 10.0, 15.0, 29.0, 23.0, 15.0, 25.0, 32.0, 43.0, 46.0, 39.0, 54.0, 44.0, 42.0, 45.0, 46.0, 42.0, 48.0, 54.0, 44.0, 40.0, 29.0, 38.0, 29.0, 31.0, 12.0, 20.0, 17.0, 18.0, 6.0, 9.0, 8.0, 5.0, 2.0, 9.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.685579299926758, -25.737878799438477, -24.790176391601562, -23.84247589111328, -22.894775390625, -21.94707489013672, -20.999372482299805, -20.051671981811523, -19.10396957397461, -18.156269073486328, -17.208566665649414, -16.260866165161133, -15.313165664672852, -14.365464210510254, -13.417762756347656, -12.470062255859375, -11.522361755371094, -10.574660301208496, -9.626959800720215, -8.679258346557617, -7.731557369232178, -6.783856391906738, -5.836154937744141, -4.888453960418701, -3.9407529830932617, -2.9930520057678223, -2.0453507900238037, -1.0976495742797852, -0.1499485969543457, 0.7977523803710938, 1.7454538345336914, 2.693154811859131, 3.6408538818359375, 4.588554859161377, 5.536255836486816, 6.483957290649414, 7.4316582679748535, 8.379359245300293, 9.32706069946289, 10.274761199951172, 11.22246265411377, 12.170164108276367, 13.117864608764648, 14.065566062927246, 15.013267517089844, 15.960968017578125, 16.908668518066406, 17.85637092590332, 18.8040714263916, 19.751771926879883, 20.699474334716797, 21.647174835205078, 22.59487533569336, 23.54257583618164, 24.490278244018555, 25.437978744506836, 26.38568115234375, 27.33338165283203, 28.281084060668945, 29.228784561157227, 30.176485061645508, 31.124187469482422, 32.0718879699707, 33.019588470458984, 33.967288970947266]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 10.0, 12.0, 17.0, 25.0, 34.0, 73.0, 101.0, 167.0, 306.0, 423.0, 700.0, 1196.0, 1996.0, 3206.0, 5312.0, 8491.0, 13106.0, 20585.0, 31275.0, 45661.0, 64154.0, 83577.0, 101952.0, 113541.0, 116144.0, 108388.0, 93170.0, 73441.0, 54149.0, 37720.0, 25530.0, 16605.0, 10516.0, 6542.0, 4092.0, 2529.0, 1508.0, 859.0, 541.0, 340.0, 203.0, 149.0, 76.0, 54.0, 29.0, 19.0, 21.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.203125, -13.788330078125, -13.37353515625, -12.958740234375, -12.5439453125, -12.129150390625, -11.71435546875, -11.299560546875, -10.884765625, -10.469970703125, -10.05517578125, -9.640380859375, -9.2255859375, -8.810791015625, -8.39599609375, -7.981201171875, -7.56640625, -7.151611328125, -6.73681640625, -6.322021484375, -5.9072265625, -5.492431640625, -5.07763671875, -4.662841796875, -4.248046875, -3.833251953125, -3.41845703125, -3.003662109375, -2.5888671875, -2.174072265625, -1.75927734375, -1.344482421875, -0.9296875, -0.514892578125, -0.10009765625, 0.314697265625, 0.7294921875, 1.144287109375, 1.55908203125, 1.973876953125, 2.388671875, 2.803466796875, 3.21826171875, 3.633056640625, 4.0478515625, 4.462646484375, 4.87744140625, 5.292236328125, 5.70703125, 6.121826171875, 6.53662109375, 6.951416015625, 7.3662109375, 7.781005859375, 8.19580078125, 8.610595703125, 9.025390625, 9.440185546875, 9.85498046875, 10.269775390625, 10.6845703125, 11.099365234375, 11.51416015625, 11.928955078125, 12.34375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 6.0, 15.0, 15.0, 12.0, 25.0, 21.0, 24.0, 29.0, 31.0, 40.0, 33.0, 35.0, 47.0, 59.0, 55.0, 48.0, 45.0, 43.0, 38.0, 42.0, 35.0, 39.0, 40.0, 24.0, 29.0, 25.0, 18.0, 24.0, 21.0, 15.0, 14.0, 9.0, 5.0, 8.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.4375, -24.49853515625, -23.5595703125, -22.62060546875, -21.681640625, -20.74267578125, -19.8037109375, -18.86474609375, -17.92578125, -16.98681640625, -16.0478515625, -15.10888671875, -14.169921875, -13.23095703125, -12.2919921875, -11.35302734375, -10.4140625, -9.47509765625, -8.5361328125, -7.59716796875, -6.658203125, -5.71923828125, -4.7802734375, -3.84130859375, -2.90234375, -1.96337890625, -1.0244140625, -0.08544921875, 0.853515625, 1.79248046875, 2.7314453125, 3.67041015625, 4.609375, 5.54833984375, 6.4873046875, 7.42626953125, 8.365234375, 9.30419921875, 10.2431640625, 11.18212890625, 12.12109375, 13.06005859375, 13.9990234375, 14.93798828125, 15.876953125, 16.81591796875, 17.7548828125, 18.69384765625, 19.6328125, 20.57177734375, 21.5107421875, 22.44970703125, 23.388671875, 24.32763671875, 25.2666015625, 26.20556640625, 27.14453125, 28.08349609375, 29.0224609375, 29.96142578125, 30.900390625, 31.83935546875, 32.7783203125, 33.71728515625, 34.65625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 14.0, 20.0, 24.0, 54.0, 88.0, 129.0, 237.0, 389.0, 628.0, 1041.0, 1640.0, 2748.0, 4458.0, 7211.0, 11252.0, 17899.0, 27174.0, 40687.0, 58428.0, 78284.0, 98578.0, 113732.0, 119428.0, 113699.0, 98946.0, 78077.0, 58165.0, 40329.0, 27351.0, 17833.0, 11345.0, 7074.0, 4429.0, 2732.0, 1758.0, 1021.0, 646.0, 369.0, 282.0, 140.0, 96.0, 59.0, 28.0, 13.0, 10.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.35205078125, -12.8994140625, -12.44677734375, -11.994140625, -11.54150390625, -11.0888671875, -10.63623046875, -10.18359375, -9.73095703125, -9.2783203125, -8.82568359375, -8.373046875, -7.92041015625, -7.4677734375, -7.01513671875, -6.5625, -6.10986328125, -5.6572265625, -5.20458984375, -4.751953125, -4.29931640625, -3.8466796875, -3.39404296875, -2.94140625, -2.48876953125, -2.0361328125, -1.58349609375, -1.130859375, -0.67822265625, -0.2255859375, 0.22705078125, 0.6796875, 1.13232421875, 1.5849609375, 2.03759765625, 2.490234375, 2.94287109375, 3.3955078125, 3.84814453125, 4.30078125, 4.75341796875, 5.2060546875, 5.65869140625, 6.111328125, 6.56396484375, 7.0166015625, 7.46923828125, 7.921875, 8.37451171875, 8.8271484375, 9.27978515625, 9.732421875, 10.18505859375, 10.6376953125, 11.09033203125, 11.54296875, 11.99560546875, 12.4482421875, 12.90087890625, 13.353515625, 13.80615234375, 14.2587890625, 14.71142578125, 15.1640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 6.0, 8.0, 10.0, 10.0, 14.0, 14.0, 29.0, 24.0, 24.0, 24.0, 33.0, 37.0, 25.0, 33.0, 48.0, 47.0, 37.0, 38.0, 63.0, 43.0, 54.0, 38.0, 46.0, 38.0, 37.0, 34.0, 30.0, 23.0, 19.0, 19.0, 16.0, 14.0, 12.0, 11.0, 10.0, 8.0, 4.0, 6.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.8125, -20.226806640625, -19.64111328125, -19.055419921875, -18.4697265625, -17.884033203125, -17.29833984375, -16.712646484375, -16.126953125, -15.541259765625, -14.95556640625, -14.369873046875, -13.7841796875, -13.198486328125, -12.61279296875, -12.027099609375, -11.44140625, -10.855712890625, -10.27001953125, -9.684326171875, -9.0986328125, -8.512939453125, -7.92724609375, -7.341552734375, -6.755859375, -6.170166015625, -5.58447265625, -4.998779296875, -4.4130859375, -3.827392578125, -3.24169921875, -2.656005859375, -2.0703125, -1.484619140625, -0.89892578125, -0.313232421875, 0.2724609375, 0.858154296875, 1.44384765625, 2.029541015625, 2.615234375, 3.200927734375, 3.78662109375, 4.372314453125, 4.9580078125, 5.543701171875, 6.12939453125, 6.715087890625, 7.30078125, 7.886474609375, 8.47216796875, 9.057861328125, 9.6435546875, 10.229248046875, 10.81494140625, 11.400634765625, 11.986328125, 12.572021484375, 13.15771484375, 13.743408203125, 14.3291015625, 14.914794921875, 15.50048828125, 16.086181640625, 16.671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 14.0, 20.0, 40.0, 60.0, 65.0, 111.0, 199.0, 284.0, 495.0, 785.0, 1211.0, 2048.0, 3259.0, 5473.0, 9106.0, 14647.0, 23569.0, 36873.0, 55731.0, 78292.0, 102348.0, 120377.0, 128137.0, 122007.0, 103921.0, 80405.0, 57138.0, 38045.0, 24498.0, 15347.0, 9426.0, 5675.0, 3506.0, 2065.0, 1268.0, 759.0, 475.0, 293.0, 222.0, 129.0, 75.0, 51.0, 32.0, 21.0, 17.0, 13.0, 12.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.015625, -5.82489013671875, -5.6341552734375, -5.44342041015625, -5.252685546875, -5.06195068359375, -4.8712158203125, -4.68048095703125, -4.48974609375, -4.29901123046875, -4.1082763671875, -3.91754150390625, -3.726806640625, -3.53607177734375, -3.3453369140625, -3.15460205078125, -2.9638671875, -2.77313232421875, -2.5823974609375, -2.39166259765625, -2.200927734375, -2.01019287109375, -1.8194580078125, -1.62872314453125, -1.43798828125, -1.24725341796875, -1.0565185546875, -0.86578369140625, -0.675048828125, -0.48431396484375, -0.2935791015625, -0.10284423828125, 0.087890625, 0.27862548828125, 0.4693603515625, 0.66009521484375, 0.850830078125, 1.04156494140625, 1.2322998046875, 1.42303466796875, 1.61376953125, 1.80450439453125, 1.9952392578125, 2.18597412109375, 2.376708984375, 2.56744384765625, 2.7581787109375, 2.94891357421875, 3.1396484375, 3.33038330078125, 3.5211181640625, 3.71185302734375, 3.902587890625, 4.09332275390625, 4.2840576171875, 4.47479248046875, 4.66552734375, 4.85626220703125, 5.0469970703125, 5.23773193359375, 5.428466796875, 5.61920166015625, 5.8099365234375, 6.00067138671875, 6.19140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 11.0, 3.0, 13.0, 14.0, 14.0, 20.0, 15.0, 21.0, 28.0, 26.0, 44.0, 35.0, 37.0, 38.0, 43.0, 56.0, 46.0, 47.0, 56.0, 46.0, 45.0, 51.0, 38.0, 37.0, 42.0, 24.0, 24.0, 24.0, 27.0, 13.0, 15.0, 10.0, 13.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005846023559570312, -0.0005632787942886353, -0.0005419552326202393, -0.0005206316709518433, -0.0004993081092834473, -0.00047798454761505127, -0.0004566609859466553, -0.0004353374242782593, -0.0004140138626098633, -0.0003926903009414673, -0.0003713667392730713, -0.0003500431776046753, -0.0003287196159362793, -0.0003073960542678833, -0.0002860724925994873, -0.0002647489309310913, -0.0002434253692626953, -0.00022210180759429932, -0.00020077824592590332, -0.00017945468425750732, -0.00015813112258911133, -0.00013680756092071533, -0.00011548399925231934, -9.416043758392334e-05, -7.283687591552734e-05, -5.151331424713135e-05, -3.018975257873535e-05, -8.866190910339355e-06, 1.245737075805664e-05, 3.378093242645264e-05, 5.510449409484863e-05, 7.642805576324463e-05, 9.775161743164062e-05, 0.00011907517910003662, 0.00014039874076843262, 0.0001617223024368286, 0.0001830458641052246, 0.0002043694257736206, 0.0002256929874420166, 0.0002470165491104126, 0.0002683401107788086, 0.0002896636724472046, 0.0003109872341156006, 0.0003323107957839966, 0.0003536343574523926, 0.0003749579191207886, 0.00039628148078918457, 0.00041760504245758057, 0.00043892860412597656, 0.00046025216579437256, 0.00048157572746276855, 0.0005028992891311646, 0.0005242228507995605, 0.0005455464124679565, 0.0005668699741363525, 0.0005881935358047485, 0.0006095170974731445, 0.0006308406591415405, 0.0006521642208099365, 0.0006734877824783325, 0.0006948113441467285, 0.0007161349058151245, 0.0007374584674835205, 0.0007587820291519165, 0.0007801055908203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 13.0, 17.0, 25.0, 35.0, 55.0, 96.0, 192.0, 321.0, 529.0, 911.0, 1629.0, 2899.0, 5312.0, 9341.0, 16789.0, 29576.0, 50279.0, 79843.0, 114661.0, 144631.0, 155530.0, 142119.0, 109460.0, 74734.0, 46749.0, 27477.0, 15770.0, 8523.0, 4843.0, 2636.0, 1435.0, 895.0, 522.0, 287.0, 165.0, 89.0, 50.0, 40.0, 21.0, 20.0, 9.0, 13.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.8984375, -8.64727783203125, -8.3961181640625, -8.14495849609375, -7.893798828125, -7.64263916015625, -7.3914794921875, -7.14031982421875, -6.88916015625, -6.63800048828125, -6.3868408203125, -6.13568115234375, -5.884521484375, -5.63336181640625, -5.3822021484375, -5.13104248046875, -4.8798828125, -4.62872314453125, -4.3775634765625, -4.12640380859375, -3.875244140625, -3.62408447265625, -3.3729248046875, -3.12176513671875, -2.87060546875, -2.61944580078125, -2.3682861328125, -2.11712646484375, -1.865966796875, -1.61480712890625, -1.3636474609375, -1.11248779296875, -0.861328125, -0.61016845703125, -0.3590087890625, -0.10784912109375, 0.143310546875, 0.39447021484375, 0.6456298828125, 0.89678955078125, 1.14794921875, 1.39910888671875, 1.6502685546875, 1.90142822265625, 2.152587890625, 2.40374755859375, 2.6549072265625, 2.90606689453125, 3.1572265625, 3.40838623046875, 3.6595458984375, 3.91070556640625, 4.161865234375, 4.41302490234375, 4.6641845703125, 4.91534423828125, 5.16650390625, 5.41766357421875, 5.6688232421875, 5.91998291015625, 6.171142578125, 6.42230224609375, 6.6734619140625, 6.92462158203125, 7.17578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 5.0, 8.0, 11.0, 15.0, 30.0, 25.0, 34.0, 54.0, 48.0, 48.0, 67.0, 72.0, 65.0, 66.0, 71.0, 65.0, 52.0, 53.0, 39.0, 29.0, 29.0, 35.0, 21.0, 12.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.611114501953125, -3.46246337890625, -3.313812255859375, -3.1651611328125, -3.016510009765625, -2.86785888671875, -2.719207763671875, -2.570556640625, -2.421905517578125, -2.27325439453125, -2.124603271484375, -1.9759521484375, -1.827301025390625, -1.67864990234375, -1.529998779296875, -1.38134765625, -1.232696533203125, -1.08404541015625, -0.935394287109375, -0.7867431640625, -0.638092041015625, -0.48944091796875, -0.340789794921875, -0.192138671875, -0.043487548828125, 0.10516357421875, 0.253814697265625, 0.4024658203125, 0.551116943359375, 0.69976806640625, 0.848419189453125, 0.9970703125, 1.145721435546875, 1.29437255859375, 1.443023681640625, 1.5916748046875, 1.740325927734375, 1.88897705078125, 2.037628173828125, 2.186279296875, 2.334930419921875, 2.48358154296875, 2.632232666015625, 2.7808837890625, 2.929534912109375, 3.07818603515625, 3.226837158203125, 3.37548828125, 3.524139404296875, 3.67279052734375, 3.821441650390625, 3.9700927734375, 4.118743896484375, 4.26739501953125, 4.416046142578125, 4.564697265625, 4.713348388671875, 4.86199951171875, 5.010650634765625, 5.1593017578125, 5.307952880859375, 5.45660400390625, 5.605255126953125, 5.75390625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 2.0, 8.0, 9.0, 6.0, 13.0, 18.0, 10.0, 12.0, 27.0, 28.0, 24.0, 31.0, 24.0, 35.0, 42.0, 36.0, 44.0, 47.0, 61.0, 42.0, 55.0, 53.0, 32.0, 31.0, 27.0, 36.0, 45.0, 36.0, 30.0, 25.0, 25.0, 16.0, 4.0, 10.0, 12.0, 6.0, 4.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.660484313964844, -20.9451904296875, -20.229896545410156, -19.514602661132812, -18.79930877685547, -18.084012985229492, -17.36871910095215, -16.653425216674805, -15.938131332397461, -15.222837448120117, -14.507543563842773, -13.792248725891113, -13.07695484161377, -12.361660957336426, -11.646366119384766, -10.931072235107422, -10.215778350830078, -9.500484466552734, -8.78519058227539, -8.06989574432373, -7.354601860046387, -6.639307975769043, -5.924013614654541, -5.208719253540039, -4.493425369262695, -3.7781312465667725, -3.0628371238708496, -2.3475430011749268, -1.632248878479004, -0.916954755783081, -0.2016606330871582, 0.5136337280273438, 1.2289276123046875, 1.9442217350006104, 2.659515857696533, 3.374809980392456, 4.090104103088379, 4.805397987365723, 5.520692348480225, 6.235986709594727, 6.95128059387207, 7.666574478149414, 8.381868362426758, 9.097163200378418, 9.812457084655762, 10.527750968933105, 11.243045806884766, 11.95833969116211, 12.673633575439453, 13.388927459716797, 14.10422134399414, 14.8195161819458, 15.534810066223145, 16.250104904174805, 16.96539878845215, 17.680692672729492, 18.395986557006836, 19.11128044128418, 19.826574325561523, 20.541868209838867, 21.257164001464844, 21.972457885742188, 22.68775177001953, 23.403045654296875, 24.11833953857422]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 0.0, 2.0, 2.0, 8.0, 7.0, 9.0, 20.0, 15.0, 13.0, 23.0, 26.0, 18.0, 35.0, 41.0, 36.0, 41.0, 31.0, 39.0, 49.0, 44.0, 47.0, 42.0, 36.0, 48.0, 43.0, 43.0, 38.0, 36.0, 40.0, 32.0, 20.0, 29.0, 16.0, 7.0, 8.0, 10.0, 9.0, 14.0, 9.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.38828468322754, -25.47492218017578, -24.561559677124023, -23.648197174072266, -22.734834671020508, -21.82147216796875, -20.90810775756836, -19.994747161865234, -19.081382751464844, -18.168020248413086, -17.254657745361328, -16.34129524230957, -15.427932739257812, -14.514570236206055, -13.60120677947998, -12.687844276428223, -11.774482727050781, -10.861120223999023, -9.947757720947266, -9.034395217895508, -8.12103271484375, -7.207669734954834, -6.294306755065918, -5.38094425201416, -4.467581748962402, -3.5542192459106445, -2.6408565044403076, -1.7274937629699707, -0.8141312599182129, 0.09923124313354492, 1.012594223022461, 1.9259567260742188, 2.8393211364746094, 3.752683639526367, 4.666046142578125, 5.579409122467041, 6.492771625518799, 7.406134128570557, 8.319497108459473, 9.23285961151123, 10.146222114562988, 11.059584617614746, 11.972947120666504, 12.886310577392578, 13.799673080444336, 14.713035583496094, 15.626398086547852, 16.53976058959961, 17.453123092651367, 18.366485595703125, 19.279848098754883, 20.19321060180664, 21.1065731048584, 22.019935607910156, 22.933300018310547, 23.846660614013672, 24.760025024414062, 25.67338752746582, 26.586750030517578, 27.500112533569336, 28.413475036621094, 29.32683753967285, 30.24020004272461, 31.153564453125, 32.066925048828125]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 9.0, 13.0, 20.0, 37.0, 55.0, 75.0, 138.0, 221.0, 327.0, 504.0, 739.0, 1208.0, 1901.0, 3185.0, 4977.0, 7956.0, 12512.0, 20084.0, 32295.0, 50975.0, 80436.0, 125071.0, 187987.0, 270363.0, 364289.0, 453687.0, 506530.0, 502247.0, 444551.0, 353818.0, 260263.0, 178946.0, 118859.0, 76602.0, 48968.0, 30746.0, 19460.0, 12565.0, 7685.0, 5007.0, 3202.0, 2023.0, 1318.0, 843.0, 527.0, 357.0, 228.0, 161.0, 118.0, 68.0, 51.0, 34.0, 21.0, 10.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-16.78125, -16.22119140625, -15.6611328125, -15.10107421875, -14.541015625, -13.98095703125, -13.4208984375, -12.86083984375, -12.30078125, -11.74072265625, -11.1806640625, -10.62060546875, -10.060546875, -9.50048828125, -8.9404296875, -8.38037109375, -7.8203125, -7.26025390625, -6.7001953125, -6.14013671875, -5.580078125, -5.02001953125, -4.4599609375, -3.89990234375, -3.33984375, -2.77978515625, -2.2197265625, -1.65966796875, -1.099609375, -0.53955078125, 0.0205078125, 0.58056640625, 1.140625, 1.70068359375, 2.2607421875, 2.82080078125, 3.380859375, 3.94091796875, 4.5009765625, 5.06103515625, 5.62109375, 6.18115234375, 6.7412109375, 7.30126953125, 7.861328125, 8.42138671875, 8.9814453125, 9.54150390625, 10.1015625, 10.66162109375, 11.2216796875, 11.78173828125, 12.341796875, 12.90185546875, 13.4619140625, 14.02197265625, 14.58203125, 15.14208984375, 15.7021484375, 16.26220703125, 16.822265625, 17.38232421875, 17.9423828125, 18.50244140625, 19.0625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 10.0, 5.0, 13.0, 13.0, 16.0, 19.0, 23.0, 18.0, 27.0, 32.0, 42.0, 29.0, 46.0, 39.0, 36.0, 49.0, 44.0, 41.0, 41.0, 41.0, 46.0, 54.0, 40.0, 45.0, 46.0, 28.0, 22.0, 24.0, 18.0, 11.0, 13.0, 12.0, 8.0, 9.0, 14.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.1875, -22.40625, -21.625, -20.84375, -20.0625, -19.28125, -18.5, -17.71875, -16.9375, -16.15625, -15.375, -14.59375, -13.8125, -13.03125, -12.25, -11.46875, -10.6875, -9.90625, -9.125, -8.34375, -7.5625, -6.78125, -6.0, -5.21875, -4.4375, -3.65625, -2.875, -2.09375, -1.3125, -0.53125, 0.25, 1.03125, 1.8125, 2.59375, 3.375, 4.15625, 4.9375, 5.71875, 6.5, 7.28125, 8.0625, 8.84375, 9.625, 10.40625, 11.1875, 11.96875, 12.75, 13.53125, 14.3125, 15.09375, 15.875, 16.65625, 17.4375, 18.21875, 19.0, 19.78125, 20.5625, 21.34375, 22.125, 22.90625, 23.6875, 24.46875, 25.25, 26.03125, 26.8125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 11.0, 10.0, 20.0, 27.0, 66.0, 153.0, 249.0, 530.0, 1002.0, 2075.0, 3899.0, 8097.0, 15554.0, 31349.0, 60761.0, 112074.0, 201254.0, 332023.0, 486460.0, 617962.0, 658885.0, 582438.0, 435032.0, 283770.0, 168319.0, 92230.0, 49027.0, 25244.0, 12747.0, 6360.0, 3286.0, 1605.0, 840.0, 436.0, 241.0, 118.0, 60.0, 28.0, 17.0, 11.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.65625, -26.82666015625, -25.9970703125, -25.16748046875, -24.337890625, -23.50830078125, -22.6787109375, -21.84912109375, -21.01953125, -20.18994140625, -19.3603515625, -18.53076171875, -17.701171875, -16.87158203125, -16.0419921875, -15.21240234375, -14.3828125, -13.55322265625, -12.7236328125, -11.89404296875, -11.064453125, -10.23486328125, -9.4052734375, -8.57568359375, -7.74609375, -6.91650390625, -6.0869140625, -5.25732421875, -4.427734375, -3.59814453125, -2.7685546875, -1.93896484375, -1.109375, -0.27978515625, 0.5498046875, 1.37939453125, 2.208984375, 3.03857421875, 3.8681640625, 4.69775390625, 5.52734375, 6.35693359375, 7.1865234375, 8.01611328125, 8.845703125, 9.67529296875, 10.5048828125, 11.33447265625, 12.1640625, 12.99365234375, 13.8232421875, 14.65283203125, 15.482421875, 16.31201171875, 17.1416015625, 17.97119140625, 18.80078125, 19.63037109375, 20.4599609375, 21.28955078125, 22.119140625, 22.94873046875, 23.7783203125, 24.60791015625, 25.4375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 13.0, 5.0, 18.0, 16.0, 25.0, 34.0, 43.0, 55.0, 50.0, 78.0, 81.0, 107.0, 103.0, 132.0, 149.0, 177.0, 190.0, 197.0, 219.0, 203.0, 199.0, 224.0, 202.0, 197.0, 179.0, 171.0, 175.0, 153.0, 139.0, 115.0, 88.0, 72.0, 63.0, 42.0, 43.0, 39.0, 28.0, 16.0, 12.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.1741943359375, -9.832763671875, -9.4913330078125, -9.14990234375, -8.8084716796875, -8.467041015625, -8.1256103515625, -7.7841796875, -7.4427490234375, -7.101318359375, -6.7598876953125, -6.41845703125, -6.0770263671875, -5.735595703125, -5.3941650390625, -5.052734375, -4.7113037109375, -4.369873046875, -4.0284423828125, -3.68701171875, -3.3455810546875, -3.004150390625, -2.6627197265625, -2.3212890625, -1.9798583984375, -1.638427734375, -1.2969970703125, -0.95556640625, -0.6141357421875, -0.272705078125, 0.0687255859375, 0.41015625, 0.7515869140625, 1.093017578125, 1.4344482421875, 1.77587890625, 2.1173095703125, 2.458740234375, 2.8001708984375, 3.1416015625, 3.4830322265625, 3.824462890625, 4.1658935546875, 4.50732421875, 4.8487548828125, 5.190185546875, 5.5316162109375, 5.873046875, 6.2144775390625, 6.555908203125, 6.8973388671875, 7.23876953125, 7.5802001953125, 7.921630859375, 8.2630615234375, 8.6044921875, 8.9459228515625, 9.287353515625, 9.6287841796875, 9.97021484375, 10.3116455078125, 10.653076171875, 10.9945068359375, 11.3359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 14.0, 10.0, 9.0, 12.0, 15.0, 16.0, 20.0, 24.0, 25.0, 32.0, 41.0, 41.0, 39.0, 40.0, 39.0, 39.0, 44.0, 50.0, 45.0, 57.0, 38.0, 38.0, 27.0, 45.0, 38.0, 29.0, 27.0, 27.0, 22.0, 11.0, 15.0, 11.0, 13.0, 12.0, 7.0, 4.0, 1.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.768598556518555, -22.987808227539062, -22.20701789855957, -21.426227569580078, -20.645435333251953, -19.86464500427246, -19.08385467529297, -18.303064346313477, -17.522274017333984, -16.741483688354492, -15.960693359375, -15.179902076721191, -14.3991117477417, -13.618321418762207, -12.837530136108398, -12.056739807128906, -11.275949478149414, -10.495159149169922, -9.71436882019043, -8.933577537536621, -8.152787208557129, -7.371996879577637, -6.591206073760986, -5.810415267944336, -5.029624938964844, -4.248834609985352, -3.468043804168701, -2.68725323677063, -1.9064626693725586, -1.1256721019744873, -0.344881534576416, 0.4359092712402344, 1.2166996002197266, 1.9974901676177979, 2.778280735015869, 3.5590713024139404, 4.339861869812012, 5.120652198791504, 5.901443004608154, 6.682233810424805, 7.463024139404297, 8.243814468383789, 9.024604797363281, 9.80539608001709, 10.586186408996582, 11.366976737976074, 12.147768020629883, 12.928558349609375, 13.709348678588867, 14.49013900756836, 15.270929336547852, 16.051719665527344, 16.83251190185547, 17.61330223083496, 18.394092559814453, 19.174882888793945, 19.955673217773438, 20.73646354675293, 21.517253875732422, 22.298044204711914, 23.078834533691406, 23.85962677001953, 24.640417098999023, 25.421207427978516, 26.201997756958008]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 2.0, 4.0, 5.0, 4.0, 12.0, 13.0, 8.0, 19.0, 21.0, 21.0, 28.0, 29.0, 34.0, 28.0, 34.0, 39.0, 31.0, 53.0, 38.0, 42.0, 46.0, 48.0, 39.0, 42.0, 35.0, 27.0, 33.0, 42.0, 22.0, 22.0, 24.0, 26.0, 20.0, 14.0, 18.0, 15.0, 12.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.339447021484375, -26.476778030395508, -25.61410903930664, -24.751441955566406, -23.88877296447754, -23.026103973388672, -22.163434982299805, -21.300765991210938, -20.438098907470703, -19.575429916381836, -18.71276092529297, -17.850093841552734, -16.987424850463867, -16.124755859375, -15.262086868286133, -14.399417877197266, -13.536748886108398, -12.674079895019531, -11.81141185760498, -10.948742866516113, -10.086074829101562, -9.223405838012695, -8.360736846923828, -7.498068332672119, -6.63539981842041, -5.772731304168701, -4.910062789916992, -4.047393798828125, -3.184725284576416, -2.322056770324707, -1.4593877792358398, -0.5967192649841309, 0.2659473419189453, 1.1286159753799438, 1.9912846088409424, 2.8539533615112305, 3.7166218757629395, 4.579290390014648, 5.441959381103516, 6.304627895355225, 7.167296409606934, 8.0299654006958, 8.892633438110352, 9.755302429199219, 10.617971420288086, 11.480639457702637, 12.343308448791504, 13.205976486206055, 14.068645477294922, 14.931314468383789, 15.79398250579834, 16.65665054321289, 17.519319534301758, 18.381988525390625, 19.244657516479492, 20.10732650756836, 20.969993591308594, 21.83266258239746, 22.695331573486328, 23.557998657226562, 24.42066764831543, 25.283336639404297, 26.146005630493164, 27.00867462158203, 27.8713436126709]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 9.0, 13.0, 23.0, 38.0, 52.0, 107.0, 120.0, 199.0, 353.0, 457.0, 757.0, 1188.0, 1831.0, 2973.0, 4617.0, 7242.0, 10834.0, 16851.0, 25317.0, 37536.0, 54430.0, 73634.0, 94972.0, 111130.0, 119327.0, 115411.0, 100828.0, 80612.0, 60443.0, 42453.0, 29389.0, 19350.0, 12775.0, 8290.0, 5364.0, 3431.0, 2163.0, 1458.0, 891.0, 591.0, 414.0, 251.0, 155.0, 93.0, 72.0, 42.0, 25.0, 15.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.49609375, -6.30316162109375, -6.1102294921875, -5.91729736328125, -5.724365234375, -5.53143310546875, -5.3385009765625, -5.14556884765625, -4.95263671875, -4.75970458984375, -4.5667724609375, -4.37384033203125, -4.180908203125, -3.98797607421875, -3.7950439453125, -3.60211181640625, -3.4091796875, -3.21624755859375, -3.0233154296875, -2.83038330078125, -2.637451171875, -2.44451904296875, -2.2515869140625, -2.05865478515625, -1.86572265625, -1.67279052734375, -1.4798583984375, -1.28692626953125, -1.093994140625, -0.90106201171875, -0.7081298828125, -0.51519775390625, -0.322265625, -0.12933349609375, 0.0635986328125, 0.25653076171875, 0.449462890625, 0.64239501953125, 0.8353271484375, 1.02825927734375, 1.22119140625, 1.41412353515625, 1.6070556640625, 1.79998779296875, 1.992919921875, 2.18585205078125, 2.3787841796875, 2.57171630859375, 2.7646484375, 2.95758056640625, 3.1505126953125, 3.34344482421875, 3.536376953125, 3.72930908203125, 3.9222412109375, 4.11517333984375, 4.30810546875, 4.50103759765625, 4.6939697265625, 4.88690185546875, 5.079833984375, 5.27276611328125, 5.4656982421875, 5.65863037109375, 5.8515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 3.0, 5.0, 3.0, 10.0, 10.0, 6.0, 23.0, 17.0, 20.0, 19.0, 30.0, 25.0, 35.0, 45.0, 27.0, 45.0, 37.0, 35.0, 42.0, 50.0, 47.0, 41.0, 31.0, 41.0, 31.0, 39.0, 35.0, 21.0, 32.0, 20.0, 27.0, 25.0, 13.0, 22.0, 11.0, 16.0, 11.0, 10.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.546875, -27.660888671875, -26.77490234375, -25.888916015625, -25.0029296875, -24.116943359375, -23.23095703125, -22.344970703125, -21.458984375, -20.572998046875, -19.68701171875, -18.801025390625, -17.9150390625, -17.029052734375, -16.14306640625, -15.257080078125, -14.37109375, -13.485107421875, -12.59912109375, -11.713134765625, -10.8271484375, -9.941162109375, -9.05517578125, -8.169189453125, -7.283203125, -6.397216796875, -5.51123046875, -4.625244140625, -3.7392578125, -2.853271484375, -1.96728515625, -1.081298828125, -0.1953125, 0.690673828125, 1.57666015625, 2.462646484375, 3.3486328125, 4.234619140625, 5.12060546875, 6.006591796875, 6.892578125, 7.778564453125, 8.66455078125, 9.550537109375, 10.4365234375, 11.322509765625, 12.20849609375, 13.094482421875, 13.98046875, 14.866455078125, 15.75244140625, 16.638427734375, 17.5244140625, 18.410400390625, 19.29638671875, 20.182373046875, 21.068359375, 21.954345703125, 22.84033203125, 23.726318359375, 24.6123046875, 25.498291015625, 26.38427734375, 27.270263671875, 28.15625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 13.0, 13.0, 18.0, 36.0, 37.0, 59.0, 99.0, 161.0, 230.0, 341.0, 523.0, 883.0, 1398.0, 2152.0, 3448.0, 5679.0, 9046.0, 14517.0, 22993.0, 35972.0, 54971.0, 79985.0, 109308.0, 134091.0, 141628.0, 127690.0, 99628.0, 71374.0, 48002.0, 31244.0, 19742.0, 12434.0, 7759.0, 4869.0, 3019.0, 1915.0, 1200.0, 737.0, 485.0, 311.0, 184.0, 132.0, 69.0, 51.0, 36.0, 23.0, 13.0, 10.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0], "bins": [-8.046875, -7.80548095703125, -7.5640869140625, -7.32269287109375, -7.081298828125, -6.83990478515625, -6.5985107421875, -6.35711669921875, -6.11572265625, -5.87432861328125, -5.6329345703125, -5.39154052734375, -5.150146484375, -4.90875244140625, -4.6673583984375, -4.42596435546875, -4.1845703125, -3.94317626953125, -3.7017822265625, -3.46038818359375, -3.218994140625, -2.97760009765625, -2.7362060546875, -2.49481201171875, -2.25341796875, -2.01202392578125, -1.7706298828125, -1.52923583984375, -1.287841796875, -1.04644775390625, -0.8050537109375, -0.56365966796875, -0.322265625, -0.08087158203125, 0.1605224609375, 0.40191650390625, 0.643310546875, 0.88470458984375, 1.1260986328125, 1.36749267578125, 1.60888671875, 1.85028076171875, 2.0916748046875, 2.33306884765625, 2.574462890625, 2.81585693359375, 3.0572509765625, 3.29864501953125, 3.5400390625, 3.78143310546875, 4.0228271484375, 4.26422119140625, 4.505615234375, 4.74700927734375, 4.9884033203125, 5.22979736328125, 5.47119140625, 5.71258544921875, 5.9539794921875, 6.19537353515625, 6.436767578125, 6.67816162109375, 6.9195556640625, 7.16094970703125, 7.40234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 10.0, 4.0, 7.0, 9.0, 10.0, 15.0, 12.0, 18.0, 19.0, 26.0, 29.0, 35.0, 33.0, 33.0, 38.0, 37.0, 28.0, 47.0, 40.0, 28.0, 35.0, 32.0, 24.0, 28.0, 28.0, 38.0, 26.0, 37.0, 31.0, 29.0, 29.0, 23.0, 18.0, 23.0, 25.0, 23.0, 18.0, 9.0, 14.0, 6.0, 3.0, 9.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.7734375, -14.3060302734375, -13.838623046875, -13.3712158203125, -12.90380859375, -12.4364013671875, -11.968994140625, -11.5015869140625, -11.0341796875, -10.5667724609375, -10.099365234375, -9.6319580078125, -9.16455078125, -8.6971435546875, -8.229736328125, -7.7623291015625, -7.294921875, -6.8275146484375, -6.360107421875, -5.8927001953125, -5.42529296875, -4.9578857421875, -4.490478515625, -4.0230712890625, -3.5556640625, -3.0882568359375, -2.620849609375, -2.1534423828125, -1.68603515625, -1.2186279296875, -0.751220703125, -0.2838134765625, 0.18359375, 0.6510009765625, 1.118408203125, 1.5858154296875, 2.05322265625, 2.5206298828125, 2.988037109375, 3.4554443359375, 3.9228515625, 4.3902587890625, 4.857666015625, 5.3250732421875, 5.79248046875, 6.2598876953125, 6.727294921875, 7.1947021484375, 7.662109375, 8.1295166015625, 8.596923828125, 9.0643310546875, 9.53173828125, 9.9991455078125, 10.466552734375, 10.9339599609375, 11.4013671875, 11.8687744140625, 12.336181640625, 12.8035888671875, 13.27099609375, 13.7384033203125, 14.205810546875, 14.6732177734375, 15.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 13.0, 10.0, 11.0, 26.0, 56.0, 83.0, 110.0, 180.0, 289.0, 494.0, 712.0, 1250.0, 1971.0, 3293.0, 5689.0, 9912.0, 16694.0, 28237.0, 47612.0, 77638.0, 117963.0, 158467.0, 171625.0, 143955.0, 101730.0, 64297.0, 39233.0, 23429.0, 13796.0, 8090.0, 4699.0, 2778.0, 1651.0, 978.0, 596.0, 366.0, 211.0, 128.0, 98.0, 70.0, 41.0, 27.0, 10.0, 8.0, 8.0, 9.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.109375, -3.989593505859375, -3.86981201171875, -3.750030517578125, -3.6302490234375, -3.510467529296875, -3.39068603515625, -3.270904541015625, -3.151123046875, -3.031341552734375, -2.91156005859375, -2.791778564453125, -2.6719970703125, -2.552215576171875, -2.43243408203125, -2.312652587890625, -2.19287109375, -2.073089599609375, -1.95330810546875, -1.833526611328125, -1.7137451171875, -1.593963623046875, -1.47418212890625, -1.354400634765625, -1.234619140625, -1.114837646484375, -0.99505615234375, -0.875274658203125, -0.7554931640625, -0.635711669921875, -0.51593017578125, -0.396148681640625, -0.2763671875, -0.156585693359375, -0.03680419921875, 0.082977294921875, 0.2027587890625, 0.322540283203125, 0.44232177734375, 0.562103271484375, 0.681884765625, 0.801666259765625, 0.92144775390625, 1.041229248046875, 1.1610107421875, 1.280792236328125, 1.40057373046875, 1.520355224609375, 1.64013671875, 1.759918212890625, 1.87969970703125, 1.999481201171875, 2.1192626953125, 2.239044189453125, 2.35882568359375, 2.478607177734375, 2.598388671875, 2.718170166015625, 2.83795166015625, 2.957733154296875, 3.0775146484375, 3.197296142578125, 3.31707763671875, 3.436859130859375, 3.556640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 8.0, 3.0, 7.0, 10.0, 9.0, 16.0, 25.0, 20.0, 25.0, 34.0, 30.0, 35.0, 56.0, 37.0, 51.0, 69.0, 66.0, 56.0, 41.0, 48.0, 50.0, 45.0, 41.0, 36.0, 37.0, 22.0, 27.0, 23.0, 12.0, 14.0, 13.0, 6.0, 3.0, 1.0, 4.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002262592315673828, -0.00021835044026374817, -0.00021044164896011353, -0.00020253285765647888, -0.00019462406635284424, -0.0001867152750492096, -0.00017880648374557495, -0.0001708976924419403, -0.00016298890113830566, -0.00015508010983467102, -0.00014717131853103638, -0.00013926252722740173, -0.0001313537359237671, -0.00012344494462013245, -0.0001155361533164978, -0.00010762736201286316, -9.971857070922852e-05, -9.180977940559387e-05, -8.390098810195923e-05, -7.599219679832458e-05, -6.808340549468994e-05, -6.01746141910553e-05, -5.2265822887420654e-05, -4.435703158378601e-05, -3.644824028015137e-05, -2.8539448976516724e-05, -2.063065767288208e-05, -1.2721866369247437e-05, -4.813075065612793e-06, 3.0957162380218506e-06, 1.1004507541656494e-05, 1.8913298845291138e-05, 2.682209014892578e-05, 3.4730881452560425e-05, 4.263967275619507e-05, 5.054846405982971e-05, 5.8457255363464355e-05, 6.6366046667099e-05, 7.427483797073364e-05, 8.218362927436829e-05, 9.009242057800293e-05, 9.800121188163757e-05, 0.00010591000318527222, 0.00011381879448890686, 0.0001217275857925415, 0.00012963637709617615, 0.0001375451683998108, 0.00014545395970344543, 0.00015336275100708008, 0.00016127154231071472, 0.00016918033361434937, 0.000177089124917984, 0.00018499791622161865, 0.0001929067075252533, 0.00020081549882888794, 0.00020872429013252258, 0.00021663308143615723, 0.00022454187273979187, 0.00023245066404342651, 0.00024035945534706116, 0.0002482682466506958, 0.00025617703795433044, 0.0002640858292579651, 0.00027199462056159973, 0.0002799034118652344]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 7.0, 13.0, 8.0, 7.0, 22.0, 41.0, 52.0, 97.0, 131.0, 190.0, 246.0, 390.0, 599.0, 912.0, 1341.0, 2129.0, 2989.0, 4683.0, 6872.0, 10370.0, 15507.0, 22303.0, 32284.0, 45226.0, 61291.0, 79274.0, 96217.0, 107887.0, 111222.0, 104138.0, 89454.0, 72116.0, 54069.0, 39663.0, 27924.0, 19410.0, 12998.0, 8858.0, 5929.0, 3912.0, 2511.0, 1774.0, 1146.0, 783.0, 509.0, 330.0, 256.0, 164.0, 99.0, 66.0, 58.0, 41.0, 25.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.872650146484375, -2.77459716796875, -2.676544189453125, -2.5784912109375, -2.480438232421875, -2.38238525390625, -2.284332275390625, -2.186279296875, -2.088226318359375, -1.99017333984375, -1.892120361328125, -1.7940673828125, -1.696014404296875, -1.59796142578125, -1.499908447265625, -1.40185546875, -1.303802490234375, -1.20574951171875, -1.107696533203125, -1.0096435546875, -0.911590576171875, -0.81353759765625, -0.715484619140625, -0.617431640625, -0.519378662109375, -0.42132568359375, -0.323272705078125, -0.2252197265625, -0.127166748046875, -0.02911376953125, 0.068939208984375, 0.1669921875, 0.265045166015625, 0.36309814453125, 0.461151123046875, 0.5592041015625, 0.657257080078125, 0.75531005859375, 0.853363037109375, 0.951416015625, 1.049468994140625, 1.14752197265625, 1.245574951171875, 1.3436279296875, 1.441680908203125, 1.53973388671875, 1.637786865234375, 1.73583984375, 1.833892822265625, 1.93194580078125, 2.029998779296875, 2.1280517578125, 2.226104736328125, 2.32415771484375, 2.422210693359375, 2.520263671875, 2.618316650390625, 2.71636962890625, 2.814422607421875, 2.9124755859375, 3.010528564453125, 3.10858154296875, 3.206634521484375, 3.3046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 12.0, 5.0, 13.0, 12.0, 14.0, 15.0, 22.0, 35.0, 25.0, 23.0, 38.0, 46.0, 41.0, 40.0, 47.0, 58.0, 57.0, 53.0, 44.0, 50.0, 45.0, 34.0, 44.0, 25.0, 35.0, 28.0, 20.0, 26.0, 14.0, 14.0, 10.0, 9.0, 13.0, 8.0, 1.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.482421875, -1.4344482421875, -1.386474609375, -1.3385009765625, -1.29052734375, -1.2425537109375, -1.194580078125, -1.1466064453125, -1.0986328125, -1.0506591796875, -1.002685546875, -0.9547119140625, -0.90673828125, -0.8587646484375, -0.810791015625, -0.7628173828125, -0.71484375, -0.6668701171875, -0.618896484375, -0.5709228515625, -0.52294921875, -0.4749755859375, -0.427001953125, -0.3790283203125, -0.3310546875, -0.2830810546875, -0.235107421875, -0.1871337890625, -0.13916015625, -0.0911865234375, -0.043212890625, 0.0047607421875, 0.052734375, 0.1007080078125, 0.148681640625, 0.1966552734375, 0.24462890625, 0.2926025390625, 0.340576171875, 0.3885498046875, 0.4365234375, 0.4844970703125, 0.532470703125, 0.5804443359375, 0.62841796875, 0.6763916015625, 0.724365234375, 0.7723388671875, 0.8203125, 0.8682861328125, 0.916259765625, 0.9642333984375, 1.01220703125, 1.0601806640625, 1.108154296875, 1.1561279296875, 1.2041015625, 1.2520751953125, 1.300048828125, 1.3480224609375, 1.39599609375, 1.4439697265625, 1.491943359375, 1.5399169921875, 1.587890625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 6.0, 8.0, 11.0, 13.0, 17.0, 10.0, 21.0, 17.0, 20.0, 28.0, 38.0, 37.0, 41.0, 43.0, 44.0, 39.0, 39.0, 52.0, 42.0, 54.0, 46.0, 38.0, 42.0, 34.0, 40.0, 34.0, 29.0, 31.0, 17.0, 25.0, 11.0, 8.0, 15.0, 13.0, 11.0, 6.0, 1.0, 3.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.4010066986084, -23.616025924682617, -22.83104705810547, -22.046066284179688, -21.261085510253906, -20.476104736328125, -19.691125869750977, -18.906145095825195, -18.121166229248047, -17.336185455322266, -16.551206588745117, -15.766225814819336, -14.981245040893555, -14.19626522064209, -13.411285400390625, -12.626304626464844, -11.841323852539062, -11.056344032287598, -10.271363258361816, -9.486383438110352, -8.70140266418457, -7.9164228439331055, -7.131443023681641, -6.346462726593018, -5.5614824295043945, -4.7765021324157715, -3.9915220737457275, -3.2065420150756836, -2.4215617179870605, -1.6365814208984375, -0.8516016006469727, -0.06662130355834961, 0.7183609008789062, 1.5033410787582397, 2.2883212566375732, 3.073301315307617, 3.8582816123962402, 4.643261909484863, 5.428241729736328, 6.213222026824951, 6.998202323913574, 7.783182621002197, 8.56816291809082, 9.353142738342285, 10.13812255859375, 10.923103332519531, 11.708083152770996, 12.493062973022461, 13.278043746948242, 14.063023567199707, 14.848004341125488, 15.632984161376953, 16.417964935302734, 17.202945709228516, 17.987924575805664, 18.772905349731445, 19.557884216308594, 20.342864990234375, 21.127843856811523, 21.912824630737305, 22.697805404663086, 23.482784271240234, 24.267765045166016, 25.052745819091797, 25.837726593017578]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 6.0, 1.0, 7.0, 3.0, 13.0, 7.0, 13.0, 13.0, 23.0, 20.0, 26.0, 26.0, 34.0, 30.0, 32.0, 32.0, 42.0, 51.0, 36.0, 44.0, 41.0, 43.0, 46.0, 46.0, 41.0, 25.0, 25.0, 46.0, 27.0, 19.0, 29.0, 22.0, 21.0, 16.0, 20.0, 14.0, 11.0, 9.0, 8.0, 7.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.532257080078125, -26.670007705688477, -25.807758331298828, -24.945510864257812, -24.083261489868164, -23.221012115478516, -22.358762741088867, -21.49651336669922, -20.63426399230957, -19.772014617919922, -18.909765243530273, -18.047515869140625, -17.18526840209961, -16.32301902770996, -15.460769653320312, -14.598520278930664, -13.736271858215332, -12.874022483825684, -12.011774063110352, -11.149524688720703, -10.287275314331055, -9.425025939941406, -8.562777519226074, -7.700528144836426, -6.8382792472839355, -5.976030349731445, -5.113780975341797, -4.251532077789307, -3.3892829418182373, -2.527033805847168, -1.6647849082946777, -0.8025355339050293, 0.05971336364746094, 0.9219624400138855, 1.78421151638031, 2.64646053314209, 3.508709669113159, 4.3709588050842285, 5.233207702636719, 6.095457077026367, 6.957705974578857, 7.819954872131348, 8.682204246520996, 9.544452667236328, 10.406702041625977, 11.268951416015625, 12.131200790405273, 12.993450164794922, 13.855698585510254, 14.717947959899902, 15.580196380615234, 16.442445755004883, 17.30469512939453, 18.16694450378418, 19.029193878173828, 19.891441345214844, 20.753690719604492, 21.61594009399414, 22.47818946838379, 23.340438842773438, 24.202686309814453, 25.0649356842041, 25.92718505859375, 26.7894344329834, 27.651683807373047]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 10.0, 12.0, 14.0, 29.0, 46.0, 57.0, 96.0, 188.0, 266.0, 400.0, 730.0, 1154.0, 1775.0, 2920.0, 4478.0, 7081.0, 11092.0, 16888.0, 24953.0, 36283.0, 49771.0, 66355.0, 82756.0, 96606.0, 105579.0, 107513.0, 100503.0, 86836.0, 71121.0, 54122.0, 38891.0, 27570.0, 18525.0, 12246.0, 7941.0, 5113.0, 3253.0, 1951.0, 1297.0, 822.0, 514.0, 281.0, 176.0, 122.0, 78.0, 47.0, 38.0, 15.0, 14.0, 10.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0], "bins": [-12.671875, -12.2774658203125, -11.883056640625, -11.4886474609375, -11.09423828125, -10.6998291015625, -10.305419921875, -9.9110107421875, -9.5166015625, -9.1221923828125, -8.727783203125, -8.3333740234375, -7.93896484375, -7.5445556640625, -7.150146484375, -6.7557373046875, -6.361328125, -5.9669189453125, -5.572509765625, -5.1781005859375, -4.78369140625, -4.3892822265625, -3.994873046875, -3.6004638671875, -3.2060546875, -2.8116455078125, -2.417236328125, -2.0228271484375, -1.62841796875, -1.2340087890625, -0.839599609375, -0.4451904296875, -0.05078125, 0.3436279296875, 0.738037109375, 1.1324462890625, 1.52685546875, 1.9212646484375, 2.315673828125, 2.7100830078125, 3.1044921875, 3.4989013671875, 3.893310546875, 4.2877197265625, 4.68212890625, 5.0765380859375, 5.470947265625, 5.8653564453125, 6.259765625, 6.6541748046875, 7.048583984375, 7.4429931640625, 7.83740234375, 8.2318115234375, 8.626220703125, 9.0206298828125, 9.4150390625, 9.8094482421875, 10.203857421875, 10.5982666015625, 10.99267578125, 11.3870849609375, 11.781494140625, 12.1759033203125, 12.5703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 9.0, 5.0, 11.0, 8.0, 12.0, 20.0, 17.0, 29.0, 22.0, 17.0, 22.0, 39.0, 29.0, 40.0, 37.0, 42.0, 40.0, 28.0, 47.0, 51.0, 44.0, 42.0, 48.0, 37.0, 33.0, 28.0, 29.0, 25.0, 19.0, 23.0, 18.0, 22.0, 15.0, 20.0, 15.0, 8.0, 7.0, 5.0, 7.0, 5.0, 8.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-26.5, -25.6240234375, -24.748046875, -23.8720703125, -22.99609375, -22.1201171875, -21.244140625, -20.3681640625, -19.4921875, -18.6162109375, -17.740234375, -16.8642578125, -15.98828125, -15.1123046875, -14.236328125, -13.3603515625, -12.484375, -11.6083984375, -10.732421875, -9.8564453125, -8.98046875, -8.1044921875, -7.228515625, -6.3525390625, -5.4765625, -4.6005859375, -3.724609375, -2.8486328125, -1.97265625, -1.0966796875, -0.220703125, 0.6552734375, 1.53125, 2.4072265625, 3.283203125, 4.1591796875, 5.03515625, 5.9111328125, 6.787109375, 7.6630859375, 8.5390625, 9.4150390625, 10.291015625, 11.1669921875, 12.04296875, 12.9189453125, 13.794921875, 14.6708984375, 15.546875, 16.4228515625, 17.298828125, 18.1748046875, 19.05078125, 19.9267578125, 20.802734375, 21.6787109375, 22.5546875, 23.4306640625, 24.306640625, 25.1826171875, 26.05859375, 26.9345703125, 27.810546875, 28.6865234375, 29.5625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 10.0, 16.0, 15.0, 42.0, 31.0, 70.0, 139.0, 211.0, 337.0, 529.0, 780.0, 1152.0, 1713.0, 2755.0, 4023.0, 5995.0, 8935.0, 13314.0, 19242.0, 27810.0, 39028.0, 52383.0, 67010.0, 81468.0, 93777.0, 100553.0, 100761.0, 94135.0, 82591.0, 67765.0, 52871.0, 39525.0, 28443.0, 19889.0, 13728.0, 9359.0, 6208.0, 4075.0, 2782.0, 1765.0, 1143.0, 734.0, 520.0, 345.0, 203.0, 143.0, 85.0, 53.0, 40.0, 32.0, 12.0, 10.0, 9.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3436279296875, -10.952880859375, -10.5621337890625, -10.17138671875, -9.7806396484375, -9.389892578125, -8.9991455078125, -8.6083984375, -8.2176513671875, -7.826904296875, -7.4361572265625, -7.04541015625, -6.6546630859375, -6.263916015625, -5.8731689453125, -5.482421875, -5.0916748046875, -4.700927734375, -4.3101806640625, -3.91943359375, -3.5286865234375, -3.137939453125, -2.7471923828125, -2.3564453125, -1.9656982421875, -1.574951171875, -1.1842041015625, -0.79345703125, -0.4027099609375, -0.011962890625, 0.3787841796875, 0.76953125, 1.1602783203125, 1.551025390625, 1.9417724609375, 2.33251953125, 2.7232666015625, 3.114013671875, 3.5047607421875, 3.8955078125, 4.2862548828125, 4.677001953125, 5.0677490234375, 5.45849609375, 5.8492431640625, 6.239990234375, 6.6307373046875, 7.021484375, 7.4122314453125, 7.802978515625, 8.1937255859375, 8.58447265625, 8.9752197265625, 9.365966796875, 9.7567138671875, 10.1474609375, 10.5382080078125, 10.928955078125, 11.3197021484375, 11.71044921875, 12.1011962890625, 12.491943359375, 12.8826904296875, 13.2734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 8.0, 15.0, 11.0, 12.0, 13.0, 22.0, 18.0, 24.0, 19.0, 22.0, 31.0, 22.0, 35.0, 38.0, 41.0, 31.0, 29.0, 36.0, 42.0, 32.0, 41.0, 44.0, 33.0, 43.0, 25.0, 40.0, 23.0, 34.0, 24.0, 21.0, 22.0, 16.0, 20.0, 13.0, 15.0, 13.0, 11.0, 8.0, 6.0, 6.0, 8.0, 7.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.066162109375, -12.56982421875, -12.073486328125, -11.5771484375, -11.080810546875, -10.58447265625, -10.088134765625, -9.591796875, -9.095458984375, -8.59912109375, -8.102783203125, -7.6064453125, -7.110107421875, -6.61376953125, -6.117431640625, -5.62109375, -5.124755859375, -4.62841796875, -4.132080078125, -3.6357421875, -3.139404296875, -2.64306640625, -2.146728515625, -1.650390625, -1.154052734375, -0.65771484375, -0.161376953125, 0.3349609375, 0.831298828125, 1.32763671875, 1.823974609375, 2.3203125, 2.816650390625, 3.31298828125, 3.809326171875, 4.3056640625, 4.802001953125, 5.29833984375, 5.794677734375, 6.291015625, 6.787353515625, 7.28369140625, 7.780029296875, 8.2763671875, 8.772705078125, 9.26904296875, 9.765380859375, 10.26171875, 10.758056640625, 11.25439453125, 11.750732421875, 12.2470703125, 12.743408203125, 13.23974609375, 13.736083984375, 14.232421875, 14.728759765625, 15.22509765625, 15.721435546875, 16.2177734375, 16.714111328125, 17.21044921875, 17.706787109375, 18.203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 8.0, 15.0, 27.0, 42.0, 74.0, 96.0, 144.0, 247.0, 328.0, 486.0, 851.0, 1190.0, 1766.0, 2719.0, 4174.0, 6138.0, 9119.0, 13227.0, 19049.0, 26978.0, 37099.0, 48331.0, 61940.0, 75041.0, 87133.0, 94485.0, 96041.0, 92990.0, 83942.0, 71359.0, 57904.0, 44974.0, 33436.0, 24088.0, 17176.0, 11685.0, 7989.0, 5400.0, 3776.0, 2358.0, 1628.0, 1043.0, 710.0, 465.0, 278.0, 228.0, 125.0, 90.0, 52.0, 38.0, 26.0, 14.0, 7.0, 12.0, 2.0, 3.0, 4.0, 2.0], "bins": [-4.74609375, -4.599365234375, -4.45263671875, -4.305908203125, -4.1591796875, -4.012451171875, -3.86572265625, -3.718994140625, -3.572265625, -3.425537109375, -3.27880859375, -3.132080078125, -2.9853515625, -2.838623046875, -2.69189453125, -2.545166015625, -2.3984375, -2.251708984375, -2.10498046875, -1.958251953125, -1.8115234375, -1.664794921875, -1.51806640625, -1.371337890625, -1.224609375, -1.077880859375, -0.93115234375, -0.784423828125, -0.6376953125, -0.490966796875, -0.34423828125, -0.197509765625, -0.05078125, 0.095947265625, 0.24267578125, 0.389404296875, 0.5361328125, 0.682861328125, 0.82958984375, 0.976318359375, 1.123046875, 1.269775390625, 1.41650390625, 1.563232421875, 1.7099609375, 1.856689453125, 2.00341796875, 2.150146484375, 2.296875, 2.443603515625, 2.59033203125, 2.737060546875, 2.8837890625, 3.030517578125, 3.17724609375, 3.323974609375, 3.470703125, 3.617431640625, 3.76416015625, 3.910888671875, 4.0576171875, 4.204345703125, 4.35107421875, 4.497802734375, 4.64453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 5.0, 8.0, 9.0, 14.0, 7.0, 14.0, 20.0, 26.0, 26.0, 38.0, 36.0, 46.0, 42.0, 46.0, 54.0, 52.0, 62.0, 53.0, 52.0, 41.0, 61.0, 47.0, 45.0, 27.0, 26.0, 30.0, 28.0, 17.0, 14.0, 10.0, 8.0, 13.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008568763732910156, -0.0008325502276420593, -0.000808224081993103, -0.0007838979363441467, -0.0007595717906951904, -0.0007352456450462341, -0.0007109194993972778, -0.0006865933537483215, -0.0006622672080993652, -0.0006379410624504089, -0.0006136149168014526, -0.0005892887711524963, -0.00056496262550354, -0.0005406364798545837, -0.0005163103342056274, -0.0004919841885566711, -0.00046765804290771484, -0.00044333189725875854, -0.00041900575160980225, -0.00039467960596084595, -0.00037035346031188965, -0.00034602731466293335, -0.00032170116901397705, -0.00029737502336502075, -0.00027304887771606445, -0.00024872273206710815, -0.00022439658641815186, -0.00020007044076919556, -0.00017574429512023926, -0.00015141814947128296, -0.00012709200382232666, -0.00010276585817337036, -7.843971252441406e-05, -5.4113566875457764e-05, -2.9787421226501465e-05, -5.461275577545166e-06, 1.8864870071411133e-05, 4.319101572036743e-05, 6.751716136932373e-05, 9.184330701828003e-05, 0.00011616945266723633, 0.00014049559831619263, 0.00016482174396514893, 0.00018914788961410522, 0.00021347403526306152, 0.00023780018091201782, 0.0002621263265609741, 0.0002864524722099304, 0.0003107786178588867, 0.000335104763507843, 0.0003594309091567993, 0.0003837570548057556, 0.0004080832004547119, 0.0004324093461036682, 0.0004567354917526245, 0.0004810616374015808, 0.0005053877830505371, 0.0005297139286994934, 0.0005540400743484497, 0.000578366219997406, 0.0006026923656463623, 0.0006270185112953186, 0.0006513446569442749, 0.0006756708025932312, 0.0006999969482421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 5.0, 8.0, 18.0, 14.0, 22.0, 45.0, 55.0, 80.0, 146.0, 196.0, 259.0, 405.0, 663.0, 961.0, 1494.0, 2276.0, 3593.0, 5282.0, 7793.0, 11674.0, 17082.0, 24875.0, 34828.0, 47599.0, 62167.0, 77511.0, 91029.0, 99671.0, 102343.0, 97613.0, 86560.0, 72687.0, 57106.0, 43278.0, 31297.0, 22184.0, 15198.0, 10332.0, 6904.0, 4500.0, 3021.0, 2005.0, 1311.0, 837.0, 528.0, 367.0, 253.0, 153.0, 98.0, 70.0, 55.0, 32.0, 27.0, 22.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-5.15625, -4.99169921875, -4.8271484375, -4.66259765625, -4.498046875, -4.33349609375, -4.1689453125, -4.00439453125, -3.83984375, -3.67529296875, -3.5107421875, -3.34619140625, -3.181640625, -3.01708984375, -2.8525390625, -2.68798828125, -2.5234375, -2.35888671875, -2.1943359375, -2.02978515625, -1.865234375, -1.70068359375, -1.5361328125, -1.37158203125, -1.20703125, -1.04248046875, -0.8779296875, -0.71337890625, -0.548828125, -0.38427734375, -0.2197265625, -0.05517578125, 0.109375, 0.27392578125, 0.4384765625, 0.60302734375, 0.767578125, 0.93212890625, 1.0966796875, 1.26123046875, 1.42578125, 1.59033203125, 1.7548828125, 1.91943359375, 2.083984375, 2.24853515625, 2.4130859375, 2.57763671875, 2.7421875, 2.90673828125, 3.0712890625, 3.23583984375, 3.400390625, 3.56494140625, 3.7294921875, 3.89404296875, 4.05859375, 4.22314453125, 4.3876953125, 4.55224609375, 4.716796875, 4.88134765625, 5.0458984375, 5.21044921875, 5.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 7.0, 7.0, 14.0, 15.0, 16.0, 22.0, 23.0, 27.0, 31.0, 28.0, 38.0, 41.0, 39.0, 38.0, 67.0, 54.0, 69.0, 43.0, 50.0, 33.0, 48.0, 32.0, 47.0, 22.0, 25.0, 35.0, 15.0, 13.0, 12.0, 13.0, 12.0, 6.0, 6.0, 8.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.080078125, -2.9876708984375, -2.895263671875, -2.8028564453125, -2.71044921875, -2.6180419921875, -2.525634765625, -2.4332275390625, -2.3408203125, -2.2484130859375, -2.156005859375, -2.0635986328125, -1.97119140625, -1.8787841796875, -1.786376953125, -1.6939697265625, -1.6015625, -1.5091552734375, -1.416748046875, -1.3243408203125, -1.23193359375, -1.1395263671875, -1.047119140625, -0.9547119140625, -0.8623046875, -0.7698974609375, -0.677490234375, -0.5850830078125, -0.49267578125, -0.4002685546875, -0.307861328125, -0.2154541015625, -0.123046875, -0.0306396484375, 0.061767578125, 0.1541748046875, 0.24658203125, 0.3389892578125, 0.431396484375, 0.5238037109375, 0.6162109375, 0.7086181640625, 0.801025390625, 0.8934326171875, 0.98583984375, 1.0782470703125, 1.170654296875, 1.2630615234375, 1.35546875, 1.4478759765625, 1.540283203125, 1.6326904296875, 1.72509765625, 1.8175048828125, 1.909912109375, 2.0023193359375, 2.0947265625, 2.1871337890625, 2.279541015625, 2.3719482421875, 2.46435546875, 2.5567626953125, 2.649169921875, 2.7415771484375, 2.833984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 13.0, 11.0, 14.0, 21.0, 18.0, 22.0, 25.0, 28.0, 39.0, 42.0, 36.0, 47.0, 45.0, 55.0, 46.0, 44.0, 55.0, 44.0, 47.0, 51.0, 39.0, 33.0, 35.0, 34.0, 23.0, 17.0, 26.0, 12.0, 19.0, 10.0, 7.0, 5.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.06755828857422, -25.234371185302734, -24.401185989379883, -23.5679988861084, -22.734811782836914, -21.901626586914062, -21.068439483642578, -20.235252380371094, -19.40206527709961, -18.568878173828125, -17.735692977905273, -16.90250587463379, -16.069318771362305, -15.236132621765137, -14.402946472167969, -13.569759368896484, -12.736574172973633, -11.903388023376465, -11.07020092010498, -10.237014770507812, -9.403827667236328, -8.57064151763916, -7.737455368041992, -6.904268741607666, -6.07108211517334, -5.237895488739014, -4.4047088623046875, -3.5715227127075195, -2.7383360862731934, -1.9051494598388672, -1.0719633102416992, -0.23877668380737305, 0.5944080352783203, 1.427594542503357, 2.2607810497283936, 3.0939674377441406, 3.927154064178467, 4.760340690612793, 5.593526840209961, 6.426713466644287, 7.259900093078613, 8.093086242675781, 8.926273345947266, 9.759459495544434, 10.592645645141602, 11.425832748413086, 12.259018898010254, 13.092205047607422, 13.925392150878906, 14.758578300476074, 15.591765403747559, 16.424951553344727, 17.25813865661621, 18.091323852539062, 18.924510955810547, 19.75769805908203, 20.590885162353516, 21.424072265625, 22.25725746154785, 23.090444564819336, 23.92363166809082, 24.756816864013672, 25.590003967285156, 26.42319107055664, 27.256376266479492]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 6.0, 3.0, 10.0, 13.0, 21.0, 17.0, 19.0, 22.0, 18.0, 38.0, 42.0, 31.0, 36.0, 36.0, 46.0, 48.0, 42.0, 46.0, 46.0, 33.0, 51.0, 47.0, 45.0, 28.0, 32.0, 39.0, 27.0, 30.0, 13.0, 21.0, 16.0, 15.0, 16.0, 13.0, 10.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.075557708740234, -31.07522201538086, -30.074886322021484, -29.07455062866211, -28.074214935302734, -27.07387924194336, -26.073545455932617, -25.073209762573242, -24.072874069213867, -23.072538375854492, -22.072202682495117, -21.071866989135742, -20.071533203125, -19.071197509765625, -18.07086181640625, -17.070526123046875, -16.0701904296875, -15.069854736328125, -14.06951904296875, -13.069184303283691, -12.068848609924316, -11.068512916564941, -10.068178176879883, -9.067842483520508, -8.067506790161133, -7.067171096801758, -6.066835880279541, -5.066500663757324, -4.066164970397949, -3.065829277038574, -2.0654940605163574, -1.0651588439941406, -0.06482124328613281, 0.9355142116546631, 1.935849666595459, 2.936185121536255, 3.936520576477051, 4.936856269836426, 5.937191486358643, 6.937526702880859, 7.937862396240234, 8.93819808959961, 9.938533782958984, 10.938868522644043, 11.939204216003418, 12.939539909362793, 13.939874649047852, 14.940210342407227, 15.940546035766602, 16.940881729125977, 17.94121742248535, 18.941553115844727, 19.94188690185547, 20.942222595214844, 21.94255828857422, 22.942893981933594, 23.94322967529297, 24.943565368652344, 25.94390106201172, 26.944236755371094, 27.94457244873047, 28.944908142089844, 29.945241928100586, 30.94557762145996, 31.945913314819336]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 16.0, 24.0, 38.0, 41.0, 76.0, 131.0, 208.0, 284.0, 472.0, 720.0, 1187.0, 1884.0, 3099.0, 4823.0, 8032.0, 13397.0, 21877.0, 36263.0, 58998.0, 95589.0, 150510.0, 230285.0, 331372.0, 438991.0, 521952.0, 544422.0, 496578.0, 401689.0, 293403.0, 198392.0, 128964.0, 80839.0, 50005.0, 30536.0, 18804.0, 11480.0, 7141.0, 4320.0, 2718.0, 1685.0, 1024.0, 701.0, 457.0, 301.0, 208.0, 131.0, 72.0, 60.0, 34.0, 16.0, 12.0, 8.0, 7.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-21.5625, -20.874267578125, -20.18603515625, -19.497802734375, -18.8095703125, -18.121337890625, -17.43310546875, -16.744873046875, -16.056640625, -15.368408203125, -14.68017578125, -13.991943359375, -13.3037109375, -12.615478515625, -11.92724609375, -11.239013671875, -10.55078125, -9.862548828125, -9.17431640625, -8.486083984375, -7.7978515625, -7.109619140625, -6.42138671875, -5.733154296875, -5.044921875, -4.356689453125, -3.66845703125, -2.980224609375, -2.2919921875, -1.603759765625, -0.91552734375, -0.227294921875, 0.4609375, 1.149169921875, 1.83740234375, 2.525634765625, 3.2138671875, 3.902099609375, 4.59033203125, 5.278564453125, 5.966796875, 6.655029296875, 7.34326171875, 8.031494140625, 8.7197265625, 9.407958984375, 10.09619140625, 10.784423828125, 11.47265625, 12.160888671875, 12.84912109375, 13.537353515625, 14.2255859375, 14.913818359375, 15.60205078125, 16.290283203125, 16.978515625, 17.666748046875, 18.35498046875, 19.043212890625, 19.7314453125, 20.419677734375, 21.10791015625, 21.796142578125, 22.484375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 3.0, 8.0, 6.0, 10.0, 8.0, 12.0, 22.0, 16.0, 22.0, 21.0, 22.0, 26.0, 25.0, 22.0, 40.0, 37.0, 38.0, 44.0, 27.0, 29.0, 45.0, 36.0, 38.0, 34.0, 39.0, 40.0, 37.0, 34.0, 30.0, 31.0, 24.0, 19.0, 17.0, 22.0, 17.0, 11.0, 18.0, 9.0, 13.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-22.640625, -21.90966796875, -21.1787109375, -20.44775390625, -19.716796875, -18.98583984375, -18.2548828125, -17.52392578125, -16.79296875, -16.06201171875, -15.3310546875, -14.60009765625, -13.869140625, -13.13818359375, -12.4072265625, -11.67626953125, -10.9453125, -10.21435546875, -9.4833984375, -8.75244140625, -8.021484375, -7.29052734375, -6.5595703125, -5.82861328125, -5.09765625, -4.36669921875, -3.6357421875, -2.90478515625, -2.173828125, -1.44287109375, -0.7119140625, 0.01904296875, 0.75, 1.48095703125, 2.2119140625, 2.94287109375, 3.673828125, 4.40478515625, 5.1357421875, 5.86669921875, 6.59765625, 7.32861328125, 8.0595703125, 8.79052734375, 9.521484375, 10.25244140625, 10.9833984375, 11.71435546875, 12.4453125, 13.17626953125, 13.9072265625, 14.63818359375, 15.369140625, 16.10009765625, 16.8310546875, 17.56201171875, 18.29296875, 19.02392578125, 19.7548828125, 20.48583984375, 21.216796875, 21.94775390625, 22.6787109375, 23.40966796875, 24.140625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 9.0, 10.0, 16.0, 13.0, 27.0, 50.0, 97.0, 117.0, 190.0, 348.0, 561.0, 860.0, 1431.0, 2614.0, 4233.0, 7167.0, 12161.0, 20381.0, 33601.0, 56078.0, 90238.0, 140936.0, 213376.0, 302174.0, 397807.0, 476931.0, 514797.0, 493017.0, 425719.0, 332778.0, 238705.0, 161573.0, 103016.0, 65076.0, 39695.0, 23625.0, 14126.0, 8343.0, 5000.0, 2908.0, 1792.0, 1096.0, 639.0, 389.0, 212.0, 146.0, 81.0, 48.0, 32.0, 28.0, 15.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.296875, -22.536865234375, -21.77685546875, -21.016845703125, -20.2568359375, -19.496826171875, -18.73681640625, -17.976806640625, -17.216796875, -16.456787109375, -15.69677734375, -14.936767578125, -14.1767578125, -13.416748046875, -12.65673828125, -11.896728515625, -11.13671875, -10.376708984375, -9.61669921875, -8.856689453125, -8.0966796875, -7.336669921875, -6.57666015625, -5.816650390625, -5.056640625, -4.296630859375, -3.53662109375, -2.776611328125, -2.0166015625, -1.256591796875, -0.49658203125, 0.263427734375, 1.0234375, 1.783447265625, 2.54345703125, 3.303466796875, 4.0634765625, 4.823486328125, 5.58349609375, 6.343505859375, 7.103515625, 7.863525390625, 8.62353515625, 9.383544921875, 10.1435546875, 10.903564453125, 11.66357421875, 12.423583984375, 13.18359375, 13.943603515625, 14.70361328125, 15.463623046875, 16.2236328125, 16.983642578125, 17.74365234375, 18.503662109375, 19.263671875, 20.023681640625, 20.78369140625, 21.543701171875, 22.3037109375, 23.063720703125, 23.82373046875, 24.583740234375, 25.34375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 15.0, 15.0, 23.0, 23.0, 29.0, 40.0, 42.0, 73.0, 88.0, 108.0, 124.0, 131.0, 158.0, 181.0, 200.0, 211.0, 229.0, 242.0, 249.0, 221.0, 217.0, 231.0, 209.0, 162.0, 143.0, 121.0, 115.0, 97.0, 64.0, 72.0, 62.0, 39.0, 26.0, 30.0, 20.0, 19.0, 8.0, 12.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.8741455078125, -11.443603515625, -11.0130615234375, -10.58251953125, -10.1519775390625, -9.721435546875, -9.2908935546875, -8.8603515625, -8.4298095703125, -7.999267578125, -7.5687255859375, -7.13818359375, -6.7076416015625, -6.277099609375, -5.8465576171875, -5.416015625, -4.9854736328125, -4.554931640625, -4.1243896484375, -3.69384765625, -3.2633056640625, -2.832763671875, -2.4022216796875, -1.9716796875, -1.5411376953125, -1.110595703125, -0.6800537109375, -0.24951171875, 0.1810302734375, 0.611572265625, 1.0421142578125, 1.47265625, 1.9031982421875, 2.333740234375, 2.7642822265625, 3.19482421875, 3.6253662109375, 4.055908203125, 4.4864501953125, 4.9169921875, 5.3475341796875, 5.778076171875, 6.2086181640625, 6.63916015625, 7.0697021484375, 7.500244140625, 7.9307861328125, 8.361328125, 8.7918701171875, 9.222412109375, 9.6529541015625, 10.08349609375, 10.5140380859375, 10.944580078125, 11.3751220703125, 11.8056640625, 12.2362060546875, 12.666748046875, 13.0972900390625, 13.52783203125, 13.9583740234375, 14.388916015625, 14.8194580078125, 15.25]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 9.0, 8.0, 15.0, 22.0, 15.0, 31.0, 45.0, 42.0, 45.0, 46.0, 59.0, 53.0, 60.0, 46.0, 65.0, 63.0, 47.0, 43.0, 36.0, 38.0, 37.0, 29.0, 31.0, 23.0, 21.0, 15.0, 11.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.91691589355469, -33.7827033996582, -32.64848709106445, -31.514272689819336, -30.38005828857422, -29.2458438873291, -28.111629486083984, -26.9774169921875, -25.84320068359375, -24.708986282348633, -23.574771881103516, -22.4405574798584, -21.30634307861328, -20.172128677368164, -19.037914276123047, -17.903701782226562, -16.769487380981445, -15.635272979736328, -14.501058578491211, -13.366844177246094, -12.232629776000977, -11.09841537475586, -9.964201927185059, -8.829987525939941, -7.695773124694824, -6.561558723449707, -5.42734432220459, -4.293130397796631, -3.1589159965515137, -2.0247015953063965, -0.8904876708984375, 0.2437267303466797, 1.3779411315917969, 2.512155532836914, 3.646369695663452, 4.78058385848999, 5.914798259735107, 7.049012660980225, 8.183226585388184, 9.3174409866333, 10.451655387878418, 11.585869789123535, 12.720084190368652, 13.854297637939453, 14.98851203918457, 16.122726440429688, 17.256940841674805, 18.391155242919922, 19.52536964416504, 20.659584045410156, 21.793798446655273, 22.92801284790039, 24.062227249145508, 25.196441650390625, 26.33065414428711, 27.46487045288086, 28.599082946777344, 29.73329734802246, 30.867511749267578, 32.00172424316406, 33.13594055175781, 34.2701530456543, 35.40436935424805, 36.53858184814453, 37.67279815673828]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 11.0, 8.0, 10.0, 6.0, 15.0, 18.0, 18.0, 24.0, 33.0, 36.0, 31.0, 53.0, 45.0, 49.0, 56.0, 43.0, 69.0, 52.0, 36.0, 47.0, 36.0, 38.0, 36.0, 34.0, 31.0, 27.0, 22.0, 28.0, 16.0, 20.0, 12.0, 14.0, 7.0, 2.0, 9.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.79008865356445, -33.54605484008789, -32.30202102661133, -31.057987213134766, -29.813953399658203, -28.56991958618164, -27.325883865356445, -26.081850051879883, -24.83781623840332, -23.593782424926758, -22.349748611450195, -21.105714797973633, -19.861679077148438, -18.617645263671875, -17.373611450195312, -16.12957763671875, -14.885543823242188, -13.641510009765625, -12.397476196289062, -11.153441429138184, -9.909407615661621, -8.665373802185059, -7.421339511871338, -6.177305221557617, -4.933271408081055, -3.689237356185913, -2.4452033042907715, -1.2011692523956299, 0.04286479949951172, 1.2868986129760742, 2.530932903289795, 3.7749671936035156, 5.019004821777344, 6.263038635253906, 7.507072925567627, 8.751107215881348, 9.99514102935791, 11.239174842834473, 12.483209609985352, 13.727243423461914, 14.971277236938477, 16.21531105041504, 17.4593448638916, 18.703378677368164, 19.94741439819336, 21.191448211669922, 22.435482025146484, 23.679515838623047, 24.92354965209961, 26.167583465576172, 27.411617279052734, 28.655651092529297, 29.89968490600586, 31.143718719482422, 32.387752532958984, 33.63179016113281, 34.875823974609375, 36.11985778808594, 37.3638916015625, 38.60792541503906, 39.851959228515625, 41.09599304199219, 42.34002685546875, 43.58406066894531, 44.828094482421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 12.0, 25.0, 41.0, 100.0, 143.0, 223.0, 330.0, 599.0, 1104.0, 1888.0, 3131.0, 5522.0, 10008.0, 17834.0, 30884.0, 51831.0, 82168.0, 117576.0, 148072.0, 157064.0, 139132.0, 106039.0, 71185.0, 43904.0, 25919.0, 14518.0, 8364.0, 4597.0, 2797.0, 1430.0, 834.0, 505.0, 287.0, 190.0, 114.0, 66.0, 38.0, 23.0, 14.0, 8.0, 9.0, 3.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7127685546875, -8.425537109375, -8.1383056640625, -7.85107421875, -7.5638427734375, -7.276611328125, -6.9893798828125, -6.7021484375, -6.4149169921875, -6.127685546875, -5.8404541015625, -5.55322265625, -5.2659912109375, -4.978759765625, -4.6915283203125, -4.404296875, -4.1170654296875, -3.829833984375, -3.5426025390625, -3.25537109375, -2.9681396484375, -2.680908203125, -2.3936767578125, -2.1064453125, -1.8192138671875, -1.531982421875, -1.2447509765625, -0.95751953125, -0.6702880859375, -0.383056640625, -0.0958251953125, 0.19140625, 0.4786376953125, 0.765869140625, 1.0531005859375, 1.34033203125, 1.6275634765625, 1.914794921875, 2.2020263671875, 2.4892578125, 2.7764892578125, 3.063720703125, 3.3509521484375, 3.63818359375, 3.9254150390625, 4.212646484375, 4.4998779296875, 4.787109375, 5.0743408203125, 5.361572265625, 5.6488037109375, 5.93603515625, 6.2232666015625, 6.510498046875, 6.7977294921875, 7.0849609375, 7.3721923828125, 7.659423828125, 7.9466552734375, 8.23388671875, 8.5211181640625, 8.808349609375, 9.0955810546875, 9.3828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 3.0, 4.0, 5.0, 13.0, 9.0, 13.0, 19.0, 17.0, 20.0, 29.0, 35.0, 49.0, 51.0, 45.0, 46.0, 51.0, 48.0, 60.0, 54.0, 47.0, 41.0, 39.0, 33.0, 40.0, 36.0, 32.0, 30.0, 20.0, 19.0, 21.0, 22.0, 9.0, 15.0, 5.0, 5.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.0517578125, -34.759765625, -33.4677734375, -32.17578125, -30.8837890625, -29.591796875, -28.2998046875, -27.0078125, -25.7158203125, -24.423828125, -23.1318359375, -21.83984375, -20.5478515625, -19.255859375, -17.9638671875, -16.671875, -15.3798828125, -14.087890625, -12.7958984375, -11.50390625, -10.2119140625, -8.919921875, -7.6279296875, -6.3359375, -5.0439453125, -3.751953125, -2.4599609375, -1.16796875, 0.1240234375, 1.416015625, 2.7080078125, 4.0, 5.2919921875, 6.583984375, 7.8759765625, 9.16796875, 10.4599609375, 11.751953125, 13.0439453125, 14.3359375, 15.6279296875, 16.919921875, 18.2119140625, 19.50390625, 20.7958984375, 22.087890625, 23.3798828125, 24.671875, 25.9638671875, 27.255859375, 28.5478515625, 29.83984375, 31.1318359375, 32.423828125, 33.7158203125, 35.0078125, 36.2998046875, 37.591796875, 38.8837890625, 40.17578125, 41.4677734375, 42.759765625, 44.0517578125, 45.34375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 14.0, 10.0, 16.0, 32.0, 46.0, 73.0, 77.0, 141.0, 227.0, 337.0, 548.0, 831.0, 1311.0, 2099.0, 3420.0, 5489.0, 9195.0, 14906.0, 24105.0, 38481.0, 60985.0, 90174.0, 124276.0, 149165.0, 148183.0, 124056.0, 89444.0, 60079.0, 38597.0, 23927.0, 14810.0, 9113.0, 5388.0, 3385.0, 2023.0, 1247.0, 845.0, 501.0, 336.0, 190.0, 147.0, 103.0, 65.0, 43.0, 32.0, 17.0, 14.0, 14.0, 18.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.765625, -9.4696044921875, -9.173583984375, -8.8775634765625, -8.58154296875, -8.2855224609375, -7.989501953125, -7.6934814453125, -7.3974609375, -7.1014404296875, -6.805419921875, -6.5093994140625, -6.21337890625, -5.9173583984375, -5.621337890625, -5.3253173828125, -5.029296875, -4.7332763671875, -4.437255859375, -4.1412353515625, -3.84521484375, -3.5491943359375, -3.253173828125, -2.9571533203125, -2.6611328125, -2.3651123046875, -2.069091796875, -1.7730712890625, -1.47705078125, -1.1810302734375, -0.885009765625, -0.5889892578125, -0.29296875, 0.0030517578125, 0.299072265625, 0.5950927734375, 0.89111328125, 1.1871337890625, 1.483154296875, 1.7791748046875, 2.0751953125, 2.3712158203125, 2.667236328125, 2.9632568359375, 3.25927734375, 3.5552978515625, 3.851318359375, 4.1473388671875, 4.443359375, 4.7393798828125, 5.035400390625, 5.3314208984375, 5.62744140625, 5.9234619140625, 6.219482421875, 6.5155029296875, 6.8115234375, 7.1075439453125, 7.403564453125, 7.6995849609375, 7.99560546875, 8.2916259765625, 8.587646484375, 8.8836669921875, 9.1796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 7.0, 5.0, 4.0, 10.0, 11.0, 6.0, 13.0, 19.0, 13.0, 18.0, 13.0, 24.0, 27.0, 32.0, 42.0, 39.0, 37.0, 48.0, 41.0, 49.0, 39.0, 42.0, 33.0, 39.0, 43.0, 41.0, 35.0, 30.0, 24.0, 39.0, 36.0, 24.0, 12.0, 17.0, 15.0, 18.0, 16.0, 3.0, 4.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.46875, -18.85986328125, -18.2509765625, -17.64208984375, -17.033203125, -16.42431640625, -15.8154296875, -15.20654296875, -14.59765625, -13.98876953125, -13.3798828125, -12.77099609375, -12.162109375, -11.55322265625, -10.9443359375, -10.33544921875, -9.7265625, -9.11767578125, -8.5087890625, -7.89990234375, -7.291015625, -6.68212890625, -6.0732421875, -5.46435546875, -4.85546875, -4.24658203125, -3.6376953125, -3.02880859375, -2.419921875, -1.81103515625, -1.2021484375, -0.59326171875, 0.015625, 0.62451171875, 1.2333984375, 1.84228515625, 2.451171875, 3.06005859375, 3.6689453125, 4.27783203125, 4.88671875, 5.49560546875, 6.1044921875, 6.71337890625, 7.322265625, 7.93115234375, 8.5400390625, 9.14892578125, 9.7578125, 10.36669921875, 10.9755859375, 11.58447265625, 12.193359375, 12.80224609375, 13.4111328125, 14.02001953125, 14.62890625, 15.23779296875, 15.8466796875, 16.45556640625, 17.064453125, 17.67333984375, 18.2822265625, 18.89111328125, 19.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 10.0, 12.0, 25.0, 34.0, 54.0, 80.0, 100.0, 185.0, 288.0, 504.0, 838.0, 1297.0, 2203.0, 3787.0, 6606.0, 11617.0, 19980.0, 34755.0, 57603.0, 93602.0, 139546.0, 174101.0, 168569.0, 126701.0, 83616.0, 50908.0, 29839.0, 17303.0, 9978.0, 5982.0, 3332.0, 2015.0, 1187.0, 719.0, 446.0, 245.0, 165.0, 107.0, 74.0, 49.0, 40.0, 20.0, 11.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.29071044921875, -4.1517333984375, -4.01275634765625, -3.873779296875, -3.73480224609375, -3.5958251953125, -3.45684814453125, -3.31787109375, -3.17889404296875, -3.0399169921875, -2.90093994140625, -2.761962890625, -2.62298583984375, -2.4840087890625, -2.34503173828125, -2.2060546875, -2.06707763671875, -1.9281005859375, -1.78912353515625, -1.650146484375, -1.51116943359375, -1.3721923828125, -1.23321533203125, -1.09423828125, -0.95526123046875, -0.8162841796875, -0.67730712890625, -0.538330078125, -0.39935302734375, -0.2603759765625, -0.12139892578125, 0.017578125, 0.15655517578125, 0.2955322265625, 0.43450927734375, 0.573486328125, 0.71246337890625, 0.8514404296875, 0.99041748046875, 1.12939453125, 1.26837158203125, 1.4073486328125, 1.54632568359375, 1.685302734375, 1.82427978515625, 1.9632568359375, 2.10223388671875, 2.2412109375, 2.38018798828125, 2.5191650390625, 2.65814208984375, 2.797119140625, 2.93609619140625, 3.0750732421875, 3.21405029296875, 3.35302734375, 3.49200439453125, 3.6309814453125, 3.76995849609375, 3.908935546875, 4.04791259765625, 4.1868896484375, 4.32586669921875, 4.46484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 7.0, 6.0, 14.0, 12.0, 15.0, 19.0, 15.0, 19.0, 16.0, 25.0, 32.0, 29.0, 42.0, 41.0, 50.0, 47.0, 58.0, 50.0, 45.0, 44.0, 45.0, 47.0, 45.0, 39.0, 38.0, 38.0, 25.0, 19.0, 17.0, 23.0, 18.0, 12.0, 10.0, 7.0, 9.0, 5.0, 5.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00028514862060546875, -0.0002774149179458618, -0.0002696812152862549, -0.00026194751262664795, -0.000254213809967041, -0.0002464801073074341, -0.00023874640464782715, -0.00023101270198822021, -0.00022327899932861328, -0.00021554529666900635, -0.00020781159400939941, -0.00020007789134979248, -0.00019234418869018555, -0.0001846104860305786, -0.00017687678337097168, -0.00016914308071136475, -0.0001614093780517578, -0.00015367567539215088, -0.00014594197273254395, -0.000138208270072937, -0.00013047456741333008, -0.00012274086475372314, -0.00011500716209411621, -0.00010727345943450928, -9.953975677490234e-05, -9.180605411529541e-05, -8.407235145568848e-05, -7.633864879608154e-05, -6.860494613647461e-05, -6.0871243476867676e-05, -5.313754081726074e-05, -4.540383815765381e-05, -3.7670135498046875e-05, -2.993643283843994e-05, -2.2202730178833008e-05, -1.4469027519226074e-05, -6.735324859619141e-06, 9.98377799987793e-07, 8.732080459594727e-06, 1.646578311920166e-05, 2.4199485778808594e-05, 3.193318843841553e-05, 3.966689109802246e-05, 4.7400593757629395e-05, 5.513429641723633e-05, 6.286799907684326e-05, 7.06017017364502e-05, 7.833540439605713e-05, 8.606910705566406e-05, 9.3802809715271e-05, 0.00010153651237487793, 0.00010927021503448486, 0.0001170039176940918, 0.00012473762035369873, 0.00013247132301330566, 0.0001402050256729126, 0.00014793872833251953, 0.00015567243099212646, 0.0001634061336517334, 0.00017113983631134033, 0.00017887353897094727, 0.0001866072416305542, 0.00019434094429016113, 0.00020207464694976807, 0.000209808349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 4.0, 7.0, 8.0, 15.0, 20.0, 42.0, 44.0, 67.0, 89.0, 157.0, 219.0, 357.0, 564.0, 756.0, 1299.0, 1931.0, 2881.0, 4486.0, 6820.0, 9907.0, 14869.0, 21441.0, 30608.0, 43147.0, 58303.0, 74589.0, 92083.0, 104036.0, 109370.0, 104684.0, 91804.0, 75513.0, 58169.0, 43214.0, 30981.0, 21474.0, 14814.0, 10074.0, 6729.0, 4371.0, 2972.0, 1981.0, 1264.0, 790.0, 567.0, 364.0, 220.0, 156.0, 115.0, 66.0, 56.0, 27.0, 19.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-3.703125, -3.589202880859375, -3.47528076171875, -3.361358642578125, -3.2474365234375, -3.133514404296875, -3.01959228515625, -2.905670166015625, -2.791748046875, -2.677825927734375, -2.56390380859375, -2.449981689453125, -2.3360595703125, -2.222137451171875, -2.10821533203125, -1.994293212890625, -1.88037109375, -1.766448974609375, -1.65252685546875, -1.538604736328125, -1.4246826171875, -1.310760498046875, -1.19683837890625, -1.082916259765625, -0.968994140625, -0.855072021484375, -0.74114990234375, -0.627227783203125, -0.5133056640625, -0.399383544921875, -0.28546142578125, -0.171539306640625, -0.0576171875, 0.056304931640625, 0.17022705078125, 0.284149169921875, 0.3980712890625, 0.511993408203125, 0.62591552734375, 0.739837646484375, 0.853759765625, 0.967681884765625, 1.08160400390625, 1.195526123046875, 1.3094482421875, 1.423370361328125, 1.53729248046875, 1.651214599609375, 1.76513671875, 1.879058837890625, 1.99298095703125, 2.106903076171875, 2.2208251953125, 2.334747314453125, 2.44866943359375, 2.562591552734375, 2.676513671875, 2.790435791015625, 2.90435791015625, 3.018280029296875, 3.1322021484375, 3.246124267578125, 3.36004638671875, 3.473968505859375, 3.587890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 7.0, 13.0, 8.0, 9.0, 10.0, 11.0, 20.0, 26.0, 24.0, 33.0, 29.0, 37.0, 40.0, 42.0, 44.0, 49.0, 57.0, 49.0, 40.0, 54.0, 47.0, 35.0, 50.0, 39.0, 41.0, 33.0, 20.0, 35.0, 16.0, 12.0, 14.0, 6.0, 7.0, 12.0, 4.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.720489501953125, -1.65972900390625, -1.598968505859375, -1.5382080078125, -1.477447509765625, -1.41668701171875, -1.355926513671875, -1.295166015625, -1.234405517578125, -1.17364501953125, -1.112884521484375, -1.0521240234375, -0.991363525390625, -0.93060302734375, -0.869842529296875, -0.80908203125, -0.748321533203125, -0.68756103515625, -0.626800537109375, -0.5660400390625, -0.505279541015625, -0.44451904296875, -0.383758544921875, -0.322998046875, -0.262237548828125, -0.20147705078125, -0.140716552734375, -0.0799560546875, -0.019195556640625, 0.04156494140625, 0.102325439453125, 0.1630859375, 0.223846435546875, 0.28460693359375, 0.345367431640625, 0.4061279296875, 0.466888427734375, 0.52764892578125, 0.588409423828125, 0.649169921875, 0.709930419921875, 0.77069091796875, 0.831451416015625, 0.8922119140625, 0.952972412109375, 1.01373291015625, 1.074493408203125, 1.13525390625, 1.196014404296875, 1.25677490234375, 1.317535400390625, 1.3782958984375, 1.439056396484375, 1.49981689453125, 1.560577392578125, 1.621337890625, 1.682098388671875, 1.74285888671875, 1.803619384765625, 1.8643798828125, 1.925140380859375, 1.98590087890625, 2.046661376953125, 2.107421875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 16.0, 7.0, 19.0, 22.0, 38.0, 44.0, 43.0, 36.0, 64.0, 48.0, 59.0, 50.0, 55.0, 64.0, 56.0, 53.0, 40.0, 34.0, 39.0, 36.0, 39.0, 18.0, 26.0, 20.0, 11.0, 7.0, 9.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.52968978881836, -33.39360809326172, -32.257530212402344, -31.121450424194336, -29.985370635986328, -28.84929084777832, -27.713211059570312, -26.577131271362305, -25.441051483154297, -24.30497169494629, -23.16889190673828, -22.032812118530273, -20.896732330322266, -19.760652542114258, -18.62457275390625, -17.488492965698242, -16.352413177490234, -15.216333389282227, -14.080253601074219, -12.944173812866211, -11.808094024658203, -10.672014236450195, -9.535934448242188, -8.39985466003418, -7.263774871826172, -6.127695083618164, -4.991615295410156, -3.8555355072021484, -2.7194557189941406, -1.5833759307861328, -0.447296142578125, 0.6887836456298828, 1.8248634338378906, 2.9609432220458984, 4.097023010253906, 5.233102798461914, 6.369182586669922, 7.50526237487793, 8.641342163085938, 9.777421951293945, 10.913501739501953, 12.049581527709961, 13.185661315917969, 14.321741104125977, 15.457820892333984, 16.593900680541992, 17.72998046875, 18.866060256958008, 20.002140045166016, 21.138219833374023, 22.27429962158203, 23.41037940979004, 24.546459197998047, 25.682538986206055, 26.818618774414062, 27.95469856262207, 29.090778350830078, 30.226858139038086, 31.362937927246094, 32.49901580810547, 33.63509750366211, 34.77117919921875, 35.907257080078125, 37.0433349609375, 38.17941665649414]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 6.0, 12.0, 8.0, 11.0, 10.0, 13.0, 18.0, 18.0, 27.0, 33.0, 35.0, 40.0, 50.0, 41.0, 55.0, 54.0, 55.0, 58.0, 43.0, 37.0, 52.0, 33.0, 43.0, 32.0, 32.0, 35.0, 21.0, 26.0, 23.0, 24.0, 15.0, 12.0, 13.0, 3.0, 3.0, 8.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.3465576171875, -33.103755950927734, -31.86095428466797, -30.618152618408203, -29.375350952148438, -28.132549285888672, -26.88974952697754, -25.646947860717773, -24.404146194458008, -23.161344528198242, -21.918542861938477, -20.67574119567871, -19.432941436767578, -18.190139770507812, -16.947338104248047, -15.704536437988281, -14.461734771728516, -13.21893310546875, -11.976131439208984, -10.733330726623535, -9.49052906036377, -8.247727394104004, -7.0049262046813965, -5.762125015258789, -4.519323348999023, -3.276521921157837, -2.0337204933166504, -0.7909190654754639, 0.45188236236572266, 1.6946840286254883, 2.9374852180480957, 4.180286407470703, 5.423091888427734, 6.6658935546875, 7.908694744110107, 9.151495933532715, 10.39429759979248, 11.637099266052246, 12.879899978637695, 14.122701644897461, 15.365503311157227, 16.608304977416992, 17.851106643676758, 19.093908309936523, 20.336708068847656, 21.579509735107422, 22.822311401367188, 24.065113067626953, 25.30791473388672, 26.550716400146484, 27.79351806640625, 29.036319732666016, 30.27912139892578, 31.521923065185547, 32.76472473144531, 34.00752258300781, 35.250328063964844, 36.49312973022461, 37.735931396484375, 38.97873306274414, 40.221534729003906, 41.46433639526367, 42.70713806152344, 43.94993591308594, 45.1927375793457]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 12.0, 18.0, 30.0, 48.0, 66.0, 90.0, 135.0, 252.0, 406.0, 654.0, 1018.0, 1665.0, 2831.0, 4456.0, 7146.0, 11734.0, 18496.0, 28629.0, 42315.0, 59616.0, 79857.0, 98414.0, 112014.0, 117248.0, 111166.0, 97452.0, 77805.0, 58322.0, 41169.0, 27771.0, 17977.0, 11252.0, 7151.0, 4398.0, 2626.0, 1608.0, 1008.0, 645.0, 370.0, 238.0, 156.0, 99.0, 63.0, 31.0, 33.0, 20.0, 12.0, 15.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.03125, -14.537841796875, -14.04443359375, -13.551025390625, -13.0576171875, -12.564208984375, -12.07080078125, -11.577392578125, -11.083984375, -10.590576171875, -10.09716796875, -9.603759765625, -9.1103515625, -8.616943359375, -8.12353515625, -7.630126953125, -7.13671875, -6.643310546875, -6.14990234375, -5.656494140625, -5.1630859375, -4.669677734375, -4.17626953125, -3.682861328125, -3.189453125, -2.696044921875, -2.20263671875, -1.709228515625, -1.2158203125, -0.722412109375, -0.22900390625, 0.264404296875, 0.7578125, 1.251220703125, 1.74462890625, 2.238037109375, 2.7314453125, 3.224853515625, 3.71826171875, 4.211669921875, 4.705078125, 5.198486328125, 5.69189453125, 6.185302734375, 6.6787109375, 7.172119140625, 7.66552734375, 8.158935546875, 8.65234375, 9.145751953125, 9.63916015625, 10.132568359375, 10.6259765625, 11.119384765625, 11.61279296875, 12.106201171875, 12.599609375, 13.093017578125, 13.58642578125, 14.079833984375, 14.5732421875, 15.066650390625, 15.56005859375, 16.053466796875, 16.546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 8.0, 10.0, 11.0, 15.0, 15.0, 11.0, 20.0, 22.0, 28.0, 48.0, 43.0, 43.0, 49.0, 50.0, 38.0, 49.0, 36.0, 38.0, 45.0, 37.0, 44.0, 36.0, 35.0, 32.0, 30.0, 36.0, 15.0, 21.0, 27.0, 21.0, 10.0, 15.0, 10.0, 7.0, 4.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.5302734375, -32.373046875, -31.2158203125, -30.05859375, -28.9013671875, -27.744140625, -26.5869140625, -25.4296875, -24.2724609375, -23.115234375, -21.9580078125, -20.80078125, -19.6435546875, -18.486328125, -17.3291015625, -16.171875, -15.0146484375, -13.857421875, -12.7001953125, -11.54296875, -10.3857421875, -9.228515625, -8.0712890625, -6.9140625, -5.7568359375, -4.599609375, -3.4423828125, -2.28515625, -1.1279296875, 0.029296875, 1.1865234375, 2.34375, 3.5009765625, 4.658203125, 5.8154296875, 6.97265625, 8.1298828125, 9.287109375, 10.4443359375, 11.6015625, 12.7587890625, 13.916015625, 15.0732421875, 16.23046875, 17.3876953125, 18.544921875, 19.7021484375, 20.859375, 22.0166015625, 23.173828125, 24.3310546875, 25.48828125, 26.6455078125, 27.802734375, 28.9599609375, 30.1171875, 31.2744140625, 32.431640625, 33.5888671875, 34.74609375, 35.9033203125, 37.060546875, 38.2177734375, 39.375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 14.0, 17.0, 15.0, 29.0, 43.0, 63.0, 124.0, 199.0, 256.0, 447.0, 707.0, 1073.0, 1656.0, 2542.0, 4102.0, 6134.0, 9546.0, 14955.0, 22631.0, 33951.0, 48538.0, 66161.0, 85109.0, 102529.0, 112968.0, 114024.0, 104854.0, 88678.0, 69493.0, 51400.0, 36281.0, 24284.0, 16187.0, 10597.0, 6784.0, 4243.0, 2862.0, 1788.0, 1125.0, 739.0, 459.0, 320.0, 223.0, 147.0, 87.0, 63.0, 39.0, 25.0, 19.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.546875, -16.03125, -15.515625, -15.0, -14.484375, -13.96875, -13.453125, -12.9375, -12.421875, -11.90625, -11.390625, -10.875, -10.359375, -9.84375, -9.328125, -8.8125, -8.296875, -7.78125, -7.265625, -6.75, -6.234375, -5.71875, -5.203125, -4.6875, -4.171875, -3.65625, -3.140625, -2.625, -2.109375, -1.59375, -1.078125, -0.5625, -0.046875, 0.46875, 0.984375, 1.5, 2.015625, 2.53125, 3.046875, 3.5625, 4.078125, 4.59375, 5.109375, 5.625, 6.140625, 6.65625, 7.171875, 7.6875, 8.203125, 8.71875, 9.234375, 9.75, 10.265625, 10.78125, 11.296875, 11.8125, 12.328125, 12.84375, 13.359375, 13.875, 14.390625, 14.90625, 15.421875, 15.9375, 16.453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 6.0, 11.0, 11.0, 10.0, 15.0, 22.0, 20.0, 18.0, 21.0, 31.0, 31.0, 30.0, 31.0, 22.0, 50.0, 43.0, 38.0, 37.0, 39.0, 40.0, 43.0, 40.0, 34.0, 36.0, 36.0, 31.0, 34.0, 28.0, 33.0, 18.0, 13.0, 16.0, 15.0, 15.0, 10.0, 9.0, 10.0, 7.0, 7.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.4658203125, -19.791015625, -19.1162109375, -18.44140625, -17.7666015625, -17.091796875, -16.4169921875, -15.7421875, -15.0673828125, -14.392578125, -13.7177734375, -13.04296875, -12.3681640625, -11.693359375, -11.0185546875, -10.34375, -9.6689453125, -8.994140625, -8.3193359375, -7.64453125, -6.9697265625, -6.294921875, -5.6201171875, -4.9453125, -4.2705078125, -3.595703125, -2.9208984375, -2.24609375, -1.5712890625, -0.896484375, -0.2216796875, 0.453125, 1.1279296875, 1.802734375, 2.4775390625, 3.15234375, 3.8271484375, 4.501953125, 5.1767578125, 5.8515625, 6.5263671875, 7.201171875, 7.8759765625, 8.55078125, 9.2255859375, 9.900390625, 10.5751953125, 11.25, 11.9248046875, 12.599609375, 13.2744140625, 13.94921875, 14.6240234375, 15.298828125, 15.9736328125, 16.6484375, 17.3232421875, 17.998046875, 18.6728515625, 19.34765625, 20.0224609375, 20.697265625, 21.3720703125, 22.046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 10.0, 2.0, 11.0, 13.0, 23.0, 32.0, 46.0, 87.0, 141.0, 195.0, 365.0, 666.0, 1079.0, 1972.0, 3456.0, 6194.0, 11210.0, 19711.0, 34952.0, 57210.0, 88300.0, 122387.0, 147706.0, 152725.0, 133437.0, 101158.0, 68218.0, 41749.0, 24152.0, 13847.0, 7666.0, 4269.0, 2410.0, 1308.0, 747.0, 416.0, 272.0, 162.0, 93.0, 73.0, 38.0, 24.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.90283203125, -8.5869140625, -8.27099609375, -7.955078125, -7.63916015625, -7.3232421875, -7.00732421875, -6.69140625, -6.37548828125, -6.0595703125, -5.74365234375, -5.427734375, -5.11181640625, -4.7958984375, -4.47998046875, -4.1640625, -3.84814453125, -3.5322265625, -3.21630859375, -2.900390625, -2.58447265625, -2.2685546875, -1.95263671875, -1.63671875, -1.32080078125, -1.0048828125, -0.68896484375, -0.373046875, -0.05712890625, 0.2587890625, 0.57470703125, 0.890625, 1.20654296875, 1.5224609375, 1.83837890625, 2.154296875, 2.47021484375, 2.7861328125, 3.10205078125, 3.41796875, 3.73388671875, 4.0498046875, 4.36572265625, 4.681640625, 4.99755859375, 5.3134765625, 5.62939453125, 5.9453125, 6.26123046875, 6.5771484375, 6.89306640625, 7.208984375, 7.52490234375, 7.8408203125, 8.15673828125, 8.47265625, 8.78857421875, 9.1044921875, 9.42041015625, 9.736328125, 10.05224609375, 10.3681640625, 10.68408203125, 11.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 6.0, 10.0, 13.0, 14.0, 17.0, 21.0, 21.0, 27.0, 27.0, 37.0, 37.0, 50.0, 46.0, 60.0, 59.0, 53.0, 65.0, 63.0, 55.0, 51.0, 43.0, 40.0, 40.0, 27.0, 26.0, 19.0, 11.0, 10.0, 17.0, 6.0, 6.0, 3.0, 0.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000888824462890625, -0.000855565071105957, -0.0008223056793212891, -0.0007890462875366211, -0.0007557868957519531, -0.0007225275039672852, -0.0006892681121826172, -0.0006560087203979492, -0.0006227493286132812, -0.0005894899368286133, -0.0005562305450439453, -0.0005229711532592773, -0.0004897117614746094, -0.0004564523696899414, -0.00042319297790527344, -0.00038993358612060547, -0.0003566741943359375, -0.00032341480255126953, -0.00029015541076660156, -0.0002568960189819336, -0.00022363662719726562, -0.00019037723541259766, -0.0001571178436279297, -0.00012385845184326172, -9.059906005859375e-05, -5.733966827392578e-05, -2.4080276489257812e-05, 9.179115295410156e-06, 4.2438507080078125e-05, 7.56978988647461e-05, 0.00010895729064941406, 0.00014221668243408203, 0.00017547607421875, 0.00020873546600341797, 0.00024199485778808594, 0.0002752542495727539, 0.0003085136413574219, 0.00034177303314208984, 0.0003750324249267578, 0.0004082918167114258, 0.00044155120849609375, 0.0004748106002807617, 0.0005080699920654297, 0.0005413293838500977, 0.0005745887756347656, 0.0006078481674194336, 0.0006411075592041016, 0.0006743669509887695, 0.0007076263427734375, 0.0007408857345581055, 0.0007741451263427734, 0.0008074045181274414, 0.0008406639099121094, 0.0008739233016967773, 0.0009071826934814453, 0.0009404420852661133, 0.0009737014770507812, 0.0010069608688354492, 0.0010402202606201172, 0.0010734796524047852, 0.0011067390441894531, 0.001139998435974121, 0.001173257827758789, 0.001206517219543457, 0.001239776611328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 5.0, 4.0, 16.0, 11.0, 23.0, 36.0, 39.0, 85.0, 116.0, 201.0, 310.0, 424.0, 688.0, 1049.0, 1735.0, 2674.0, 4234.0, 6888.0, 11120.0, 18093.0, 28202.0, 43413.0, 64689.0, 89271.0, 113665.0, 128876.0, 130095.0, 115574.0, 92367.0, 67716.0, 45991.0, 29863.0, 19203.0, 12039.0, 7413.0, 4436.0, 2806.0, 1844.0, 1158.0, 740.0, 493.0, 298.0, 228.0, 149.0, 89.0, 72.0, 35.0, 28.0, 15.0, 9.0, 12.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-9.5625, -9.2733154296875, -8.984130859375, -8.6949462890625, -8.40576171875, -8.1165771484375, -7.827392578125, -7.5382080078125, -7.2490234375, -6.9598388671875, -6.670654296875, -6.3814697265625, -6.09228515625, -5.8031005859375, -5.513916015625, -5.2247314453125, -4.935546875, -4.6463623046875, -4.357177734375, -4.0679931640625, -3.77880859375, -3.4896240234375, -3.200439453125, -2.9112548828125, -2.6220703125, -2.3328857421875, -2.043701171875, -1.7545166015625, -1.46533203125, -1.1761474609375, -0.886962890625, -0.5977783203125, -0.30859375, -0.0194091796875, 0.269775390625, 0.5589599609375, 0.84814453125, 1.1373291015625, 1.426513671875, 1.7156982421875, 2.0048828125, 2.2940673828125, 2.583251953125, 2.8724365234375, 3.16162109375, 3.4508056640625, 3.739990234375, 4.0291748046875, 4.318359375, 4.6075439453125, 4.896728515625, 5.1859130859375, 5.47509765625, 5.7642822265625, 6.053466796875, 6.3426513671875, 6.6318359375, 6.9210205078125, 7.210205078125, 7.4993896484375, 7.78857421875, 8.0777587890625, 8.366943359375, 8.6561279296875, 8.9453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 10.0, 7.0, 14.0, 11.0, 13.0, 15.0, 28.0, 39.0, 42.0, 38.0, 51.0, 60.0, 53.0, 65.0, 62.0, 70.0, 64.0, 45.0, 58.0, 47.0, 47.0, 34.0, 22.0, 18.0, 21.0, 22.0, 10.0, 5.0, 9.0, 7.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0], "bins": [-6.64453125, -6.48004150390625, -6.3155517578125, -6.15106201171875, -5.986572265625, -5.82208251953125, -5.6575927734375, -5.49310302734375, -5.32861328125, -5.16412353515625, -4.9996337890625, -4.83514404296875, -4.670654296875, -4.50616455078125, -4.3416748046875, -4.17718505859375, -4.0126953125, -3.84820556640625, -3.6837158203125, -3.51922607421875, -3.354736328125, -3.19024658203125, -3.0257568359375, -2.86126708984375, -2.69677734375, -2.53228759765625, -2.3677978515625, -2.20330810546875, -2.038818359375, -1.87432861328125, -1.7098388671875, -1.54534912109375, -1.380859375, -1.21636962890625, -1.0518798828125, -0.88739013671875, -0.722900390625, -0.55841064453125, -0.3939208984375, -0.22943115234375, -0.06494140625, 0.09954833984375, 0.2640380859375, 0.42852783203125, 0.593017578125, 0.75750732421875, 0.9219970703125, 1.08648681640625, 1.2509765625, 1.41546630859375, 1.5799560546875, 1.74444580078125, 1.908935546875, 2.07342529296875, 2.2379150390625, 2.40240478515625, 2.56689453125, 2.73138427734375, 2.8958740234375, 3.06036376953125, 3.224853515625, 3.38934326171875, 3.5538330078125, 3.71832275390625, 3.8828125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 4.0, 3.0, 4.0, 5.0, 11.0, 11.0, 11.0, 15.0, 20.0, 15.0, 49.0, 37.0, 47.0, 57.0, 54.0, 58.0, 46.0, 61.0, 57.0, 52.0, 62.0, 44.0, 42.0, 38.0, 43.0, 31.0, 29.0, 31.0, 10.0, 13.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.94009017944336, -31.797508239746094, -30.654924392700195, -29.51234245300293, -28.36975860595703, -27.227176666259766, -26.0845947265625, -24.9420108795166, -23.799427032470703, -22.656845092773438, -21.51426124572754, -20.371679306030273, -19.229095458984375, -18.08651351928711, -16.943931579589844, -15.801347732543945, -14.65876579284668, -13.516182899475098, -12.373600006103516, -11.23101806640625, -10.088434219360352, -8.945852279663086, -7.803269386291504, -6.660686492919922, -5.51810359954834, -4.375520706176758, -3.232938051223755, -2.090355396270752, -0.9477725028991699, 0.1948103904724121, 1.337392807006836, 2.479975700378418, 3.62255859375, 4.765141487121582, 5.907724380493164, 7.050306797027588, 8.192890167236328, 9.335472106933594, 10.478055000305176, 11.620637893676758, 12.76322078704834, 13.905803680419922, 15.048386573791504, 16.190969467163086, 17.33355140686035, 18.47613525390625, 19.618717193603516, 20.76129913330078, 21.90388298034668, 23.046464920043945, 24.189048767089844, 25.33163070678711, 26.474214553833008, 27.616796493530273, 28.759380340576172, 29.901962280273438, 31.044544219970703, 32.18712615966797, 33.329708099365234, 34.472293853759766, 35.61487579345703, 36.7574577331543, 37.90003967285156, 39.042625427246094, 40.18520736694336]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 12.0, 13.0, 15.0, 21.0, 21.0, 28.0, 34.0, 37.0, 44.0, 42.0, 56.0, 59.0, 60.0, 47.0, 73.0, 49.0, 52.0, 50.0, 35.0, 41.0, 27.0, 16.0, 37.0, 26.0, 25.0, 15.0, 15.0, 9.0, 7.0, 6.0, 7.0, 1.0, 10.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.05831527709961, -48.4994010925293, -46.94048309326172, -45.381568908691406, -43.82265090942383, -42.263736724853516, -40.70481872558594, -39.145904541015625, -37.58699035644531, -36.028076171875, -34.46915817260742, -32.91024398803711, -31.35132598876953, -29.79241180419922, -28.233495712280273, -26.674579620361328, -25.11566162109375, -23.556745529174805, -21.99782943725586, -20.438915252685547, -18.87999725341797, -17.321083068847656, -15.762166976928711, -14.203250885009766, -12.64433479309082, -11.085418701171875, -9.52650260925293, -7.967587471008301, -6.4086713790893555, -4.84975528717041, -3.2908401489257812, -1.731924057006836, -0.173004150390625, 1.3859117031097412, 2.9448275566101074, 4.5037431716918945, 6.06265926361084, 7.621575355529785, 9.180490493774414, 10.73940658569336, 12.298322677612305, 13.85723876953125, 15.416154861450195, 16.97507095336914, 18.533985137939453, 20.09290313720703, 21.651817321777344, 23.21073341369629, 24.769649505615234, 26.32856559753418, 27.887481689453125, 29.446395874023438, 31.005313873291016, 32.56422805786133, 34.123146057128906, 35.68206024169922, 37.24097442626953, 38.799888610839844, 40.35880661010742, 41.917720794677734, 43.47663879394531, 45.035552978515625, 46.59446716308594, 48.153385162353516, 49.712303161621094]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 18.0, 17.0, 30.0, 46.0, 72.0, 121.0, 227.0, 341.0, 547.0, 922.0, 1571.0, 2795.0, 4870.0, 8688.0, 15593.0, 27452.0, 49519.0, 88699.0, 155416.0, 258335.0, 400011.0, 549270.0, 641133.0, 620428.0, 501551.0, 350854.0, 220338.0, 129351.0, 73118.0, 40687.0, 22643.0, 12751.0, 7219.0, 4053.0, 2312.0, 1310.0, 806.0, 464.0, 278.0, 167.0, 103.0, 57.0, 36.0, 30.0, 9.0, 7.0, 12.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.875, -33.81298828125, -32.7509765625, -31.68896484375, -30.626953125, -29.56494140625, -28.5029296875, -27.44091796875, -26.37890625, -25.31689453125, -24.2548828125, -23.19287109375, -22.130859375, -21.06884765625, -20.0068359375, -18.94482421875, -17.8828125, -16.82080078125, -15.7587890625, -14.69677734375, -13.634765625, -12.57275390625, -11.5107421875, -10.44873046875, -9.38671875, -8.32470703125, -7.2626953125, -6.20068359375, -5.138671875, -4.07666015625, -3.0146484375, -1.95263671875, -0.890625, 0.17138671875, 1.2333984375, 2.29541015625, 3.357421875, 4.41943359375, 5.4814453125, 6.54345703125, 7.60546875, 8.66748046875, 9.7294921875, 10.79150390625, 11.853515625, 12.91552734375, 13.9775390625, 15.03955078125, 16.1015625, 17.16357421875, 18.2255859375, 19.28759765625, 20.349609375, 21.41162109375, 22.4736328125, 23.53564453125, 24.59765625, 25.65966796875, 26.7216796875, 27.78369140625, 28.845703125, 29.90771484375, 30.9697265625, 32.03173828125, 33.09375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 5.0, 10.0, 6.0, 21.0, 20.0, 17.0, 25.0, 31.0, 45.0, 29.0, 48.0, 64.0, 44.0, 55.0, 62.0, 55.0, 56.0, 52.0, 63.0, 36.0, 42.0, 28.0, 32.0, 28.0, 23.0, 23.0, 12.0, 8.0, 14.0, 15.0, 6.0, 4.0, 4.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.03125, -45.57470703125, -44.1181640625, -42.66162109375, -41.205078125, -39.74853515625, -38.2919921875, -36.83544921875, -35.37890625, -33.92236328125, -32.4658203125, -31.00927734375, -29.552734375, -28.09619140625, -26.6396484375, -25.18310546875, -23.7265625, -22.27001953125, -20.8134765625, -19.35693359375, -17.900390625, -16.44384765625, -14.9873046875, -13.53076171875, -12.07421875, -10.61767578125, -9.1611328125, -7.70458984375, -6.248046875, -4.79150390625, -3.3349609375, -1.87841796875, -0.421875, 1.03466796875, 2.4912109375, 3.94775390625, 5.404296875, 6.86083984375, 8.3173828125, 9.77392578125, 11.23046875, 12.68701171875, 14.1435546875, 15.60009765625, 17.056640625, 18.51318359375, 19.9697265625, 21.42626953125, 22.8828125, 24.33935546875, 25.7958984375, 27.25244140625, 28.708984375, 30.16552734375, 31.6220703125, 33.07861328125, 34.53515625, 35.99169921875, 37.4482421875, 38.90478515625, 40.361328125, 41.81787109375, 43.2744140625, 44.73095703125, 46.1875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 12.0, 19.0, 35.0, 58.0, 79.0, 136.0, 243.0, 407.0, 795.0, 1330.0, 2466.0, 4420.0, 8003.0, 15068.0, 27536.0, 51110.0, 92518.0, 161927.0, 268590.0, 409556.0, 550052.0, 631987.0, 610142.0, 496639.0, 349306.0, 221494.0, 130474.0, 73004.0, 39752.0, 21510.0, 11801.0, 6180.0, 3328.0, 1804.0, 1062.0, 578.0, 328.0, 233.0, 107.0, 70.0, 43.0, 19.0, 26.0, 12.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-43.53125, -42.2802734375, -41.029296875, -39.7783203125, -38.52734375, -37.2763671875, -36.025390625, -34.7744140625, -33.5234375, -32.2724609375, -31.021484375, -29.7705078125, -28.51953125, -27.2685546875, -26.017578125, -24.7666015625, -23.515625, -22.2646484375, -21.013671875, -19.7626953125, -18.51171875, -17.2607421875, -16.009765625, -14.7587890625, -13.5078125, -12.2568359375, -11.005859375, -9.7548828125, -8.50390625, -7.2529296875, -6.001953125, -4.7509765625, -3.5, -2.2490234375, -0.998046875, 0.2529296875, 1.50390625, 2.7548828125, 4.005859375, 5.2568359375, 6.5078125, 7.7587890625, 9.009765625, 10.2607421875, 11.51171875, 12.7626953125, 14.013671875, 15.2646484375, 16.515625, 17.7666015625, 19.017578125, 20.2685546875, 21.51953125, 22.7705078125, 24.021484375, 25.2724609375, 26.5234375, 27.7744140625, 29.025390625, 30.2763671875, 31.52734375, 32.7783203125, 34.029296875, 35.2802734375, 36.53125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 11.0, 5.0, 9.0, 8.0, 14.0, 6.0, 15.0, 13.0, 21.0, 33.0, 32.0, 41.0, 50.0, 52.0, 88.0, 91.0, 97.0, 111.0, 130.0, 167.0, 173.0, 156.0, 184.0, 192.0, 208.0, 216.0, 203.0, 203.0, 187.0, 185.0, 165.0, 154.0, 147.0, 123.0, 113.0, 89.0, 73.0, 58.0, 53.0, 51.0, 33.0, 34.0, 27.0, 17.0, 11.0, 7.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.140625, -15.60546875, -15.0703125, -14.53515625, -14.0, -13.46484375, -12.9296875, -12.39453125, -11.859375, -11.32421875, -10.7890625, -10.25390625, -9.71875, -9.18359375, -8.6484375, -8.11328125, -7.578125, -7.04296875, -6.5078125, -5.97265625, -5.4375, -4.90234375, -4.3671875, -3.83203125, -3.296875, -2.76171875, -2.2265625, -1.69140625, -1.15625, -0.62109375, -0.0859375, 0.44921875, 0.984375, 1.51953125, 2.0546875, 2.58984375, 3.125, 3.66015625, 4.1953125, 4.73046875, 5.265625, 5.80078125, 6.3359375, 6.87109375, 7.40625, 7.94140625, 8.4765625, 9.01171875, 9.546875, 10.08203125, 10.6171875, 11.15234375, 11.6875, 12.22265625, 12.7578125, 13.29296875, 13.828125, 14.36328125, 14.8984375, 15.43359375, 15.96875, 16.50390625, 17.0390625, 17.57421875, 18.109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 10.0, 10.0, 14.0, 15.0, 22.0, 19.0, 31.0, 35.0, 44.0, 38.0, 47.0, 46.0, 53.0, 63.0, 62.0, 69.0, 59.0, 55.0, 49.0, 34.0, 28.0, 37.0, 27.0, 23.0, 20.0, 17.0, 10.0, 14.0, 10.0, 9.0, 4.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.68342971801758, -50.09819412231445, -48.51295471191406, -46.92771911621094, -45.34248352050781, -43.75724411010742, -42.1720085144043, -40.586769104003906, -39.00153350830078, -37.416297912597656, -35.831058502197266, -34.24582290649414, -32.66058349609375, -31.075347900390625, -29.4901123046875, -27.904874801635742, -26.319637298583984, -24.734399795532227, -23.14916229248047, -21.563926696777344, -19.978689193725586, -18.393451690673828, -16.808216094970703, -15.222978591918945, -13.637741088867188, -12.05250358581543, -10.467267036437988, -8.882030487060547, -7.296792984008789, -5.7115559577941895, -4.12631893157959, -2.5410823822021484, -0.955841064453125, 0.6293959617614746, 2.214632987976074, 3.799870014190674, 5.385107040405273, 6.970344066619873, 8.555581092834473, 10.140817642211914, 11.726055145263672, 13.31129264831543, 14.896529197692871, 16.481765747070312, 18.06700325012207, 19.652240753173828, 21.237476348876953, 22.82271385192871, 24.40795135498047, 25.993188858032227, 27.578426361083984, 29.16366195678711, 30.748899459838867, 32.334136962890625, 33.91937255859375, 35.504608154296875, 37.089847564697266, 38.67508316040039, 40.26032257080078, 41.845558166503906, 43.43079376220703, 45.01603317260742, 46.60126876831055, 48.18650817871094, 49.77174377441406]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 3.0, 9.0, 6.0, 3.0, 13.0, 16.0, 21.0, 19.0, 16.0, 32.0, 30.0, 27.0, 21.0, 31.0, 42.0, 45.0, 42.0, 47.0, 43.0, 38.0, 38.0, 38.0, 43.0, 30.0, 22.0, 35.0, 40.0, 30.0, 32.0, 23.0, 27.0, 34.0, 8.0, 13.0, 19.0, 14.0, 10.0, 7.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-55.67958450317383, -53.94290542602539, -52.20622253417969, -50.46954345703125, -48.73286437988281, -46.996185302734375, -45.25950241088867, -43.522823333740234, -41.78614044189453, -40.049461364746094, -38.31277847290039, -36.57609939575195, -34.839420318603516, -33.10273742675781, -31.366058349609375, -29.629379272460938, -27.8927001953125, -26.15601921081543, -24.419340133666992, -22.682659149169922, -20.945980072021484, -19.209299087524414, -17.472618103027344, -15.73593807220459, -13.999258041381836, -12.262578010559082, -10.525897979736328, -8.789216995239258, -7.052536964416504, -5.31585693359375, -3.5791759490966797, -1.8424959182739258, -0.10581207275390625, 1.6308681964874268, 3.3675484657287598, 5.104228973388672, 6.840909004211426, 8.57758903503418, 10.31427001953125, 12.050950050354004, 13.787630081176758, 15.524310111999512, 17.260990142822266, 18.997671127319336, 20.734352111816406, 22.471031188964844, 24.207712173461914, 25.944393157958984, 27.681072235107422, 29.417753219604492, 31.15443229675293, 32.89111328125, 34.62779235839844, 36.364471435546875, 38.10115432739258, 39.837833404541016, 41.57451629638672, 43.311195373535156, 45.04787826538086, 46.7845573425293, 48.521236419677734, 50.25791931152344, 51.994598388671875, 53.73127746582031, 55.46795654296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 2.0, 13.0, 14.0, 12.0, 28.0, 46.0, 46.0, 61.0, 107.0, 141.0, 206.0, 349.0, 500.0, 833.0, 1283.0, 2045.0, 3273.0, 5157.0, 8415.0, 13729.0, 21914.0, 34654.0, 54487.0, 79892.0, 109445.0, 133399.0, 142959.0, 129049.0, 101980.0, 72945.0, 48525.0, 30994.0, 19613.0, 12053.0, 7657.0, 4649.0, 2923.0, 1829.0, 1165.0, 769.0, 486.0, 329.0, 186.0, 122.0, 89.0, 59.0, 32.0, 29.0, 25.0, 13.0, 10.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.71875, -12.300048828125, -11.88134765625, -11.462646484375, -11.0439453125, -10.625244140625, -10.20654296875, -9.787841796875, -9.369140625, -8.950439453125, -8.53173828125, -8.113037109375, -7.6943359375, -7.275634765625, -6.85693359375, -6.438232421875, -6.01953125, -5.600830078125, -5.18212890625, -4.763427734375, -4.3447265625, -3.926025390625, -3.50732421875, -3.088623046875, -2.669921875, -2.251220703125, -1.83251953125, -1.413818359375, -0.9951171875, -0.576416015625, -0.15771484375, 0.260986328125, 0.6796875, 1.098388671875, 1.51708984375, 1.935791015625, 2.3544921875, 2.773193359375, 3.19189453125, 3.610595703125, 4.029296875, 4.447998046875, 4.86669921875, 5.285400390625, 5.7041015625, 6.122802734375, 6.54150390625, 6.960205078125, 7.37890625, 7.797607421875, 8.21630859375, 8.635009765625, 9.0537109375, 9.472412109375, 9.89111328125, 10.309814453125, 10.728515625, 11.147216796875, 11.56591796875, 11.984619140625, 12.4033203125, 12.822021484375, 13.24072265625, 13.659423828125, 14.078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 9.0, 10.0, 12.0, 12.0, 13.0, 14.0, 31.0, 31.0, 29.0, 29.0, 30.0, 47.0, 37.0, 39.0, 37.0, 46.0, 38.0, 53.0, 38.0, 42.0, 30.0, 33.0, 31.0, 33.0, 26.0, 26.0, 28.0, 33.0, 29.0, 21.0, 17.0, 15.0, 9.0, 12.0, 6.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-57.0625, -55.30322265625, -53.5439453125, -51.78466796875, -50.025390625, -48.26611328125, -46.5068359375, -44.74755859375, -42.98828125, -41.22900390625, -39.4697265625, -37.71044921875, -35.951171875, -34.19189453125, -32.4326171875, -30.67333984375, -28.9140625, -27.15478515625, -25.3955078125, -23.63623046875, -21.876953125, -20.11767578125, -18.3583984375, -16.59912109375, -14.83984375, -13.08056640625, -11.3212890625, -9.56201171875, -7.802734375, -6.04345703125, -4.2841796875, -2.52490234375, -0.765625, 0.99365234375, 2.7529296875, 4.51220703125, 6.271484375, 8.03076171875, 9.7900390625, 11.54931640625, 13.30859375, 15.06787109375, 16.8271484375, 18.58642578125, 20.345703125, 22.10498046875, 23.8642578125, 25.62353515625, 27.3828125, 29.14208984375, 30.9013671875, 32.66064453125, 34.419921875, 36.17919921875, 37.9384765625, 39.69775390625, 41.45703125, 43.21630859375, 44.9755859375, 46.73486328125, 48.494140625, 50.25341796875, 52.0126953125, 53.77197265625, 55.53125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 8.0, 10.0, 19.0, 25.0, 30.0, 41.0, 60.0, 106.0, 143.0, 209.0, 362.0, 539.0, 760.0, 1230.0, 1975.0, 2883.0, 4648.0, 7382.0, 11724.0, 19272.0, 30639.0, 49092.0, 76731.0, 112030.0, 146614.0, 158208.0, 138167.0, 102087.0, 68465.0, 42989.0, 26723.0, 16784.0, 10536.0, 6498.0, 3982.0, 2712.0, 1665.0, 1114.0, 701.0, 453.0, 310.0, 210.0, 123.0, 101.0, 60.0, 44.0, 27.0, 16.0, 9.0, 7.0, 9.0, 6.0, 0.0, 4.0, 5.0, 0.0, 4.0], "bins": [-15.3984375, -14.9227294921875, -14.447021484375, -13.9713134765625, -13.49560546875, -13.0198974609375, -12.544189453125, -12.0684814453125, -11.5927734375, -11.1170654296875, -10.641357421875, -10.1656494140625, -9.68994140625, -9.2142333984375, -8.738525390625, -8.2628173828125, -7.787109375, -7.3114013671875, -6.835693359375, -6.3599853515625, -5.88427734375, -5.4085693359375, -4.932861328125, -4.4571533203125, -3.9814453125, -3.5057373046875, -3.030029296875, -2.5543212890625, -2.07861328125, -1.6029052734375, -1.127197265625, -0.6514892578125, -0.17578125, 0.2999267578125, 0.775634765625, 1.2513427734375, 1.72705078125, 2.2027587890625, 2.678466796875, 3.1541748046875, 3.6298828125, 4.1055908203125, 4.581298828125, 5.0570068359375, 5.53271484375, 6.0084228515625, 6.484130859375, 6.9598388671875, 7.435546875, 7.9112548828125, 8.386962890625, 8.8626708984375, 9.33837890625, 9.8140869140625, 10.289794921875, 10.7655029296875, 11.2412109375, 11.7169189453125, 12.192626953125, 12.6683349609375, 13.14404296875, 13.6197509765625, 14.095458984375, 14.5711669921875, 15.046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 9.0, 6.0, 17.0, 9.0, 19.0, 35.0, 18.0, 21.0, 38.0, 28.0, 29.0, 51.0, 42.0, 47.0, 63.0, 46.0, 47.0, 37.0, 46.0, 47.0, 46.0, 33.0, 41.0, 38.0, 32.0, 24.0, 17.0, 18.0, 16.0, 9.0, 17.0, 15.0, 8.0, 9.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.8125, -28.76220703125, -27.7119140625, -26.66162109375, -25.611328125, -24.56103515625, -23.5107421875, -22.46044921875, -21.41015625, -20.35986328125, -19.3095703125, -18.25927734375, -17.208984375, -16.15869140625, -15.1083984375, -14.05810546875, -13.0078125, -11.95751953125, -10.9072265625, -9.85693359375, -8.806640625, -7.75634765625, -6.7060546875, -5.65576171875, -4.60546875, -3.55517578125, -2.5048828125, -1.45458984375, -0.404296875, 0.64599609375, 1.6962890625, 2.74658203125, 3.796875, 4.84716796875, 5.8974609375, 6.94775390625, 7.998046875, 9.04833984375, 10.0986328125, 11.14892578125, 12.19921875, 13.24951171875, 14.2998046875, 15.35009765625, 16.400390625, 17.45068359375, 18.5009765625, 19.55126953125, 20.6015625, 21.65185546875, 22.7021484375, 23.75244140625, 24.802734375, 25.85302734375, 26.9033203125, 27.95361328125, 29.00390625, 30.05419921875, 31.1044921875, 32.15478515625, 33.205078125, 34.25537109375, 35.3056640625, 36.35595703125, 37.40625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 15.0, 13.0, 17.0, 34.0, 51.0, 80.0, 90.0, 157.0, 211.0, 359.0, 543.0, 831.0, 1296.0, 2078.0, 3180.0, 5166.0, 8168.0, 13035.0, 21084.0, 32819.0, 51255.0, 77714.0, 111632.0, 143928.0, 153151.0, 133768.0, 99796.0, 67922.0, 44230.0, 28325.0, 17635.0, 11025.0, 6778.0, 4383.0, 2821.0, 1711.0, 1090.0, 749.0, 493.0, 311.0, 181.0, 145.0, 97.0, 55.0, 38.0, 30.0, 20.0, 12.0, 7.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0], "bins": [-5.6484375, -5.4681396484375, -5.287841796875, -5.1075439453125, -4.92724609375, -4.7469482421875, -4.566650390625, -4.3863525390625, -4.2060546875, -4.0257568359375, -3.845458984375, -3.6651611328125, -3.48486328125, -3.3045654296875, -3.124267578125, -2.9439697265625, -2.763671875, -2.5833740234375, -2.403076171875, -2.2227783203125, -2.04248046875, -1.8621826171875, -1.681884765625, -1.5015869140625, -1.3212890625, -1.1409912109375, -0.960693359375, -0.7803955078125, -0.60009765625, -0.4197998046875, -0.239501953125, -0.0592041015625, 0.12109375, 0.3013916015625, 0.481689453125, 0.6619873046875, 0.84228515625, 1.0225830078125, 1.202880859375, 1.3831787109375, 1.5634765625, 1.7437744140625, 1.924072265625, 2.1043701171875, 2.28466796875, 2.4649658203125, 2.645263671875, 2.8255615234375, 3.005859375, 3.1861572265625, 3.366455078125, 3.5467529296875, 3.72705078125, 3.9073486328125, 4.087646484375, 4.2679443359375, 4.4482421875, 4.6285400390625, 4.808837890625, 4.9891357421875, 5.16943359375, 5.3497314453125, 5.530029296875, 5.7103271484375, 5.890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 4.0, 7.0, 14.0, 15.0, 22.0, 26.0, 28.0, 22.0, 21.0, 42.0, 51.0, 36.0, 59.0, 57.0, 43.0, 57.0, 46.0, 46.0, 49.0, 40.0, 37.0, 39.0, 33.0, 41.0, 35.0, 29.0, 23.0, 16.0, 10.0, 10.0, 7.0, 11.0, 4.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036144256591796875, -0.0003485381603240967, -0.0003356337547302246, -0.00032272934913635254, -0.00030982494354248047, -0.0002969205379486084, -0.00028401613235473633, -0.00027111172676086426, -0.0002582073211669922, -0.0002453029155731201, -0.00023239850997924805, -0.00021949410438537598, -0.0002065896987915039, -0.00019368529319763184, -0.00018078088760375977, -0.0001678764820098877, -0.00015497207641601562, -0.00014206767082214355, -0.00012916326522827148, -0.00011625885963439941, -0.00010335445404052734, -9.045004844665527e-05, -7.75456428527832e-05, -6.464123725891113e-05, -5.173683166503906e-05, -3.883242607116699e-05, -2.5928020477294922e-05, -1.3023614883422852e-05, -1.1920928955078125e-07, 1.2785196304321289e-05, 2.568960189819336e-05, 3.859400749206543e-05, 5.14984130859375e-05, 6.440281867980957e-05, 7.730722427368164e-05, 9.021162986755371e-05, 0.00010311603546142578, 0.00011602044105529785, 0.00012892484664916992, 0.000141829252243042, 0.00015473365783691406, 0.00016763806343078613, 0.0001805424690246582, 0.00019344687461853027, 0.00020635128021240234, 0.00021925568580627441, 0.00023216009140014648, 0.00024506449699401855, 0.0002579689025878906, 0.0002708733081817627, 0.00028377771377563477, 0.00029668211936950684, 0.0003095865249633789, 0.000322490930557251, 0.00033539533615112305, 0.0003482997417449951, 0.0003612041473388672, 0.00037410855293273926, 0.00038701295852661133, 0.0003999173641204834, 0.00041282176971435547, 0.00042572617530822754, 0.0004386305809020996, 0.0004515349864959717, 0.00046443939208984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 3.0, 6.0, 10.0, 15.0, 27.0, 29.0, 55.0, 51.0, 95.0, 123.0, 166.0, 268.0, 387.0, 606.0, 865.0, 1329.0, 1890.0, 2902.0, 4400.0, 6715.0, 10033.0, 15325.0, 23453.0, 34838.0, 51409.0, 73350.0, 97299.0, 118036.0, 128454.0, 123092.0, 103452.0, 79164.0, 56327.0, 38417.0, 25763.0, 16997.0, 11130.0, 7435.0, 4876.0, 3224.0, 2094.0, 1441.0, 994.0, 625.0, 440.0, 318.0, 189.0, 148.0, 102.0, 59.0, 43.0, 24.0, 26.0, 13.0, 13.0, 8.0, 6.0, 2.0, 1.0, 1.0, 3.0], "bins": [-6.40625, -6.20367431640625, -6.0010986328125, -5.79852294921875, -5.595947265625, -5.39337158203125, -5.1907958984375, -4.98822021484375, -4.78564453125, -4.58306884765625, -4.3804931640625, -4.17791748046875, -3.975341796875, -3.77276611328125, -3.5701904296875, -3.36761474609375, -3.1650390625, -2.96246337890625, -2.7598876953125, -2.55731201171875, -2.354736328125, -2.15216064453125, -1.9495849609375, -1.74700927734375, -1.54443359375, -1.34185791015625, -1.1392822265625, -0.93670654296875, -0.734130859375, -0.53155517578125, -0.3289794921875, -0.12640380859375, 0.076171875, 0.27874755859375, 0.4813232421875, 0.68389892578125, 0.886474609375, 1.08905029296875, 1.2916259765625, 1.49420166015625, 1.69677734375, 1.89935302734375, 2.1019287109375, 2.30450439453125, 2.507080078125, 2.70965576171875, 2.9122314453125, 3.11480712890625, 3.3173828125, 3.51995849609375, 3.7225341796875, 3.92510986328125, 4.127685546875, 4.33026123046875, 4.5328369140625, 4.73541259765625, 4.93798828125, 5.14056396484375, 5.3431396484375, 5.54571533203125, 5.748291015625, 5.95086669921875, 6.1534423828125, 6.35601806640625, 6.55859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 11.0, 9.0, 9.0, 14.0, 10.0, 19.0, 16.0, 27.0, 23.0, 39.0, 34.0, 44.0, 57.0, 46.0, 57.0, 62.0, 52.0, 49.0, 66.0, 42.0, 63.0, 38.0, 35.0, 25.0, 25.0, 28.0, 22.0, 22.0, 7.0, 12.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.97265625, -3.84490966796875, -3.7171630859375, -3.58941650390625, -3.461669921875, -3.33392333984375, -3.2061767578125, -3.07843017578125, -2.95068359375, -2.82293701171875, -2.6951904296875, -2.56744384765625, -2.439697265625, -2.31195068359375, -2.1842041015625, -2.05645751953125, -1.9287109375, -1.80096435546875, -1.6732177734375, -1.54547119140625, -1.417724609375, -1.28997802734375, -1.1622314453125, -1.03448486328125, -0.90673828125, -0.77899169921875, -0.6512451171875, -0.52349853515625, -0.395751953125, -0.26800537109375, -0.1402587890625, -0.01251220703125, 0.115234375, 0.24298095703125, 0.3707275390625, 0.49847412109375, 0.626220703125, 0.75396728515625, 0.8817138671875, 1.00946044921875, 1.13720703125, 1.26495361328125, 1.3927001953125, 1.52044677734375, 1.648193359375, 1.77593994140625, 1.9036865234375, 2.03143310546875, 2.1591796875, 2.28692626953125, 2.4146728515625, 2.54241943359375, 2.670166015625, 2.79791259765625, 2.9256591796875, 3.05340576171875, 3.18115234375, 3.30889892578125, 3.4366455078125, 3.56439208984375, 3.692138671875, 3.81988525390625, 3.9476318359375, 4.07537841796875, 4.203125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 11.0, 4.0, 12.0, 15.0, 11.0, 17.0, 22.0, 18.0, 34.0, 37.0, 37.0, 41.0, 50.0, 65.0, 45.0, 61.0, 70.0, 63.0, 51.0, 55.0, 56.0, 28.0, 34.0, 29.0, 26.0, 22.0, 24.0, 12.0, 16.0, 9.0, 7.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.71332550048828, -49.083213806152344, -47.453102111816406, -45.82299041748047, -44.19287872314453, -42.562767028808594, -40.932655334472656, -39.30253982543945, -37.672428131103516, -36.04231643676758, -34.41220474243164, -32.7820930480957, -31.151979446411133, -29.521867752075195, -27.891756057739258, -26.261642456054688, -24.631532669067383, -23.001420974731445, -21.371309280395508, -19.741195678710938, -18.111083984375, -16.480972290039062, -14.850860595703125, -13.220747947692871, -11.590636253356934, -9.960524559020996, -8.330411911010742, -6.700300216674805, -5.070188045501709, -3.4400758743286133, -1.8099641799926758, -0.17985153198242188, 1.4502601623535156, 3.0803723335266113, 4.710484504699707, 6.3405961990356445, 7.97070837020874, 9.600820541381836, 11.230932235717773, 12.861044883728027, 14.491156578063965, 16.12126922607422, 17.751380920410156, 19.381492614746094, 21.01160430908203, 22.64171600341797, 24.271827697753906, 25.901941299438477, 27.532052993774414, 29.16216468811035, 30.79227638244629, 32.42238998413086, 34.0525016784668, 35.682613372802734, 37.31272506713867, 38.94283676147461, 40.57294845581055, 42.203060150146484, 43.83317184448242, 45.46328353881836, 47.0933952331543, 48.7235107421875, 50.35362243652344, 51.983734130859375, 53.61384582519531]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 3.0, 4.0, 11.0, 2.0, 5.0, 13.0, 16.0, 21.0, 20.0, 19.0, 32.0, 23.0, 24.0, 22.0, 30.0, 46.0, 47.0, 39.0, 45.0, 37.0, 43.0, 36.0, 34.0, 39.0, 38.0, 23.0, 27.0, 37.0, 36.0, 34.0, 19.0, 31.0, 27.0, 15.0, 15.0, 16.0, 16.0, 10.0, 10.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-53.97252655029297, -52.24657440185547, -50.52062225341797, -48.79467010498047, -47.068721771240234, -45.342769622802734, -43.616817474365234, -41.890865325927734, -40.1649169921875, -38.43896484375, -36.7130126953125, -34.987060546875, -33.261112213134766, -31.535160064697266, -29.809207916259766, -28.083255767822266, -26.357303619384766, -24.631351470947266, -22.9054012298584, -21.1794490814209, -19.45349884033203, -17.72754669189453, -16.00159454345703, -14.275643348693848, -12.549692153930664, -10.82374095916748, -9.097789764404297, -7.371837615966797, -5.645886421203613, -3.9199352264404297, -2.1939830780029297, -0.4680318832397461, 1.2579154968261719, 2.9838669300079346, 4.709818363189697, 6.435770034790039, 8.161721229553223, 9.887672424316406, 11.613624572753906, 13.33957576751709, 15.065526962280273, 16.791479110717773, 18.51742935180664, 20.24338150024414, 21.96933364868164, 23.695283889770508, 25.421236038208008, 27.147186279296875, 28.873138427734375, 30.599090576171875, 32.325042724609375, 34.050994873046875, 35.77694320678711, 37.50289535522461, 39.22884750366211, 40.95479965209961, 42.680747985839844, 44.406700134277344, 46.132652282714844, 47.858604431152344, 49.58455276489258, 51.31050491333008, 53.03645706176758, 54.76240921020508, 56.48836135864258]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 9.0, 17.0, 25.0, 23.0, 55.0, 69.0, 104.0, 157.0, 207.0, 363.0, 579.0, 789.0, 1169.0, 1941.0, 3070.0, 4589.0, 7265.0, 11283.0, 17494.0, 27459.0, 41583.0, 59980.0, 82030.0, 105450.0, 120806.0, 125331.0, 115902.0, 96177.0, 73314.0, 51982.0, 35156.0, 23039.0, 14859.0, 9357.0, 5803.0, 3905.0, 2483.0, 1641.0, 1060.0, 688.0, 455.0, 298.0, 206.0, 139.0, 86.0, 50.0, 42.0, 22.0, 14.0, 13.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-25.328125, -24.5439453125, -23.759765625, -22.9755859375, -22.19140625, -21.4072265625, -20.623046875, -19.8388671875, -19.0546875, -18.2705078125, -17.486328125, -16.7021484375, -15.91796875, -15.1337890625, -14.349609375, -13.5654296875, -12.78125, -11.9970703125, -11.212890625, -10.4287109375, -9.64453125, -8.8603515625, -8.076171875, -7.2919921875, -6.5078125, -5.7236328125, -4.939453125, -4.1552734375, -3.37109375, -2.5869140625, -1.802734375, -1.0185546875, -0.234375, 0.5498046875, 1.333984375, 2.1181640625, 2.90234375, 3.6865234375, 4.470703125, 5.2548828125, 6.0390625, 6.8232421875, 7.607421875, 8.3916015625, 9.17578125, 9.9599609375, 10.744140625, 11.5283203125, 12.3125, 13.0966796875, 13.880859375, 14.6650390625, 15.44921875, 16.2333984375, 17.017578125, 17.8017578125, 18.5859375, 19.3701171875, 20.154296875, 20.9384765625, 21.72265625, 22.5068359375, 23.291015625, 24.0751953125, 24.859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 7.0, 11.0, 15.0, 16.0, 26.0, 22.0, 25.0, 21.0, 30.0, 34.0, 32.0, 41.0, 45.0, 53.0, 42.0, 40.0, 50.0, 48.0, 39.0, 35.0, 29.0, 36.0, 44.0, 42.0, 25.0, 29.0, 24.0, 16.0, 24.0, 13.0, 14.0, 15.0, 9.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-56.40625, -54.56591796875, -52.7255859375, -50.88525390625, -49.044921875, -47.20458984375, -45.3642578125, -43.52392578125, -41.68359375, -39.84326171875, -38.0029296875, -36.16259765625, -34.322265625, -32.48193359375, -30.6416015625, -28.80126953125, -26.9609375, -25.12060546875, -23.2802734375, -21.43994140625, -19.599609375, -17.75927734375, -15.9189453125, -14.07861328125, -12.23828125, -10.39794921875, -8.5576171875, -6.71728515625, -4.876953125, -3.03662109375, -1.1962890625, 0.64404296875, 2.484375, 4.32470703125, 6.1650390625, 8.00537109375, 9.845703125, 11.68603515625, 13.5263671875, 15.36669921875, 17.20703125, 19.04736328125, 20.8876953125, 22.72802734375, 24.568359375, 26.40869140625, 28.2490234375, 30.08935546875, 31.9296875, 33.77001953125, 35.6103515625, 37.45068359375, 39.291015625, 41.13134765625, 42.9716796875, 44.81201171875, 46.65234375, 48.49267578125, 50.3330078125, 52.17333984375, 54.013671875, 55.85400390625, 57.6943359375, 59.53466796875, 61.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 18.0, 22.0, 43.0, 68.0, 81.0, 157.0, 202.0, 315.0, 478.0, 753.0, 1189.0, 1700.0, 2714.0, 4131.0, 6692.0, 10587.0, 17266.0, 27814.0, 45550.0, 71667.0, 105218.0, 138583.0, 153942.0, 143022.0, 111162.0, 76184.0, 48605.0, 30063.0, 18661.0, 11599.0, 7167.0, 4547.0, 2881.0, 1908.0, 1238.0, 817.0, 512.0, 314.0, 228.0, 152.0, 72.0, 65.0, 50.0, 39.0, 25.0, 14.0, 4.0, 10.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.52294921875, -36.2958984375, -35.06884765625, -33.841796875, -32.61474609375, -31.3876953125, -30.16064453125, -28.93359375, -27.70654296875, -26.4794921875, -25.25244140625, -24.025390625, -22.79833984375, -21.5712890625, -20.34423828125, -19.1171875, -17.89013671875, -16.6630859375, -15.43603515625, -14.208984375, -12.98193359375, -11.7548828125, -10.52783203125, -9.30078125, -8.07373046875, -6.8466796875, -5.61962890625, -4.392578125, -3.16552734375, -1.9384765625, -0.71142578125, 0.515625, 1.74267578125, 2.9697265625, 4.19677734375, 5.423828125, 6.65087890625, 7.8779296875, 9.10498046875, 10.33203125, 11.55908203125, 12.7861328125, 14.01318359375, 15.240234375, 16.46728515625, 17.6943359375, 18.92138671875, 20.1484375, 21.37548828125, 22.6025390625, 23.82958984375, 25.056640625, 26.28369140625, 27.5107421875, 28.73779296875, 29.96484375, 31.19189453125, 32.4189453125, 33.64599609375, 34.873046875, 36.10009765625, 37.3271484375, 38.55419921875, 39.78125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 9.0, 5.0, 10.0, 14.0, 20.0, 30.0, 26.0, 39.0, 27.0, 34.0, 46.0, 38.0, 47.0, 50.0, 51.0, 37.0, 42.0, 42.0, 54.0, 61.0, 44.0, 35.0, 38.0, 37.0, 17.0, 22.0, 22.0, 21.0, 13.0, 11.0, 11.0, 10.0, 7.0, 8.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.125, -34.6796875, -33.234375, -31.7890625, -30.34375, -28.8984375, -27.453125, -26.0078125, -24.5625, -23.1171875, -21.671875, -20.2265625, -18.78125, -17.3359375, -15.890625, -14.4453125, -13.0, -11.5546875, -10.109375, -8.6640625, -7.21875, -5.7734375, -4.328125, -2.8828125, -1.4375, 0.0078125, 1.453125, 2.8984375, 4.34375, 5.7890625, 7.234375, 8.6796875, 10.125, 11.5703125, 13.015625, 14.4609375, 15.90625, 17.3515625, 18.796875, 20.2421875, 21.6875, 23.1328125, 24.578125, 26.0234375, 27.46875, 28.9140625, 30.359375, 31.8046875, 33.25, 34.6953125, 36.140625, 37.5859375, 39.03125, 40.4765625, 41.921875, 43.3671875, 44.8125, 46.2578125, 47.703125, 49.1484375, 50.59375, 52.0390625, 53.484375, 54.9296875, 56.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 10.0, 9.0, 10.0, 6.0, 13.0, 27.0, 41.0, 71.0, 85.0, 161.0, 219.0, 294.0, 487.0, 809.0, 1238.0, 2098.0, 3443.0, 5772.0, 10127.0, 17813.0, 31120.0, 55235.0, 92221.0, 137407.0, 173065.0, 170995.0, 134411.0, 88052.0, 52596.0, 29971.0, 16854.0, 9777.0, 5605.0, 3285.0, 1904.0, 1172.0, 762.0, 488.0, 321.0, 188.0, 125.0, 87.0, 68.0, 35.0, 33.0, 19.0, 9.0, 13.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.431396484375, -20.80029296875, -20.169189453125, -19.5380859375, -18.906982421875, -18.27587890625, -17.644775390625, -17.013671875, -16.382568359375, -15.75146484375, -15.120361328125, -14.4892578125, -13.858154296875, -13.22705078125, -12.595947265625, -11.96484375, -11.333740234375, -10.70263671875, -10.071533203125, -9.4404296875, -8.809326171875, -8.17822265625, -7.547119140625, -6.916015625, -6.284912109375, -5.65380859375, -5.022705078125, -4.3916015625, -3.760498046875, -3.12939453125, -2.498291015625, -1.8671875, -1.236083984375, -0.60498046875, 0.026123046875, 0.6572265625, 1.288330078125, 1.91943359375, 2.550537109375, 3.181640625, 3.812744140625, 4.44384765625, 5.074951171875, 5.7060546875, 6.337158203125, 6.96826171875, 7.599365234375, 8.23046875, 8.861572265625, 9.49267578125, 10.123779296875, 10.7548828125, 11.385986328125, 12.01708984375, 12.648193359375, 13.279296875, 13.910400390625, 14.54150390625, 15.172607421875, 15.8037109375, 16.434814453125, 17.06591796875, 17.697021484375, 18.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 8.0, 12.0, 21.0, 15.0, 24.0, 29.0, 31.0, 33.0, 50.0, 53.0, 54.0, 58.0, 59.0, 62.0, 56.0, 73.0, 65.0, 45.0, 39.0, 47.0, 27.0, 23.0, 20.0, 20.0, 13.0, 9.0, 8.0, 7.0, 10.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022411346435546875, -0.0021737217903137207, -0.002106308937072754, -0.002038896083831787, -0.0019714832305908203, -0.0019040703773498535, -0.0018366575241088867, -0.00176924467086792, -0.0017018318176269531, -0.0016344189643859863, -0.0015670061111450195, -0.0014995932579040527, -0.001432180404663086, -0.0013647675514221191, -0.0012973546981811523, -0.0012299418449401855, -0.0011625289916992188, -0.001095116138458252, -0.0010277032852172852, -0.0009602904319763184, -0.0008928775787353516, -0.0008254647254943848, -0.000758051872253418, -0.0006906390190124512, -0.0006232261657714844, -0.0005558133125305176, -0.0004884004592895508, -0.000420987606048584, -0.0003535747528076172, -0.0002861618995666504, -0.0002187490463256836, -0.0001513361930847168, -8.392333984375e-05, -1.6510486602783203e-05, 5.0902366638183594e-05, 0.00011831521987915039, 0.0001857280731201172, 0.000253140926361084, 0.0003205537796020508, 0.0003879666328430176, 0.0004553794860839844, 0.0005227923393249512, 0.000590205192565918, 0.0006576180458068848, 0.0007250308990478516, 0.0007924437522888184, 0.0008598566055297852, 0.000927269458770752, 0.0009946823120117188, 0.0010620951652526855, 0.0011295080184936523, 0.0011969208717346191, 0.001264333724975586, 0.0013317465782165527, 0.0013991594314575195, 0.0014665722846984863, 0.0015339851379394531, 0.00160139799118042, 0.0016688108444213867, 0.0017362236976623535, 0.0018036365509033203, 0.0018710494041442871, 0.001938462257385254, 0.0020058751106262207, 0.0020732879638671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 17.0, 20.0, 37.0, 54.0, 76.0, 108.0, 174.0, 234.0, 392.0, 564.0, 844.0, 1254.0, 2235.0, 3543.0, 5808.0, 9516.0, 16474.0, 28041.0, 47888.0, 77234.0, 117933.0, 153671.0, 165824.0, 144616.0, 105422.0, 66957.0, 40417.0, 23882.0, 13807.0, 8329.0, 4949.0, 2985.0, 1838.0, 1127.0, 767.0, 502.0, 321.0, 214.0, 143.0, 91.0, 75.0, 52.0, 42.0, 22.0, 20.0, 9.0, 9.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.21875, -17.618408203125, -17.01806640625, -16.417724609375, -15.8173828125, -15.217041015625, -14.61669921875, -14.016357421875, -13.416015625, -12.815673828125, -12.21533203125, -11.614990234375, -11.0146484375, -10.414306640625, -9.81396484375, -9.213623046875, -8.61328125, -8.012939453125, -7.41259765625, -6.812255859375, -6.2119140625, -5.611572265625, -5.01123046875, -4.410888671875, -3.810546875, -3.210205078125, -2.60986328125, -2.009521484375, -1.4091796875, -0.808837890625, -0.20849609375, 0.391845703125, 0.9921875, 1.592529296875, 2.19287109375, 2.793212890625, 3.3935546875, 3.993896484375, 4.59423828125, 5.194580078125, 5.794921875, 6.395263671875, 6.99560546875, 7.595947265625, 8.1962890625, 8.796630859375, 9.39697265625, 9.997314453125, 10.59765625, 11.197998046875, 11.79833984375, 12.398681640625, 12.9990234375, 13.599365234375, 14.19970703125, 14.800048828125, 15.400390625, 16.000732421875, 16.60107421875, 17.201416015625, 17.8017578125, 18.402099609375, 19.00244140625, 19.602783203125, 20.203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 13.0, 15.0, 21.0, 24.0, 21.0, 38.0, 44.0, 35.0, 45.0, 46.0, 49.0, 51.0, 66.0, 74.0, 68.0, 59.0, 43.0, 42.0, 33.0, 32.0, 33.0, 27.0, 15.0, 13.0, 10.0, 8.0, 8.0, 6.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.3890380859375, -7.156982421875, -6.9249267578125, -6.69287109375, -6.4608154296875, -6.228759765625, -5.9967041015625, -5.7646484375, -5.5325927734375, -5.300537109375, -5.0684814453125, -4.83642578125, -4.6043701171875, -4.372314453125, -4.1402587890625, -3.908203125, -3.6761474609375, -3.444091796875, -3.2120361328125, -2.97998046875, -2.7479248046875, -2.515869140625, -2.2838134765625, -2.0517578125, -1.8197021484375, -1.587646484375, -1.3555908203125, -1.12353515625, -0.8914794921875, -0.659423828125, -0.4273681640625, -0.1953125, 0.0367431640625, 0.268798828125, 0.5008544921875, 0.73291015625, 0.9649658203125, 1.197021484375, 1.4290771484375, 1.6611328125, 1.8931884765625, 2.125244140625, 2.3572998046875, 2.58935546875, 2.8214111328125, 3.053466796875, 3.2855224609375, 3.517578125, 3.7496337890625, 3.981689453125, 4.2137451171875, 4.44580078125, 4.6778564453125, 4.909912109375, 5.1419677734375, 5.3740234375, 5.6060791015625, 5.838134765625, 6.0701904296875, 6.30224609375, 6.5343017578125, 6.766357421875, 6.9984130859375, 7.23046875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 6.0, 8.0, 9.0, 7.0, 15.0, 20.0, 17.0, 17.0, 33.0, 26.0, 32.0, 39.0, 35.0, 46.0, 57.0, 45.0, 57.0, 63.0, 40.0, 51.0, 34.0, 36.0, 45.0, 47.0, 28.0, 31.0, 23.0, 20.0, 21.0, 11.0, 11.0, 7.0, 10.0, 8.0, 8.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.3460807800293, -46.90038299560547, -45.454689025878906, -44.00899124145508, -42.56329345703125, -41.11759948730469, -39.67190170288086, -38.22620391845703, -36.78050994873047, -35.33481216430664, -33.88911819458008, -32.44342041015625, -30.997724533081055, -29.55202865600586, -28.10633087158203, -26.660634994506836, -25.21493911743164, -23.769243240356445, -22.32354736328125, -20.877849578857422, -19.432153701782227, -17.98645782470703, -16.540760040283203, -15.095064163208008, -13.649368286132812, -12.203672409057617, -10.757975578308105, -9.312278747558594, -7.866582870483398, -6.420886516571045, -4.975190162658691, -3.5294933319091797, -2.0837974548339844, -0.6381011009216309, 0.8075952529907227, 2.253291606903076, 3.6989879608154297, 5.144684314727783, 6.590380668640137, 8.036077499389648, 9.481773376464844, 10.927469253540039, 12.37316608428955, 13.818862915039062, 15.264558792114258, 16.710254669189453, 18.15595245361328, 19.601648330688477, 21.047344207763672, 22.493040084838867, 23.938735961914062, 25.38443374633789, 26.830129623413086, 28.27582550048828, 29.72152328491211, 31.167219161987305, 32.6129150390625, 34.05861282348633, 35.50430679321289, 36.95000457763672, 38.39569854736328, 39.84139633178711, 41.28709411621094, 42.7327880859375, 44.17848587036133]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 4.0, 3.0, 3.0, 12.0, 16.0, 19.0, 5.0, 21.0, 17.0, 21.0, 22.0, 19.0, 28.0, 30.0, 24.0, 33.0, 29.0, 28.0, 33.0, 43.0, 42.0, 45.0, 30.0, 44.0, 32.0, 35.0, 54.0, 28.0, 40.0, 31.0, 25.0, 22.0, 31.0, 13.0, 25.0, 10.0, 22.0, 11.0, 7.0, 10.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-75.282470703125, -72.97908020019531, -70.6756820678711, -68.3722915649414, -66.06889343261719, -63.7655029296875, -61.46210861206055, -59.158714294433594, -56.855323791503906, -54.55192947387695, -52.24853515625, -49.94514465332031, -47.64175033569336, -45.338356018066406, -43.03496170043945, -40.7315673828125, -38.42817306518555, -36.124778747558594, -33.82138442993164, -31.51799201965332, -29.214599609375, -26.911205291748047, -24.607810974121094, -22.304418563842773, -20.00102424621582, -17.697629928588867, -15.394237518310547, -13.090843200683594, -10.787449836730957, -8.48405647277832, -6.180662155151367, -3.877269744873047, -1.5738754272460938, 0.7295181751251221, 3.032911777496338, 5.336305618286133, 7.6396989822387695, 9.943092346191406, 12.24648666381836, 14.54987907409668, 16.853273391723633, 19.156667709350586, 21.460060119628906, 23.76345443725586, 26.066848754882812, 28.370241165161133, 30.673635482788086, 32.977027893066406, 35.28042221069336, 37.58381652832031, 39.887210845947266, 42.19060516357422, 44.493995666503906, 46.79738998413086, 49.10078430175781, 51.4041748046875, 53.70757293701172, 56.01096725463867, 58.314361572265625, 60.61775207519531, 62.921146392822266, 65.22454071044922, 67.52793884277344, 69.83132934570312, 72.13471984863281]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 10.0, 13.0, 16.0, 20.0, 23.0, 46.0, 41.0, 65.0, 68.0, 113.0, 145.0, 222.0, 285.0, 440.0, 666.0, 1031.0, 1796.0, 2905.0, 4238.0, 6475.0, 1017905.0, 4935.0, 3345.0, 2044.0, 1293.0, 805.0, 467.0, 322.0, 230.0, 171.0, 128.0, 79.0, 68.0, 56.0, 37.0, 25.0, 23.0, 9.0, 9.0, 10.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-663.8341064453125, -641.8236083984375, -619.8131713867188, -597.8026733398438, -575.792236328125, -553.78173828125, -531.771240234375, -509.76080322265625, -487.75030517578125, -465.7398376464844, -443.7293701171875, -421.7188720703125, -399.7084045410156, -377.69793701171875, -355.6874694824219, -333.677001953125, -311.6665344238281, -289.65606689453125, -267.6455993652344, -245.63511657714844, -223.6246337890625, -201.61416625976562, -179.60369873046875, -157.5932159423828, -135.58274841308594, -113.57227325439453, -91.56179809570312, -69.55133056640625, -47.540855407714844, -25.530380249023438, -3.5199127197265625, 18.490570068359375, 40.50103759765625, 62.511512756347656, 84.52198791503906, 106.53245544433594, 128.54293823242188, 150.55340576171875, 172.56387329101562, 194.57435607910156, 216.58482360839844, 238.5952911376953, 260.60577392578125, 282.6162414550781, 304.626708984375, 326.63720703125, 348.64764404296875, 370.65814208984375, 392.6686096191406, 414.6790771484375, 436.6895446777344, 458.70001220703125, 480.71051025390625, 502.7209777832031, 524.7314453125, 546.741943359375, 568.7523803710938, 590.7628784179688, 612.7733154296875, 634.7838134765625, 656.7942504882812, 678.8047485351562, 700.815185546875, 722.82568359375, 744.836181640625]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 8.0, 12.0, 24.0, 25.0, 31.0, 49.0, 42.0, 65.0, 100.0, 147.0, 208.0, 288.0, 403.0, 555.0, 813.0, 1402.0, 2355.0, 4689.0, 9104.0, 16414.0, 32120.0, 51279416.0, 70747.0, 23923.0, 12841.0, 6687.0, 3520.0, 1867.0, 1132.0, 680.0, 418.0, 361.0, 200.0, 186.0, 131.0, 95.0, 70.0, 43.0, 48.0, 31.0, 19.0, 12.0, 11.0, 6.0, 9.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-520.4613037109375, -504.0864562988281, -487.71160888671875, -471.3367614746094, -454.9619140625, -438.5870361328125, -422.2121887207031, -405.83734130859375, -389.4624938964844, -373.087646484375, -356.7127990722656, -340.33795166015625, -323.96307373046875, -307.5882568359375, -291.21337890625, -274.8385314941406, -258.46368408203125, -242.08883666992188, -225.7139892578125, -209.33912658691406, -192.9642791748047, -176.5894317626953, -160.21456909179688, -143.8397216796875, -127.46487426757812, -111.09002685546875, -94.71517181396484, -78.34031677246094, -61.96546936035156, -45.59062194824219, -29.21576690673828, -12.840911865234375, 3.533935546875, 19.90878677368164, 36.28363800048828, 52.65848922729492, 69.03334045410156, 85.40818786621094, 101.78304290771484, 118.15789794921875, 134.53274536132812, 150.9075927734375, 167.28244018554688, 183.6573028564453, 200.0321502685547, 216.40699768066406, 232.7818603515625, 249.15670776367188, 265.53155517578125, 281.9064025878906, 298.28125, 314.6560974121094, 331.03094482421875, 347.40582275390625, 363.7806701660156, 380.155517578125, 396.5303649902344, 412.90521240234375, 429.2800598144531, 445.6549072265625, 462.02978515625, 478.40460205078125, 494.77947998046875, 511.1543273925781, 527.5291748046875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 11.0, 18.0, 23.0, 23.0, 44.0, 73.0, 90.0, 205.0, 276.0, 481.0, 729.0, 1192.0, 2091.0, 3673.0, 6792.0, 12649.0, 24810.0, 50468.0, 105060.0, 229071.0, 525489.0, 1329326.0, 2191610.0, 1029271.0, 418198.0, 186790.0, 86637.0, 41471.0, 20717.0, 10733.0, 5672.0, 3225.0, 1790.0, 1067.0, 614.0, 378.0, 219.0, 151.0, 105.0, 66.0, 46.0, 34.0, 21.0, 13.0, 5.0, 1.0, 6.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-59.9375, -58.1416015625, -56.345703125, -54.5498046875, -52.75390625, -50.9580078125, -49.162109375, -47.3662109375, -45.5703125, -43.7744140625, -41.978515625, -40.1826171875, -38.38671875, -36.5908203125, -34.794921875, -32.9990234375, -31.203125, -29.4072265625, -27.611328125, -25.8154296875, -24.01953125, -22.2236328125, -20.427734375, -18.6318359375, -16.8359375, -15.0400390625, -13.244140625, -11.4482421875, -9.65234375, -7.8564453125, -6.060546875, -4.2646484375, -2.46875, -0.6728515625, 1.123046875, 2.9189453125, 4.71484375, 6.5107421875, 8.306640625, 10.1025390625, 11.8984375, 13.6943359375, 15.490234375, 17.2861328125, 19.08203125, 20.8779296875, 22.673828125, 24.4697265625, 26.265625, 28.0615234375, 29.857421875, 31.6533203125, 33.44921875, 35.2451171875, 37.041015625, 38.8369140625, 40.6328125, 42.4287109375, 44.224609375, 46.0205078125, 47.81640625, 49.6123046875, 51.408203125, 53.2041015625, 55.0]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 6.0, 6.0, 8.0, 9.0, 10.0, 21.0, 25.0, 19.0, 25.0, 21.0, 34.0, 46.0, 48.0, 67.0, 77.0, 102.0, 142.0, 194.0, 217.0, 226.0, 150.0, 124.0, 87.0, 67.0, 62.0, 39.0, 33.0, 33.0, 17.0, 20.0, 11.0, 20.0, 12.0, 12.0, 9.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.0439453125, -37.712890625, -36.3818359375, -35.05078125, -33.7197265625, -32.388671875, -31.0576171875, -29.7265625, -28.3955078125, -27.064453125, -25.7333984375, -24.40234375, -23.0712890625, -21.740234375, -20.4091796875, -19.078125, -17.7470703125, -16.416015625, -15.0849609375, -13.75390625, -12.4228515625, -11.091796875, -9.7607421875, -8.4296875, -7.0986328125, -5.767578125, -4.4365234375, -3.10546875, -1.7744140625, -0.443359375, 0.8876953125, 2.21875, 3.5498046875, 4.880859375, 6.2119140625, 7.54296875, 8.8740234375, 10.205078125, 11.5361328125, 12.8671875, 14.1982421875, 15.529296875, 16.8603515625, 18.19140625, 19.5224609375, 20.853515625, 22.1845703125, 23.515625, 24.8466796875, 26.177734375, 27.5087890625, 28.83984375, 30.1708984375, 31.501953125, 32.8330078125, 34.1640625, 35.4951171875, 36.826171875, 38.1572265625, 39.48828125, 40.8193359375, 42.150390625, 43.4814453125, 44.8125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 12.0, 19.0, 40.0, 36.0, 62.0, 66.0, 87.0, 147.0, 244.0, 371.0, 564.0, 1048.0, 1634.0, 2856.0, 4437.0, 7804.0, 13213.0, 22393.0, 36600.0, 60408.0, 96115.0, 152450.0, 237408.0, 383416.0, 815431.0, 1952018.0, 1241952.0, 494450.0, 283598.0, 182168.0, 116852.0, 71807.0, 44470.0, 26613.0, 16433.0, 9698.0, 5741.0, 3478.0, 2041.0, 1218.0, 753.0, 442.0, 284.0, 195.0, 115.0, 82.0, 45.0, 35.0, 21.0, 19.0, 12.0, 7.0, 11.0, 5.0, 1.0, 4.0, 1.0, 1.0], "bins": [-24.84375, -24.06005859375, -23.2763671875, -22.49267578125, -21.708984375, -20.92529296875, -20.1416015625, -19.35791015625, -18.57421875, -17.79052734375, -17.0068359375, -16.22314453125, -15.439453125, -14.65576171875, -13.8720703125, -13.08837890625, -12.3046875, -11.52099609375, -10.7373046875, -9.95361328125, -9.169921875, -8.38623046875, -7.6025390625, -6.81884765625, -6.03515625, -5.25146484375, -4.4677734375, -3.68408203125, -2.900390625, -2.11669921875, -1.3330078125, -0.54931640625, 0.234375, 1.01806640625, 1.8017578125, 2.58544921875, 3.369140625, 4.15283203125, 4.9365234375, 5.72021484375, 6.50390625, 7.28759765625, 8.0712890625, 8.85498046875, 9.638671875, 10.42236328125, 11.2060546875, 11.98974609375, 12.7734375, 13.55712890625, 14.3408203125, 15.12451171875, 15.908203125, 16.69189453125, 17.4755859375, 18.25927734375, 19.04296875, 19.82666015625, 20.6103515625, 21.39404296875, 22.177734375, 22.96142578125, 23.7451171875, 24.52880859375, 25.3125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 8.0, 6.0, 4.0, 5.0, 10.0, 15.0, 13.0, 14.0, 22.0, 24.0, 22.0, 39.0, 40.0, 55.0, 51.0, 69.0, 125.0, 253.0, 375.0, 267.0, 169.0, 111.0, 68.0, 49.0, 49.0, 30.0, 30.0, 26.0, 16.0, 16.0, 16.0, 11.0, 13.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.9375, -46.7568359375, -44.576171875, -42.3955078125, -40.21484375, -38.0341796875, -35.853515625, -33.6728515625, -31.4921875, -29.3115234375, -27.130859375, -24.9501953125, -22.76953125, -20.5888671875, -18.408203125, -16.2275390625, -14.046875, -11.8662109375, -9.685546875, -7.5048828125, -5.32421875, -3.1435546875, -0.962890625, 1.2177734375, 3.3984375, 5.5791015625, 7.759765625, 9.9404296875, 12.12109375, 14.3017578125, 16.482421875, 18.6630859375, 20.84375, 23.0244140625, 25.205078125, 27.3857421875, 29.56640625, 31.7470703125, 33.927734375, 36.1083984375, 38.2890625, 40.4697265625, 42.650390625, 44.8310546875, 47.01171875, 49.1923828125, 51.373046875, 53.5537109375, 55.734375, 57.9150390625, 60.095703125, 62.2763671875, 64.45703125, 66.6376953125, 68.818359375, 70.9990234375, 73.1796875, 75.3603515625, 77.541015625, 79.7216796875, 81.90234375, 84.0830078125, 86.263671875, 88.4443359375, 90.625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 0.0, 4.0, 6.0, 7.0, 13.0, 25.0, 21.0, 30.0, 36.0, 53.0, 69.0, 133.0, 172.0, 241.0, 335.0, 540.0, 824.0, 1173.0, 1979.0, 3606.0, 6422.0, 11941.0, 23327.0, 47449.0, 104083.0, 3984642.0, 1903583.0, 102592.0, 46949.0, 23351.0, 11828.0, 6459.0, 3595.0, 2064.0, 1297.0, 811.0, 529.0, 324.0, 266.0, 168.0, 134.0, 96.0, 74.0, 41.0, 30.0, 34.0, 25.0, 21.0, 11.0, 11.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-85.625, -82.671875, -79.71875, -76.765625, -73.8125, -70.859375, -67.90625, -64.953125, -62.0, -59.046875, -56.09375, -53.140625, -50.1875, -47.234375, -44.28125, -41.328125, -38.375, -35.421875, -32.46875, -29.515625, -26.5625, -23.609375, -20.65625, -17.703125, -14.75, -11.796875, -8.84375, -5.890625, -2.9375, 0.015625, 2.96875, 5.921875, 8.875, 11.828125, 14.78125, 17.734375, 20.6875, 23.640625, 26.59375, 29.546875, 32.5, 35.453125, 38.40625, 41.359375, 44.3125, 47.265625, 50.21875, 53.171875, 56.125, 59.078125, 62.03125, 64.984375, 67.9375, 70.890625, 73.84375, 76.796875, 79.75, 82.703125, 85.65625, 88.609375, 91.5625, 94.515625, 97.46875, 100.421875, 103.375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 9.0, 11.0, 16.0, 21.0, 21.0, 22.0, 23.0, 33.0, 36.0, 47.0, 45.0, 43.0, 55.0, 115.0, 388.0, 442.0, 210.0, 94.0, 70.0, 47.0, 41.0, 33.0, 30.0, 35.0, 22.0, 18.0, 16.0, 15.0, 11.0, 12.0, 5.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-113.875, -110.5380859375, -107.201171875, -103.8642578125, -100.52734375, -97.1904296875, -93.853515625, -90.5166015625, -87.1796875, -83.8427734375, -80.505859375, -77.1689453125, -73.83203125, -70.4951171875, -67.158203125, -63.8212890625, -60.484375, -57.1474609375, -53.810546875, -50.4736328125, -47.13671875, -43.7998046875, -40.462890625, -37.1259765625, -33.7890625, -30.4521484375, -27.115234375, -23.7783203125, -20.44140625, -17.1044921875, -13.767578125, -10.4306640625, -7.09375, -3.7568359375, -0.419921875, 2.9169921875, 6.25390625, 9.5908203125, 12.927734375, 16.2646484375, 19.6015625, 22.9384765625, 26.275390625, 29.6123046875, 32.94921875, 36.2861328125, 39.623046875, 42.9599609375, 46.296875, 49.6337890625, 52.970703125, 56.3076171875, 59.64453125, 62.9814453125, 66.318359375, 69.6552734375, 72.9921875, 76.3291015625, 79.666015625, 83.0029296875, 86.33984375, 89.6767578125, 93.013671875, 96.3505859375, 99.6875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 7.0, 3.0, 18.0, 25.0, 38.0, 63.0, 99.0, 171.0, 243.0, 101.0, 76.0, 48.0, 39.0, 14.0, 11.0, 12.0, 7.0, 4.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2903.458740234375, -2837.835693359375, -2772.212890625, -2706.58984375, -2640.967041015625, -2575.343994140625, -2509.72119140625, -2444.09814453125, -2378.47509765625, -2312.85205078125, -2247.229248046875, -2181.606201171875, -2115.9833984375, -2050.3603515625, -1984.7374267578125, -1919.114501953125, -1853.4915771484375, -1787.86865234375, -1722.2457275390625, -1656.622802734375, -1590.999755859375, -1525.3768310546875, -1459.75390625, -1394.1309814453125, -1328.508056640625, -1262.8851318359375, -1197.26220703125, -1131.63916015625, -1066.0162353515625, -1000.393310546875, -934.7703857421875, -869.1474609375, -803.5244140625, -737.9014892578125, -672.2785034179688, -606.6555786132812, -541.0325927734375, -475.40966796875, -409.7867431640625, -344.1637878417969, -278.54083251953125, -212.91787719726562, -147.29493713378906, -81.6719970703125, -16.049041748046875, 49.57391357421875, 115.19683837890625, 180.81979370117188, 246.4427490234375, 312.0657043457031, 377.68865966796875, 443.31158447265625, 508.9345397949219, 574.5574951171875, 640.180419921875, 705.8033447265625, 771.4263305664062, 837.0492553710938, 902.6722412109375, 968.295166015625, 1033.9180908203125, 1099.541015625, 1165.1640625, 1230.7869873046875, 1296.409912109375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 7.0, 16.0, 10.0, 22.0, 12.0, 16.0, 10.0, 20.0, 12.0, 28.0, 28.0, 33.0, 40.0, 52.0, 81.0, 101.0, 92.0, 69.0, 51.0, 50.0, 30.0, 27.0, 18.0, 24.0, 23.0, 13.0, 18.0, 15.0, 15.0, 5.0, 8.0, 9.0, 2.0, 7.0, 2.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1565.72216796875, -1518.025146484375, -1470.328125, -1422.631103515625, -1374.93408203125, -1327.237060546875, -1279.5400390625, -1231.8428955078125, -1184.1458740234375, -1136.4488525390625, -1088.7518310546875, -1041.0548095703125, -993.3577270507812, -945.6607055664062, -897.9636840820312, -850.2666015625, -802.5696411132812, -754.8726196289062, -707.1755981445312, -659.478515625, -611.781494140625, -564.08447265625, -516.387451171875, -468.6903991699219, -420.9933776855469, -373.2963562011719, -325.59930419921875, -277.90228271484375, -230.2052459716797, -182.50820922851562, -134.81118774414062, -87.1141357421875, -39.4171142578125, 8.279918670654297, 55.976951599121094, 103.67398071289062, 151.3710174560547, 199.06805419921875, 246.76507568359375, 294.4621276855469, 342.1591491699219, 389.8561706542969, 437.55322265625, 485.250244140625, 532.947265625, 580.644287109375, 628.34130859375, 676.0383911132812, 723.7354125976562, 771.4324340820312, 819.1294555664062, 866.8265380859375, 914.5235595703125, 962.2205810546875, 1009.9176025390625, 1057.6146240234375, 1105.3116455078125, 1153.0086669921875, 1200.7056884765625, 1248.4027099609375, 1296.0997314453125, 1343.796875, 1391.493896484375, 1439.19091796875, 1486.887939453125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 10.0, 14.0, 17.0, 22.0, 27.0, 38.0, 51.0, 88.0, 103.0, 175.0, 220.0, 290.0, 464.0, 657.0, 961.0, 1489.0, 2420.0, 3903.0, 6620.0, 11605.0, 22780.0, 51125.0, 175954.0, 3290695.0, 481977.0, 80014.0, 30502.0, 14254.0, 7553.0, 4074.0, 2331.0, 1413.0, 830.0, 546.0, 351.0, 264.0, 133.0, 98.0, 77.0, 41.0, 32.0, 23.0, 14.0, 9.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.40625, -13.0198974609375, -12.633544921875, -12.2471923828125, -11.86083984375, -11.4744873046875, -11.088134765625, -10.7017822265625, -10.3154296875, -9.9290771484375, -9.542724609375, -9.1563720703125, -8.77001953125, -8.3836669921875, -7.997314453125, -7.6109619140625, -7.224609375, -6.8382568359375, -6.451904296875, -6.0655517578125, -5.67919921875, -5.2928466796875, -4.906494140625, -4.5201416015625, -4.1337890625, -3.7474365234375, -3.361083984375, -2.9747314453125, -2.58837890625, -2.2020263671875, -1.815673828125, -1.4293212890625, -1.04296875, -0.6566162109375, -0.270263671875, 0.1160888671875, 0.50244140625, 0.8887939453125, 1.275146484375, 1.6614990234375, 2.0478515625, 2.4342041015625, 2.820556640625, 3.2069091796875, 3.59326171875, 3.9796142578125, 4.365966796875, 4.7523193359375, 5.138671875, 5.5250244140625, 5.911376953125, 6.2977294921875, 6.68408203125, 7.0704345703125, 7.456787109375, 7.8431396484375, 8.2294921875, 8.6158447265625, 9.002197265625, 9.3885498046875, 9.77490234375, 10.1612548828125, 10.547607421875, 10.9339599609375, 11.3203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 4.0, 11.0, 6.0, 8.0, 10.0, 11.0, 26.0, 59.0, 137.0, 264.0, 200.0, 98.0, 42.0, 20.0, 17.0, 18.0, 11.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.488616943359375, -2.41473388671875, -2.340850830078125, -2.2669677734375, -2.193084716796875, -2.11920166015625, -2.045318603515625, -1.971435546875, -1.897552490234375, -1.82366943359375, -1.749786376953125, -1.6759033203125, -1.602020263671875, -1.52813720703125, -1.454254150390625, -1.38037109375, -1.306488037109375, -1.23260498046875, -1.158721923828125, -1.0848388671875, -1.010955810546875, -0.93707275390625, -0.863189697265625, -0.789306640625, -0.715423583984375, -0.64154052734375, -0.567657470703125, -0.4937744140625, -0.419891357421875, -0.34600830078125, -0.272125244140625, -0.1982421875, -0.124359130859375, -0.05047607421875, 0.023406982421875, 0.0972900390625, 0.171173095703125, 0.24505615234375, 0.318939208984375, 0.392822265625, 0.466705322265625, 0.54058837890625, 0.614471435546875, 0.6883544921875, 0.762237548828125, 0.83612060546875, 0.910003662109375, 0.98388671875, 1.057769775390625, 1.13165283203125, 1.205535888671875, 1.2794189453125, 1.353302001953125, 1.42718505859375, 1.501068115234375, 1.574951171875, 1.648834228515625, 1.72271728515625, 1.796600341796875, 1.8704833984375, 1.944366455078125, 2.01824951171875, 2.092132568359375, 2.166015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 12.0, 14.0, 29.0, 32.0, 41.0, 81.0, 88.0, 188.0, 312.0, 525.0, 940.0, 1708.0, 3596.0, 8327.0, 21471.0, 65492.0, 245330.0, 1159490.0, 2072843.0, 447925.0, 109711.0, 33391.0, 12359.0, 5161.0, 2366.0, 1143.0, 651.0, 353.0, 208.0, 146.0, 93.0, 73.0, 45.0, 35.0, 20.0, 19.0, 10.0, 4.0, 16.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.4375, -9.135009765625, -8.83251953125, -8.530029296875, -8.2275390625, -7.925048828125, -7.62255859375, -7.320068359375, -7.017578125, -6.715087890625, -6.41259765625, -6.110107421875, -5.8076171875, -5.505126953125, -5.20263671875, -4.900146484375, -4.59765625, -4.295166015625, -3.99267578125, -3.690185546875, -3.3876953125, -3.085205078125, -2.78271484375, -2.480224609375, -2.177734375, -1.875244140625, -1.57275390625, -1.270263671875, -0.9677734375, -0.665283203125, -0.36279296875, -0.060302734375, 0.2421875, 0.544677734375, 0.84716796875, 1.149658203125, 1.4521484375, 1.754638671875, 2.05712890625, 2.359619140625, 2.662109375, 2.964599609375, 3.26708984375, 3.569580078125, 3.8720703125, 4.174560546875, 4.47705078125, 4.779541015625, 5.08203125, 5.384521484375, 5.68701171875, 5.989501953125, 6.2919921875, 6.594482421875, 6.89697265625, 7.199462890625, 7.501953125, 7.804443359375, 8.10693359375, 8.409423828125, 8.7119140625, 9.014404296875, 9.31689453125, 9.619384765625, 9.921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 7.0, 8.0, 9.0, 15.0, 20.0, 21.0, 43.0, 53.0, 58.0, 98.0, 125.0, 167.0, 219.0, 294.0, 408.0, 583.0, 487.0, 376.0, 273.0, 207.0, 146.0, 113.0, 96.0, 68.0, 42.0, 37.0, 19.0, 16.0, 14.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68359375, -3.56744384765625, -3.4512939453125, -3.33514404296875, -3.218994140625, -3.10284423828125, -2.9866943359375, -2.87054443359375, -2.75439453125, -2.63824462890625, -2.5220947265625, -2.40594482421875, -2.289794921875, -2.17364501953125, -2.0574951171875, -1.94134521484375, -1.8251953125, -1.70904541015625, -1.5928955078125, -1.47674560546875, -1.360595703125, -1.24444580078125, -1.1282958984375, -1.01214599609375, -0.89599609375, -0.77984619140625, -0.6636962890625, -0.54754638671875, -0.431396484375, -0.31524658203125, -0.1990966796875, -0.08294677734375, 0.033203125, 0.14935302734375, 0.2655029296875, 0.38165283203125, 0.497802734375, 0.61395263671875, 0.7301025390625, 0.84625244140625, 0.96240234375, 1.07855224609375, 1.1947021484375, 1.31085205078125, 1.427001953125, 1.54315185546875, 1.6593017578125, 1.77545166015625, 1.8916015625, 2.00775146484375, 2.1239013671875, 2.24005126953125, 2.356201171875, 2.47235107421875, 2.5885009765625, 2.70465087890625, 2.82080078125, 2.93695068359375, 3.0531005859375, 3.16925048828125, 3.285400390625, 3.40155029296875, 3.5177001953125, 3.63385009765625, 3.75]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 9.0, 14.0, 44.0, 79.0, 140.0, 217.0, 245.0, 123.0, 66.0, 35.0, 16.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.758819580078125, -45.90781021118164, -44.056800842285156, -42.205787658691406, -40.35477828979492, -38.50376892089844, -36.65275955200195, -34.80175018310547, -32.95073699951172, -31.099727630615234, -29.248716354370117, -27.397706985473633, -25.546695709228516, -23.69568634033203, -21.844676971435547, -19.993667602539062, -18.142658233642578, -16.291648864746094, -14.440637588500977, -12.589628219604492, -10.738617897033691, -8.88760757446289, -7.036598205566406, -5.1855878829956055, -3.3345775604248047, -1.483567476272583, 0.36744260787963867, 2.2184524536132812, 4.069462776184082, 5.920473098754883, 7.771482467651367, 9.622492790222168, 11.473503112792969, 13.32451343536377, 15.17552375793457, 17.026533126831055, 18.877544403076172, 20.728553771972656, 22.57956314086914, 24.430572509765625, 26.281583786010742, 28.132593154907227, 29.983604431152344, 31.834613800048828, 33.68562316894531, 35.53663635253906, 37.38764190673828, 39.23865509033203, 41.089664459228516, 42.940673828125, 44.791683197021484, 46.64269256591797, 48.49370574951172, 50.3447151184082, 52.19572448730469, 54.04673385620117, 55.897743225097656, 57.74875259399414, 59.599761962890625, 61.450775146484375, 63.30178451538086, 65.15279388427734, 67.00379943847656, 68.85481262207031, 70.70582580566406]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 5.0, 7.0, 20.0, 15.0, 10.0, 18.0, 36.0, 30.0, 33.0, 42.0, 50.0, 54.0, 73.0, 55.0, 64.0, 62.0, 58.0, 62.0, 47.0, 43.0, 37.0, 33.0, 29.0, 24.0, 17.0, 14.0, 13.0, 14.0, 13.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.553367614746094, -23.76286506652832, -22.972362518310547, -22.181861877441406, -21.391359329223633, -20.60085678100586, -19.81035614013672, -19.019853591918945, -18.229351043701172, -17.4388484954834, -16.648345947265625, -15.857845306396484, -15.067342758178711, -14.276840209960938, -13.48633861541748, -12.695837020874023, -11.90533447265625, -11.114831924438477, -10.32433032989502, -9.533828735351562, -8.743326187133789, -7.952824115753174, -7.162322044372559, -6.371819972991943, -5.581317901611328, -4.790815830230713, -4.000313758850098, -3.2098116874694824, -2.419309616088867, -1.628807544708252, -0.8383054733276367, -0.047803401947021484, 0.7426986694335938, 1.533200740814209, 2.323702812194824, 3.1142048835754395, 3.9047069549560547, 4.69520902633667, 5.485711097717285, 6.2762131690979, 7.066715240478516, 7.857217311859131, 8.647719383239746, 9.438220977783203, 10.228723526000977, 11.01922607421875, 11.809727668762207, 12.600229263305664, 13.390731811523438, 14.181234359741211, 14.971735954284668, 15.762237548828125, 16.5527400970459, 17.343242645263672, 18.133743286132812, 18.924245834350586, 19.71474838256836, 20.505250930786133, 21.295753479003906, 22.086254119873047, 22.87675666809082, 23.667259216308594, 24.457759857177734, 25.248262405395508, 26.03876495361328]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 9.0, 16.0, 17.0, 20.0, 28.0, 43.0, 52.0, 74.0, 80.0, 115.0, 176.0, 223.0, 296.0, 397.0, 578.0, 831.0, 1318.0, 2031.0, 3015.0, 4913.0, 8477.0, 17031.0, 44282.0, 210940.0, 588909.0, 103831.0, 29265.0, 12650.0, 7018.0, 3999.0, 2609.0, 1619.0, 1074.0, 737.0, 516.0, 386.0, 239.0, 166.0, 132.0, 103.0, 96.0, 61.0, 51.0, 37.0, 25.0, 22.0, 18.0, 9.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.14453125, -5.954345703125, -5.76416015625, -5.573974609375, -5.3837890625, -5.193603515625, -5.00341796875, -4.813232421875, -4.623046875, -4.432861328125, -4.24267578125, -4.052490234375, -3.8623046875, -3.672119140625, -3.48193359375, -3.291748046875, -3.1015625, -2.911376953125, -2.72119140625, -2.531005859375, -2.3408203125, -2.150634765625, -1.96044921875, -1.770263671875, -1.580078125, -1.389892578125, -1.19970703125, -1.009521484375, -0.8193359375, -0.629150390625, -0.43896484375, -0.248779296875, -0.05859375, 0.131591796875, 0.32177734375, 0.511962890625, 0.7021484375, 0.892333984375, 1.08251953125, 1.272705078125, 1.462890625, 1.653076171875, 1.84326171875, 2.033447265625, 2.2236328125, 2.413818359375, 2.60400390625, 2.794189453125, 2.984375, 3.174560546875, 3.36474609375, 3.554931640625, 3.7451171875, 3.935302734375, 4.12548828125, 4.315673828125, 4.505859375, 4.696044921875, 4.88623046875, 5.076416015625, 5.2666015625, 5.456787109375, 5.64697265625, 5.837158203125, 6.02734375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 12.0, 6.0, 8.0, 5.0, 8.0, 18.0, 37.0, 56.0, 93.0, 140.0, 171.0, 152.0, 105.0, 58.0, 30.0, 20.0, 17.0, 11.0, 7.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.748046875, -2.67462158203125, -2.6011962890625, -2.52777099609375, -2.454345703125, -2.38092041015625, -2.3074951171875, -2.23406982421875, -2.16064453125, -2.08721923828125, -2.0137939453125, -1.94036865234375, -1.866943359375, -1.79351806640625, -1.7200927734375, -1.64666748046875, -1.5732421875, -1.49981689453125, -1.4263916015625, -1.35296630859375, -1.279541015625, -1.20611572265625, -1.1326904296875, -1.05926513671875, -0.98583984375, -0.91241455078125, -0.8389892578125, -0.76556396484375, -0.692138671875, -0.61871337890625, -0.5452880859375, -0.47186279296875, -0.3984375, -0.32501220703125, -0.2515869140625, -0.17816162109375, -0.104736328125, -0.03131103515625, 0.0421142578125, 0.11553955078125, 0.18896484375, 0.26239013671875, 0.3358154296875, 0.40924072265625, 0.482666015625, 0.55609130859375, 0.6295166015625, 0.70294189453125, 0.7763671875, 0.84979248046875, 0.9232177734375, 0.99664306640625, 1.070068359375, 1.14349365234375, 1.2169189453125, 1.29034423828125, 1.36376953125, 1.43719482421875, 1.5106201171875, 1.58404541015625, 1.657470703125, 1.73089599609375, 1.8043212890625, 1.87774658203125, 1.951171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 8.0, 8.0, 14.0, 18.0, 22.0, 27.0, 46.0, 63.0, 116.0, 158.0, 269.0, 456.0, 773.0, 1532.0, 2802.0, 5273.0, 10787.0, 22862.0, 53739.0, 148931.0, 422857.0, 238597.0, 78224.0, 31718.0, 14232.0, 6901.0, 3607.0, 1947.0, 1044.0, 582.0, 354.0, 185.0, 134.0, 66.0, 59.0, 43.0, 28.0, 18.0, 15.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.95703125, -5.77484130859375, -5.5926513671875, -5.41046142578125, -5.228271484375, -5.04608154296875, -4.8638916015625, -4.68170166015625, -4.49951171875, -4.31732177734375, -4.1351318359375, -3.95294189453125, -3.770751953125, -3.58856201171875, -3.4063720703125, -3.22418212890625, -3.0419921875, -2.85980224609375, -2.6776123046875, -2.49542236328125, -2.313232421875, -2.13104248046875, -1.9488525390625, -1.76666259765625, -1.58447265625, -1.40228271484375, -1.2200927734375, -1.03790283203125, -0.855712890625, -0.67352294921875, -0.4913330078125, -0.30914306640625, -0.126953125, 0.05523681640625, 0.2374267578125, 0.41961669921875, 0.601806640625, 0.78399658203125, 0.9661865234375, 1.14837646484375, 1.33056640625, 1.51275634765625, 1.6949462890625, 1.87713623046875, 2.059326171875, 2.24151611328125, 2.4237060546875, 2.60589599609375, 2.7880859375, 2.97027587890625, 3.1524658203125, 3.33465576171875, 3.516845703125, 3.69903564453125, 3.8812255859375, 4.06341552734375, 4.24560546875, 4.42779541015625, 4.6099853515625, 4.79217529296875, 4.974365234375, 5.15655517578125, 5.3387451171875, 5.52093505859375, 5.703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 4.0, 9.0, 10.0, 9.0, 7.0, 11.0, 25.0, 19.0, 15.0, 18.0, 27.0, 37.0, 29.0, 34.0, 36.0, 45.0, 38.0, 47.0, 55.0, 58.0, 40.0, 39.0, 53.0, 32.0, 30.0, 31.0, 43.0, 23.0, 36.0, 31.0, 20.0, 19.0, 17.0, 11.0, 9.0, 9.0, 7.0, 7.0, 6.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.1761474609375, -7.914794921875, -7.6534423828125, -7.39208984375, -7.1307373046875, -6.869384765625, -6.6080322265625, -6.3466796875, -6.0853271484375, -5.823974609375, -5.5626220703125, -5.30126953125, -5.0399169921875, -4.778564453125, -4.5172119140625, -4.255859375, -3.9945068359375, -3.733154296875, -3.4718017578125, -3.21044921875, -2.9490966796875, -2.687744140625, -2.4263916015625, -2.1650390625, -1.9036865234375, -1.642333984375, -1.3809814453125, -1.11962890625, -0.8582763671875, -0.596923828125, -0.3355712890625, -0.07421875, 0.1871337890625, 0.448486328125, 0.7098388671875, 0.97119140625, 1.2325439453125, 1.493896484375, 1.7552490234375, 2.0166015625, 2.2779541015625, 2.539306640625, 2.8006591796875, 3.06201171875, 3.3233642578125, 3.584716796875, 3.8460693359375, 4.107421875, 4.3687744140625, 4.630126953125, 4.8914794921875, 5.15283203125, 5.4141845703125, 5.675537109375, 5.9368896484375, 6.1982421875, 6.4595947265625, 6.720947265625, 6.9822998046875, 7.24365234375, 7.5050048828125, 7.766357421875, 8.0277099609375, 8.2890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 6.0, 11.0, 6.0, 13.0, 19.0, 22.0, 31.0, 74.0, 126.0, 290.0, 841.0, 2939.0, 16283.0, 310297.0, 683451.0, 27826.0, 4428.0, 1116.0, 370.0, 173.0, 72.0, 59.0, 25.0, 20.0, 9.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 7.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0], "bins": [-17.765625, -17.3228759765625, -16.880126953125, -16.4373779296875, -15.99462890625, -15.5518798828125, -15.109130859375, -14.6663818359375, -14.2236328125, -13.7808837890625, -13.338134765625, -12.8953857421875, -12.45263671875, -12.0098876953125, -11.567138671875, -11.1243896484375, -10.681640625, -10.2388916015625, -9.796142578125, -9.3533935546875, -8.91064453125, -8.4678955078125, -8.025146484375, -7.5823974609375, -7.1396484375, -6.6968994140625, -6.254150390625, -5.8114013671875, -5.36865234375, -4.9259033203125, -4.483154296875, -4.0404052734375, -3.59765625, -3.1549072265625, -2.712158203125, -2.2694091796875, -1.82666015625, -1.3839111328125, -0.941162109375, -0.4984130859375, -0.0556640625, 0.3870849609375, 0.829833984375, 1.2725830078125, 1.71533203125, 2.1580810546875, 2.600830078125, 3.0435791015625, 3.486328125, 3.9290771484375, 4.371826171875, 4.8145751953125, 5.25732421875, 5.7000732421875, 6.142822265625, 6.5855712890625, 7.0283203125, 7.4710693359375, 7.913818359375, 8.3565673828125, 8.79931640625, 9.2420654296875, 9.684814453125, 10.1275634765625, 10.5703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 11.0, 15.0, 14.0, 12.0, 22.0, 37.0, 38.0, 41.0, 53.0, 48.0, 73.0, 78.0, 74.0, 54.0, 68.0, 58.0, 57.0, 34.0, 40.0, 35.0, 23.0, 25.0, 11.0, 16.0, 12.0, 6.0, 6.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002601146697998047, -0.0002533774822950363, -0.00024664029479026794, -0.00023990310728549957, -0.0002331659197807312, -0.00022642873227596283, -0.00021969154477119446, -0.00021295435726642609, -0.00020621716976165771, -0.00019947998225688934, -0.00019274279475212097, -0.0001860056072473526, -0.00017926841974258423, -0.00017253123223781586, -0.00016579404473304749, -0.00015905685722827911, -0.00015231966972351074, -0.00014558248221874237, -0.000138845294713974, -0.00013210810720920563, -0.00012537091970443726, -0.00011863373219966888, -0.00011189654469490051, -0.00010515935719013214, -9.842216968536377e-05, -9.16849821805954e-05, -8.494779467582703e-05, -7.821060717105865e-05, -7.147341966629028e-05, -6.473623216152191e-05, -5.799904465675354e-05, -5.126185715198517e-05, -4.45246696472168e-05, -3.7787482142448425e-05, -3.1050294637680054e-05, -2.4313107132911682e-05, -1.757591962814331e-05, -1.0838732123374939e-05, -4.101544618606567e-06, 2.635642886161804e-06, 9.372830390930176e-06, 1.6110017895698547e-05, 2.284720540046692e-05, 2.958439290523529e-05, 3.632158041000366e-05, 4.3058767914772034e-05, 4.9795955419540405e-05, 5.653314292430878e-05, 6.327033042907715e-05, 7.000751793384552e-05, 7.674470543861389e-05, 8.348189294338226e-05, 9.021908044815063e-05, 9.6956267952919e-05, 0.00010369345545768738, 0.00011043064296245575, 0.00011716783046722412, 0.0001239050179719925, 0.00013064220547676086, 0.00013737939298152924, 0.0001441165804862976, 0.00015085376799106598, 0.00015759095549583435, 0.00016432814300060272, 0.0001710653305053711]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 6.0, 9.0, 16.0, 18.0, 42.0, 57.0, 135.0, 208.0, 425.0, 954.0, 2160.0, 6407.0, 24009.0, 155704.0, 688232.0, 138121.0, 22180.0, 6036.0, 2037.0, 886.0, 418.0, 181.0, 119.0, 68.0, 32.0, 27.0, 23.0, 17.0, 10.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.0859375, -10.79779052734375, -10.5096435546875, -10.22149658203125, -9.933349609375, -9.64520263671875, -9.3570556640625, -9.06890869140625, -8.78076171875, -8.49261474609375, -8.2044677734375, -7.91632080078125, -7.628173828125, -7.34002685546875, -7.0518798828125, -6.76373291015625, -6.4755859375, -6.18743896484375, -5.8992919921875, -5.61114501953125, -5.322998046875, -5.03485107421875, -4.7467041015625, -4.45855712890625, -4.17041015625, -3.88226318359375, -3.5941162109375, -3.30596923828125, -3.017822265625, -2.72967529296875, -2.4415283203125, -2.15338134765625, -1.865234375, -1.57708740234375, -1.2889404296875, -1.00079345703125, -0.712646484375, -0.42449951171875, -0.1363525390625, 0.15179443359375, 0.43994140625, 0.72808837890625, 1.0162353515625, 1.30438232421875, 1.592529296875, 1.88067626953125, 2.1688232421875, 2.45697021484375, 2.7451171875, 3.03326416015625, 3.3214111328125, 3.60955810546875, 3.897705078125, 4.18585205078125, 4.4739990234375, 4.76214599609375, 5.05029296875, 5.33843994140625, 5.6265869140625, 5.91473388671875, 6.202880859375, 6.49102783203125, 6.7791748046875, 7.06732177734375, 7.35546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 7.0, 11.0, 2.0, 6.0, 15.0, 20.0, 16.0, 35.0, 41.0, 47.0, 54.0, 65.0, 72.0, 83.0, 82.0, 71.0, 88.0, 64.0, 37.0, 38.0, 32.0, 32.0, 18.0, 18.0, 12.0, 9.0, 5.0, 4.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.22918701171875, -4.0638427734375, -3.89849853515625, -3.733154296875, -3.56781005859375, -3.4024658203125, -3.23712158203125, -3.07177734375, -2.90643310546875, -2.7410888671875, -2.57574462890625, -2.410400390625, -2.24505615234375, -2.0797119140625, -1.91436767578125, -1.7490234375, -1.58367919921875, -1.4183349609375, -1.25299072265625, -1.087646484375, -0.92230224609375, -0.7569580078125, -0.59161376953125, -0.42626953125, -0.26092529296875, -0.0955810546875, 0.06976318359375, 0.235107421875, 0.40045166015625, 0.5657958984375, 0.73114013671875, 0.896484375, 1.06182861328125, 1.2271728515625, 1.39251708984375, 1.557861328125, 1.72320556640625, 1.8885498046875, 2.05389404296875, 2.21923828125, 2.38458251953125, 2.5499267578125, 2.71527099609375, 2.880615234375, 3.04595947265625, 3.2113037109375, 3.37664794921875, 3.5419921875, 3.70733642578125, 3.8726806640625, 4.03802490234375, 4.203369140625, 4.36871337890625, 4.5340576171875, 4.69940185546875, 4.86474609375, 5.03009033203125, 5.1954345703125, 5.36077880859375, 5.526123046875, 5.69146728515625, 5.8568115234375, 6.02215576171875, 6.1875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 10.0, 20.0, 84.0, 518.0, 298.0, 49.0, 11.0, 10.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-295.17803955078125, -286.9461364746094, -278.7142028808594, -270.4822998046875, -262.2503662109375, -254.01844787597656, -245.78652954101562, -237.55462646484375, -229.32269287109375, -221.0907745361328, -212.85885620117188, -204.62693786621094, -196.39501953125, -188.16310119628906, -179.93118286132812, -171.69927978515625, -163.4673614501953, -155.23544311523438, -147.00352478027344, -138.7716064453125, -130.53968811035156, -122.30776977539062, -114.07585906982422, -105.84394073486328, -97.61202239990234, -89.3801040649414, -81.14818572998047, -72.91627502441406, -64.68435668945312, -56.45243453979492, -48.22052001953125, -39.98860168457031, -31.756698608398438, -23.5247802734375, -15.292863845825195, -7.060947418212891, 1.1709709167480469, 9.402889251708984, 17.634803771972656, 25.866722106933594, 34.09864044189453, 42.33055877685547, 50.562477111816406, 58.79439163208008, 67.02630615234375, 75.25822448730469, 83.49014282226562, 91.72206115722656, 99.9539794921875, 108.18589782714844, 116.41781616210938, 124.64973449707031, 132.88165283203125, 141.1135711669922, 149.34548950195312, 157.577392578125, 165.809326171875, 174.04124450683594, 182.27316284179688, 190.5050811767578, 198.73699951171875, 206.9689178466797, 215.20083618164062, 223.4327392578125, 231.66465759277344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 5.0, 2.0, 5.0, 9.0, 13.0, 9.0, 22.0, 27.0, 55.0, 66.0, 85.0, 129.0, 133.0, 111.0, 98.0, 62.0, 47.0, 25.0, 22.0, 7.0, 12.0, 6.0, 6.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-128.66307067871094, -124.70231628417969, -120.74156188964844, -116.78080749511719, -112.82006072998047, -108.85930633544922, -104.89855194091797, -100.93779754638672, -96.97705078125, -93.01629638671875, -89.0555419921875, -85.09478759765625, -81.13404083251953, -77.17328643798828, -73.21253204345703, -69.25177764892578, -65.29102325439453, -61.33026885986328, -57.3695182800293, -53.40876388549805, -49.44801330566406, -45.48725891113281, -41.52650451660156, -37.56575012207031, -33.60499954223633, -29.64424705505371, -25.683494567871094, -21.722740173339844, -17.761987686157227, -13.80123519897461, -9.84048080444336, -5.879728317260742, -1.918975830078125, 2.0417771339416504, 6.002530097961426, 9.96328353881836, 13.924036026000977, 17.884788513183594, 21.845542907714844, 25.80629539489746, 29.767047882080078, 33.72780227661133, 37.68855285644531, 41.64930725097656, 45.61006164550781, 49.5708122253418, 53.53156661987305, 57.49231719970703, 61.45307159423828, 65.41382598876953, 69.37458038330078, 73.3353271484375, 77.29608154296875, 81.2568359375, 85.21759033203125, 89.1783447265625, 93.13909912109375, 97.099853515625, 101.06060791015625, 105.0213623046875, 108.98210906982422, 112.94286346435547, 116.90361785888672, 120.86437225341797, 124.82511901855469]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 15.0, 17.0, 27.0, 40.0, 52.0, 99.0, 247.0, 551.0, 1181.0, 3166.0, 10961.0, 78101.0, 3971843.0, 111784.0, 11549.0, 2906.0, 993.0, 354.0, 184.0, 83.0, 45.0, 15.0, 12.0, 13.0, 6.0, 3.0, 5.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.15625, -53.6875, -52.21875, -50.75, -49.28125, -47.8125, -46.34375, -44.875, -43.40625, -41.9375, -40.46875, -39.0, -37.53125, -36.0625, -34.59375, -33.125, -31.65625, -30.1875, -28.71875, -27.25, -25.78125, -24.3125, -22.84375, -21.375, -19.90625, -18.4375, -16.96875, -15.5, -14.03125, -12.5625, -11.09375, -9.625, -8.15625, -6.6875, -5.21875, -3.75, -2.28125, -0.8125, 0.65625, 2.125, 3.59375, 5.0625, 6.53125, 8.0, 9.46875, 10.9375, 12.40625, 13.875, 15.34375, 16.8125, 18.28125, 19.75, 21.21875, 22.6875, 24.15625, 25.625, 27.09375, 28.5625, 30.03125, 31.5, 32.96875, 34.4375, 35.90625, 37.375, 38.84375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 7.0, 9.0, 7.0, 8.0, 15.0, 32.0, 48.0, 54.0, 83.0, 123.0, 135.0, 114.0, 103.0, 67.0, 59.0, 27.0, 15.0, 17.0, 10.0, 7.0, 7.0, 10.0, 4.0, 6.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.412109375, -2.347686767578125, -2.28326416015625, -2.218841552734375, -2.1544189453125, -2.089996337890625, -2.02557373046875, -1.961151123046875, -1.896728515625, -1.832305908203125, -1.76788330078125, -1.703460693359375, -1.6390380859375, -1.574615478515625, -1.51019287109375, -1.445770263671875, -1.38134765625, -1.316925048828125, -1.25250244140625, -1.188079833984375, -1.1236572265625, -1.059234619140625, -0.99481201171875, -0.930389404296875, -0.865966796875, -0.801544189453125, -0.73712158203125, -0.672698974609375, -0.6082763671875, -0.543853759765625, -0.47943115234375, -0.415008544921875, -0.3505859375, -0.286163330078125, -0.22174072265625, -0.157318115234375, -0.0928955078125, -0.028472900390625, 0.03594970703125, 0.100372314453125, 0.164794921875, 0.229217529296875, 0.29364013671875, 0.358062744140625, 0.4224853515625, 0.486907958984375, 0.55133056640625, 0.615753173828125, 0.68017578125, 0.744598388671875, 0.80902099609375, 0.873443603515625, 0.9378662109375, 1.002288818359375, 1.06671142578125, 1.131134033203125, 1.195556640625, 1.259979248046875, 1.32440185546875, 1.388824462890625, 1.4532470703125, 1.517669677734375, 1.58209228515625, 1.646514892578125, 1.7109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 10.0, 5.0, 7.0, 14.0, 21.0, 39.0, 46.0, 92.0, 147.0, 299.0, 560.0, 1151.0, 2689.0, 7132.0, 25024.0, 130501.0, 2371462.0, 1508711.0, 112021.0, 22554.0, 6824.0, 2618.0, 1126.0, 535.0, 298.0, 164.0, 84.0, 48.0, 33.0, 11.0, 21.0, 6.0, 8.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.53125, -17.868408203125, -17.20556640625, -16.542724609375, -15.8798828125, -15.217041015625, -14.55419921875, -13.891357421875, -13.228515625, -12.565673828125, -11.90283203125, -11.239990234375, -10.5771484375, -9.914306640625, -9.25146484375, -8.588623046875, -7.92578125, -7.262939453125, -6.60009765625, -5.937255859375, -5.2744140625, -4.611572265625, -3.94873046875, -3.285888671875, -2.623046875, -1.960205078125, -1.29736328125, -0.634521484375, 0.0283203125, 0.691162109375, 1.35400390625, 2.016845703125, 2.6796875, 3.342529296875, 4.00537109375, 4.668212890625, 5.3310546875, 5.993896484375, 6.65673828125, 7.319580078125, 7.982421875, 8.645263671875, 9.30810546875, 9.970947265625, 10.6337890625, 11.296630859375, 11.95947265625, 12.622314453125, 13.28515625, 13.947998046875, 14.61083984375, 15.273681640625, 15.9365234375, 16.599365234375, 17.26220703125, 17.925048828125, 18.587890625, 19.250732421875, 19.91357421875, 20.576416015625, 21.2392578125, 21.902099609375, 22.56494140625, 23.227783203125, 23.890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 10.0, 18.0, 16.0, 26.0, 43.0, 63.0, 112.0, 159.0, 310.0, 539.0, 1380.0, 594.0, 274.0, 180.0, 94.0, 70.0, 51.0, 30.0, 20.0, 15.0, 20.0, 7.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.126953125, -3.0208740234375, -2.914794921875, -2.8087158203125, -2.70263671875, -2.5965576171875, -2.490478515625, -2.3843994140625, -2.2783203125, -2.1722412109375, -2.066162109375, -1.9600830078125, -1.85400390625, -1.7479248046875, -1.641845703125, -1.5357666015625, -1.4296875, -1.3236083984375, -1.217529296875, -1.1114501953125, -1.00537109375, -0.8992919921875, -0.793212890625, -0.6871337890625, -0.5810546875, -0.4749755859375, -0.368896484375, -0.2628173828125, -0.15673828125, -0.0506591796875, 0.055419921875, 0.1614990234375, 0.267578125, 0.3736572265625, 0.479736328125, 0.5858154296875, 0.69189453125, 0.7979736328125, 0.904052734375, 1.0101318359375, 1.1162109375, 1.2222900390625, 1.328369140625, 1.4344482421875, 1.54052734375, 1.6466064453125, 1.752685546875, 1.8587646484375, 1.96484375, 2.0709228515625, 2.177001953125, 2.2830810546875, 2.38916015625, 2.4952392578125, 2.601318359375, 2.7073974609375, 2.8134765625, 2.9195556640625, 3.025634765625, 3.1317138671875, 3.23779296875, 3.3438720703125, 3.449951171875, 3.5560302734375, 3.662109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 11.0, 28.0, 70.0, 164.0, 259.0, 257.0, 122.0, 46.0, 18.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.38623046875, -34.19475173950195, -33.00327682495117, -31.811798095703125, -30.62032127380371, -29.428844451904297, -28.23736572265625, -27.045888900756836, -25.854412078857422, -24.662935256958008, -23.471458435058594, -22.279979705810547, -21.088502883911133, -19.89702606201172, -18.705547332763672, -17.514070510864258, -16.322593688964844, -15.13111686706543, -13.9396390914917, -12.748161315917969, -11.556684494018555, -10.36520767211914, -9.17372989654541, -7.98225212097168, -6.790775299072266, -5.599298000335693, -4.407820701599121, -3.216343402862549, -2.0248661041259766, -0.8333888053894043, 0.35808849334716797, 1.5495662689208984, 2.741039276123047, 3.932516574859619, 5.123993873596191, 6.315471172332764, 7.506948471069336, 8.69842529296875, 9.88990306854248, 11.081380844116211, 12.272857666015625, 13.464334487915039, 14.65581226348877, 15.8472900390625, 17.038766860961914, 18.230243682861328, 19.421722412109375, 20.61319923400879, 21.804676055908203, 22.996152877807617, 24.18762969970703, 25.379108428955078, 26.570585250854492, 27.762062072753906, 28.953540802001953, 30.145017623901367, 31.33649444580078, 32.52797317504883, 33.71944808959961, 34.910926818847656, 36.10240173339844, 37.293880462646484, 38.48535919189453, 39.67683410644531, 40.86831283569336]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 4.0, 11.0, 22.0, 22.0, 35.0, 64.0, 43.0, 70.0, 70.0, 92.0, 69.0, 89.0, 88.0, 58.0, 56.0, 45.0, 40.0, 31.0, 24.0, 15.0, 7.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-21.577701568603516, -20.988906860351562, -20.400110244750977, -19.81131362915039, -19.222518920898438, -18.633724212646484, -18.0449275970459, -17.456130981445312, -16.86733627319336, -16.278541564941406, -15.68974494934082, -15.10094928741455, -14.512153625488281, -13.923357963562012, -13.334562301635742, -12.745766639709473, -12.156970977783203, -11.568175315856934, -10.979379653930664, -10.390583992004395, -9.801788330078125, -9.212992668151855, -8.624197006225586, -8.035401344299316, -7.446605682373047, -6.857810020446777, -6.269014358520508, -5.680218696594238, -5.091423034667969, -4.502627372741699, -3.9138317108154297, -3.32503604888916, -2.736238479614258, -2.1474428176879883, -1.5586471557617188, -0.9698514938354492, -0.3810558319091797, 0.20773983001708984, 0.7965354919433594, 1.385331153869629, 1.9741268157958984, 2.562922477722168, 3.1517181396484375, 3.740513801574707, 4.329309463500977, 4.918105125427246, 5.506900787353516, 6.095696449279785, 6.684492111206055, 7.273287773132324, 7.862083435058594, 8.450879096984863, 9.039674758911133, 9.628470420837402, 10.217266082763672, 10.806061744689941, 11.394857406616211, 11.98365306854248, 12.57244873046875, 13.16124439239502, 13.750040054321289, 14.338835716247559, 14.927631378173828, 15.516427040100098, 16.105222702026367]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 5.0, 11.0, 16.0, 29.0, 44.0, 81.0, 146.0, 194.0, 387.0, 659.0, 1400.0, 3454.0, 9922.0, 40703.0, 393430.0, 528203.0, 51022.0, 11532.0, 3912.0, 1495.0, 753.0, 408.0, 221.0, 175.0, 106.0, 73.0, 55.0, 29.0, 19.0, 18.0, 10.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.578125, -20.925537109375, -20.27294921875, -19.620361328125, -18.9677734375, -18.315185546875, -17.66259765625, -17.010009765625, -16.357421875, -15.704833984375, -15.05224609375, -14.399658203125, -13.7470703125, -13.094482421875, -12.44189453125, -11.789306640625, -11.13671875, -10.484130859375, -9.83154296875, -9.178955078125, -8.5263671875, -7.873779296875, -7.22119140625, -6.568603515625, -5.916015625, -5.263427734375, -4.61083984375, -3.958251953125, -3.3056640625, -2.653076171875, -2.00048828125, -1.347900390625, -0.6953125, -0.042724609375, 0.60986328125, 1.262451171875, 1.9150390625, 2.567626953125, 3.22021484375, 3.872802734375, 4.525390625, 5.177978515625, 5.83056640625, 6.483154296875, 7.1357421875, 7.788330078125, 8.44091796875, 9.093505859375, 9.74609375, 10.398681640625, 11.05126953125, 11.703857421875, 12.3564453125, 13.009033203125, 13.66162109375, 14.314208984375, 14.966796875, 15.619384765625, 16.27197265625, 16.924560546875, 17.5771484375, 18.229736328125, 18.88232421875, 19.534912109375, 20.1875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 5.0, 6.0, 6.0, 1.0, 11.0, 20.0, 25.0, 31.0, 42.0, 78.0, 96.0, 109.0, 149.0, 105.0, 89.0, 65.0, 46.0, 29.0, 15.0, 16.0, 11.0, 9.0, 7.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.86328125, -2.79840087890625, -2.7335205078125, -2.66864013671875, -2.603759765625, -2.53887939453125, -2.4739990234375, -2.40911865234375, -2.34423828125, -2.27935791015625, -2.2144775390625, -2.14959716796875, -2.084716796875, -2.01983642578125, -1.9549560546875, -1.89007568359375, -1.8251953125, -1.76031494140625, -1.6954345703125, -1.63055419921875, -1.565673828125, -1.50079345703125, -1.4359130859375, -1.37103271484375, -1.30615234375, -1.24127197265625, -1.1763916015625, -1.11151123046875, -1.046630859375, -0.98175048828125, -0.9168701171875, -0.85198974609375, -0.787109375, -0.72222900390625, -0.6573486328125, -0.59246826171875, -0.527587890625, -0.46270751953125, -0.3978271484375, -0.33294677734375, -0.26806640625, -0.20318603515625, -0.1383056640625, -0.07342529296875, -0.008544921875, 0.05633544921875, 0.1212158203125, 0.18609619140625, 0.2509765625, 0.31585693359375, 0.3807373046875, 0.44561767578125, 0.510498046875, 0.57537841796875, 0.6402587890625, 0.70513916015625, 0.77001953125, 0.83489990234375, 0.8997802734375, 0.96466064453125, 1.029541015625, 1.09442138671875, 1.1593017578125, 1.22418212890625, 1.2890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 8.0, 11.0, 10.0, 17.0, 29.0, 36.0, 74.0, 88.0, 145.0, 242.0, 403.0, 691.0, 1445.0, 2993.0, 6926.0, 17842.0, 54122.0, 208733.0, 504358.0, 174221.0, 47506.0, 16354.0, 6302.0, 2787.0, 1408.0, 752.0, 383.0, 245.0, 134.0, 84.0, 65.0, 28.0, 23.0, 19.0, 25.0, 11.0, 6.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.09716796875, -8.7880859375, -8.47900390625, -8.169921875, -7.86083984375, -7.5517578125, -7.24267578125, -6.93359375, -6.62451171875, -6.3154296875, -6.00634765625, -5.697265625, -5.38818359375, -5.0791015625, -4.77001953125, -4.4609375, -4.15185546875, -3.8427734375, -3.53369140625, -3.224609375, -2.91552734375, -2.6064453125, -2.29736328125, -1.98828125, -1.67919921875, -1.3701171875, -1.06103515625, -0.751953125, -0.44287109375, -0.1337890625, 0.17529296875, 0.484375, 0.79345703125, 1.1025390625, 1.41162109375, 1.720703125, 2.02978515625, 2.3388671875, 2.64794921875, 2.95703125, 3.26611328125, 3.5751953125, 3.88427734375, 4.193359375, 4.50244140625, 4.8115234375, 5.12060546875, 5.4296875, 5.73876953125, 6.0478515625, 6.35693359375, 6.666015625, 6.97509765625, 7.2841796875, 7.59326171875, 7.90234375, 8.21142578125, 8.5205078125, 8.82958984375, 9.138671875, 9.44775390625, 9.7568359375, 10.06591796875, 10.375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 9.0, 12.0, 14.0, 20.0, 16.0, 42.0, 26.0, 47.0, 60.0, 67.0, 59.0, 57.0, 59.0, 64.0, 69.0, 47.0, 56.0, 63.0, 52.0, 41.0, 17.0, 31.0, 23.0, 5.0, 9.0, 10.0, 5.0, 4.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.486083984375, -8.19091796875, -7.895751953125, -7.6005859375, -7.305419921875, -7.01025390625, -6.715087890625, -6.419921875, -6.124755859375, -5.82958984375, -5.534423828125, -5.2392578125, -4.944091796875, -4.64892578125, -4.353759765625, -4.05859375, -3.763427734375, -3.46826171875, -3.173095703125, -2.8779296875, -2.582763671875, -2.28759765625, -1.992431640625, -1.697265625, -1.402099609375, -1.10693359375, -0.811767578125, -0.5166015625, -0.221435546875, 0.07373046875, 0.368896484375, 0.6640625, 0.959228515625, 1.25439453125, 1.549560546875, 1.8447265625, 2.139892578125, 2.43505859375, 2.730224609375, 3.025390625, 3.320556640625, 3.61572265625, 3.910888671875, 4.2060546875, 4.501220703125, 4.79638671875, 5.091552734375, 5.38671875, 5.681884765625, 5.97705078125, 6.272216796875, 6.5673828125, 6.862548828125, 7.15771484375, 7.452880859375, 7.748046875, 8.043212890625, 8.33837890625, 8.633544921875, 8.9287109375, 9.223876953125, 9.51904296875, 9.814208984375, 10.109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 10.0, 16.0, 13.0, 23.0, 65.0, 107.0, 267.0, 942.0, 5141.0, 91816.0, 910216.0, 35800.0, 3027.0, 696.0, 236.0, 78.0, 44.0, 26.0, 13.0, 12.0, 4.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.09375, -48.75341796875, -47.4130859375, -46.07275390625, -44.732421875, -43.39208984375, -42.0517578125, -40.71142578125, -39.37109375, -38.03076171875, -36.6904296875, -35.35009765625, -34.009765625, -32.66943359375, -31.3291015625, -29.98876953125, -28.6484375, -27.30810546875, -25.9677734375, -24.62744140625, -23.287109375, -21.94677734375, -20.6064453125, -19.26611328125, -17.92578125, -16.58544921875, -15.2451171875, -13.90478515625, -12.564453125, -11.22412109375, -9.8837890625, -8.54345703125, -7.203125, -5.86279296875, -4.5224609375, -3.18212890625, -1.841796875, -0.50146484375, 0.8388671875, 2.17919921875, 3.51953125, 4.85986328125, 6.2001953125, 7.54052734375, 8.880859375, 10.22119140625, 11.5615234375, 12.90185546875, 14.2421875, 15.58251953125, 16.9228515625, 18.26318359375, 19.603515625, 20.94384765625, 22.2841796875, 23.62451171875, 24.96484375, 26.30517578125, 27.6455078125, 28.98583984375, 30.326171875, 31.66650390625, 33.0068359375, 34.34716796875, 35.6875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 7.0, 23.0, 45.0, 85.0, 104.0, 143.0, 162.0, 144.0, 81.0, 58.0, 35.0, 27.0, 11.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013637542724609375, -0.001328207552433014, -0.0012926608324050903, -0.0012571141123771667, -0.0012215673923492432, -0.0011860206723213196, -0.001150473952293396, -0.0011149272322654724, -0.0010793805122375488, -0.0010438337922096252, -0.0010082870721817017, -0.0009727403521537781, -0.0009371936321258545, -0.0009016469120979309, -0.0008661001920700073, -0.0008305534720420837, -0.0007950067520141602, -0.0007594600319862366, -0.000723913311958313, -0.0006883665919303894, -0.0006528198719024658, -0.0006172731518745422, -0.0005817264318466187, -0.0005461797118186951, -0.0005106329917907715, -0.0004750862717628479, -0.0004395395517349243, -0.00040399283170700073, -0.00036844611167907715, -0.00033289939165115356, -0.00029735267162323, -0.0002618059515953064, -0.0002262592315673828, -0.00019071251153945923, -0.00015516579151153564, -0.00011961907148361206, -8.407235145568848e-05, -4.852563142776489e-05, -1.2978911399841309e-05, 2.2567808628082275e-05, 5.811452865600586e-05, 9.366124868392944e-05, 0.00012920796871185303, 0.0001647546887397766, 0.0002003014087677002, 0.00023584812879562378, 0.00027139484882354736, 0.00030694156885147095, 0.00034248828887939453, 0.0003780350089073181, 0.0004135817289352417, 0.0004491284489631653, 0.00048467516899108887, 0.0005202218890190125, 0.000555768609046936, 0.0005913153290748596, 0.0006268620491027832, 0.0006624087691307068, 0.0006979554891586304, 0.000733502209186554, 0.0007690489292144775, 0.0008045956492424011, 0.0008401423692703247, 0.0008756890892982483, 0.0009112358093261719]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 8.0, 16.0, 24.0, 30.0, 63.0, 104.0, 166.0, 335.0, 885.0, 2468.0, 9451.0, 54211.0, 511893.0, 414725.0, 42821.0, 7759.0, 2204.0, 741.0, 294.0, 150.0, 83.0, 44.0, 31.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.078369140625, -19.35986328125, -18.641357421875, -17.9228515625, -17.204345703125, -16.48583984375, -15.767333984375, -15.048828125, -14.330322265625, -13.61181640625, -12.893310546875, -12.1748046875, -11.456298828125, -10.73779296875, -10.019287109375, -9.30078125, -8.582275390625, -7.86376953125, -7.145263671875, -6.4267578125, -5.708251953125, -4.98974609375, -4.271240234375, -3.552734375, -2.834228515625, -2.11572265625, -1.397216796875, -0.6787109375, 0.039794921875, 0.75830078125, 1.476806640625, 2.1953125, 2.913818359375, 3.63232421875, 4.350830078125, 5.0693359375, 5.787841796875, 6.50634765625, 7.224853515625, 7.943359375, 8.661865234375, 9.38037109375, 10.098876953125, 10.8173828125, 11.535888671875, 12.25439453125, 12.972900390625, 13.69140625, 14.409912109375, 15.12841796875, 15.846923828125, 16.5654296875, 17.283935546875, 18.00244140625, 18.720947265625, 19.439453125, 20.157958984375, 20.87646484375, 21.594970703125, 22.3134765625, 23.031982421875, 23.75048828125, 24.468994140625, 25.1875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 8.0, 17.0, 32.0, 28.0, 47.0, 63.0, 70.0, 109.0, 151.0, 126.0, 107.0, 71.0, 46.0, 37.0, 24.0, 15.0, 14.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.7166748046875, -17.292724609375, -16.8687744140625, -16.44482421875, -16.0208740234375, -15.596923828125, -15.1729736328125, -14.7490234375, -14.3250732421875, -13.901123046875, -13.4771728515625, -13.05322265625, -12.6292724609375, -12.205322265625, -11.7813720703125, -11.357421875, -10.9334716796875, -10.509521484375, -10.0855712890625, -9.66162109375, -9.2376708984375, -8.813720703125, -8.3897705078125, -7.9658203125, -7.5418701171875, -7.117919921875, -6.6939697265625, -6.27001953125, -5.8460693359375, -5.422119140625, -4.9981689453125, -4.57421875, -4.1502685546875, -3.726318359375, -3.3023681640625, -2.87841796875, -2.4544677734375, -2.030517578125, -1.6065673828125, -1.1826171875, -0.7586669921875, -0.334716796875, 0.0892333984375, 0.51318359375, 0.9371337890625, 1.361083984375, 1.7850341796875, 2.208984375, 2.6329345703125, 3.056884765625, 3.4808349609375, 3.90478515625, 4.3287353515625, 4.752685546875, 5.1766357421875, 5.6005859375, 6.0245361328125, 6.448486328125, 6.8724365234375, 7.29638671875, 7.7203369140625, 8.144287109375, 8.5682373046875, 8.9921875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 15.0, 35.0, 100.0, 225.0, 281.0, 179.0, 85.0, 39.0, 13.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-131.6260528564453, -127.67518615722656, -123.72432708740234, -119.7734603881836, -115.82260131835938, -111.87173461914062, -107.92086791992188, -103.97000885009766, -100.0191421508789, -96.06827545166016, -92.11741638183594, -88.16654968261719, -84.21569061279297, -80.26482391357422, -76.31396484375, -72.36309814453125, -68.4122314453125, -64.46136474609375, -60.51050567626953, -56.55963897705078, -52.6087760925293, -48.65791320800781, -44.70705032348633, -40.756187438964844, -36.805328369140625, -32.85446548461914, -28.903600692749023, -24.95273780822754, -21.001873016357422, -17.051010131835938, -13.100147247314453, -9.149282455444336, -5.198417663574219, -1.247554063796997, 2.7033095359802246, 6.654172897338867, 10.605036735534668, 14.555900573730469, 18.506763458251953, 22.45762825012207, 26.408491134643555, 30.35935401916504, 34.310218811035156, 38.26108169555664, 42.211944580078125, 46.162811279296875, 50.113670349121094, 54.064537048339844, 58.01539993286133, 61.96626281738281, 65.91712951660156, 69.86798858642578, 73.81885528564453, 77.76971435546875, 81.7205810546875, 85.67144775390625, 89.62230682373047, 93.57317352294922, 97.52403259277344, 101.47489929199219, 105.4257583618164, 109.37662506103516, 113.32748413085938, 117.27835083007812, 121.22921752929688]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 6.0, 4.0, 2.0, 5.0, 7.0, 7.0, 13.0, 20.0, 19.0, 31.0, 36.0, 62.0, 56.0, 60.0, 76.0, 78.0, 78.0, 86.0, 86.0, 80.0, 42.0, 36.0, 19.0, 22.0, 21.0, 13.0, 14.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.03410339355469, -73.37730407714844, -70.72050476074219, -68.0636978149414, -65.40689849853516, -62.750099182128906, -60.093299865722656, -57.43649673461914, -54.779693603515625, -52.122894287109375, -49.46609115600586, -46.80929183959961, -44.152488708496094, -41.495689392089844, -38.838890075683594, -36.18208694458008, -33.52528762817383, -30.868486404418945, -28.211685180664062, -25.554885864257812, -22.898082733154297, -20.241283416748047, -17.584482192993164, -14.927680969238281, -12.270879745483398, -9.614078521728516, -6.957277774810791, -4.300477027893066, -1.6436758041381836, 1.0131254196166992, 3.6699256896972656, 6.326726913452148, 8.983528137207031, 11.640329360961914, 14.297130584716797, 16.953929901123047, 19.610733032226562, 22.267532348632812, 24.924333572387695, 27.581134796142578, 30.23793601989746, 32.894737243652344, 35.551536560058594, 38.20833969116211, 40.86513900756836, 43.521942138671875, 46.178741455078125, 48.835540771484375, 51.49234390258789, 54.14914321899414, 56.805946350097656, 59.462745666503906, 62.11954879760742, 64.77635192871094, 67.43315124511719, 70.08995056152344, 72.74674987792969, 75.40354919433594, 78.06034851074219, 80.71715545654297, 83.37395477294922, 86.03075408935547, 88.68755340576172, 91.3443603515625, 94.00115966796875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 12.0, 14.0, 15.0, 9.0, 17.0, 19.0, 24.0, 29.0, 34.0, 58.0, 50.0, 65.0, 81.0, 108.0, 148.0, 198.0, 268.0, 402.0, 622.0, 1022.0, 1667.0, 3230.0, 6808.0, 17930.0, 68856.0, 824590.0, 3109400.0, 119175.0, 24694.0, 7918.0, 3383.0, 1620.0, 794.0, 414.0, 232.0, 138.0, 87.0, 53.0, 35.0, 19.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0], "bins": [-41.34375, -40.406982421875, -39.47021484375, -38.533447265625, -37.5966796875, -36.659912109375, -35.72314453125, -34.786376953125, -33.849609375, -32.912841796875, -31.97607421875, -31.039306640625, -30.1025390625, -29.165771484375, -28.22900390625, -27.292236328125, -26.35546875, -25.418701171875, -24.48193359375, -23.545166015625, -22.6083984375, -21.671630859375, -20.73486328125, -19.798095703125, -18.861328125, -17.924560546875, -16.98779296875, -16.051025390625, -15.1142578125, -14.177490234375, -13.24072265625, -12.303955078125, -11.3671875, -10.430419921875, -9.49365234375, -8.556884765625, -7.6201171875, -6.683349609375, -5.74658203125, -4.809814453125, -3.873046875, -2.936279296875, -1.99951171875, -1.062744140625, -0.1259765625, 0.810791015625, 1.74755859375, 2.684326171875, 3.62109375, 4.557861328125, 5.49462890625, 6.431396484375, 7.3681640625, 8.304931640625, 9.24169921875, 10.178466796875, 11.115234375, 12.052001953125, 12.98876953125, 13.925537109375, 14.8623046875, 15.799072265625, 16.73583984375, 17.672607421875, 18.609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 7.0, 14.0, 18.0, 9.0, 39.0, 40.0, 53.0, 74.0, 96.0, 116.0, 97.0, 91.0, 72.0, 80.0, 51.0, 28.0, 33.0, 13.0, 23.0, 9.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.76953125, -2.7081451416015625, -2.646759033203125, -2.5853729248046875, -2.52398681640625, -2.4626007080078125, -2.401214599609375, -2.3398284912109375, -2.2784423828125, -2.2170562744140625, -2.155670166015625, -2.0942840576171875, -2.03289794921875, -1.9715118408203125, -1.910125732421875, -1.8487396240234375, -1.787353515625, -1.7259674072265625, -1.664581298828125, -1.6031951904296875, -1.54180908203125, -1.4804229736328125, -1.419036865234375, -1.3576507568359375, -1.2962646484375, -1.2348785400390625, -1.173492431640625, -1.1121063232421875, -1.05072021484375, -0.9893341064453125, -0.927947998046875, -0.8665618896484375, -0.80517578125, -0.7437896728515625, -0.682403564453125, -0.6210174560546875, -0.55963134765625, -0.4982452392578125, -0.436859130859375, -0.3754730224609375, -0.3140869140625, -0.2527008056640625, -0.191314697265625, -0.1299285888671875, -0.06854248046875, -0.0071563720703125, 0.054229736328125, 0.1156158447265625, 0.177001953125, 0.2383880615234375, 0.299774169921875, 0.3611602783203125, 0.42254638671875, 0.4839324951171875, 0.545318603515625, 0.6067047119140625, 0.6680908203125, 0.7294769287109375, 0.790863037109375, 0.8522491455078125, 0.91363525390625, 0.9750213623046875, 1.036407470703125, 1.0977935791015625, 1.1591796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 7.0, 6.0, 6.0, 6.0, 8.0, 19.0, 11.0, 30.0, 37.0, 55.0, 62.0, 103.0, 193.0, 493.0, 1899.0, 11675.0, 348297.0, 3767097.0, 57874.0, 4699.0, 936.0, 301.0, 143.0, 80.0, 61.0, 44.0, 41.0, 27.0, 11.0, 15.0, 15.0, 6.0, 9.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.0, -47.267578125, -45.53515625, -43.802734375, -42.0703125, -40.337890625, -38.60546875, -36.873046875, -35.140625, -33.408203125, -31.67578125, -29.943359375, -28.2109375, -26.478515625, -24.74609375, -23.013671875, -21.28125, -19.548828125, -17.81640625, -16.083984375, -14.3515625, -12.619140625, -10.88671875, -9.154296875, -7.421875, -5.689453125, -3.95703125, -2.224609375, -0.4921875, 1.240234375, 2.97265625, 4.705078125, 6.4375, 8.169921875, 9.90234375, 11.634765625, 13.3671875, 15.099609375, 16.83203125, 18.564453125, 20.296875, 22.029296875, 23.76171875, 25.494140625, 27.2265625, 28.958984375, 30.69140625, 32.423828125, 34.15625, 35.888671875, 37.62109375, 39.353515625, 41.0859375, 42.818359375, 44.55078125, 46.283203125, 48.015625, 49.748046875, 51.48046875, 53.212890625, 54.9453125, 56.677734375, 58.41015625, 60.142578125, 61.875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 8.0, 10.0, 3.0, 12.0, 23.0, 30.0, 42.0, 42.0, 62.0, 81.0, 116.0, 169.0, 236.0, 382.0, 775.0, 806.0, 391.0, 262.0, 180.0, 140.0, 75.0, 59.0, 33.0, 29.0, 27.0, 18.0, 13.0, 6.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.13714599609375, -3.0360107421875, -2.93487548828125, -2.833740234375, -2.73260498046875, -2.6314697265625, -2.53033447265625, -2.42919921875, -2.32806396484375, -2.2269287109375, -2.12579345703125, -2.024658203125, -1.92352294921875, -1.8223876953125, -1.72125244140625, -1.6201171875, -1.51898193359375, -1.4178466796875, -1.31671142578125, -1.215576171875, -1.11444091796875, -1.0133056640625, -0.91217041015625, -0.81103515625, -0.70989990234375, -0.6087646484375, -0.50762939453125, -0.406494140625, -0.30535888671875, -0.2042236328125, -0.10308837890625, -0.001953125, 0.09918212890625, 0.2003173828125, 0.30145263671875, 0.402587890625, 0.50372314453125, 0.6048583984375, 0.70599365234375, 0.80712890625, 0.90826416015625, 1.0093994140625, 1.11053466796875, 1.211669921875, 1.31280517578125, 1.4139404296875, 1.51507568359375, 1.6162109375, 1.71734619140625, 1.8184814453125, 1.91961669921875, 2.020751953125, 2.12188720703125, 2.2230224609375, 2.32415771484375, 2.42529296875, 2.52642822265625, 2.6275634765625, 2.72869873046875, 2.829833984375, 2.93096923828125, 3.0321044921875, 3.13323974609375, 3.234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 1.0, 12.0, 34.0, 43.0, 94.0, 161.0, 186.0, 189.0, 149.0, 78.0, 26.0, 17.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.10785484313965, -21.94831085205078, -20.788766860961914, -19.629222869873047, -18.469680786132812, -17.310136795043945, -16.150592803955078, -14.991049766540527, -13.83150577545166, -12.671961784362793, -11.512418746948242, -10.352874755859375, -9.193330764770508, -8.033787727355957, -6.87424373626709, -5.714700698852539, -4.555156707763672, -3.395613193511963, -2.236069440841675, -1.0765256881713867, 0.08301782608032227, 1.2425613403320312, 2.4021053314208984, 3.561648368835449, 4.721192359924316, 5.880735874176025, 7.040279388427734, 8.199823379516602, 9.359367370605469, 10.51891040802002, 11.678454399108887, 12.837997436523438, 13.997539520263672, 15.157083511352539, 16.316627502441406, 17.47616958618164, 18.635713577270508, 19.795257568359375, 20.954801559448242, 22.11434555053711, 23.273887634277344, 24.43343162536621, 25.592975616455078, 26.752517700195312, 27.91206169128418, 29.071605682373047, 30.231149673461914, 31.39069366455078, 32.55023956298828, 33.709781646728516, 34.869327545166016, 36.02886962890625, 37.18841552734375, 38.347957611083984, 39.50749969482422, 40.66704559326172, 41.82658767700195, 42.98612976074219, 44.14567565917969, 45.30521774291992, 46.46476364135742, 47.624305725097656, 48.783851623535156, 49.94339370727539, 51.102935791015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 8.0, 16.0, 20.0, 20.0, 22.0, 39.0, 32.0, 38.0, 47.0, 45.0, 50.0, 52.0, 59.0, 62.0, 51.0, 51.0, 50.0, 58.0, 41.0, 41.0, 36.0, 27.0, 23.0, 22.0, 14.0, 9.0, 11.0, 14.0, 6.0, 4.0, 10.0, 0.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.380228042602539, -11.859716415405273, -11.339204788208008, -10.818693161010742, -10.298181533813477, -9.777669906616211, -9.257158279418945, -8.73664665222168, -8.216135025024414, -7.695623397827148, -7.175111770629883, -6.654600143432617, -6.134088516235352, -5.613576889038086, -5.093064785003662, -4.5725531578063965, -4.052041053771973, -3.531529426574707, -3.0110177993774414, -2.4905059337615967, -1.969994306564331, -1.4494826793670654, -0.9289708137512207, -0.4084591865539551, 0.11205244064331055, 0.632564127445221, 1.1530758142471313, 1.6735875606536865, 2.194099187850952, 2.7146108150482178, 3.2351226806640625, 3.755634307861328, 4.276145935058594, 4.796657562255859, 5.317169189453125, 5.837680816650391, 6.358192443847656, 6.878704071044922, 7.399216175079346, 7.919727802276611, 8.440238952636719, 8.960750579833984, 9.48126220703125, 10.001773834228516, 10.522285461425781, 11.042797088623047, 11.563308715820312, 12.083820343017578, 12.60433292388916, 13.124844551086426, 13.645356178283691, 14.165867805480957, 14.686379432678223, 15.206891059875488, 15.72740364074707, 16.247915267944336, 16.7684268951416, 17.288938522338867, 17.809450149536133, 18.3299617767334, 18.850473403930664, 19.37098503112793, 19.891496658325195, 20.41200828552246, 20.932519912719727]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 9.0, 15.0, 28.0, 26.0, 44.0, 45.0, 49.0, 84.0, 130.0, 214.0, 303.0, 471.0, 912.0, 1815.0, 4298.0, 11933.0, 38116.0, 141802.0, 473137.0, 274610.0, 67828.0, 20019.0, 6905.0, 2762.0, 1193.0, 649.0, 375.0, 237.0, 153.0, 84.0, 73.0, 73.0, 39.0, 27.0, 27.0, 12.0, 12.0, 7.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.5, -16.96533203125, -16.4306640625, -15.89599609375, -15.361328125, -14.82666015625, -14.2919921875, -13.75732421875, -13.22265625, -12.68798828125, -12.1533203125, -11.61865234375, -11.083984375, -10.54931640625, -10.0146484375, -9.47998046875, -8.9453125, -8.41064453125, -7.8759765625, -7.34130859375, -6.806640625, -6.27197265625, -5.7373046875, -5.20263671875, -4.66796875, -4.13330078125, -3.5986328125, -3.06396484375, -2.529296875, -1.99462890625, -1.4599609375, -0.92529296875, -0.390625, 0.14404296875, 0.6787109375, 1.21337890625, 1.748046875, 2.28271484375, 2.8173828125, 3.35205078125, 3.88671875, 4.42138671875, 4.9560546875, 5.49072265625, 6.025390625, 6.56005859375, 7.0947265625, 7.62939453125, 8.1640625, 8.69873046875, 9.2333984375, 9.76806640625, 10.302734375, 10.83740234375, 11.3720703125, 11.90673828125, 12.44140625, 12.97607421875, 13.5107421875, 14.04541015625, 14.580078125, 15.11474609375, 15.6494140625, 16.18408203125, 16.71875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 12.0, 24.0, 28.0, 36.0, 43.0, 61.0, 85.0, 111.0, 94.0, 112.0, 89.0, 76.0, 57.0, 50.0, 42.0, 28.0, 12.0, 10.0, 6.0, 3.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.8828125, -2.8168792724609375, -2.750946044921875, -2.6850128173828125, -2.61907958984375, -2.5531463623046875, -2.487213134765625, -2.4212799072265625, -2.3553466796875, -2.2894134521484375, -2.223480224609375, -2.1575469970703125, -2.09161376953125, -2.0256805419921875, -1.959747314453125, -1.8938140869140625, -1.827880859375, -1.7619476318359375, -1.696014404296875, -1.6300811767578125, -1.56414794921875, -1.4982147216796875, -1.432281494140625, -1.3663482666015625, -1.3004150390625, -1.2344818115234375, -1.168548583984375, -1.1026153564453125, -1.03668212890625, -0.9707489013671875, -0.904815673828125, -0.8388824462890625, -0.77294921875, -0.7070159912109375, -0.641082763671875, -0.5751495361328125, -0.50921630859375, -0.4432830810546875, -0.377349853515625, -0.3114166259765625, -0.2454833984375, -0.1795501708984375, -0.113616943359375, -0.0476837158203125, 0.01824951171875, 0.0841827392578125, 0.150115966796875, 0.2160491943359375, 0.281982421875, 0.3479156494140625, 0.413848876953125, 0.4797821044921875, 0.54571533203125, 0.6116485595703125, 0.677581787109375, 0.7435150146484375, 0.8094482421875, 0.8753814697265625, 0.941314697265625, 1.0072479248046875, 1.07318115234375, 1.1391143798828125, 1.205047607421875, 1.2709808349609375, 1.3369140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 7.0, 9.0, 10.0, 12.0, 15.0, 14.0, 27.0, 43.0, 48.0, 68.0, 107.0, 135.0, 237.0, 313.0, 600.0, 965.0, 2003.0, 4672.0, 12323.0, 36868.0, 125439.0, 384489.0, 330549.0, 100539.0, 30336.0, 10273.0, 4129.0, 1847.0, 907.0, 522.0, 331.0, 208.0, 122.0, 101.0, 60.0, 54.0, 49.0, 36.0, 27.0, 16.0, 11.0, 8.0, 10.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.875, -14.377685546875, -13.88037109375, -13.383056640625, -12.8857421875, -12.388427734375, -11.89111328125, -11.393798828125, -10.896484375, -10.399169921875, -9.90185546875, -9.404541015625, -8.9072265625, -8.409912109375, -7.91259765625, -7.415283203125, -6.91796875, -6.420654296875, -5.92333984375, -5.426025390625, -4.9287109375, -4.431396484375, -3.93408203125, -3.436767578125, -2.939453125, -2.442138671875, -1.94482421875, -1.447509765625, -0.9501953125, -0.452880859375, 0.04443359375, 0.541748046875, 1.0390625, 1.536376953125, 2.03369140625, 2.531005859375, 3.0283203125, 3.525634765625, 4.02294921875, 4.520263671875, 5.017578125, 5.514892578125, 6.01220703125, 6.509521484375, 7.0068359375, 7.504150390625, 8.00146484375, 8.498779296875, 8.99609375, 9.493408203125, 9.99072265625, 10.488037109375, 10.9853515625, 11.482666015625, 11.97998046875, 12.477294921875, 12.974609375, 13.471923828125, 13.96923828125, 14.466552734375, 14.9638671875, 15.461181640625, 15.95849609375, 16.455810546875, 16.953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 6.0, 2.0, 7.0, 10.0, 13.0, 14.0, 13.0, 16.0, 15.0, 21.0, 29.0, 28.0, 37.0, 38.0, 37.0, 37.0, 35.0, 47.0, 50.0, 55.0, 46.0, 41.0, 43.0, 45.0, 40.0, 44.0, 31.0, 32.0, 28.0, 29.0, 20.0, 11.0, 11.0, 11.0, 8.0, 14.0, 6.0, 6.0, 5.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.32421875, -7.06890869140625, -6.8135986328125, -6.55828857421875, -6.302978515625, -6.04766845703125, -5.7923583984375, -5.53704833984375, -5.28173828125, -5.02642822265625, -4.7711181640625, -4.51580810546875, -4.260498046875, -4.00518798828125, -3.7498779296875, -3.49456787109375, -3.2392578125, -2.98394775390625, -2.7286376953125, -2.47332763671875, -2.218017578125, -1.96270751953125, -1.7073974609375, -1.45208740234375, -1.19677734375, -0.94146728515625, -0.6861572265625, -0.43084716796875, -0.175537109375, 0.07977294921875, 0.3350830078125, 0.59039306640625, 0.845703125, 1.10101318359375, 1.3563232421875, 1.61163330078125, 1.866943359375, 2.12225341796875, 2.3775634765625, 2.63287353515625, 2.88818359375, 3.14349365234375, 3.3988037109375, 3.65411376953125, 3.909423828125, 4.16473388671875, 4.4200439453125, 4.67535400390625, 4.9306640625, 5.18597412109375, 5.4412841796875, 5.69659423828125, 5.951904296875, 6.20721435546875, 6.4625244140625, 6.71783447265625, 6.97314453125, 7.22845458984375, 7.4837646484375, 7.73907470703125, 7.994384765625, 8.24969482421875, 8.5050048828125, 8.76031494140625, 9.015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 9.0, 13.0, 36.0, 31.0, 51.0, 79.0, 103.0, 210.0, 448.0, 870.0, 2238.0, 6717.0, 24025.0, 99964.0, 423339.0, 374594.0, 85384.0, 21017.0, 5773.0, 1992.0, 786.0, 350.0, 191.0, 99.0, 68.0, 42.0, 33.0, 31.0, 13.0, 7.0, 11.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.96875, -17.4688720703125, -16.968994140625, -16.4691162109375, -15.96923828125, -15.4693603515625, -14.969482421875, -14.4696044921875, -13.9697265625, -13.4698486328125, -12.969970703125, -12.4700927734375, -11.97021484375, -11.4703369140625, -10.970458984375, -10.4705810546875, -9.970703125, -9.4708251953125, -8.970947265625, -8.4710693359375, -7.97119140625, -7.4713134765625, -6.971435546875, -6.4715576171875, -5.9716796875, -5.4718017578125, -4.971923828125, -4.4720458984375, -3.97216796875, -3.4722900390625, -2.972412109375, -2.4725341796875, -1.97265625, -1.4727783203125, -0.972900390625, -0.4730224609375, 0.02685546875, 0.5267333984375, 1.026611328125, 1.5264892578125, 2.0263671875, 2.5262451171875, 3.026123046875, 3.5260009765625, 4.02587890625, 4.5257568359375, 5.025634765625, 5.5255126953125, 6.025390625, 6.5252685546875, 7.025146484375, 7.5250244140625, 8.02490234375, 8.5247802734375, 9.024658203125, 9.5245361328125, 10.0244140625, 10.5242919921875, 11.024169921875, 11.5240478515625, 12.02392578125, 12.5238037109375, 13.023681640625, 13.5235595703125, 14.0234375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 5.0, 9.0, 8.0, 11.0, 11.0, 10.0, 22.0, 19.0, 36.0, 39.0, 41.0, 46.0, 70.0, 81.0, 112.0, 99.0, 61.0, 67.0, 58.0, 40.0, 25.0, 25.0, 24.0, 15.0, 6.0, 5.0, 5.0, 9.0, 5.0, 3.0, 3.0, 5.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.001453399658203125, -0.0014092177152633667, -0.0013650357723236084, -0.00132085382938385, -0.0012766718864440918, -0.0012324899435043335, -0.0011883080005645752, -0.001144126057624817, -0.0010999441146850586, -0.0010557621717453003, -0.001011580228805542, -0.0009673982858657837, -0.0009232163429260254, -0.0008790343999862671, -0.0008348524570465088, -0.0007906705141067505, -0.0007464885711669922, -0.0007023066282272339, -0.0006581246852874756, -0.0006139427423477173, -0.000569760799407959, -0.0005255788564682007, -0.0004813969135284424, -0.0004372149705886841, -0.0003930330276489258, -0.0003488510847091675, -0.0003046691417694092, -0.0002604871988296509, -0.00021630525588989258, -0.00017212331295013428, -0.00012794137001037598, -8.375942707061768e-05, -3.9577484130859375e-05, 4.604458808898926e-06, 4.8786401748657227e-05, 9.296834468841553e-05, 0.00013715028762817383, 0.00018133223056793213, 0.00022551417350769043, 0.00026969611644744873, 0.00031387805938720703, 0.00035806000232696533, 0.00040224194526672363, 0.00044642388820648193, 0.0004906058311462402, 0.0005347877740859985, 0.0005789697170257568, 0.0006231516599655151, 0.0006673336029052734, 0.0007115155458450317, 0.00075569748878479, 0.0007998794317245483, 0.0008440613746643066, 0.0008882433176040649, 0.0009324252605438232, 0.0009766072034835815, 0.0010207891464233398, 0.0010649710893630981, 0.0011091530323028564, 0.0011533349752426147, 0.001197516918182373, 0.0012416988611221313, 0.0012858808040618896, 0.001330062747001648, 0.0013742446899414062]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 8.0, 14.0, 24.0, 29.0, 42.0, 74.0, 114.0, 202.0, 402.0, 800.0, 1782.0, 5003.0, 16189.0, 66501.0, 387106.0, 461757.0, 79841.0, 19124.0, 5658.0, 2054.0, 840.0, 424.0, 244.0, 102.0, 76.0, 42.0, 21.0, 25.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-21.671875, -21.07080078125, -20.4697265625, -19.86865234375, -19.267578125, -18.66650390625, -18.0654296875, -17.46435546875, -16.86328125, -16.26220703125, -15.6611328125, -15.06005859375, -14.458984375, -13.85791015625, -13.2568359375, -12.65576171875, -12.0546875, -11.45361328125, -10.8525390625, -10.25146484375, -9.650390625, -9.04931640625, -8.4482421875, -7.84716796875, -7.24609375, -6.64501953125, -6.0439453125, -5.44287109375, -4.841796875, -4.24072265625, -3.6396484375, -3.03857421875, -2.4375, -1.83642578125, -1.2353515625, -0.63427734375, -0.033203125, 0.56787109375, 1.1689453125, 1.77001953125, 2.37109375, 2.97216796875, 3.5732421875, 4.17431640625, 4.775390625, 5.37646484375, 5.9775390625, 6.57861328125, 7.1796875, 7.78076171875, 8.3818359375, 8.98291015625, 9.583984375, 10.18505859375, 10.7861328125, 11.38720703125, 11.98828125, 12.58935546875, 13.1904296875, 13.79150390625, 14.392578125, 14.99365234375, 15.5947265625, 16.19580078125, 16.796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 9.0, 5.0, 8.0, 9.0, 9.0, 28.0, 23.0, 31.0, 36.0, 65.0, 62.0, 86.0, 118.0, 95.0, 97.0, 78.0, 62.0, 31.0, 28.0, 21.0, 20.0, 18.0, 11.0, 9.0, 13.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.375, -9.10675048828125, -8.8385009765625, -8.57025146484375, -8.302001953125, -8.03375244140625, -7.7655029296875, -7.49725341796875, -7.22900390625, -6.96075439453125, -6.6925048828125, -6.42425537109375, -6.156005859375, -5.88775634765625, -5.6195068359375, -5.35125732421875, -5.0830078125, -4.81475830078125, -4.5465087890625, -4.27825927734375, -4.010009765625, -3.74176025390625, -3.4735107421875, -3.20526123046875, -2.93701171875, -2.66876220703125, -2.4005126953125, -2.13226318359375, -1.864013671875, -1.59576416015625, -1.3275146484375, -1.05926513671875, -0.791015625, -0.52276611328125, -0.2545166015625, 0.01373291015625, 0.281982421875, 0.55023193359375, 0.8184814453125, 1.08673095703125, 1.35498046875, 1.62322998046875, 1.8914794921875, 2.15972900390625, 2.427978515625, 2.69622802734375, 2.9644775390625, 3.23272705078125, 3.5009765625, 3.76922607421875, 4.0374755859375, 4.30572509765625, 4.573974609375, 4.84222412109375, 5.1104736328125, 5.37872314453125, 5.64697265625, 5.91522216796875, 6.1834716796875, 6.45172119140625, 6.719970703125, 6.98822021484375, 7.2564697265625, 7.52471923828125, 7.79296875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 3.0, 5.0, 16.0, 20.0, 48.0, 76.0, 137.0, 165.0, 204.0, 138.0, 79.0, 36.0, 29.0, 18.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-148.98036193847656, -144.6322479248047, -140.28414916992188, -135.93603515625, -131.58792114257812, -127.23981475830078, -122.89170837402344, -118.54359436035156, -114.19548797607422, -109.84738159179688, -105.499267578125, -101.15116119384766, -96.80305480957031, -92.45494079589844, -88.1068344116211, -83.75872802734375, -79.41061401367188, -75.06250762939453, -70.71439361572266, -66.36628723144531, -62.0181770324707, -57.670066833496094, -53.32196044921875, -48.97385025024414, -44.62574005126953, -40.27762985229492, -35.92951965332031, -31.58141326904297, -27.23330307006836, -22.88519287109375, -18.537084579467773, -14.188976287841797, -9.84088134765625, -5.492772102355957, -1.144662857055664, 3.203446388244629, 7.551555633544922, 11.899665832519531, 16.247774124145508, 20.595882415771484, 24.943992614746094, 29.292102813720703, 33.64021301269531, 37.988319396972656, 42.336429595947266, 46.684539794921875, 51.03264617919922, 55.38075637817383, 59.72886657714844, 64.07697296142578, 68.42508697509766, 72.773193359375, 77.12130737304688, 81.46941375732422, 85.81752014160156, 90.16563415527344, 94.51374053955078, 98.86184692382812, 103.2099609375, 107.55806732177734, 111.90617370605469, 116.25428771972656, 120.6023941040039, 124.95050048828125, 129.29861450195312]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 5.0, 7.0, 12.0, 13.0, 17.0, 18.0, 22.0, 30.0, 30.0, 35.0, 52.0, 41.0, 42.0, 50.0, 66.0, 63.0, 58.0, 46.0, 51.0, 49.0, 51.0, 35.0, 30.0, 25.0, 28.0, 26.0, 15.0, 18.0, 16.0, 8.0, 5.0, 9.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-76.22288513183594, -73.91661834716797, -71.6103515625, -69.30408477783203, -66.99781799316406, -64.6915512084961, -62.385284423828125, -60.079017639160156, -57.77275085449219, -55.46648406982422, -53.16021728515625, -50.85395050048828, -48.54768371582031, -46.241416931152344, -43.935150146484375, -41.628883361816406, -39.32261276245117, -37.0163459777832, -34.710079193115234, -32.403812408447266, -30.097545623779297, -27.791278839111328, -25.485010147094727, -23.178743362426758, -20.87247657775879, -18.56620979309082, -16.25994300842285, -13.953675270080566, -11.647408485412598, -9.341141700744629, -7.034873962402344, -4.728607177734375, -2.4223403930664062, -0.1160733699798584, 2.1901936531066895, 4.496460914611816, 6.802727699279785, 9.108994483947754, 11.415262222290039, 13.721529006958008, 16.027795791625977, 18.334062576293945, 20.640329360961914, 22.946598052978516, 25.252864837646484, 27.559131622314453, 29.865398406982422, 32.17166519165039, 34.47793197631836, 36.78419876098633, 39.0904655456543, 41.396732330322266, 43.702999114990234, 46.0092658996582, 48.31553649902344, 50.621803283691406, 52.928070068359375, 55.234336853027344, 57.54060363769531, 59.84687042236328, 62.15313720703125, 64.45940399169922, 66.76567077636719, 69.07193756103516, 71.37820434570312]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 5.0, 5.0, 8.0, 10.0, 6.0, 6.0, 16.0, 25.0, 37.0, 32.0, 60.0, 63.0, 111.0, 154.0, 223.0, 338.0, 565.0, 993.0, 2021.0, 4594.0, 14486.0, 78625.0, 2861533.0, 1147720.0, 64432.0, 12128.0, 3512.0, 1375.0, 598.0, 253.0, 141.0, 73.0, 53.0, 28.0, 12.0, 14.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.09375, -47.864501953125, -46.63525390625, -45.406005859375, -44.1767578125, -42.947509765625, -41.71826171875, -40.489013671875, -39.259765625, -38.030517578125, -36.80126953125, -35.572021484375, -34.3427734375, -33.113525390625, -31.88427734375, -30.655029296875, -29.42578125, -28.196533203125, -26.96728515625, -25.738037109375, -24.5087890625, -23.279541015625, -22.05029296875, -20.821044921875, -19.591796875, -18.362548828125, -17.13330078125, -15.904052734375, -14.6748046875, -13.445556640625, -12.21630859375, -10.987060546875, -9.7578125, -8.528564453125, -7.29931640625, -6.070068359375, -4.8408203125, -3.611572265625, -2.38232421875, -1.153076171875, 0.076171875, 1.305419921875, 2.53466796875, 3.763916015625, 4.9931640625, 6.222412109375, 7.45166015625, 8.680908203125, 9.91015625, 11.139404296875, 12.36865234375, 13.597900390625, 14.8271484375, 16.056396484375, 17.28564453125, 18.514892578125, 19.744140625, 20.973388671875, 22.20263671875, 23.431884765625, 24.6611328125, 25.890380859375, 27.11962890625, 28.348876953125, 29.578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 13.0, 25.0, 31.0, 54.0, 68.0, 103.0, 90.0, 117.0, 124.0, 88.0, 71.0, 65.0, 51.0, 33.0, 26.0, 9.0, 8.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.951171875, -3.854095458984375, -3.75701904296875, -3.659942626953125, -3.5628662109375, -3.465789794921875, -3.36871337890625, -3.271636962890625, -3.174560546875, -3.077484130859375, -2.98040771484375, -2.883331298828125, -2.7862548828125, -2.689178466796875, -2.59210205078125, -2.495025634765625, -2.39794921875, -2.300872802734375, -2.20379638671875, -2.106719970703125, -2.0096435546875, -1.912567138671875, -1.81549072265625, -1.718414306640625, -1.621337890625, -1.524261474609375, -1.42718505859375, -1.330108642578125, -1.2330322265625, -1.135955810546875, -1.03887939453125, -0.941802978515625, -0.8447265625, -0.747650146484375, -0.65057373046875, -0.553497314453125, -0.4564208984375, -0.359344482421875, -0.26226806640625, -0.165191650390625, -0.068115234375, 0.028961181640625, 0.12603759765625, 0.223114013671875, 0.3201904296875, 0.417266845703125, 0.51434326171875, 0.611419677734375, 0.70849609375, 0.805572509765625, 0.90264892578125, 0.999725341796875, 1.0968017578125, 1.193878173828125, 1.29095458984375, 1.388031005859375, 1.485107421875, 1.582183837890625, 1.67926025390625, 1.776336669921875, 1.8734130859375, 1.970489501953125, 2.06756591796875, 2.164642333984375, 2.26171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 9.0, 19.0, 46.0, 65.0, 109.0, 330.0, 804.0, 2691.0, 12782.0, 112649.0, 3515481.0, 511030.0, 30732.0, 5217.0, 1398.0, 475.0, 239.0, 93.0, 57.0, 37.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.09375, -54.52392578125, -52.9541015625, -51.38427734375, -49.814453125, -48.24462890625, -46.6748046875, -45.10498046875, -43.53515625, -41.96533203125, -40.3955078125, -38.82568359375, -37.255859375, -35.68603515625, -34.1162109375, -32.54638671875, -30.9765625, -29.40673828125, -27.8369140625, -26.26708984375, -24.697265625, -23.12744140625, -21.5576171875, -19.98779296875, -18.41796875, -16.84814453125, -15.2783203125, -13.70849609375, -12.138671875, -10.56884765625, -8.9990234375, -7.42919921875, -5.859375, -4.28955078125, -2.7197265625, -1.14990234375, 0.419921875, 1.98974609375, 3.5595703125, 5.12939453125, 6.69921875, 8.26904296875, 9.8388671875, 11.40869140625, 12.978515625, 14.54833984375, 16.1181640625, 17.68798828125, 19.2578125, 20.82763671875, 22.3974609375, 23.96728515625, 25.537109375, 27.10693359375, 28.6767578125, 30.24658203125, 31.81640625, 33.38623046875, 34.9560546875, 36.52587890625, 38.095703125, 39.66552734375, 41.2353515625, 42.80517578125, 44.375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 12.0, 22.0, 25.0, 34.0, 49.0, 92.0, 125.0, 218.0, 446.0, 1312.0, 841.0, 336.0, 190.0, 127.0, 73.0, 44.0, 34.0, 23.0, 15.0, 12.0, 4.0, 3.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.898193359375, -7.67138671875, -7.444580078125, -7.2177734375, -6.990966796875, -6.76416015625, -6.537353515625, -6.310546875, -6.083740234375, -5.85693359375, -5.630126953125, -5.4033203125, -5.176513671875, -4.94970703125, -4.722900390625, -4.49609375, -4.269287109375, -4.04248046875, -3.815673828125, -3.5888671875, -3.362060546875, -3.13525390625, -2.908447265625, -2.681640625, -2.454833984375, -2.22802734375, -2.001220703125, -1.7744140625, -1.547607421875, -1.32080078125, -1.093994140625, -0.8671875, -0.640380859375, -0.41357421875, -0.186767578125, 0.0400390625, 0.266845703125, 0.49365234375, 0.720458984375, 0.947265625, 1.174072265625, 1.40087890625, 1.627685546875, 1.8544921875, 2.081298828125, 2.30810546875, 2.534912109375, 2.76171875, 2.988525390625, 3.21533203125, 3.442138671875, 3.6689453125, 3.895751953125, 4.12255859375, 4.349365234375, 4.576171875, 4.802978515625, 5.02978515625, 5.256591796875, 5.4833984375, 5.710205078125, 5.93701171875, 6.163818359375, 6.390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 14.0, 13.0, 35.0, 92.0, 175.0, 227.0, 185.0, 143.0, 85.0, 25.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-117.08839416503906, -114.83235931396484, -112.57633209228516, -110.32029724121094, -108.06426239013672, -105.80823516845703, -103.55220031738281, -101.2961654663086, -99.0401382446289, -96.78410339355469, -94.528076171875, -92.27204132080078, -90.01600646972656, -87.75997924804688, -85.50394439697266, -83.24790954589844, -80.99188232421875, -78.73584747314453, -76.47982025146484, -74.22378540039062, -71.9677505493164, -69.71172332763672, -67.4556884765625, -65.19965362548828, -62.94361877441406, -60.68758773803711, -58.43155288696289, -56.17552185058594, -53.919490814208984, -51.66345977783203, -49.40742492675781, -47.15139389038086, -44.895355224609375, -42.63932418823242, -40.3832893371582, -38.12725830078125, -35.8712272644043, -33.615196228027344, -31.359161376953125, -29.103130340576172, -26.84709930419922, -24.591066360473633, -22.33503532409668, -20.079002380371094, -17.82297134399414, -15.566938400268555, -13.310905456542969, -11.0548734664917, -8.79884147644043, -6.54280948638916, -4.286777019500732, -2.0307445526123047, 0.22528743743896484, 2.4813194274902344, 4.73735237121582, 6.99338436126709, 9.24941635131836, 11.505448341369629, 13.761480331420898, 16.017513275146484, 18.273544311523438, 20.529577255249023, 22.78561019897461, 25.041641235351562, 27.29767417907715]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 9.0, 6.0, 8.0, 15.0, 18.0, 11.0, 19.0, 22.0, 28.0, 25.0, 30.0, 25.0, 26.0, 40.0, 39.0, 44.0, 49.0, 39.0, 43.0, 33.0, 40.0, 64.0, 44.0, 41.0, 48.0, 36.0, 30.0, 35.0, 24.0, 16.0, 22.0, 10.0, 13.0, 8.0, 10.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.254213333129883, -25.470956802368164, -24.687698364257812, -23.904441833496094, -23.121185302734375, -22.337926864624023, -21.554670333862305, -20.771411895751953, -19.988155364990234, -19.204898834228516, -18.421640396118164, -17.638383865356445, -16.855125427246094, -16.071868896484375, -15.288612365722656, -14.505354881286621, -13.722097396850586, -12.93883991241455, -12.155582427978516, -11.372325897216797, -10.589068412780762, -9.805810928344727, -9.022554397583008, -8.239296913146973, -7.4560394287109375, -6.672781944274902, -5.889524936676025, -5.106267929077148, -4.323010444641113, -3.5397531986236572, -2.756495952606201, -1.9732389450073242, -1.1899833679199219, -0.4067261219024658, 0.37653112411499023, 1.1597883701324463, 1.9430456161499023, 2.7263028621673584, 3.5095601081848145, 4.292817115783691, 5.076074600219727, 5.859332084655762, 6.642589092254639, 7.425846099853516, 8.20910358428955, 8.992361068725586, 9.775617599487305, 10.55887508392334, 11.342132568359375, 12.12539005279541, 12.908647537231445, 13.691904067993164, 14.4751615524292, 15.258419036865234, 16.041675567626953, 16.824932098388672, 17.608190536499023, 18.391447067260742, 19.174705505371094, 19.957962036132812, 20.74121856689453, 21.524477005004883, 22.3077335357666, 23.090991973876953, 23.874248504638672]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 5.0, 10.0, 10.0, 25.0, 22.0, 40.0, 43.0, 45.0, 104.0, 128.0, 209.0, 335.0, 547.0, 1071.0, 2251.0, 5937.0, 15702.0, 47059.0, 141891.0, 357928.0, 305531.0, 111171.0, 36980.0, 12537.0, 4697.0, 2017.0, 917.0, 462.0, 283.0, 176.0, 133.0, 68.0, 57.0, 41.0, 36.0, 17.0, 18.0, 14.0, 9.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.2110595703125, -16.687744140625, -16.1644287109375, -15.64111328125, -15.1177978515625, -14.594482421875, -14.0711669921875, -13.5478515625, -13.0245361328125, -12.501220703125, -11.9779052734375, -11.45458984375, -10.9312744140625, -10.407958984375, -9.8846435546875, -9.361328125, -8.8380126953125, -8.314697265625, -7.7913818359375, -7.26806640625, -6.7447509765625, -6.221435546875, -5.6981201171875, -5.1748046875, -4.6514892578125, -4.128173828125, -3.6048583984375, -3.08154296875, -2.5582275390625, -2.034912109375, -1.5115966796875, -0.98828125, -0.4649658203125, 0.058349609375, 0.5816650390625, 1.10498046875, 1.6282958984375, 2.151611328125, 2.6749267578125, 3.1982421875, 3.7215576171875, 4.244873046875, 4.7681884765625, 5.29150390625, 5.8148193359375, 6.338134765625, 6.8614501953125, 7.384765625, 7.9080810546875, 8.431396484375, 8.9547119140625, 9.47802734375, 10.0013427734375, 10.524658203125, 11.0479736328125, 11.5712890625, 12.0946044921875, 12.617919921875, 13.1412353515625, 13.66455078125, 14.1878662109375, 14.711181640625, 15.2344970703125, 15.7578125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 14.0, 20.0, 24.0, 35.0, 35.0, 65.0, 49.0, 63.0, 64.0, 78.0, 77.0, 84.0, 89.0, 62.0, 53.0, 64.0, 24.0, 29.0, 15.0, 11.0, 9.0, 12.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.81640625, -3.7277984619140625, -3.639190673828125, -3.5505828857421875, -3.46197509765625, -3.3733673095703125, -3.284759521484375, -3.1961517333984375, -3.1075439453125, -3.0189361572265625, -2.930328369140625, -2.8417205810546875, -2.75311279296875, -2.6645050048828125, -2.575897216796875, -2.4872894287109375, -2.398681640625, -2.3100738525390625, -2.221466064453125, -2.1328582763671875, -2.04425048828125, -1.9556427001953125, -1.867034912109375, -1.7784271240234375, -1.6898193359375, -1.6012115478515625, -1.512603759765625, -1.4239959716796875, -1.33538818359375, -1.2467803955078125, -1.158172607421875, -1.0695648193359375, -0.98095703125, -0.8923492431640625, -0.803741455078125, -0.7151336669921875, -0.62652587890625, -0.5379180908203125, -0.449310302734375, -0.3607025146484375, -0.2720947265625, -0.1834869384765625, -0.094879150390625, -0.0062713623046875, 0.08233642578125, 0.1709442138671875, 0.259552001953125, 0.3481597900390625, 0.436767578125, 0.5253753662109375, 0.613983154296875, 0.7025909423828125, 0.79119873046875, 0.8798065185546875, 0.968414306640625, 1.0570220947265625, 1.1456298828125, 1.2342376708984375, 1.322845458984375, 1.4114532470703125, 1.50006103515625, 1.5886688232421875, 1.677276611328125, 1.7658843994140625, 1.8544921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 13.0, 7.0, 20.0, 19.0, 18.0, 33.0, 41.0, 51.0, 75.0, 89.0, 144.0, 177.0, 306.0, 405.0, 662.0, 1130.0, 2067.0, 3892.0, 8247.0, 19208.0, 50337.0, 140519.0, 358524.0, 290649.0, 104792.0, 37907.0, 14986.0, 6585.0, 3220.0, 1669.0, 957.0, 581.0, 347.0, 242.0, 172.0, 99.0, 109.0, 63.0, 63.0, 24.0, 29.0, 18.0, 14.0, 13.0, 7.0, 9.0, 3.0, 4.0, 0.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.09375, -17.52587890625, -16.9580078125, -16.39013671875, -15.822265625, -15.25439453125, -14.6865234375, -14.11865234375, -13.55078125, -12.98291015625, -12.4150390625, -11.84716796875, -11.279296875, -10.71142578125, -10.1435546875, -9.57568359375, -9.0078125, -8.43994140625, -7.8720703125, -7.30419921875, -6.736328125, -6.16845703125, -5.6005859375, -5.03271484375, -4.46484375, -3.89697265625, -3.3291015625, -2.76123046875, -2.193359375, -1.62548828125, -1.0576171875, -0.48974609375, 0.078125, 0.64599609375, 1.2138671875, 1.78173828125, 2.349609375, 2.91748046875, 3.4853515625, 4.05322265625, 4.62109375, 5.18896484375, 5.7568359375, 6.32470703125, 6.892578125, 7.46044921875, 8.0283203125, 8.59619140625, 9.1640625, 9.73193359375, 10.2998046875, 10.86767578125, 11.435546875, 12.00341796875, 12.5712890625, 13.13916015625, 13.70703125, 14.27490234375, 14.8427734375, 15.41064453125, 15.978515625, 16.54638671875, 17.1142578125, 17.68212890625, 18.25]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 8.0, 19.0, 13.0, 6.0, 14.0, 22.0, 27.0, 33.0, 27.0, 34.0, 35.0, 47.0, 60.0, 48.0, 47.0, 50.0, 55.0, 33.0, 45.0, 57.0, 39.0, 38.0, 46.0, 33.0, 26.0, 19.0, 19.0, 17.0, 13.0, 7.0, 12.0, 9.0, 6.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.86767578125, -11.4306640625, -10.99365234375, -10.556640625, -10.11962890625, -9.6826171875, -9.24560546875, -8.80859375, -8.37158203125, -7.9345703125, -7.49755859375, -7.060546875, -6.62353515625, -6.1865234375, -5.74951171875, -5.3125, -4.87548828125, -4.4384765625, -4.00146484375, -3.564453125, -3.12744140625, -2.6904296875, -2.25341796875, -1.81640625, -1.37939453125, -0.9423828125, -0.50537109375, -0.068359375, 0.36865234375, 0.8056640625, 1.24267578125, 1.6796875, 2.11669921875, 2.5537109375, 2.99072265625, 3.427734375, 3.86474609375, 4.3017578125, 4.73876953125, 5.17578125, 5.61279296875, 6.0498046875, 6.48681640625, 6.923828125, 7.36083984375, 7.7978515625, 8.23486328125, 8.671875, 9.10888671875, 9.5458984375, 9.98291015625, 10.419921875, 10.85693359375, 11.2939453125, 11.73095703125, 12.16796875, 12.60498046875, 13.0419921875, 13.47900390625, 13.916015625, 14.35302734375, 14.7900390625, 15.22705078125, 15.6640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 4.0, 12.0, 15.0, 18.0, 38.0, 55.0, 64.0, 99.0, 148.0, 236.0, 371.0, 653.0, 1185.0, 2173.0, 4298.0, 9130.0, 20738.0, 49181.0, 124468.0, 328038.0, 309094.0, 115485.0, 45873.0, 19349.0, 8690.0, 4139.0, 2150.0, 1175.0, 634.0, 375.0, 216.0, 138.0, 77.0, 61.0, 47.0, 29.0, 18.0, 21.0, 16.0, 13.0, 5.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.15625, -9.87384033203125, -9.5914306640625, -9.30902099609375, -9.026611328125, -8.74420166015625, -8.4617919921875, -8.17938232421875, -7.89697265625, -7.61456298828125, -7.3321533203125, -7.04974365234375, -6.767333984375, -6.48492431640625, -6.2025146484375, -5.92010498046875, -5.6376953125, -5.35528564453125, -5.0728759765625, -4.79046630859375, -4.508056640625, -4.22564697265625, -3.9432373046875, -3.66082763671875, -3.37841796875, -3.09600830078125, -2.8135986328125, -2.53118896484375, -2.248779296875, -1.96636962890625, -1.6839599609375, -1.40155029296875, -1.119140625, -0.83673095703125, -0.5543212890625, -0.27191162109375, 0.010498046875, 0.29290771484375, 0.5753173828125, 0.85772705078125, 1.14013671875, 1.42254638671875, 1.7049560546875, 1.98736572265625, 2.269775390625, 2.55218505859375, 2.8345947265625, 3.11700439453125, 3.3994140625, 3.68182373046875, 3.9642333984375, 4.24664306640625, 4.529052734375, 4.81146240234375, 5.0938720703125, 5.37628173828125, 5.65869140625, 5.94110107421875, 6.2235107421875, 6.50592041015625, 6.788330078125, 7.07073974609375, 7.3531494140625, 7.63555908203125, 7.91796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 7.0, 2.0, 12.0, 8.0, 4.0, 13.0, 18.0, 8.0, 13.0, 23.0, 26.0, 22.0, 29.0, 51.0, 69.0, 115.0, 117.0, 104.0, 69.0, 41.0, 53.0, 30.0, 28.0, 27.0, 15.0, 11.0, 12.0, 7.0, 12.0, 9.0, 8.0, 5.0, 7.0, 6.0, 3.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018377304077148438, -0.0017860978841781616, -0.0017344653606414795, -0.0016828328371047974, -0.0016312003135681152, -0.001579567790031433, -0.001527935266494751, -0.0014763027429580688, -0.0014246702194213867, -0.0013730376958847046, -0.0013214051723480225, -0.0012697726488113403, -0.0012181401252746582, -0.001166507601737976, -0.001114875078201294, -0.0010632425546646118, -0.0010116100311279297, -0.0009599775075912476, -0.0009083449840545654, -0.0008567124605178833, -0.0008050799369812012, -0.000753447413444519, -0.0007018148899078369, -0.0006501823663711548, -0.0005985498428344727, -0.0005469173192977905, -0.0004952847957611084, -0.00044365227222442627, -0.00039201974868774414, -0.000340387225151062, -0.0002887547016143799, -0.00023712217807769775, -0.00018548965454101562, -0.0001338571310043335, -8.222460746765137e-05, -3.059208393096924e-05, 2.104043960571289e-05, 7.267296314239502e-05, 0.00012430548667907715, 0.00017593801021575928, 0.0002275705337524414, 0.00027920305728912354, 0.00033083558082580566, 0.0003824681043624878, 0.0004341006278991699, 0.00048573315143585205, 0.0005373656749725342, 0.0005889981985092163, 0.0006406307220458984, 0.0006922632455825806, 0.0007438957691192627, 0.0007955282926559448, 0.000847160816192627, 0.0008987933397293091, 0.0009504258632659912, 0.0010020583868026733, 0.0010536909103393555, 0.0011053234338760376, 0.0011569559574127197, 0.0012085884809494019, 0.001260221004486084, 0.0013118535280227661, 0.0013634860515594482, 0.0014151185750961304, 0.0014667510986328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 2.0, 7.0, 10.0, 21.0, 16.0, 28.0, 35.0, 56.0, 73.0, 114.0, 161.0, 242.0, 430.0, 774.0, 1462.0, 3205.0, 7440.0, 20411.0, 64783.0, 252636.0, 501435.0, 133132.0, 38787.0, 13090.0, 5127.0, 2335.0, 1114.0, 648.0, 335.0, 195.0, 130.0, 88.0, 75.0, 40.0, 33.0, 26.0, 17.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.52587890625, -12.0830078125, -11.64013671875, -11.197265625, -10.75439453125, -10.3115234375, -9.86865234375, -9.42578125, -8.98291015625, -8.5400390625, -8.09716796875, -7.654296875, -7.21142578125, -6.7685546875, -6.32568359375, -5.8828125, -5.43994140625, -4.9970703125, -4.55419921875, -4.111328125, -3.66845703125, -3.2255859375, -2.78271484375, -2.33984375, -1.89697265625, -1.4541015625, -1.01123046875, -0.568359375, -0.12548828125, 0.3173828125, 0.76025390625, 1.203125, 1.64599609375, 2.0888671875, 2.53173828125, 2.974609375, 3.41748046875, 3.8603515625, 4.30322265625, 4.74609375, 5.18896484375, 5.6318359375, 6.07470703125, 6.517578125, 6.96044921875, 7.4033203125, 7.84619140625, 8.2890625, 8.73193359375, 9.1748046875, 9.61767578125, 10.060546875, 10.50341796875, 10.9462890625, 11.38916015625, 11.83203125, 12.27490234375, 12.7177734375, 13.16064453125, 13.603515625, 14.04638671875, 14.4892578125, 14.93212890625, 15.375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 6.0, 4.0, 18.0, 13.0, 15.0, 18.0, 18.0, 37.0, 29.0, 42.0, 53.0, 59.0, 69.0, 83.0, 80.0, 70.0, 58.0, 44.0, 53.0, 30.0, 35.0, 24.0, 15.0, 22.0, 9.0, 11.0, 12.0, 6.0, 11.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.01171875, -6.79290771484375, -6.5740966796875, -6.35528564453125, -6.136474609375, -5.91766357421875, -5.6988525390625, -5.48004150390625, -5.26123046875, -5.04241943359375, -4.8236083984375, -4.60479736328125, -4.385986328125, -4.16717529296875, -3.9483642578125, -3.72955322265625, -3.5107421875, -3.29193115234375, -3.0731201171875, -2.85430908203125, -2.635498046875, -2.41668701171875, -2.1978759765625, -1.97906494140625, -1.76025390625, -1.54144287109375, -1.3226318359375, -1.10382080078125, -0.885009765625, -0.66619873046875, -0.4473876953125, -0.22857666015625, -0.009765625, 0.20904541015625, 0.4278564453125, 0.64666748046875, 0.865478515625, 1.08428955078125, 1.3031005859375, 1.52191162109375, 1.74072265625, 1.95953369140625, 2.1783447265625, 2.39715576171875, 2.615966796875, 2.83477783203125, 3.0535888671875, 3.27239990234375, 3.4912109375, 3.71002197265625, 3.9288330078125, 4.14764404296875, 4.366455078125, 4.58526611328125, 4.8040771484375, 5.02288818359375, 5.24169921875, 5.46051025390625, 5.6793212890625, 5.89813232421875, 6.116943359375, 6.33575439453125, 6.5545654296875, 6.77337646484375, 6.9921875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 12.0, 16.0, 38.0, 49.0, 58.0, 86.0, 104.0, 112.0, 127.0, 98.0, 80.0, 59.0, 40.0, 28.0, 29.0, 11.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-106.07269287109375, -102.42373657226562, -98.77478790283203, -95.1258316040039, -91.47688293457031, -87.82792663574219, -84.17897033691406, -80.53001403808594, -76.88106536865234, -73.23210906982422, -69.58316040039062, -65.9342041015625, -62.28525161743164, -58.63629913330078, -54.987342834472656, -51.3383903503418, -47.68943786621094, -44.04048538208008, -40.39153289794922, -36.742576599121094, -33.093624114990234, -29.444671630859375, -25.795717239379883, -22.14676284790039, -18.49781036376953, -14.848856925964355, -11.19990348815918, -7.550950050354004, -3.901996612548828, -0.25304412841796875, 3.3959102630615234, 7.044864654541016, 10.693817138671875, 14.34277057647705, 17.991724014282227, 21.64067840576172, 25.289630889892578, 28.938583374023438, 32.58753967285156, 36.23649215698242, 39.88544464111328, 43.53439712524414, 47.183349609375, 50.832305908203125, 54.481258392333984, 58.130210876464844, 61.77916717529297, 65.42811584472656, 69.07707214355469, 72.72602844238281, 76.3749771118164, 80.02393341064453, 83.67288208007812, 87.32183837890625, 90.97079467773438, 94.6197509765625, 98.2686996459961, 101.91765594482422, 105.56660461425781, 109.21556091308594, 112.86451721191406, 116.51346588134766, 120.16242218017578, 123.81137084960938, 127.4603271484375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 3.0, 9.0, 7.0, 7.0, 11.0, 17.0, 18.0, 17.0, 25.0, 23.0, 34.0, 38.0, 41.0, 39.0, 45.0, 55.0, 42.0, 45.0, 50.0, 45.0, 48.0, 38.0, 42.0, 39.0, 36.0, 35.0, 24.0, 35.0, 21.0, 22.0, 12.0, 16.0, 16.0, 12.0, 6.0, 1.0, 7.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-96.41365051269531, -93.451171875, -90.48869323730469, -87.52621459960938, -84.5637435913086, -81.60126495361328, -78.63878631591797, -75.67630767822266, -72.71383666992188, -69.75135803222656, -66.78887939453125, -63.8264045715332, -60.863929748535156, -57.901451110839844, -54.93897247314453, -51.97649383544922, -49.014015197753906, -46.051536560058594, -43.08906173706055, -40.126583099365234, -37.16410827636719, -34.201629638671875, -31.239151000976562, -28.276674270629883, -25.314197540283203, -22.351720809936523, -19.389244079589844, -16.42676544189453, -13.464288711547852, -10.501811981201172, -7.539333343505859, -4.57685661315918, -1.6143798828125, 1.348097324371338, 4.310574531555176, 7.273052215576172, 10.235528945922852, 13.198005676269531, 16.160484313964844, 19.122961044311523, 22.085437774658203, 25.047914505004883, 28.010391235351562, 30.972869873046875, 33.93534851074219, 36.897823333740234, 39.86030197143555, 42.822776794433594, 45.785255432128906, 48.74773406982422, 51.710208892822266, 54.67268753051758, 57.635162353515625, 60.59764099121094, 63.56011962890625, 66.52259826660156, 69.48507690429688, 72.44755554199219, 75.4100341796875, 78.37251281738281, 81.3349838256836, 84.2974624633789, 87.25994110107422, 90.22241973876953, 93.18489074707031]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 11.0, 9.0, 18.0, 23.0, 49.0, 59.0, 105.0, 157.0, 338.0, 665.0, 1667.0, 4888.0, 21297.0, 200803.0, 3806195.0, 135716.0, 16496.0, 3698.0, 1162.0, 474.0, 173.0, 105.0, 57.0, 31.0, 24.0, 20.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-56.90625, -55.595947265625, -54.28564453125, -52.975341796875, -51.6650390625, -50.354736328125, -49.04443359375, -47.734130859375, -46.423828125, -45.113525390625, -43.80322265625, -42.492919921875, -41.1826171875, -39.872314453125, -38.56201171875, -37.251708984375, -35.94140625, -34.631103515625, -33.32080078125, -32.010498046875, -30.7001953125, -29.389892578125, -28.07958984375, -26.769287109375, -25.458984375, -24.148681640625, -22.83837890625, -21.528076171875, -20.2177734375, -18.907470703125, -17.59716796875, -16.286865234375, -14.9765625, -13.666259765625, -12.35595703125, -11.045654296875, -9.7353515625, -8.425048828125, -7.11474609375, -5.804443359375, -4.494140625, -3.183837890625, -1.87353515625, -0.563232421875, 0.7470703125, 2.057373046875, 3.36767578125, 4.677978515625, 5.98828125, 7.298583984375, 8.60888671875, 9.919189453125, 11.2294921875, 12.539794921875, 13.85009765625, 15.160400390625, 16.470703125, 17.781005859375, 19.09130859375, 20.401611328125, 21.7119140625, 23.022216796875, 24.33251953125, 25.642822265625, 26.953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 9.0, 5.0, 12.0, 15.0, 16.0, 30.0, 36.0, 48.0, 40.0, 51.0, 64.0, 74.0, 73.0, 85.0, 91.0, 62.0, 60.0, 64.0, 45.0, 40.0, 17.0, 12.0, 19.0, 14.0, 8.0, 5.0, 6.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.6064453125, -4.494140625, -4.3818359375, -4.26953125, -4.1572265625, -4.044921875, -3.9326171875, -3.8203125, -3.7080078125, -3.595703125, -3.4833984375, -3.37109375, -3.2587890625, -3.146484375, -3.0341796875, -2.921875, -2.8095703125, -2.697265625, -2.5849609375, -2.47265625, -2.3603515625, -2.248046875, -2.1357421875, -2.0234375, -1.9111328125, -1.798828125, -1.6865234375, -1.57421875, -1.4619140625, -1.349609375, -1.2373046875, -1.125, -1.0126953125, -0.900390625, -0.7880859375, -0.67578125, -0.5634765625, -0.451171875, -0.3388671875, -0.2265625, -0.1142578125, -0.001953125, 0.1103515625, 0.22265625, 0.3349609375, 0.447265625, 0.5595703125, 0.671875, 0.7841796875, 0.896484375, 1.0087890625, 1.12109375, 1.2333984375, 1.345703125, 1.4580078125, 1.5703125, 1.6826171875, 1.794921875, 1.9072265625, 2.01953125, 2.1318359375, 2.244140625, 2.3564453125, 2.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 14.0, 24.0, 54.0, 72.0, 109.0, 198.0, 332.0, 778.0, 1857.0, 4829.0, 14686.0, 58498.0, 445392.0, 3374665.0, 236509.0, 38830.0, 10497.0, 3749.0, 1448.0, 688.0, 380.0, 218.0, 152.0, 98.0, 64.0, 41.0, 34.0, 13.0, 16.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.861083984375, -34.84716796875, -33.833251953125, -32.8193359375, -31.805419921875, -30.79150390625, -29.777587890625, -28.763671875, -27.749755859375, -26.73583984375, -25.721923828125, -24.7080078125, -23.694091796875, -22.68017578125, -21.666259765625, -20.65234375, -19.638427734375, -18.62451171875, -17.610595703125, -16.5966796875, -15.582763671875, -14.56884765625, -13.554931640625, -12.541015625, -11.527099609375, -10.51318359375, -9.499267578125, -8.4853515625, -7.471435546875, -6.45751953125, -5.443603515625, -4.4296875, -3.415771484375, -2.40185546875, -1.387939453125, -0.3740234375, 0.639892578125, 1.65380859375, 2.667724609375, 3.681640625, 4.695556640625, 5.70947265625, 6.723388671875, 7.7373046875, 8.751220703125, 9.76513671875, 10.779052734375, 11.79296875, 12.806884765625, 13.82080078125, 14.834716796875, 15.8486328125, 16.862548828125, 17.87646484375, 18.890380859375, 19.904296875, 20.918212890625, 21.93212890625, 22.946044921875, 23.9599609375, 24.973876953125, 25.98779296875, 27.001708984375, 28.015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 10.0, 5.0, 18.0, 16.0, 22.0, 31.0, 42.0, 70.0, 100.0, 165.0, 324.0, 985.0, 1327.0, 374.0, 200.0, 128.0, 74.0, 57.0, 23.0, 21.0, 28.0, 10.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.54144287109375, -4.2899169921875, -4.03839111328125, -3.786865234375, -3.53533935546875, -3.2838134765625, -3.03228759765625, -2.78076171875, -2.52923583984375, -2.2777099609375, -2.02618408203125, -1.774658203125, -1.52313232421875, -1.2716064453125, -1.02008056640625, -0.7685546875, -0.51702880859375, -0.2655029296875, -0.01397705078125, 0.237548828125, 0.48907470703125, 0.7406005859375, 0.99212646484375, 1.24365234375, 1.49517822265625, 1.7467041015625, 1.99822998046875, 2.249755859375, 2.50128173828125, 2.7528076171875, 3.00433349609375, 3.255859375, 3.50738525390625, 3.7589111328125, 4.01043701171875, 4.261962890625, 4.51348876953125, 4.7650146484375, 5.01654052734375, 5.26806640625, 5.51959228515625, 5.7711181640625, 6.02264404296875, 6.274169921875, 6.52569580078125, 6.7772216796875, 7.02874755859375, 7.2802734375, 7.53179931640625, 7.7833251953125, 8.03485107421875, 8.286376953125, 8.53790283203125, 8.7894287109375, 9.04095458984375, 9.29248046875, 9.54400634765625, 9.7955322265625, 10.04705810546875, 10.298583984375, 10.55010986328125, 10.8016357421875, 11.05316162109375, 11.3046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 12.0, 18.0, 16.0, 26.0, 68.0, 104.0, 131.0, 173.0, 137.0, 128.0, 81.0, 40.0, 30.0, 15.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.09375, -62.28982162475586, -60.48588943481445, -58.68196105957031, -56.878028869628906, -55.074100494384766, -53.270172119140625, -51.46623992919922, -49.66231155395508, -47.85838317871094, -46.05445098876953, -44.25052261352539, -42.44659423828125, -40.642662048339844, -38.8387336730957, -37.03480529785156, -35.230873107910156, -33.426944732666016, -31.62301254272461, -29.81908416748047, -28.015153884887695, -26.211223602294922, -24.40729522705078, -22.603364944458008, -20.799434661865234, -18.99550437927246, -17.191574096679688, -15.387645721435547, -13.583715438842773, -11.77978515625, -9.975855827331543, -8.171926498413086, -6.3679962158203125, -4.564066410064697, -2.760136604309082, -0.9562067985534668, 0.8477230072021484, 2.651653289794922, 4.455582618713379, 6.259511947631836, 8.06344223022461, 9.867372512817383, 11.67130184173584, 13.475231170654297, 15.27916145324707, 17.083091735839844, 18.887020111083984, 20.690950393676758, 22.49488067626953, 24.298810958862305, 26.102741241455078, 27.90666961669922, 29.710599899291992, 31.514530181884766, 33.318458557128906, 35.12239074707031, 36.92631912231445, 38.730247497558594, 40.5341796875, 42.33810806274414, 44.14203643798828, 45.94596862792969, 47.74989700317383, 49.55382537841797, 51.357757568359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 14.0, 17.0, 11.0, 18.0, 19.0, 18.0, 26.0, 24.0, 31.0, 15.0, 31.0, 36.0, 35.0, 29.0, 34.0, 43.0, 45.0, 45.0, 44.0, 40.0, 36.0, 40.0, 38.0, 38.0, 35.0, 34.0, 25.0, 21.0, 24.0, 14.0, 7.0, 14.0, 21.0, 9.0, 13.0, 10.0, 11.0, 5.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.883262634277344, -25.136049270629883, -24.388835906982422, -23.64162254333496, -22.8944091796875, -22.14719581604004, -21.399982452392578, -20.652767181396484, -19.905555725097656, -19.158342361450195, -18.411128997802734, -17.663915634155273, -16.916702270507812, -16.16948890686035, -15.422274589538574, -14.675061225891113, -13.927846908569336, -13.180633544921875, -12.433420181274414, -11.686206817626953, -10.938993453979492, -10.191780090332031, -9.444565773010254, -8.697352409362793, -7.950139045715332, -7.202925682067871, -6.45571231842041, -5.708498477935791, -4.96128511428833, -4.214071750640869, -3.46685791015625, -2.719644546508789, -1.9724311828613281, -1.2252177000045776, -0.47800421714782715, 0.2692093849182129, 1.0164227485656738, 1.7636361122131348, 2.510849952697754, 3.258063316345215, 4.005276679992676, 4.752490043640137, 5.499703407287598, 6.246917247772217, 6.994130611419678, 7.741343975067139, 8.488557815551758, 9.235771179199219, 9.98298454284668, 10.73019790649414, 11.477411270141602, 12.224624633789062, 12.971837997436523, 13.719051361083984, 14.466265678405762, 15.213479042053223, 15.960692405700684, 16.70790672302246, 17.455120086669922, 18.202333450317383, 18.949546813964844, 19.696760177612305, 20.443973541259766, 21.191186904907227, 21.938400268554688]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 4.0, 8.0, 17.0, 16.0, 23.0, 41.0, 42.0, 50.0, 67.0, 130.0, 167.0, 300.0, 568.0, 978.0, 1751.0, 3356.0, 6471.0, 13029.0, 27054.0, 56299.0, 118641.0, 226418.0, 276957.0, 162012.0, 79210.0, 37692.0, 18217.0, 8956.0, 4632.0, 2347.0, 1216.0, 736.0, 384.0, 209.0, 167.0, 97.0, 69.0, 59.0, 43.0, 29.0, 27.0, 15.0, 16.0, 11.0, 5.0, 5.0, 2.0, 4.0], "bins": [-12.8984375, -12.56103515625, -12.2236328125, -11.88623046875, -11.548828125, -11.21142578125, -10.8740234375, -10.53662109375, -10.19921875, -9.86181640625, -9.5244140625, -9.18701171875, -8.849609375, -8.51220703125, -8.1748046875, -7.83740234375, -7.5, -7.16259765625, -6.8251953125, -6.48779296875, -6.150390625, -5.81298828125, -5.4755859375, -5.13818359375, -4.80078125, -4.46337890625, -4.1259765625, -3.78857421875, -3.451171875, -3.11376953125, -2.7763671875, -2.43896484375, -2.1015625, -1.76416015625, -1.4267578125, -1.08935546875, -0.751953125, -0.41455078125, -0.0771484375, 0.26025390625, 0.59765625, 0.93505859375, 1.2724609375, 1.60986328125, 1.947265625, 2.28466796875, 2.6220703125, 2.95947265625, 3.296875, 3.63427734375, 3.9716796875, 4.30908203125, 4.646484375, 4.98388671875, 5.3212890625, 5.65869140625, 5.99609375, 6.33349609375, 6.6708984375, 7.00830078125, 7.345703125, 7.68310546875, 8.0205078125, 8.35791015625, 8.6953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 13.0, 17.0, 16.0, 20.0, 23.0, 31.0, 25.0, 39.0, 38.0, 53.0, 43.0, 58.0, 58.0, 58.0, 66.0, 71.0, 50.0, 49.0, 59.0, 42.0, 35.0, 22.0, 23.0, 22.0, 15.0, 13.0, 8.0, 9.0, 3.0, 3.0, 9.0, 2.0, 2.0, 3.0], "bins": [-4.140625, -4.0455474853515625, -3.950469970703125, -3.8553924560546875, -3.76031494140625, -3.6652374267578125, -3.570159912109375, -3.4750823974609375, -3.3800048828125, -3.2849273681640625, -3.189849853515625, -3.0947723388671875, -2.99969482421875, -2.9046173095703125, -2.809539794921875, -2.7144622802734375, -2.619384765625, -2.5243072509765625, -2.429229736328125, -2.3341522216796875, -2.23907470703125, -2.1439971923828125, -2.048919677734375, -1.9538421630859375, -1.8587646484375, -1.7636871337890625, -1.668609619140625, -1.5735321044921875, -1.47845458984375, -1.3833770751953125, -1.288299560546875, -1.1932220458984375, -1.09814453125, -1.0030670166015625, -0.907989501953125, -0.8129119873046875, -0.71783447265625, -0.6227569580078125, -0.527679443359375, -0.4326019287109375, -0.3375244140625, -0.2424468994140625, -0.147369384765625, -0.0522918701171875, 0.04278564453125, 0.1378631591796875, 0.232940673828125, 0.3280181884765625, 0.423095703125, 0.5181732177734375, 0.613250732421875, 0.7083282470703125, 0.80340576171875, 0.8984832763671875, 0.993560791015625, 1.0886383056640625, 1.1837158203125, 1.2787933349609375, 1.373870849609375, 1.4689483642578125, 1.56402587890625, 1.6591033935546875, 1.754180908203125, 1.8492584228515625, 1.9443359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 14.0, 15.0, 25.0, 32.0, 41.0, 50.0, 108.0, 102.0, 152.0, 263.0, 368.0, 569.0, 948.0, 1537.0, 2645.0, 4783.0, 9518.0, 19694.0, 45088.0, 107683.0, 244781.0, 321861.0, 162505.0, 67779.0, 29181.0, 13320.0, 6560.0, 3486.0, 1970.0, 1185.0, 726.0, 463.0, 334.0, 232.0, 154.0, 117.0, 63.0, 46.0, 43.0, 38.0, 16.0, 18.0, 11.0, 6.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-14.140625, -13.7152099609375, -13.289794921875, -12.8643798828125, -12.43896484375, -12.0135498046875, -11.588134765625, -11.1627197265625, -10.7373046875, -10.3118896484375, -9.886474609375, -9.4610595703125, -9.03564453125, -8.6102294921875, -8.184814453125, -7.7593994140625, -7.333984375, -6.9085693359375, -6.483154296875, -6.0577392578125, -5.63232421875, -5.2069091796875, -4.781494140625, -4.3560791015625, -3.9306640625, -3.5052490234375, -3.079833984375, -2.6544189453125, -2.22900390625, -1.8035888671875, -1.378173828125, -0.9527587890625, -0.52734375, -0.1019287109375, 0.323486328125, 0.7489013671875, 1.17431640625, 1.5997314453125, 2.025146484375, 2.4505615234375, 2.8759765625, 3.3013916015625, 3.726806640625, 4.1522216796875, 4.57763671875, 5.0030517578125, 5.428466796875, 5.8538818359375, 6.279296875, 6.7047119140625, 7.130126953125, 7.5555419921875, 7.98095703125, 8.4063720703125, 8.831787109375, 9.2572021484375, 9.6826171875, 10.1080322265625, 10.533447265625, 10.9588623046875, 11.38427734375, 11.8096923828125, 12.235107421875, 12.6605224609375, 13.0859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 11.0, 10.0, 10.0, 12.0, 17.0, 18.0, 31.0, 29.0, 31.0, 41.0, 45.0, 48.0, 57.0, 50.0, 62.0, 51.0, 48.0, 51.0, 46.0, 44.0, 48.0, 39.0, 29.0, 33.0, 25.0, 11.0, 19.0, 20.0, 14.0, 7.0, 7.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.7381591796875, -13.218505859375, -12.6988525390625, -12.17919921875, -11.6595458984375, -11.139892578125, -10.6202392578125, -10.1005859375, -9.5809326171875, -9.061279296875, -8.5416259765625, -8.02197265625, -7.5023193359375, -6.982666015625, -6.4630126953125, -5.943359375, -5.4237060546875, -4.904052734375, -4.3843994140625, -3.86474609375, -3.3450927734375, -2.825439453125, -2.3057861328125, -1.7861328125, -1.2664794921875, -0.746826171875, -0.2271728515625, 0.29248046875, 0.8121337890625, 1.331787109375, 1.8514404296875, 2.37109375, 2.8907470703125, 3.410400390625, 3.9300537109375, 4.44970703125, 4.9693603515625, 5.489013671875, 6.0086669921875, 6.5283203125, 7.0479736328125, 7.567626953125, 8.0872802734375, 8.60693359375, 9.1265869140625, 9.646240234375, 10.1658935546875, 10.685546875, 11.2052001953125, 11.724853515625, 12.2445068359375, 12.76416015625, 13.2838134765625, 13.803466796875, 14.3231201171875, 14.8427734375, 15.3624267578125, 15.882080078125, 16.4017333984375, 16.92138671875, 17.4410400390625, 17.960693359375, 18.4803466796875, 19.0]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [9.0, 4.0, 3.0, 9.0, 7.0, 10.0, 6.0, 18.0, 17.0, 29.0, 29.0, 64.0, 70.0, 101.0, 152.0, 259.0, 444.0, 857.0, 1758.0, 4285.0, 11703.0, 37229.0, 130444.0, 388931.0, 326909.0, 100161.0, 28910.0, 9295.0, 3548.0, 1448.0, 732.0, 383.0, 222.0, 169.0, 99.0, 57.0, 36.0, 39.0, 29.0, 24.0, 19.0, 13.0, 10.0, 6.0, 4.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7578125, -5.516845703125, -5.27587890625, -5.034912109375, -4.7939453125, -4.552978515625, -4.31201171875, -4.071044921875, -3.830078125, -3.589111328125, -3.34814453125, -3.107177734375, -2.8662109375, -2.625244140625, -2.38427734375, -2.143310546875, -1.90234375, -1.661376953125, -1.42041015625, -1.179443359375, -0.9384765625, -0.697509765625, -0.45654296875, -0.215576171875, 0.025390625, 0.266357421875, 0.50732421875, 0.748291015625, 0.9892578125, 1.230224609375, 1.47119140625, 1.712158203125, 1.953125, 2.194091796875, 2.43505859375, 2.676025390625, 2.9169921875, 3.157958984375, 3.39892578125, 3.639892578125, 3.880859375, 4.121826171875, 4.36279296875, 4.603759765625, 4.8447265625, 5.085693359375, 5.32666015625, 5.567626953125, 5.80859375, 6.049560546875, 6.29052734375, 6.531494140625, 6.7724609375, 7.013427734375, 7.25439453125, 7.495361328125, 7.736328125, 7.977294921875, 8.21826171875, 8.459228515625, 8.7001953125, 8.941162109375, 9.18212890625, 9.423095703125, 9.6640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 7.0, 9.0, 13.0, 12.0, 8.0, 15.0, 17.0, 26.0, 30.0, 37.0, 32.0, 31.0, 40.0, 63.0, 75.0, 101.0, 92.0, 59.0, 40.0, 35.0, 38.0, 29.0, 30.0, 23.0, 19.0, 23.0, 16.0, 14.0, 13.0, 11.0, 5.0, 3.0, 11.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009675025939941406, -0.0009347125887870789, -0.0009019225835800171, -0.0008691325783729553, -0.0008363425731658936, -0.0008035525679588318, -0.00077076256275177, -0.0007379725575447083, -0.0007051825523376465, -0.0006723925471305847, -0.000639602541923523, -0.0006068125367164612, -0.0005740225315093994, -0.0005412325263023376, -0.0005084425210952759, -0.0004756525158882141, -0.00044286251068115234, -0.0004100725054740906, -0.0003772825002670288, -0.00034449249505996704, -0.0003117024898529053, -0.0002789124846458435, -0.00024612247943878174, -0.00021333247423171997, -0.0001805424690246582, -0.00014775246381759644, -0.00011496245861053467, -8.21724534034729e-05, -4.938244819641113e-05, -1.6592442989349365e-05, 1.6197562217712402e-05, 4.898756742477417e-05, 8.177757263183594e-05, 0.0001145675778388977, 0.00014735758304595947, 0.00018014758825302124, 0.000212937593460083, 0.0002457275986671448, 0.00027851760387420654, 0.0003113076090812683, 0.0003440976142883301, 0.00037688761949539185, 0.0004096776247024536, 0.0004424676299095154, 0.00047525763511657715, 0.0005080476403236389, 0.0005408376455307007, 0.0005736276507377625, 0.0006064176559448242, 0.000639207661151886, 0.0006719976663589478, 0.0007047876715660095, 0.0007375776767730713, 0.0007703676819801331, 0.0008031576871871948, 0.0008359476923942566, 0.0008687376976013184, 0.0009015277028083801, 0.0009343177080154419, 0.0009671077132225037, 0.0009998977184295654, 0.0010326877236366272, 0.001065477728843689, 0.0010982677340507507, 0.0011310577392578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 8.0, 14.0, 19.0, 31.0, 38.0, 52.0, 83.0, 100.0, 197.0, 247.0, 475.0, 782.0, 1336.0, 2605.0, 5336.0, 12733.0, 34766.0, 105974.0, 317597.0, 365971.0, 130214.0, 42189.0, 14879.0, 6093.0, 2893.0, 1590.0, 888.0, 490.0, 281.0, 208.0, 112.0, 101.0, 67.0, 42.0, 28.0, 27.0, 21.0, 8.0, 12.0, 6.0, 8.0, 1.0, 3.0, 3.0, 1.0, 6.0, 1.0, 5.0, 1.0, 1.0], "bins": [-7.6484375, -7.41729736328125, -7.1861572265625, -6.95501708984375, -6.723876953125, -6.49273681640625, -6.2615966796875, -6.03045654296875, -5.79931640625, -5.56817626953125, -5.3370361328125, -5.10589599609375, -4.874755859375, -4.64361572265625, -4.4124755859375, -4.18133544921875, -3.9501953125, -3.71905517578125, -3.4879150390625, -3.25677490234375, -3.025634765625, -2.79449462890625, -2.5633544921875, -2.33221435546875, -2.10107421875, -1.86993408203125, -1.6387939453125, -1.40765380859375, -1.176513671875, -0.94537353515625, -0.7142333984375, -0.48309326171875, -0.251953125, -0.02081298828125, 0.2103271484375, 0.44146728515625, 0.672607421875, 0.90374755859375, 1.1348876953125, 1.36602783203125, 1.59716796875, 1.82830810546875, 2.0594482421875, 2.29058837890625, 2.521728515625, 2.75286865234375, 2.9840087890625, 3.21514892578125, 3.4462890625, 3.67742919921875, 3.9085693359375, 4.13970947265625, 4.370849609375, 4.60198974609375, 4.8331298828125, 5.06427001953125, 5.29541015625, 5.52655029296875, 5.7576904296875, 5.98883056640625, 6.219970703125, 6.45111083984375, 6.6822509765625, 6.91339111328125, 7.14453125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 14.0, 23.0, 16.0, 19.0, 33.0, 54.0, 48.0, 65.0, 76.0, 88.0, 91.0, 79.0, 76.0, 64.0, 71.0, 52.0, 18.0, 34.0, 20.0, 8.0, 7.0, 5.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.8359375, -7.6160888671875, -7.396240234375, -7.1763916015625, -6.95654296875, -6.7366943359375, -6.516845703125, -6.2969970703125, -6.0771484375, -5.8572998046875, -5.637451171875, -5.4176025390625, -5.19775390625, -4.9779052734375, -4.758056640625, -4.5382080078125, -4.318359375, -4.0985107421875, -3.878662109375, -3.6588134765625, -3.43896484375, -3.2191162109375, -2.999267578125, -2.7794189453125, -2.5595703125, -2.3397216796875, -2.119873046875, -1.9000244140625, -1.68017578125, -1.4603271484375, -1.240478515625, -1.0206298828125, -0.80078125, -0.5809326171875, -0.361083984375, -0.1412353515625, 0.07861328125, 0.2984619140625, 0.518310546875, 0.7381591796875, 0.9580078125, 1.1778564453125, 1.397705078125, 1.6175537109375, 1.83740234375, 2.0572509765625, 2.277099609375, 2.4969482421875, 2.716796875, 2.9366455078125, 3.156494140625, 3.3763427734375, 3.59619140625, 3.8160400390625, 4.035888671875, 4.2557373046875, 4.4755859375, 4.6954345703125, 4.915283203125, 5.1351318359375, 5.35498046875, 5.5748291015625, 5.794677734375, 6.0145263671875, 6.234375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 12.0, 12.0, 18.0, 40.0, 50.0, 114.0, 116.0, 155.0, 156.0, 107.0, 73.0, 52.0, 38.0, 18.0, 11.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-157.15682983398438, -153.20716857910156, -149.2575225830078, -145.307861328125, -141.35821533203125, -137.40855407714844, -133.4589080810547, -129.50924682617188, -125.55960083007812, -121.60994720458984, -117.66029357910156, -113.71063995361328, -109.760986328125, -105.81133270263672, -101.86167907714844, -97.91202545166016, -93.96237182617188, -90.0127182006836, -86.06306457519531, -82.11341094970703, -78.16375732421875, -74.21410369873047, -70.26445007324219, -66.3147964477539, -62.365135192871094, -58.41548156738281, -54.46582794189453, -50.51617431640625, -46.56652069091797, -42.61686706542969, -38.667213439941406, -34.717559814453125, -30.767906188964844, -26.818252563476562, -22.86859893798828, -18.9189453125, -14.969290733337402, -11.019636154174805, -7.069982528686523, -3.120328903198242, 0.8293247222900391, 4.77897834777832, 8.728631973266602, 12.6782865524292, 16.627941131591797, 20.577594757080078, 24.52724838256836, 28.47690200805664, 32.42655563354492, 36.3762092590332, 40.325862884521484, 44.275516510009766, 48.22517013549805, 52.174827575683594, 56.124481201171875, 60.074134826660156, 64.02378845214844, 67.97344207763672, 71.923095703125, 75.87274932861328, 79.82240295410156, 83.77205657958984, 87.72171020507812, 91.6713638305664, 95.62101745605469]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 4.0, 6.0, 4.0, 21.0, 17.0, 20.0, 20.0, 36.0, 35.0, 37.0, 38.0, 51.0, 46.0, 58.0, 59.0, 55.0, 62.0, 53.0, 51.0, 46.0, 43.0, 38.0, 34.0, 25.0, 20.0, 22.0, 22.0, 20.0, 14.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.13690185546875, -66.1010513305664, -63.0651969909668, -60.02934265136719, -56.99348831176758, -53.95763397216797, -50.921783447265625, -47.885929107666016, -44.850074768066406, -41.8142204284668, -38.77836990356445, -35.742515563964844, -32.706661224365234, -29.670808792114258, -26.63495635986328, -23.599102020263672, -20.563251495361328, -17.52739906311035, -14.491544723510742, -11.455692291259766, -8.419838905334473, -5.38398551940918, -2.348133087158203, 0.6877212524414062, 3.723573684692383, 6.759427070617676, 9.795280456542969, 12.831132888793945, 15.866986274719238, 18.90283966064453, 21.938692092895508, 24.974546432495117, 28.010398864746094, 31.04625129699707, 34.08210372924805, 37.117958068847656, 40.153812408447266, 43.189666748046875, 46.22551727294922, 49.26137161254883, 52.29722595214844, 55.33308029174805, 58.36893081665039, 61.40478515625, 64.44063568115234, 67.47649383544922, 70.51234436035156, 73.54820251464844, 76.58404541015625, 79.6198959350586, 82.65575408935547, 85.69160461425781, 88.72745513916016, 91.76331329345703, 94.79916381835938, 97.83502197265625, 100.8708724975586, 103.90672302246094, 106.94258117675781, 109.97843170166016, 113.0142822265625, 116.05014038085938, 119.08599090576172, 122.12184143066406, 125.15769958496094]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 20.0, 11.0, 16.0, 28.0, 46.0, 52.0, 100.0, 142.0, 229.0, 427.0, 696.0, 1256.0, 2507.0, 5246.0, 12704.0, 38009.0, 200166.0, 3635649.0, 230856.0, 41345.0, 13534.0, 5583.0, 2570.0, 1326.0, 740.0, 405.0, 234.0, 133.0, 93.0, 51.0, 28.0, 18.0, 16.0, 17.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.1485595703125, -18.593994140625, -18.0394287109375, -17.48486328125, -16.9302978515625, -16.375732421875, -15.8211669921875, -15.2666015625, -14.7120361328125, -14.157470703125, -13.6029052734375, -13.04833984375, -12.4937744140625, -11.939208984375, -11.3846435546875, -10.830078125, -10.2755126953125, -9.720947265625, -9.1663818359375, -8.61181640625, -8.0572509765625, -7.502685546875, -6.9481201171875, -6.3935546875, -5.8389892578125, -5.284423828125, -4.7298583984375, -4.17529296875, -3.6207275390625, -3.066162109375, -2.5115966796875, -1.95703125, -1.4024658203125, -0.847900390625, -0.2933349609375, 0.26123046875, 0.8157958984375, 1.370361328125, 1.9249267578125, 2.4794921875, 3.0340576171875, 3.588623046875, 4.1431884765625, 4.69775390625, 5.2523193359375, 5.806884765625, 6.3614501953125, 6.916015625, 7.4705810546875, 8.025146484375, 8.5797119140625, 9.13427734375, 9.6888427734375, 10.243408203125, 10.7979736328125, 11.3525390625, 11.9071044921875, 12.461669921875, 13.0162353515625, 13.57080078125, 14.1253662109375, 14.679931640625, 15.2344970703125, 15.7890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 6.0, 9.0, 13.0, 26.0, 30.0, 24.0, 34.0, 43.0, 49.0, 55.0, 52.0, 50.0, 74.0, 65.0, 51.0, 84.0, 50.0, 64.0, 43.0, 43.0, 27.0, 30.0, 21.0, 11.0, 8.0, 14.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.167236328125, -4.06103515625, -3.954833984375, -3.8486328125, -3.742431640625, -3.63623046875, -3.530029296875, -3.423828125, -3.317626953125, -3.21142578125, -3.105224609375, -2.9990234375, -2.892822265625, -2.78662109375, -2.680419921875, -2.57421875, -2.468017578125, -2.36181640625, -2.255615234375, -2.1494140625, -2.043212890625, -1.93701171875, -1.830810546875, -1.724609375, -1.618408203125, -1.51220703125, -1.406005859375, -1.2998046875, -1.193603515625, -1.08740234375, -0.981201171875, -0.875, -0.768798828125, -0.66259765625, -0.556396484375, -0.4501953125, -0.343994140625, -0.23779296875, -0.131591796875, -0.025390625, 0.080810546875, 0.18701171875, 0.293212890625, 0.3994140625, 0.505615234375, 0.61181640625, 0.718017578125, 0.82421875, 0.930419921875, 1.03662109375, 1.142822265625, 1.2490234375, 1.355224609375, 1.46142578125, 1.567626953125, 1.673828125, 1.780029296875, 1.88623046875, 1.992431640625, 2.0986328125, 2.204833984375, 2.31103515625, 2.417236328125, 2.5234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 11.0, 19.0, 29.0, 34.0, 78.0, 98.0, 135.0, 253.0, 392.0, 598.0, 988.0, 1583.0, 3003.0, 6243.0, 14394.0, 41780.0, 159554.0, 2262233.0, 1493357.0, 144788.0, 38628.0, 13690.0, 5767.0, 2797.0, 1490.0, 863.0, 503.0, 322.0, 206.0, 144.0, 112.0, 62.0, 44.0, 25.0, 18.0, 9.0, 8.0, 7.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.59375, -17.090576171875, -16.58740234375, -16.084228515625, -15.5810546875, -15.077880859375, -14.57470703125, -14.071533203125, -13.568359375, -13.065185546875, -12.56201171875, -12.058837890625, -11.5556640625, -11.052490234375, -10.54931640625, -10.046142578125, -9.54296875, -9.039794921875, -8.53662109375, -8.033447265625, -7.5302734375, -7.027099609375, -6.52392578125, -6.020751953125, -5.517578125, -5.014404296875, -4.51123046875, -4.008056640625, -3.5048828125, -3.001708984375, -2.49853515625, -1.995361328125, -1.4921875, -0.989013671875, -0.48583984375, 0.017333984375, 0.5205078125, 1.023681640625, 1.52685546875, 2.030029296875, 2.533203125, 3.036376953125, 3.53955078125, 4.042724609375, 4.5458984375, 5.049072265625, 5.55224609375, 6.055419921875, 6.55859375, 7.061767578125, 7.56494140625, 8.068115234375, 8.5712890625, 9.074462890625, 9.57763671875, 10.080810546875, 10.583984375, 11.087158203125, 11.59033203125, 12.093505859375, 12.5966796875, 13.099853515625, 13.60302734375, 14.106201171875, 14.609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 7.0, 9.0, 7.0, 6.0, 9.0, 20.0, 29.0, 40.0, 51.0, 89.0, 148.0, 317.0, 1041.0, 1434.0, 383.0, 181.0, 98.0, 73.0, 34.0, 34.0, 13.0, 16.0, 10.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80078125, -5.61419677734375, -5.4276123046875, -5.24102783203125, -5.054443359375, -4.86785888671875, -4.6812744140625, -4.49468994140625, -4.30810546875, -4.12152099609375, -3.9349365234375, -3.74835205078125, -3.561767578125, -3.37518310546875, -3.1885986328125, -3.00201416015625, -2.8154296875, -2.62884521484375, -2.4422607421875, -2.25567626953125, -2.069091796875, -1.88250732421875, -1.6959228515625, -1.50933837890625, -1.32275390625, -1.13616943359375, -0.9495849609375, -0.76300048828125, -0.576416015625, -0.38983154296875, -0.2032470703125, -0.01666259765625, 0.169921875, 0.35650634765625, 0.5430908203125, 0.72967529296875, 0.916259765625, 1.10284423828125, 1.2894287109375, 1.47601318359375, 1.66259765625, 1.84918212890625, 2.0357666015625, 2.22235107421875, 2.408935546875, 2.59552001953125, 2.7821044921875, 2.96868896484375, 3.1552734375, 3.34185791015625, 3.5284423828125, 3.71502685546875, 3.901611328125, 4.08819580078125, 4.2747802734375, 4.46136474609375, 4.64794921875, 4.83453369140625, 5.0211181640625, 5.20770263671875, 5.394287109375, 5.58087158203125, 5.7674560546875, 5.95404052734375, 6.140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 10.0, 30.0, 84.0, 214.0, 291.0, 233.0, 100.0, 29.0, 9.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-135.7429656982422, -133.20912170410156, -130.67526245117188, -128.14141845703125, -125.6075668334961, -123.07371520996094, -120.53986358642578, -118.00601196289062, -115.47216796875, -112.93831634521484, -110.40446472167969, -107.87062072753906, -105.3367691040039, -102.80291748046875, -100.2690658569336, -97.73521423339844, -95.20137023925781, -92.66751861572266, -90.1336669921875, -87.59982299804688, -85.06597137451172, -82.53211975097656, -79.9982681274414, -77.46441650390625, -74.9305648803711, -72.39671325683594, -69.86286163330078, -67.32901763916016, -64.795166015625, -62.261314392089844, -59.72746276855469, -57.1936149597168, -54.65976333618164, -52.125911712646484, -49.592063903808594, -47.05821228027344, -44.52436447143555, -41.99051284790039, -39.4566650390625, -36.922813415527344, -34.38896179199219, -31.855112075805664, -29.32126235961914, -26.787410736083984, -24.253562927246094, -21.719711303710938, -19.185861587524414, -16.65201187133789, -14.1181640625, -11.584314346313477, -9.050464630126953, -6.516613960266113, -3.98276424407959, -1.4489145278930664, 1.0849361419677734, 3.618785858154297, 6.15263557434082, 8.686485290527344, 11.220335006713867, 13.754185676574707, 16.288036346435547, 18.821884155273438, 21.355735778808594, 23.889585494995117, 26.42343521118164]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 9.0, 6.0, 11.0, 14.0, 18.0, 27.0, 32.0, 46.0, 31.0, 41.0, 52.0, 65.0, 78.0, 55.0, 66.0, 54.0, 68.0, 59.0, 39.0, 56.0, 32.0, 35.0, 22.0, 22.0, 20.0, 13.0, 11.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-31.299800872802734, -30.542741775512695, -29.785682678222656, -29.02862548828125, -28.27156639099121, -27.514507293701172, -26.757448196411133, -26.000389099121094, -25.243331909179688, -24.48627281188965, -23.72921371459961, -22.972156524658203, -22.215097427368164, -21.458038330078125, -20.700979232788086, -19.943920135498047, -19.186861038208008, -18.42980194091797, -17.67274284362793, -16.91568374633789, -16.158626556396484, -15.401567459106445, -14.644508361816406, -13.887449264526367, -13.130391120910645, -12.373332023620605, -11.616273880004883, -10.859214782714844, -10.102155685424805, -9.345097541809082, -8.588038444519043, -7.830979824066162, -7.073921203613281, -6.3168625831604, -5.5598039627075195, -4.8027448654174805, -4.0456862449646, -3.2886276245117188, -2.5315685272216797, -1.7745099067687988, -1.017451286315918, -0.26039254665374756, 0.49666619300842285, 1.2537250518798828, 2.0107836723327637, 2.7678422927856445, 3.5249013900756836, 4.2819600105285645, 5.039018630981445, 5.796077251434326, 6.553135871887207, 7.310194969177246, 8.067253112792969, 8.824312210083008, 9.581371307373047, 10.338430404663086, 11.095488548278809, 11.852547645568848, 12.60960578918457, 13.36666488647461, 14.123723983764648, 14.880782127380371, 15.63784122467041, 16.394899368286133, 17.151958465576172]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 12.0, 11.0, 9.0, 16.0, 19.0, 35.0, 48.0, 87.0, 118.0, 219.0, 343.0, 558.0, 1144.0, 1993.0, 3828.0, 7886.0, 16771.0, 36886.0, 81388.0, 172695.0, 295911.0, 224315.0, 109908.0, 50128.0, 22923.0, 10503.0, 5041.0, 2573.0, 1360.0, 706.0, 408.0, 257.0, 150.0, 83.0, 61.0, 37.0, 36.0, 22.0, 20.0, 8.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.375, -10.0369873046875, -9.698974609375, -9.3609619140625, -9.02294921875, -8.6849365234375, -8.346923828125, -8.0089111328125, -7.6708984375, -7.3328857421875, -6.994873046875, -6.6568603515625, -6.31884765625, -5.9808349609375, -5.642822265625, -5.3048095703125, -4.966796875, -4.6287841796875, -4.290771484375, -3.9527587890625, -3.61474609375, -3.2767333984375, -2.938720703125, -2.6007080078125, -2.2626953125, -1.9246826171875, -1.586669921875, -1.2486572265625, -0.91064453125, -0.5726318359375, -0.234619140625, 0.1033935546875, 0.44140625, 0.7794189453125, 1.117431640625, 1.4554443359375, 1.79345703125, 2.1314697265625, 2.469482421875, 2.8074951171875, 3.1455078125, 3.4835205078125, 3.821533203125, 4.1595458984375, 4.49755859375, 4.8355712890625, 5.173583984375, 5.5115966796875, 5.849609375, 6.1876220703125, 6.525634765625, 6.8636474609375, 7.20166015625, 7.5396728515625, 7.877685546875, 8.2156982421875, 8.5537109375, 8.8917236328125, 9.229736328125, 9.5677490234375, 9.90576171875, 10.2437744140625, 10.581787109375, 10.9197998046875, 11.2578125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 16.0, 20.0, 20.0, 25.0, 19.0, 37.0, 43.0, 49.0, 43.0, 36.0, 48.0, 69.0, 62.0, 65.0, 74.0, 45.0, 41.0, 53.0, 48.0, 43.0, 23.0, 22.0, 26.0, 20.0, 13.0, 7.0, 6.0, 11.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.2265625, -4.1278076171875, -4.029052734375, -3.9302978515625, -3.83154296875, -3.7327880859375, -3.634033203125, -3.5352783203125, -3.4365234375, -3.3377685546875, -3.239013671875, -3.1402587890625, -3.04150390625, -2.9427490234375, -2.843994140625, -2.7452392578125, -2.646484375, -2.5477294921875, -2.448974609375, -2.3502197265625, -2.25146484375, -2.1527099609375, -2.053955078125, -1.9552001953125, -1.8564453125, -1.7576904296875, -1.658935546875, -1.5601806640625, -1.46142578125, -1.3626708984375, -1.263916015625, -1.1651611328125, -1.06640625, -0.9676513671875, -0.868896484375, -0.7701416015625, -0.67138671875, -0.5726318359375, -0.473876953125, -0.3751220703125, -0.2763671875, -0.1776123046875, -0.078857421875, 0.0198974609375, 0.11865234375, 0.2174072265625, 0.316162109375, 0.4149169921875, 0.513671875, 0.6124267578125, 0.711181640625, 0.8099365234375, 0.90869140625, 1.0074462890625, 1.106201171875, 1.2049560546875, 1.3037109375, 1.4024658203125, 1.501220703125, 1.5999755859375, 1.69873046875, 1.7974853515625, 1.896240234375, 1.9949951171875, 2.09375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 11.0, 21.0, 21.0, 17.0, 28.0, 49.0, 62.0, 70.0, 128.0, 172.0, 299.0, 438.0, 727.0, 1237.0, 2328.0, 4876.0, 11311.0, 28138.0, 78415.0, 215134.0, 389614.0, 198074.0, 71259.0, 25912.0, 10216.0, 4672.0, 2188.0, 1167.0, 689.0, 409.0, 262.0, 186.0, 115.0, 87.0, 59.0, 47.0, 30.0, 20.0, 13.0, 15.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-14.0859375, -13.6771240234375, -13.268310546875, -12.8594970703125, -12.45068359375, -12.0418701171875, -11.633056640625, -11.2242431640625, -10.8154296875, -10.4066162109375, -9.997802734375, -9.5889892578125, -9.18017578125, -8.7713623046875, -8.362548828125, -7.9537353515625, -7.544921875, -7.1361083984375, -6.727294921875, -6.3184814453125, -5.90966796875, -5.5008544921875, -5.092041015625, -4.6832275390625, -4.2744140625, -3.8656005859375, -3.456787109375, -3.0479736328125, -2.63916015625, -2.2303466796875, -1.821533203125, -1.4127197265625, -1.00390625, -0.5950927734375, -0.186279296875, 0.2225341796875, 0.63134765625, 1.0401611328125, 1.448974609375, 1.8577880859375, 2.2666015625, 2.6754150390625, 3.084228515625, 3.4930419921875, 3.90185546875, 4.3106689453125, 4.719482421875, 5.1282958984375, 5.537109375, 5.9459228515625, 6.354736328125, 6.7635498046875, 7.17236328125, 7.5811767578125, 7.989990234375, 8.3988037109375, 8.8076171875, 9.2164306640625, 9.625244140625, 10.0340576171875, 10.44287109375, 10.8516845703125, 11.260498046875, 11.6693115234375, 12.078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 2.0, 5.0, 8.0, 14.0, 3.0, 8.0, 8.0, 15.0, 13.0, 22.0, 19.0, 26.0, 29.0, 25.0, 42.0, 35.0, 39.0, 42.0, 34.0, 36.0, 35.0, 47.0, 40.0, 42.0, 45.0, 39.0, 43.0, 43.0, 30.0, 26.0, 28.0, 23.0, 20.0, 15.0, 9.0, 12.0, 18.0, 13.0, 8.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.9296875, -9.596435546875, -9.26318359375, -8.929931640625, -8.5966796875, -8.263427734375, -7.93017578125, -7.596923828125, -7.263671875, -6.930419921875, -6.59716796875, -6.263916015625, -5.9306640625, -5.597412109375, -5.26416015625, -4.930908203125, -4.59765625, -4.264404296875, -3.93115234375, -3.597900390625, -3.2646484375, -2.931396484375, -2.59814453125, -2.264892578125, -1.931640625, -1.598388671875, -1.26513671875, -0.931884765625, -0.5986328125, -0.265380859375, 0.06787109375, 0.401123046875, 0.734375, 1.067626953125, 1.40087890625, 1.734130859375, 2.0673828125, 2.400634765625, 2.73388671875, 3.067138671875, 3.400390625, 3.733642578125, 4.06689453125, 4.400146484375, 4.7333984375, 5.066650390625, 5.39990234375, 5.733154296875, 6.06640625, 6.399658203125, 6.73291015625, 7.066162109375, 7.3994140625, 7.732666015625, 8.06591796875, 8.399169921875, 8.732421875, 9.065673828125, 9.39892578125, 9.732177734375, 10.0654296875, 10.398681640625, 10.73193359375, 11.065185546875, 11.3984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 7.0, 9.0, 15.0, 34.0, 71.0, 158.0, 418.0, 1245.0, 5408.0, 35350.0, 352617.0, 578589.0, 63470.0, 8464.0, 1780.0, 557.0, 193.0, 85.0, 33.0, 17.0, 16.0, 6.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.234375, -14.8450927734375, -14.455810546875, -14.0665283203125, -13.67724609375, -13.2879638671875, -12.898681640625, -12.5093994140625, -12.1201171875, -11.7308349609375, -11.341552734375, -10.9522705078125, -10.56298828125, -10.1737060546875, -9.784423828125, -9.3951416015625, -9.005859375, -8.6165771484375, -8.227294921875, -7.8380126953125, -7.44873046875, -7.0594482421875, -6.670166015625, -6.2808837890625, -5.8916015625, -5.5023193359375, -5.113037109375, -4.7237548828125, -4.33447265625, -3.9451904296875, -3.555908203125, -3.1666259765625, -2.77734375, -2.3880615234375, -1.998779296875, -1.6094970703125, -1.22021484375, -0.8309326171875, -0.441650390625, -0.0523681640625, 0.3369140625, 0.7261962890625, 1.115478515625, 1.5047607421875, 1.89404296875, 2.2833251953125, 2.672607421875, 3.0618896484375, 3.451171875, 3.8404541015625, 4.229736328125, 4.6190185546875, 5.00830078125, 5.3975830078125, 5.786865234375, 6.1761474609375, 6.5654296875, 6.9547119140625, 7.343994140625, 7.7332763671875, 8.12255859375, 8.5118408203125, 8.901123046875, 9.2904052734375, 9.6796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 12.0, 5.0, 11.0, 10.0, 13.0, 10.0, 23.0, 26.0, 30.0, 37.0, 55.0, 81.0, 112.0, 139.0, 114.0, 80.0, 48.0, 39.0, 38.0, 27.0, 20.0, 12.0, 15.0, 8.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017251968383789062, -0.0016801655292510986, -0.001635134220123291, -0.0015901029109954834, -0.0015450716018676758, -0.0015000402927398682, -0.0014550089836120605, -0.001409977674484253, -0.0013649463653564453, -0.0013199150562286377, -0.00127488374710083, -0.0012298524379730225, -0.0011848211288452148, -0.0011397898197174072, -0.0010947585105895996, -0.001049727201461792, -0.0010046958923339844, -0.0009596645832061768, -0.0009146332740783691, -0.0008696019649505615, -0.0008245706558227539, -0.0007795393466949463, -0.0007345080375671387, -0.0006894767284393311, -0.0006444454193115234, -0.0005994141101837158, -0.0005543828010559082, -0.0005093514919281006, -0.00046432018280029297, -0.00041928887367248535, -0.00037425756454467773, -0.0003292262554168701, -0.0002841949462890625, -0.00023916363716125488, -0.00019413232803344727, -0.00014910101890563965, -0.00010406970977783203, -5.9038400650024414e-05, -1.4007091522216797e-05, 3.102421760559082e-05, 7.605552673339844e-05, 0.00012108683586120605, 0.00016611814498901367, 0.0002111494541168213, 0.0002561807632446289, 0.0003012120723724365, 0.00034624338150024414, 0.00039127469062805176, 0.0004363059997558594, 0.000481337308883667, 0.0005263686180114746, 0.0005713999271392822, 0.0006164312362670898, 0.0006614625453948975, 0.0007064938545227051, 0.0007515251636505127, 0.0007965564727783203, 0.0008415877819061279, 0.0008866190910339355, 0.0009316504001617432, 0.0009766817092895508, 0.0010217130184173584, 0.001066744327545166, 0.0011117756366729736, 0.0011568069458007812]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 13.0, 21.0, 30.0, 58.0, 102.0, 171.0, 311.0, 640.0, 1673.0, 5375.0, 24355.0, 176053.0, 692659.0, 122014.0, 18249.0, 4204.0, 1332.0, 587.0, 301.0, 158.0, 83.0, 48.0, 38.0, 15.0, 15.0, 7.0, 9.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7890625, -12.39453125, -12.0, -11.60546875, -11.2109375, -10.81640625, -10.421875, -10.02734375, -9.6328125, -9.23828125, -8.84375, -8.44921875, -8.0546875, -7.66015625, -7.265625, -6.87109375, -6.4765625, -6.08203125, -5.6875, -5.29296875, -4.8984375, -4.50390625, -4.109375, -3.71484375, -3.3203125, -2.92578125, -2.53125, -2.13671875, -1.7421875, -1.34765625, -0.953125, -0.55859375, -0.1640625, 0.23046875, 0.625, 1.01953125, 1.4140625, 1.80859375, 2.203125, 2.59765625, 2.9921875, 3.38671875, 3.78125, 4.17578125, 4.5703125, 4.96484375, 5.359375, 5.75390625, 6.1484375, 6.54296875, 6.9375, 7.33203125, 7.7265625, 8.12109375, 8.515625, 8.91015625, 9.3046875, 9.69921875, 10.09375, 10.48828125, 10.8828125, 11.27734375, 11.671875, 12.06640625, 12.4609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 7.0, 13.0, 22.0, 14.0, 32.0, 45.0, 74.0, 87.0, 120.0, 137.0, 125.0, 85.0, 53.0, 50.0, 46.0, 18.0, 19.0, 9.0, 13.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6484375, -6.39794921875, -6.1474609375, -5.89697265625, -5.646484375, -5.39599609375, -5.1455078125, -4.89501953125, -4.64453125, -4.39404296875, -4.1435546875, -3.89306640625, -3.642578125, -3.39208984375, -3.1416015625, -2.89111328125, -2.640625, -2.39013671875, -2.1396484375, -1.88916015625, -1.638671875, -1.38818359375, -1.1376953125, -0.88720703125, -0.63671875, -0.38623046875, -0.1357421875, 0.11474609375, 0.365234375, 0.61572265625, 0.8662109375, 1.11669921875, 1.3671875, 1.61767578125, 1.8681640625, 2.11865234375, 2.369140625, 2.61962890625, 2.8701171875, 3.12060546875, 3.37109375, 3.62158203125, 3.8720703125, 4.12255859375, 4.373046875, 4.62353515625, 4.8740234375, 5.12451171875, 5.375, 5.62548828125, 5.8759765625, 6.12646484375, 6.376953125, 6.62744140625, 6.8779296875, 7.12841796875, 7.37890625, 7.62939453125, 7.8798828125, 8.13037109375, 8.380859375, 8.63134765625, 8.8818359375, 9.13232421875, 9.3828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 18.0, 23.0, 45.0, 83.0, 143.0, 172.0, 170.0, 148.0, 90.0, 42.0, 32.0, 13.0, 8.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.83692932128906, -137.397705078125, -132.95849609375, -128.51927185058594, -124.08004760742188, -119.64082336425781, -115.20160675048828, -110.76239013671875, -106.32316589355469, -101.88394165039062, -97.4447250366211, -93.00550842285156, -88.5662841796875, -84.12705993652344, -79.6878433227539, -75.24862670898438, -70.80940246582031, -66.37017822265625, -61.93096160888672, -57.49174118041992, -53.052520751953125, -48.61330032348633, -44.17407989501953, -39.734859466552734, -35.29563903808594, -30.85641860961914, -26.417198181152344, -21.977977752685547, -17.53875732421875, -13.099536895751953, -8.660316467285156, -4.221096038818359, 0.2181396484375, 4.657360076904297, 9.096580505371094, 13.53580093383789, 17.975021362304688, 22.414241790771484, 26.85346221923828, 31.292682647705078, 35.731903076171875, 40.17112350463867, 44.61034393310547, 49.049564361572266, 53.48878479003906, 57.92800521850586, 62.367225646972656, 66.80644226074219, 71.24566650390625, 75.68489074707031, 80.12410736083984, 84.56332397460938, 89.00254821777344, 93.4417724609375, 97.88098907470703, 102.32020568847656, 106.75942993164062, 111.19865417480469, 115.63787078857422, 120.07708740234375, 124.51631164550781, 128.95553588867188, 133.39474487304688, 137.83396911621094, 142.273193359375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 9.0, 8.0, 5.0, 9.0, 12.0, 7.0, 17.0, 24.0, 31.0, 19.0, 31.0, 35.0, 23.0, 39.0, 23.0, 40.0, 42.0, 37.0, 37.0, 37.0, 43.0, 43.0, 55.0, 53.0, 26.0, 41.0, 33.0, 29.0, 24.0, 36.0, 23.0, 14.0, 9.0, 23.0, 10.0, 9.0, 6.0, 2.0, 2.0, 7.0, 9.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.4637451171875, -53.53178405761719, -51.599822998046875, -49.66786193847656, -47.73590087890625, -45.80393981933594, -43.871978759765625, -41.94002151489258, -40.008060455322266, -38.07609939575195, -36.14413833618164, -34.21217727661133, -32.280216217041016, -30.348257064819336, -28.416296005249023, -26.484336853027344, -24.5523738861084, -22.620412826538086, -20.688451766967773, -18.756492614746094, -16.82453155517578, -14.892570495605469, -12.960609436035156, -11.02864933013916, -9.096688270568848, -7.164727687835693, -5.232767105102539, -3.3008060455322266, -1.3688454627990723, 0.563115119934082, 2.4950761795043945, 4.427036285400391, 6.358997344970703, 8.290958404541016, 10.222918510437012, 12.154879570007324, 14.08683967590332, 16.018800735473633, 17.950761795043945, 19.882720947265625, 21.814682006835938, 23.74664306640625, 25.678604125976562, 27.610565185546875, 29.542524337768555, 31.474485397338867, 33.40644836425781, 35.33840560913086, 37.27037048339844, 39.20233154296875, 41.13429260253906, 43.066253662109375, 44.99821472167969, 46.93017578125, 48.86213684082031, 50.79409408569336, 52.72605514526367, 54.658016204833984, 56.5899772644043, 58.52193832397461, 60.45389938354492, 62.38585662841797, 64.31781768798828, 66.2497787475586, 68.1817398071289]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 4.0, 12.0, 17.0, 25.0, 32.0, 49.0, 81.0, 110.0, 154.0, 282.0, 457.0, 761.0, 1406.0, 2593.0, 5568.0, 12903.0, 35093.0, 125368.0, 1723787.0, 2093684.0, 130645.0, 36169.0, 13395.0, 5666.0, 2835.0, 1333.0, 727.0, 419.0, 254.0, 162.0, 99.0, 55.0, 37.0, 27.0, 27.0, 14.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.3984375, -14.9708251953125, -14.543212890625, -14.1156005859375, -13.68798828125, -13.2603759765625, -12.832763671875, -12.4051513671875, -11.9775390625, -11.5499267578125, -11.122314453125, -10.6947021484375, -10.26708984375, -9.8394775390625, -9.411865234375, -8.9842529296875, -8.556640625, -8.1290283203125, -7.701416015625, -7.2738037109375, -6.84619140625, -6.4185791015625, -5.990966796875, -5.5633544921875, -5.1357421875, -4.7081298828125, -4.280517578125, -3.8529052734375, -3.42529296875, -2.9976806640625, -2.570068359375, -2.1424560546875, -1.71484375, -1.2872314453125, -0.859619140625, -0.4320068359375, -0.00439453125, 0.4232177734375, 0.850830078125, 1.2784423828125, 1.7060546875, 2.1336669921875, 2.561279296875, 2.9888916015625, 3.41650390625, 3.8441162109375, 4.271728515625, 4.6993408203125, 5.126953125, 5.5545654296875, 5.982177734375, 6.4097900390625, 6.83740234375, 7.2650146484375, 7.692626953125, 8.1202392578125, 8.5478515625, 8.9754638671875, 9.403076171875, 9.8306884765625, 10.25830078125, 10.6859130859375, 11.113525390625, 11.5411376953125, 11.96875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 14.0, 23.0, 30.0, 25.0, 36.0, 38.0, 53.0, 53.0, 44.0, 43.0, 69.0, 60.0, 69.0, 66.0, 43.0, 68.0, 50.0, 43.0, 34.0, 36.0, 22.0, 22.0, 7.0, 7.0, 7.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-4.078125, -3.977630615234375, -3.87713623046875, -3.776641845703125, -3.6761474609375, -3.575653076171875, -3.47515869140625, -3.374664306640625, -3.274169921875, -3.173675537109375, -3.07318115234375, -2.972686767578125, -2.8721923828125, -2.771697998046875, -2.67120361328125, -2.570709228515625, -2.47021484375, -2.369720458984375, -2.26922607421875, -2.168731689453125, -2.0682373046875, -1.967742919921875, -1.86724853515625, -1.766754150390625, -1.666259765625, -1.565765380859375, -1.46527099609375, -1.364776611328125, -1.2642822265625, -1.163787841796875, -1.06329345703125, -0.962799072265625, -0.8623046875, -0.761810302734375, -0.66131591796875, -0.560821533203125, -0.4603271484375, -0.359832763671875, -0.25933837890625, -0.158843994140625, -0.058349609375, 0.042144775390625, 0.14263916015625, 0.243133544921875, 0.3436279296875, 0.444122314453125, 0.54461669921875, 0.645111083984375, 0.74560546875, 0.846099853515625, 0.94659423828125, 1.047088623046875, 1.1475830078125, 1.248077392578125, 1.34857177734375, 1.449066162109375, 1.549560546875, 1.650054931640625, 1.75054931640625, 1.851043701171875, 1.9515380859375, 2.052032470703125, 2.15252685546875, 2.253021240234375, 2.353515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 4.0, 7.0, 9.0, 12.0, 15.0, 16.0, 27.0, 51.0, 70.0, 100.0, 149.0, 251.0, 367.0, 586.0, 1117.0, 1921.0, 3581.0, 7316.0, 16553.0, 43002.0, 141856.0, 786028.0, 2722212.0, 335258.0, 82095.0, 28064.0, 11524.0, 5522.0, 2819.0, 1442.0, 898.0, 463.0, 343.0, 177.0, 120.0, 86.0, 63.0, 44.0, 37.0, 22.0, 17.0, 12.0, 9.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.6953125, -12.33544921875, -11.9755859375, -11.61572265625, -11.255859375, -10.89599609375, -10.5361328125, -10.17626953125, -9.81640625, -9.45654296875, -9.0966796875, -8.73681640625, -8.376953125, -8.01708984375, -7.6572265625, -7.29736328125, -6.9375, -6.57763671875, -6.2177734375, -5.85791015625, -5.498046875, -5.13818359375, -4.7783203125, -4.41845703125, -4.05859375, -3.69873046875, -3.3388671875, -2.97900390625, -2.619140625, -2.25927734375, -1.8994140625, -1.53955078125, -1.1796875, -0.81982421875, -0.4599609375, -0.10009765625, 0.259765625, 0.61962890625, 0.9794921875, 1.33935546875, 1.69921875, 2.05908203125, 2.4189453125, 2.77880859375, 3.138671875, 3.49853515625, 3.8583984375, 4.21826171875, 4.578125, 4.93798828125, 5.2978515625, 5.65771484375, 6.017578125, 6.37744140625, 6.7373046875, 7.09716796875, 7.45703125, 7.81689453125, 8.1767578125, 8.53662109375, 8.896484375, 9.25634765625, 9.6162109375, 9.97607421875, 10.3359375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 8.0, 8.0, 10.0, 15.0, 14.0, 24.0, 48.0, 73.0, 85.0, 143.0, 245.0, 482.0, 1189.0, 738.0, 365.0, 205.0, 131.0, 82.0, 45.0, 33.0, 22.0, 25.0, 22.0, 13.0, 4.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.72991943359375, -4.5457763671875, -4.36163330078125, -4.177490234375, -3.99334716796875, -3.8092041015625, -3.62506103515625, -3.44091796875, -3.25677490234375, -3.0726318359375, -2.88848876953125, -2.704345703125, -2.52020263671875, -2.3360595703125, -2.15191650390625, -1.9677734375, -1.78363037109375, -1.5994873046875, -1.41534423828125, -1.231201171875, -1.04705810546875, -0.8629150390625, -0.67877197265625, -0.49462890625, -0.31048583984375, -0.1263427734375, 0.05780029296875, 0.241943359375, 0.42608642578125, 0.6102294921875, 0.79437255859375, 0.978515625, 1.16265869140625, 1.3468017578125, 1.53094482421875, 1.715087890625, 1.89923095703125, 2.0833740234375, 2.26751708984375, 2.45166015625, 2.63580322265625, 2.8199462890625, 3.00408935546875, 3.188232421875, 3.37237548828125, 3.5565185546875, 3.74066162109375, 3.9248046875, 4.10894775390625, 4.2930908203125, 4.47723388671875, 4.661376953125, 4.84552001953125, 5.0296630859375, 5.21380615234375, 5.39794921875, 5.58209228515625, 5.7662353515625, 5.95037841796875, 6.134521484375, 6.31866455078125, 6.5028076171875, 6.68695068359375, 6.87109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 9.0, 14.0, 15.0, 24.0, 52.0, 84.0, 79.0, 127.0, 145.0, 105.0, 100.0, 79.0, 61.0, 46.0, 29.0, 8.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.97651290893555, -38.51361083984375, -37.05070877075195, -35.587806701660156, -34.12490463256836, -32.66200256347656, -31.199098587036133, -29.736196517944336, -28.27329444885254, -26.810392379760742, -25.347490310668945, -23.884586334228516, -22.42168426513672, -20.958782196044922, -19.495880126953125, -18.032978057861328, -16.57007598876953, -15.107173919677734, -13.644271850585938, -12.181368827819824, -10.718466758728027, -9.25556468963623, -7.792661666870117, -6.32975959777832, -4.866857528686523, -3.4039552211761475, -1.9410529136657715, -0.4781503677368164, 0.9847517013549805, 2.4476537704467773, 3.9105567932128906, 5.3734588623046875, 6.836357116699219, 8.299259185791016, 9.762161254882812, 11.225064277648926, 12.687966346740723, 14.15086841583252, 15.613771438598633, 17.07667350769043, 18.539575576782227, 20.002477645874023, 21.46537971496582, 22.92828369140625, 24.391185760498047, 25.854087829589844, 27.31698989868164, 28.779891967773438, 30.242794036865234, 31.70569610595703, 33.16859817504883, 34.631500244140625, 36.09440231323242, 37.55730438232422, 39.02021026611328, 40.48310852050781, 41.946014404296875, 43.40891647338867, 44.87181854248047, 46.334720611572266, 47.79762268066406, 49.26052474975586, 50.723426818847656, 52.18633270263672, 53.64923095703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 2.0, 5.0, 13.0, 12.0, 18.0, 11.0, 18.0, 20.0, 21.0, 28.0, 22.0, 27.0, 34.0, 34.0, 33.0, 43.0, 46.0, 35.0, 47.0, 50.0, 40.0, 40.0, 42.0, 25.0, 42.0, 31.0, 25.0, 32.0, 20.0, 28.0, 24.0, 26.0, 13.0, 14.0, 14.0, 8.0, 15.0, 5.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.687936782836914, -20.018146514892578, -19.348358154296875, -18.67856788635254, -18.008777618408203, -17.338987350463867, -16.66919708251953, -15.999408721923828, -15.329618453979492, -14.659828186035156, -13.990038871765137, -13.320249557495117, -12.650459289550781, -11.980669021606445, -11.310879707336426, -10.641090393066406, -9.97130012512207, -9.301509857177734, -8.631720542907715, -7.961930751800537, -7.292140960693359, -6.622351169586182, -5.952561378479004, -5.282771587371826, -4.612981796264648, -3.9431920051574707, -3.273402214050293, -2.6036124229431152, -1.9338226318359375, -1.2640328407287598, -0.594243049621582, 0.0755467414855957, 0.7453384399414062, 1.415128231048584, 2.0849180221557617, 2.7547078132629395, 3.424497604370117, 4.094287395477295, 4.764077186584473, 5.43386697769165, 6.103656768798828, 6.773446559906006, 7.443236351013184, 8.113025665283203, 8.782815933227539, 9.452606201171875, 10.122395515441895, 10.792184829711914, 11.46197509765625, 12.131765365600586, 12.801554679870605, 13.471343994140625, 14.141134262084961, 14.810924530029297, 15.480713844299316, 16.150503158569336, 16.820293426513672, 17.490083694458008, 18.159873962402344, 18.829662322998047, 19.499452590942383, 20.16924285888672, 20.839031219482422, 21.508821487426758, 22.178611755371094]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 8.0, 9.0, 5.0, 13.0, 26.0, 38.0, 51.0, 97.0, 154.0, 242.0, 492.0, 880.0, 2094.0, 5065.0, 13942.0, 41274.0, 121938.0, 352358.0, 334496.0, 114642.0, 38907.0, 13304.0, 4694.0, 1891.0, 876.0, 433.0, 234.0, 139.0, 100.0, 59.0, 32.0, 22.0, 16.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.703125, -15.17919921875, -14.6552734375, -14.13134765625, -13.607421875, -13.08349609375, -12.5595703125, -12.03564453125, -11.51171875, -10.98779296875, -10.4638671875, -9.93994140625, -9.416015625, -8.89208984375, -8.3681640625, -7.84423828125, -7.3203125, -6.79638671875, -6.2724609375, -5.74853515625, -5.224609375, -4.70068359375, -4.1767578125, -3.65283203125, -3.12890625, -2.60498046875, -2.0810546875, -1.55712890625, -1.033203125, -0.50927734375, 0.0146484375, 0.53857421875, 1.0625, 1.58642578125, 2.1103515625, 2.63427734375, 3.158203125, 3.68212890625, 4.2060546875, 4.72998046875, 5.25390625, 5.77783203125, 6.3017578125, 6.82568359375, 7.349609375, 7.87353515625, 8.3974609375, 8.92138671875, 9.4453125, 9.96923828125, 10.4931640625, 11.01708984375, 11.541015625, 12.06494140625, 12.5888671875, 13.11279296875, 13.63671875, 14.16064453125, 14.6845703125, 15.20849609375, 15.732421875, 16.25634765625, 16.7802734375, 17.30419921875, 17.828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 11.0, 18.0, 26.0, 25.0, 17.0, 33.0, 52.0, 58.0, 50.0, 57.0, 68.0, 56.0, 80.0, 63.0, 59.0, 62.0, 47.0, 50.0, 37.0, 29.0, 29.0, 19.0, 15.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.359375, -4.253326416015625, -4.14727783203125, -4.041229248046875, -3.9351806640625, -3.829132080078125, -3.72308349609375, -3.617034912109375, -3.510986328125, -3.404937744140625, -3.29888916015625, -3.192840576171875, -3.0867919921875, -2.980743408203125, -2.87469482421875, -2.768646240234375, -2.66259765625, -2.556549072265625, -2.45050048828125, -2.344451904296875, -2.2384033203125, -2.132354736328125, -2.02630615234375, -1.920257568359375, -1.814208984375, -1.708160400390625, -1.60211181640625, -1.496063232421875, -1.3900146484375, -1.283966064453125, -1.17791748046875, -1.071868896484375, -0.9658203125, -0.859771728515625, -0.75372314453125, -0.647674560546875, -0.5416259765625, -0.435577392578125, -0.32952880859375, -0.223480224609375, -0.117431640625, -0.011383056640625, 0.09466552734375, 0.200714111328125, 0.3067626953125, 0.412811279296875, 0.51885986328125, 0.624908447265625, 0.73095703125, 0.837005615234375, 0.94305419921875, 1.049102783203125, 1.1551513671875, 1.261199951171875, 1.36724853515625, 1.473297119140625, 1.579345703125, 1.685394287109375, 1.79144287109375, 1.897491455078125, 2.0035400390625, 2.109588623046875, 2.21563720703125, 2.321685791015625, 2.427734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 10.0, 16.0, 22.0, 37.0, 75.0, 99.0, 147.0, 240.0, 458.0, 980.0, 2232.0, 5597.0, 14792.0, 44471.0, 141750.0, 418010.0, 285664.0, 88680.0, 28558.0, 9949.0, 3676.0, 1497.0, 727.0, 350.0, 195.0, 118.0, 64.0, 36.0, 19.0, 23.0, 13.0, 12.0, 10.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.171875, -13.6962890625, -13.220703125, -12.7451171875, -12.26953125, -11.7939453125, -11.318359375, -10.8427734375, -10.3671875, -9.8916015625, -9.416015625, -8.9404296875, -8.46484375, -7.9892578125, -7.513671875, -7.0380859375, -6.5625, -6.0869140625, -5.611328125, -5.1357421875, -4.66015625, -4.1845703125, -3.708984375, -3.2333984375, -2.7578125, -2.2822265625, -1.806640625, -1.3310546875, -0.85546875, -0.3798828125, 0.095703125, 0.5712890625, 1.046875, 1.5224609375, 1.998046875, 2.4736328125, 2.94921875, 3.4248046875, 3.900390625, 4.3759765625, 4.8515625, 5.3271484375, 5.802734375, 6.2783203125, 6.75390625, 7.2294921875, 7.705078125, 8.1806640625, 8.65625, 9.1318359375, 9.607421875, 10.0830078125, 10.55859375, 11.0341796875, 11.509765625, 11.9853515625, 12.4609375, 12.9365234375, 13.412109375, 13.8876953125, 14.36328125, 14.8388671875, 15.314453125, 15.7900390625, 16.265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 9.0, 10.0, 15.0, 16.0, 16.0, 20.0, 12.0, 16.0, 25.0, 24.0, 29.0, 26.0, 36.0, 31.0, 28.0, 43.0, 51.0, 34.0, 51.0, 31.0, 42.0, 43.0, 38.0, 31.0, 37.0, 38.0, 33.0, 28.0, 29.0, 22.0, 22.0, 9.0, 11.0, 13.0, 14.0, 11.0, 12.0, 2.0, 8.0, 7.0, 1.0, 5.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.046875, -10.710205078125, -10.37353515625, -10.036865234375, -9.7001953125, -9.363525390625, -9.02685546875, -8.690185546875, -8.353515625, -8.016845703125, -7.68017578125, -7.343505859375, -7.0068359375, -6.670166015625, -6.33349609375, -5.996826171875, -5.66015625, -5.323486328125, -4.98681640625, -4.650146484375, -4.3134765625, -3.976806640625, -3.64013671875, -3.303466796875, -2.966796875, -2.630126953125, -2.29345703125, -1.956787109375, -1.6201171875, -1.283447265625, -0.94677734375, -0.610107421875, -0.2734375, 0.063232421875, 0.39990234375, 0.736572265625, 1.0732421875, 1.409912109375, 1.74658203125, 2.083251953125, 2.419921875, 2.756591796875, 3.09326171875, 3.429931640625, 3.7666015625, 4.103271484375, 4.43994140625, 4.776611328125, 5.11328125, 5.449951171875, 5.78662109375, 6.123291015625, 6.4599609375, 6.796630859375, 7.13330078125, 7.469970703125, 7.806640625, 8.143310546875, 8.47998046875, 8.816650390625, 9.1533203125, 9.489990234375, 9.82666015625, 10.163330078125, 10.5]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 7.0, 8.0, 15.0, 25.0, 37.0, 74.0, 123.0, 284.0, 855.0, 3396.0, 20196.0, 212573.0, 723437.0, 75395.0, 9305.0, 1799.0, 539.0, 205.0, 90.0, 56.0, 43.0, 28.0, 8.0, 12.0, 8.0, 2.0, 5.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.2576904296875, -11.773193359375, -11.2886962890625, -10.80419921875, -10.3197021484375, -9.835205078125, -9.3507080078125, -8.8662109375, -8.3817138671875, -7.897216796875, -7.4127197265625, -6.92822265625, -6.4437255859375, -5.959228515625, -5.4747314453125, -4.990234375, -4.5057373046875, -4.021240234375, -3.5367431640625, -3.05224609375, -2.5677490234375, -2.083251953125, -1.5987548828125, -1.1142578125, -0.6297607421875, -0.145263671875, 0.3392333984375, 0.82373046875, 1.3082275390625, 1.792724609375, 2.2772216796875, 2.76171875, 3.2462158203125, 3.730712890625, 4.2152099609375, 4.69970703125, 5.1842041015625, 5.668701171875, 6.1531982421875, 6.6376953125, 7.1221923828125, 7.606689453125, 8.0911865234375, 8.57568359375, 9.0601806640625, 9.544677734375, 10.0291748046875, 10.513671875, 10.9981689453125, 11.482666015625, 11.9671630859375, 12.45166015625, 12.9361572265625, 13.420654296875, 13.9051513671875, 14.3896484375, 14.8741455078125, 15.358642578125, 15.8431396484375, 16.32763671875, 16.8121337890625, 17.296630859375, 17.7811279296875, 18.265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 9.0, 1.0, 2.0, 10.0, 10.0, 15.0, 18.0, 22.0, 19.0, 28.0, 27.0, 46.0, 66.0, 105.0, 143.0, 124.0, 99.0, 58.0, 34.0, 31.0, 28.0, 15.0, 15.0, 12.0, 8.0, 14.0, 5.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012731552124023438, -0.0012291669845581055, -0.0011851787567138672, -0.001141190528869629, -0.0010972023010253906, -0.0010532140731811523, -0.001009225845336914, -0.0009652376174926758, -0.0009212493896484375, -0.0008772611618041992, -0.0008332729339599609, -0.0007892847061157227, -0.0007452964782714844, -0.0007013082504272461, -0.0006573200225830078, -0.0006133317947387695, -0.0005693435668945312, -0.000525355339050293, -0.0004813671112060547, -0.0004373788833618164, -0.0003933906555175781, -0.00034940242767333984, -0.00030541419982910156, -0.0002614259719848633, -0.000217437744140625, -0.00017344951629638672, -0.00012946128845214844, -8.547306060791016e-05, -4.1484832763671875e-05, 2.5033950805664062e-06, 4.649162292480469e-05, 9.047985076904297e-05, 0.00013446807861328125, 0.00017845630645751953, 0.0002224445343017578, 0.0002664327621459961, 0.0003104209899902344, 0.00035440921783447266, 0.00039839744567871094, 0.0004423856735229492, 0.0004863739013671875, 0.0005303621292114258, 0.0005743503570556641, 0.0006183385848999023, 0.0006623268127441406, 0.0007063150405883789, 0.0007503032684326172, 0.0007942914962768555, 0.0008382797241210938, 0.000882267951965332, 0.0009262561798095703, 0.0009702444076538086, 0.0010142326354980469, 0.0010582208633422852, 0.0011022090911865234, 0.0011461973190307617, 0.001190185546875, 0.0012341737747192383, 0.0012781620025634766, 0.0013221502304077148, 0.0013661384582519531, 0.0014101266860961914, 0.0014541149139404297, 0.001498103141784668, 0.0015420913696289062]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 12.0, 10.0, 13.0, 25.0, 16.0, 42.0, 47.0, 56.0, 97.0, 169.0, 252.0, 433.0, 748.0, 1327.0, 3027.0, 7764.0, 24759.0, 109996.0, 556113.0, 271184.0, 49894.0, 13200.0, 4834.0, 2058.0, 1002.0, 548.0, 295.0, 190.0, 123.0, 101.0, 65.0, 45.0, 32.0, 19.0, 15.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.9296875, -8.6295166015625, -8.329345703125, -8.0291748046875, -7.72900390625, -7.4288330078125, -7.128662109375, -6.8284912109375, -6.5283203125, -6.2281494140625, -5.927978515625, -5.6278076171875, -5.32763671875, -5.0274658203125, -4.727294921875, -4.4271240234375, -4.126953125, -3.8267822265625, -3.526611328125, -3.2264404296875, -2.92626953125, -2.6260986328125, -2.325927734375, -2.0257568359375, -1.7255859375, -1.4254150390625, -1.125244140625, -0.8250732421875, -0.52490234375, -0.2247314453125, 0.075439453125, 0.3756103515625, 0.67578125, 0.9759521484375, 1.276123046875, 1.5762939453125, 1.87646484375, 2.1766357421875, 2.476806640625, 2.7769775390625, 3.0771484375, 3.3773193359375, 3.677490234375, 3.9776611328125, 4.27783203125, 4.5780029296875, 4.878173828125, 5.1783447265625, 5.478515625, 5.7786865234375, 6.078857421875, 6.3790283203125, 6.67919921875, 6.9793701171875, 7.279541015625, 7.5797119140625, 7.8798828125, 8.1800537109375, 8.480224609375, 8.7803955078125, 9.08056640625, 9.3807373046875, 9.680908203125, 9.9810791015625, 10.28125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 5.0, 7.0, 12.0, 10.0, 22.0, 44.0, 67.0, 84.0, 129.0, 185.0, 142.0, 92.0, 65.0, 48.0, 29.0, 17.0, 9.0, 7.0, 8.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0228271484375, -7.709716796875, -7.3966064453125, -7.08349609375, -6.7703857421875, -6.457275390625, -6.1441650390625, -5.8310546875, -5.5179443359375, -5.204833984375, -4.8917236328125, -4.57861328125, -4.2655029296875, -3.952392578125, -3.6392822265625, -3.326171875, -3.0130615234375, -2.699951171875, -2.3868408203125, -2.07373046875, -1.7606201171875, -1.447509765625, -1.1343994140625, -0.8212890625, -0.5081787109375, -0.195068359375, 0.1180419921875, 0.43115234375, 0.7442626953125, 1.057373046875, 1.3704833984375, 1.68359375, 1.9967041015625, 2.309814453125, 2.6229248046875, 2.93603515625, 3.2491455078125, 3.562255859375, 3.8753662109375, 4.1884765625, 4.5015869140625, 4.814697265625, 5.1278076171875, 5.44091796875, 5.7540283203125, 6.067138671875, 6.3802490234375, 6.693359375, 7.0064697265625, 7.319580078125, 7.6326904296875, 7.94580078125, 8.2589111328125, 8.572021484375, 8.8851318359375, 9.1982421875, 9.5113525390625, 9.824462890625, 10.1375732421875, 10.45068359375, 10.7637939453125, 11.076904296875, 11.3900146484375, 11.703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 9.0, 12.0, 13.0, 27.0, 36.0, 54.0, 60.0, 88.0, 106.0, 111.0, 93.0, 100.0, 86.0, 55.0, 47.0, 30.0, 26.0, 13.0, 12.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-106.55751037597656, -103.81463623046875, -101.07176971435547, -98.32889556884766, -95.58602142333984, -92.84314727783203, -90.10028076171875, -87.35740661621094, -84.61453247070312, -81.87165832519531, -79.12879180908203, -76.38591766357422, -73.6430435180664, -70.9001693725586, -68.15730285644531, -65.4144287109375, -62.67155838012695, -59.928688049316406, -57.185813903808594, -54.44294357299805, -51.700069427490234, -48.95719909667969, -46.214324951171875, -43.47145462036133, -40.72858428955078, -37.985713958740234, -35.24283981323242, -32.499969482421875, -29.757095336914062, -27.014225006103516, -24.271352767944336, -21.528480529785156, -18.785606384277344, -16.042734146118164, -13.299861907958984, -10.556990623474121, -7.814118385314941, -5.071246147155762, -2.3283748626708984, 0.41449737548828125, 3.157369613647461, 5.900241851806641, 8.64311408996582, 11.385985374450684, 14.128857612609863, 16.87173080444336, 19.614601135253906, 22.357473373413086, 25.100345611572266, 27.843217849731445, 30.586090087890625, 33.32896041870117, 36.071834564208984, 38.81470489501953, 41.557579040527344, 44.30044937133789, 47.04331970214844, 49.786190032958984, 52.5290641784668, 55.271934509277344, 58.014808654785156, 60.7576789855957, 63.50054931640625, 66.24342346191406, 68.98629760742188]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 1.0, 4.0, 6.0, 9.0, 13.0, 16.0, 17.0, 14.0, 20.0, 16.0, 23.0, 30.0, 36.0, 40.0, 26.0, 35.0, 44.0, 45.0, 29.0, 45.0, 44.0, 43.0, 40.0, 53.0, 37.0, 46.0, 37.0, 30.0, 32.0, 25.0, 30.0, 16.0, 18.0, 14.0, 14.0, 6.0, 9.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0], "bins": [-68.12063598632812, -66.09707641601562, -64.07352447509766, -62.04996871948242, -60.02641296386719, -58.00285720825195, -55.97930145263672, -53.95574188232422, -51.93218994140625, -49.908634185791016, -47.88507843017578, -45.86152267456055, -43.83796691894531, -41.81441116333008, -39.790855407714844, -37.767295837402344, -35.74374008178711, -33.720184326171875, -31.69662857055664, -29.673072814941406, -27.649517059326172, -25.625961303710938, -23.60240364074707, -21.578847885131836, -19.5552921295166, -17.531736373901367, -15.508180618286133, -13.484623908996582, -11.461068153381348, -9.437512397766113, -7.4139556884765625, -5.390399932861328, -3.3668479919433594, -1.343291997909546, 0.6802639961242676, 2.70382022857666, 4.7273759841918945, 6.750931739807129, 8.77448844909668, 10.798044204711914, 12.821599960327148, 14.845155715942383, 16.868711471557617, 18.892269134521484, 20.91582489013672, 22.939380645751953, 24.962936401367188, 26.986492156982422, 29.010047912597656, 31.03360366821289, 33.057159423828125, 35.08071517944336, 37.104270935058594, 39.12782669067383, 41.15138244628906, 43.17494201660156, 45.19849395751953, 47.222049713134766, 49.24560546875, 51.269161224365234, 53.29271697998047, 55.3162727355957, 57.33982849121094, 59.36338806152344, 61.38694381713867]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 9.0, 4.0, 8.0, 11.0, 13.0, 28.0, 29.0, 33.0, 71.0, 85.0, 134.0, 167.0, 318.0, 403.0, 653.0, 1147.0, 2001.0, 3910.0, 8254.0, 20065.0, 63135.0, 375856.0, 3457425.0, 188854.0, 43184.0, 14821.0, 6223.0, 3153.0, 1662.0, 936.0, 546.0, 390.0, 253.0, 159.0, 103.0, 65.0, 45.0, 41.0, 30.0, 16.0, 11.0, 12.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-13.4921875, -13.1209716796875, -12.749755859375, -12.3785400390625, -12.00732421875, -11.6361083984375, -11.264892578125, -10.8936767578125, -10.5224609375, -10.1512451171875, -9.780029296875, -9.4088134765625, -9.03759765625, -8.6663818359375, -8.295166015625, -7.9239501953125, -7.552734375, -7.1815185546875, -6.810302734375, -6.4390869140625, -6.06787109375, -5.6966552734375, -5.325439453125, -4.9542236328125, -4.5830078125, -4.2117919921875, -3.840576171875, -3.4693603515625, -3.09814453125, -2.7269287109375, -2.355712890625, -1.9844970703125, -1.61328125, -1.2420654296875, -0.870849609375, -0.4996337890625, -0.12841796875, 0.2427978515625, 0.614013671875, 0.9852294921875, 1.3564453125, 1.7276611328125, 2.098876953125, 2.4700927734375, 2.84130859375, 3.2125244140625, 3.583740234375, 3.9549560546875, 4.326171875, 4.6973876953125, 5.068603515625, 5.4398193359375, 5.81103515625, 6.1822509765625, 6.553466796875, 6.9246826171875, 7.2958984375, 7.6671142578125, 8.038330078125, 8.4095458984375, 8.78076171875, 9.1519775390625, 9.523193359375, 9.8944091796875, 10.265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 5.0, 7.0, 12.0, 16.0, 24.0, 14.0, 29.0, 39.0, 55.0, 55.0, 60.0, 65.0, 65.0, 71.0, 75.0, 50.0, 72.0, 62.0, 51.0, 56.0, 31.0, 21.0, 17.0, 15.0, 11.0, 6.0, 9.0, 4.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.34765625, -4.22900390625, -4.1103515625, -3.99169921875, -3.873046875, -3.75439453125, -3.6357421875, -3.51708984375, -3.3984375, -3.27978515625, -3.1611328125, -3.04248046875, -2.923828125, -2.80517578125, -2.6865234375, -2.56787109375, -2.44921875, -2.33056640625, -2.2119140625, -2.09326171875, -1.974609375, -1.85595703125, -1.7373046875, -1.61865234375, -1.5, -1.38134765625, -1.2626953125, -1.14404296875, -1.025390625, -0.90673828125, -0.7880859375, -0.66943359375, -0.55078125, -0.43212890625, -0.3134765625, -0.19482421875, -0.076171875, 0.04248046875, 0.1611328125, 0.27978515625, 0.3984375, 0.51708984375, 0.6357421875, 0.75439453125, 0.873046875, 0.99169921875, 1.1103515625, 1.22900390625, 1.34765625, 1.46630859375, 1.5849609375, 1.70361328125, 1.822265625, 1.94091796875, 2.0595703125, 2.17822265625, 2.296875, 2.41552734375, 2.5341796875, 2.65283203125, 2.771484375, 2.89013671875, 3.0087890625, 3.12744140625, 3.24609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 14.0, 18.0, 36.0, 75.0, 102.0, 199.0, 348.0, 599.0, 1143.0, 2076.0, 4284.0, 9580.0, 24231.0, 75963.0, 396053.0, 3163475.0, 397384.0, 76263.0, 24317.0, 9574.0, 4111.0, 2075.0, 1045.0, 549.0, 316.0, 180.0, 103.0, 68.0, 36.0, 26.0, 18.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.714599609375, -8.35888671875, -8.003173828125, -7.6474609375, -7.291748046875, -6.93603515625, -6.580322265625, -6.224609375, -5.868896484375, -5.51318359375, -5.157470703125, -4.8017578125, -4.446044921875, -4.09033203125, -3.734619140625, -3.37890625, -3.023193359375, -2.66748046875, -2.311767578125, -1.9560546875, -1.600341796875, -1.24462890625, -0.888916015625, -0.533203125, -0.177490234375, 0.17822265625, 0.533935546875, 0.8896484375, 1.245361328125, 1.60107421875, 1.956787109375, 2.3125, 2.668212890625, 3.02392578125, 3.379638671875, 3.7353515625, 4.091064453125, 4.44677734375, 4.802490234375, 5.158203125, 5.513916015625, 5.86962890625, 6.225341796875, 6.5810546875, 6.936767578125, 7.29248046875, 7.648193359375, 8.00390625, 8.359619140625, 8.71533203125, 9.071044921875, 9.4267578125, 9.782470703125, 10.13818359375, 10.493896484375, 10.849609375, 11.205322265625, 11.56103515625, 11.916748046875, 12.2724609375, 12.628173828125, 12.98388671875, 13.339599609375, 13.6953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 7.0, 5.0, 7.0, 8.0, 12.0, 14.0, 22.0, 22.0, 38.0, 43.0, 86.0, 112.0, 232.0, 379.0, 1095.0, 949.0, 385.0, 234.0, 129.0, 63.0, 62.0, 43.0, 27.0, 8.0, 16.0, 19.0, 11.0, 6.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.33984375, -4.212005615234375, -4.08416748046875, -3.956329345703125, -3.8284912109375, -3.700653076171875, -3.57281494140625, -3.444976806640625, -3.317138671875, -3.189300537109375, -3.06146240234375, -2.933624267578125, -2.8057861328125, -2.677947998046875, -2.55010986328125, -2.422271728515625, -2.29443359375, -2.166595458984375, -2.03875732421875, -1.910919189453125, -1.7830810546875, -1.655242919921875, -1.52740478515625, -1.399566650390625, -1.271728515625, -1.143890380859375, -1.01605224609375, -0.888214111328125, -0.7603759765625, -0.632537841796875, -0.50469970703125, -0.376861572265625, -0.2490234375, -0.121185302734375, 0.00665283203125, 0.134490966796875, 0.2623291015625, 0.390167236328125, 0.51800537109375, 0.645843505859375, 0.773681640625, 0.901519775390625, 1.02935791015625, 1.157196044921875, 1.2850341796875, 1.412872314453125, 1.54071044921875, 1.668548583984375, 1.79638671875, 1.924224853515625, 2.05206298828125, 2.179901123046875, 2.3077392578125, 2.435577392578125, 2.56341552734375, 2.691253662109375, 2.819091796875, 2.946929931640625, 3.07476806640625, 3.202606201171875, 3.3304443359375, 3.458282470703125, 3.58612060546875, 3.713958740234375, 3.841796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 15.0, 30.0, 39.0, 51.0, 68.0, 80.0, 123.0, 86.0, 109.0, 95.0, 77.0, 71.0, 51.0, 34.0, 17.0, 11.0, 10.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.805009841918945, -28.969240188598633, -28.13347053527832, -27.297700881958008, -26.461933135986328, -25.626163482666016, -24.790393829345703, -23.95462417602539, -23.118854522705078, -22.283084869384766, -21.447315216064453, -20.61154556274414, -19.775775909423828, -18.940006256103516, -18.104238510131836, -17.268468856811523, -16.43269920349121, -15.596929550170898, -14.761159896850586, -13.92539119720459, -13.089621543884277, -12.253851890563965, -11.418083190917969, -10.582313537597656, -9.746543884277344, -8.910774230957031, -8.075004577636719, -7.239235877990723, -6.40346622467041, -5.567696571350098, -4.731927394866943, -3.896158218383789, -3.0603866577148438, -2.2246172428131104, -1.388847827911377, -0.5530784130096436, 0.28269100189208984, 1.1184606552124023, 1.9542298316955566, 2.789999008178711, 3.6257686614990234, 4.461538314819336, 5.29730749130249, 6.1330766677856445, 6.968846321105957, 7.8046159744262695, 8.640384674072266, 9.476154327392578, 10.31192398071289, 11.147693634033203, 11.983463287353516, 12.819231986999512, 13.655001640319824, 14.490771293640137, 15.326539993286133, 16.162309646606445, 16.998079299926758, 17.83384895324707, 18.669618606567383, 19.505388259887695, 20.341156005859375, 21.176925659179688, 22.0126953125, 22.848464965820312, 23.684234619140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 11.0, 8.0, 10.0, 18.0, 18.0, 20.0, 21.0, 25.0, 34.0, 31.0, 32.0, 37.0, 42.0, 48.0, 61.0, 57.0, 58.0, 62.0, 37.0, 47.0, 45.0, 32.0, 39.0, 40.0, 26.0, 25.0, 18.0, 19.0, 13.0, 12.0, 8.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.24041748046875, -13.703510284423828, -13.166603088378906, -12.629695892333984, -12.092788696289062, -11.55588150024414, -11.018974304199219, -10.482067108154297, -9.945159912109375, -9.408252716064453, -8.871345520019531, -8.33443832397461, -7.7975311279296875, -7.260623931884766, -6.723716735839844, -6.186809539794922, -5.64990234375, -5.112995147705078, -4.576087951660156, -4.039180755615234, -3.5022735595703125, -2.9653663635253906, -2.4284591674804688, -1.8915519714355469, -1.354644775390625, -0.8177375793457031, -0.28083038330078125, 0.2560768127441406, 0.7929840087890625, 1.3298912048339844, 1.8667984008789062, 2.403705596923828, 2.940614700317383, 3.4775218963623047, 4.014429092407227, 4.551336288452148, 5.08824348449707, 5.625150680541992, 6.162057876586914, 6.698965072631836, 7.235872268676758, 7.77277946472168, 8.309686660766602, 8.846593856811523, 9.383501052856445, 9.920408248901367, 10.457315444946289, 10.994222640991211, 11.531129837036133, 12.068037033081055, 12.604944229125977, 13.141851425170898, 13.67875862121582, 14.215665817260742, 14.752573013305664, 15.289480209350586, 15.826387405395508, 16.36329460144043, 16.90020179748535, 17.437108993530273, 17.974016189575195, 18.510923385620117, 19.04783058166504, 19.58473777770996, 20.121644973754883]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 6.0, 7.0, 14.0, 17.0, 22.0, 31.0, 68.0, 72.0, 140.0, 227.0, 360.0, 611.0, 1123.0, 1996.0, 3845.0, 8014.0, 16938.0, 38607.0, 89340.0, 207744.0, 342103.0, 189963.0, 81663.0, 34647.0, 15520.0, 7406.0, 3672.0, 1907.0, 1036.0, 535.0, 324.0, 213.0, 119.0, 95.0, 43.0, 39.0, 28.0, 17.0, 14.0, 9.0, 12.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.2239990234375, -10.799560546875, -10.3751220703125, -9.95068359375, -9.5262451171875, -9.101806640625, -8.6773681640625, -8.2529296875, -7.8284912109375, -7.404052734375, -6.9796142578125, -6.55517578125, -6.1307373046875, -5.706298828125, -5.2818603515625, -4.857421875, -4.4329833984375, -4.008544921875, -3.5841064453125, -3.15966796875, -2.7352294921875, -2.310791015625, -1.8863525390625, -1.4619140625, -1.0374755859375, -0.613037109375, -0.1885986328125, 0.23583984375, 0.6602783203125, 1.084716796875, 1.5091552734375, 1.93359375, 2.3580322265625, 2.782470703125, 3.2069091796875, 3.63134765625, 4.0557861328125, 4.480224609375, 4.9046630859375, 5.3291015625, 5.7535400390625, 6.177978515625, 6.6024169921875, 7.02685546875, 7.4512939453125, 7.875732421875, 8.3001708984375, 8.724609375, 9.1490478515625, 9.573486328125, 9.9979248046875, 10.42236328125, 10.8468017578125, 11.271240234375, 11.6956787109375, 12.1201171875, 12.5445556640625, 12.968994140625, 13.3934326171875, 13.81787109375, 14.2423095703125, 14.666748046875, 15.0911865234375, 15.515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 14.0, 16.0, 23.0, 22.0, 30.0, 46.0, 47.0, 66.0, 44.0, 57.0, 71.0, 61.0, 54.0, 64.0, 65.0, 45.0, 43.0, 40.0, 40.0, 43.0, 21.0, 21.0, 9.0, 7.0, 8.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.880859375, -3.774993896484375, -3.66912841796875, -3.563262939453125, -3.4573974609375, -3.351531982421875, -3.24566650390625, -3.139801025390625, -3.033935546875, -2.928070068359375, -2.82220458984375, -2.716339111328125, -2.6104736328125, -2.504608154296875, -2.39874267578125, -2.292877197265625, -2.18701171875, -2.081146240234375, -1.97528076171875, -1.869415283203125, -1.7635498046875, -1.657684326171875, -1.55181884765625, -1.445953369140625, -1.340087890625, -1.234222412109375, -1.12835693359375, -1.022491455078125, -0.9166259765625, -0.810760498046875, -0.70489501953125, -0.599029541015625, -0.4931640625, -0.387298583984375, -0.28143310546875, -0.175567626953125, -0.0697021484375, 0.036163330078125, 0.14202880859375, 0.247894287109375, 0.353759765625, 0.459625244140625, 0.56549072265625, 0.671356201171875, 0.7772216796875, 0.883087158203125, 0.98895263671875, 1.094818115234375, 1.20068359375, 1.306549072265625, 1.41241455078125, 1.518280029296875, 1.6241455078125, 1.730010986328125, 1.83587646484375, 1.941741943359375, 2.047607421875, 2.153472900390625, 2.25933837890625, 2.365203857421875, 2.4710693359375, 2.576934814453125, 2.68280029296875, 2.788665771484375, 2.89453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 12.0, 17.0, 16.0, 36.0, 28.0, 61.0, 73.0, 98.0, 140.0, 217.0, 321.0, 454.0, 747.0, 1342.0, 2774.0, 6107.0, 15375.0, 42155.0, 117616.0, 306314.0, 339077.0, 135212.0, 48844.0, 17542.0, 6911.0, 3090.0, 1544.0, 803.0, 472.0, 361.0, 220.0, 173.0, 107.0, 76.0, 51.0, 36.0, 32.0, 15.0, 24.0, 11.0, 13.0, 8.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.546875, -12.16748046875, -11.7880859375, -11.40869140625, -11.029296875, -10.64990234375, -10.2705078125, -9.89111328125, -9.51171875, -9.13232421875, -8.7529296875, -8.37353515625, -7.994140625, -7.61474609375, -7.2353515625, -6.85595703125, -6.4765625, -6.09716796875, -5.7177734375, -5.33837890625, -4.958984375, -4.57958984375, -4.2001953125, -3.82080078125, -3.44140625, -3.06201171875, -2.6826171875, -2.30322265625, -1.923828125, -1.54443359375, -1.1650390625, -0.78564453125, -0.40625, -0.02685546875, 0.3525390625, 0.73193359375, 1.111328125, 1.49072265625, 1.8701171875, 2.24951171875, 2.62890625, 3.00830078125, 3.3876953125, 3.76708984375, 4.146484375, 4.52587890625, 4.9052734375, 5.28466796875, 5.6640625, 6.04345703125, 6.4228515625, 6.80224609375, 7.181640625, 7.56103515625, 7.9404296875, 8.31982421875, 8.69921875, 9.07861328125, 9.4580078125, 9.83740234375, 10.216796875, 10.59619140625, 10.9755859375, 11.35498046875, 11.734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 8.0, 13.0, 16.0, 14.0, 21.0, 37.0, 31.0, 40.0, 37.0, 50.0, 56.0, 50.0, 56.0, 53.0, 51.0, 55.0, 46.0, 50.0, 48.0, 34.0, 43.0, 30.0, 29.0, 22.0, 21.0, 18.0, 9.0, 15.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1484375, -11.726318359375, -11.30419921875, -10.882080078125, -10.4599609375, -10.037841796875, -9.61572265625, -9.193603515625, -8.771484375, -8.349365234375, -7.92724609375, -7.505126953125, -7.0830078125, -6.660888671875, -6.23876953125, -5.816650390625, -5.39453125, -4.972412109375, -4.55029296875, -4.128173828125, -3.7060546875, -3.283935546875, -2.86181640625, -2.439697265625, -2.017578125, -1.595458984375, -1.17333984375, -0.751220703125, -0.3291015625, 0.093017578125, 0.51513671875, 0.937255859375, 1.359375, 1.781494140625, 2.20361328125, 2.625732421875, 3.0478515625, 3.469970703125, 3.89208984375, 4.314208984375, 4.736328125, 5.158447265625, 5.58056640625, 6.002685546875, 6.4248046875, 6.846923828125, 7.26904296875, 7.691162109375, 8.11328125, 8.535400390625, 8.95751953125, 9.379638671875, 9.8017578125, 10.223876953125, 10.64599609375, 11.068115234375, 11.490234375, 11.912353515625, 12.33447265625, 12.756591796875, 13.1787109375, 13.600830078125, 14.02294921875, 14.445068359375, 14.8671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 12.0, 23.0, 19.0, 36.0, 75.0, 93.0, 154.0, 269.0, 494.0, 850.0, 1561.0, 3162.0, 6846.0, 16054.0, 46628.0, 172638.0, 485599.0, 222194.0, 57251.0, 19166.0, 7815.0, 3651.0, 1718.0, 930.0, 489.0, 299.0, 178.0, 110.0, 75.0, 43.0, 27.0, 21.0, 12.0, 14.0, 9.0, 11.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.91015625, -7.66741943359375, -7.4246826171875, -7.18194580078125, -6.939208984375, -6.69647216796875, -6.4537353515625, -6.21099853515625, -5.96826171875, -5.72552490234375, -5.4827880859375, -5.24005126953125, -4.997314453125, -4.75457763671875, -4.5118408203125, -4.26910400390625, -4.0263671875, -3.78363037109375, -3.5408935546875, -3.29815673828125, -3.055419921875, -2.81268310546875, -2.5699462890625, -2.32720947265625, -2.08447265625, -1.84173583984375, -1.5989990234375, -1.35626220703125, -1.113525390625, -0.87078857421875, -0.6280517578125, -0.38531494140625, -0.142578125, 0.10015869140625, 0.3428955078125, 0.58563232421875, 0.828369140625, 1.07110595703125, 1.3138427734375, 1.55657958984375, 1.79931640625, 2.04205322265625, 2.2847900390625, 2.52752685546875, 2.770263671875, 3.01300048828125, 3.2557373046875, 3.49847412109375, 3.7412109375, 3.98394775390625, 4.2266845703125, 4.46942138671875, 4.712158203125, 4.95489501953125, 5.1976318359375, 5.44036865234375, 5.68310546875, 5.92584228515625, 6.1685791015625, 6.41131591796875, 6.654052734375, 6.89678955078125, 7.1395263671875, 7.38226318359375, 7.625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 10.0, 11.0, 9.0, 12.0, 14.0, 20.0, 31.0, 42.0, 41.0, 50.0, 70.0, 142.0, 144.0, 110.0, 58.0, 58.0, 38.0, 33.0, 18.0, 15.0, 12.0, 9.0, 10.0, 14.0, 6.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00148773193359375, -0.0014365911483764648, -0.0013854503631591797, -0.0013343095779418945, -0.0012831687927246094, -0.0012320280075073242, -0.001180887222290039, -0.001129746437072754, -0.0010786056518554688, -0.0010274648666381836, -0.0009763240814208984, -0.0009251832962036133, -0.0008740425109863281, -0.000822901725769043, -0.0007717609405517578, -0.0007206201553344727, -0.0006694793701171875, -0.0006183385848999023, -0.0005671977996826172, -0.000516057014465332, -0.0004649162292480469, -0.0004137754440307617, -0.00036263465881347656, -0.0003114938735961914, -0.00026035308837890625, -0.0002092123031616211, -0.00015807151794433594, -0.00010693073272705078, -5.5789947509765625e-05, -4.649162292480469e-06, 4.649162292480469e-05, 9.763240814208984e-05, 0.000148773193359375, 0.00019991397857666016, 0.0002510547637939453, 0.00030219554901123047, 0.0003533363342285156, 0.0004044771194458008, 0.00045561790466308594, 0.0005067586898803711, 0.0005578994750976562, 0.0006090402603149414, 0.0006601810455322266, 0.0007113218307495117, 0.0007624626159667969, 0.000813603401184082, 0.0008647441864013672, 0.0009158849716186523, 0.0009670257568359375, 0.0010181665420532227, 0.0010693073272705078, 0.001120448112487793, 0.0011715888977050781, 0.0012227296829223633, 0.0012738704681396484, 0.0013250112533569336, 0.0013761520385742188, 0.001427292823791504, 0.001478433609008789, 0.0015295743942260742, 0.0015807151794433594, 0.0016318559646606445, 0.0016829967498779297, 0.0017341375350952148, 0.0017852783203125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 11.0, 17.0, 17.0, 31.0, 51.0, 78.0, 114.0, 208.0, 380.0, 803.0, 2010.0, 5398.0, 17116.0, 72650.0, 588651.0, 301219.0, 41896.0, 11265.0, 3707.0, 1484.0, 670.0, 293.0, 158.0, 112.0, 65.0, 46.0, 32.0, 24.0, 14.0, 12.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3671875, -11.966064453125, -11.56494140625, -11.163818359375, -10.7626953125, -10.361572265625, -9.96044921875, -9.559326171875, -9.158203125, -8.757080078125, -8.35595703125, -7.954833984375, -7.5537109375, -7.152587890625, -6.75146484375, -6.350341796875, -5.94921875, -5.548095703125, -5.14697265625, -4.745849609375, -4.3447265625, -3.943603515625, -3.54248046875, -3.141357421875, -2.740234375, -2.339111328125, -1.93798828125, -1.536865234375, -1.1357421875, -0.734619140625, -0.33349609375, 0.067626953125, 0.46875, 0.869873046875, 1.27099609375, 1.672119140625, 2.0732421875, 2.474365234375, 2.87548828125, 3.276611328125, 3.677734375, 4.078857421875, 4.47998046875, 4.881103515625, 5.2822265625, 5.683349609375, 6.08447265625, 6.485595703125, 6.88671875, 7.287841796875, 7.68896484375, 8.090087890625, 8.4912109375, 8.892333984375, 9.29345703125, 9.694580078125, 10.095703125, 10.496826171875, 10.89794921875, 11.299072265625, 11.7001953125, 12.101318359375, 12.50244140625, 12.903564453125, 13.3046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 13.0, 5.0, 10.0, 20.0, 17.0, 19.0, 29.0, 62.0, 66.0, 92.0, 133.0, 120.0, 119.0, 83.0, 48.0, 40.0, 24.0, 12.0, 20.0, 11.0, 8.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51171875, -7.25445556640625, -6.9971923828125, -6.73992919921875, -6.482666015625, -6.22540283203125, -5.9681396484375, -5.71087646484375, -5.45361328125, -5.19635009765625, -4.9390869140625, -4.68182373046875, -4.424560546875, -4.16729736328125, -3.9100341796875, -3.65277099609375, -3.3955078125, -3.13824462890625, -2.8809814453125, -2.62371826171875, -2.366455078125, -2.10919189453125, -1.8519287109375, -1.59466552734375, -1.33740234375, -1.08013916015625, -0.8228759765625, -0.56561279296875, -0.308349609375, -0.05108642578125, 0.2061767578125, 0.46343994140625, 0.720703125, 0.97796630859375, 1.2352294921875, 1.49249267578125, 1.749755859375, 2.00701904296875, 2.2642822265625, 2.52154541015625, 2.77880859375, 3.03607177734375, 3.2933349609375, 3.55059814453125, 3.807861328125, 4.06512451171875, 4.3223876953125, 4.57965087890625, 4.8369140625, 5.09417724609375, 5.3514404296875, 5.60870361328125, 5.865966796875, 6.12322998046875, 6.3804931640625, 6.63775634765625, 6.89501953125, 7.15228271484375, 7.4095458984375, 7.66680908203125, 7.924072265625, 8.18133544921875, 8.4385986328125, 8.69586181640625, 8.953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 9.0, 28.0, 31.0, 60.0, 63.0, 131.0, 143.0, 133.0, 108.0, 98.0, 75.0, 36.0, 32.0, 24.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.35137939453125, -72.9698715209961, -69.58836364746094, -66.20685577392578, -62.82535171508789, -59.443843841552734, -56.06233596801758, -52.68083190917969, -49.29932403564453, -45.917816162109375, -42.53630828857422, -39.15480041503906, -35.77329635620117, -32.391788482666016, -29.01028060913086, -25.628774642944336, -22.247264862060547, -18.86575698852539, -15.484251022338867, -12.102743148803711, -8.721236228942871, -5.339729309082031, -1.958221435546875, 1.4232845306396484, 4.804792404174805, 8.186299324035645, 11.567806243896484, 14.94931411743164, 18.330821990966797, 21.71232795715332, 25.093835830688477, 28.475341796875, 31.856849670410156, 35.23835754394531, 38.61986541748047, 42.001373291015625, 45.382877349853516, 48.76438522338867, 52.14589309692383, 55.52739715576172, 58.908905029296875, 62.29041290283203, 65.67192077636719, 69.05342864990234, 72.4349365234375, 75.81643676757812, 79.19795227050781, 82.57945251464844, 85.96096801757812, 89.34247589111328, 92.72398376464844, 96.1054916381836, 99.48699951171875, 102.86849975585938, 106.25001525878906, 109.63151550292969, 113.01302337646484, 116.39453125, 119.77603912353516, 123.15754699707031, 126.53905487060547, 129.92056274414062, 133.30206298828125, 136.68357849121094, 140.06507873535156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 5.0, 10.0, 4.0, 9.0, 16.0, 8.0, 16.0, 19.0, 24.0, 16.0, 24.0, 29.0, 25.0, 22.0, 32.0, 30.0, 39.0, 40.0, 32.0, 35.0, 42.0, 40.0, 49.0, 50.0, 38.0, 38.0, 43.0, 28.0, 33.0, 37.0, 22.0, 20.0, 16.0, 10.0, 24.0, 19.0, 8.0, 6.0, 7.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-57.708396911621094, -55.993080139160156, -54.27776336669922, -52.56244659423828, -50.847129821777344, -49.131813049316406, -47.41649627685547, -45.70117950439453, -43.985862731933594, -42.270545959472656, -40.55522918701172, -38.83991241455078, -37.124595642089844, -35.409278869628906, -33.69396209716797, -31.97864532470703, -30.263328552246094, -28.548011779785156, -26.83269500732422, -25.11737823486328, -23.402061462402344, -21.686744689941406, -19.97142791748047, -18.25611114501953, -16.540794372558594, -14.825477600097656, -13.110160827636719, -11.394844055175781, -9.679527282714844, -7.964210510253906, -6.248893737792969, -4.533576965332031, -2.818256378173828, -1.1029396057128906, 0.6123771667480469, 2.3276939392089844, 4.043010711669922, 5.758327484130859, 7.473644256591797, 9.188961029052734, 10.904277801513672, 12.61959457397461, 14.334911346435547, 16.050228118896484, 17.765544891357422, 19.48086166381836, 21.196178436279297, 22.911495208740234, 24.626811981201172, 26.34212875366211, 28.057445526123047, 29.772762298583984, 31.488079071044922, 33.20339584350586, 34.9187126159668, 36.634029388427734, 38.34934616088867, 40.06466293334961, 41.77997970581055, 43.495296478271484, 45.21061325073242, 46.92593002319336, 48.6412467956543, 50.356563568115234, 52.07188034057617]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 12.0, 11.0, 22.0, 25.0, 48.0, 64.0, 90.0, 122.0, 199.0, 314.0, 554.0, 1057.0, 2046.0, 4324.0, 10906.0, 34561.0, 189647.0, 3515955.0, 359953.0, 49769.0, 14057.0, 5388.0, 2399.0, 1185.0, 635.0, 347.0, 194.0, 125.0, 76.0, 47.0, 39.0, 32.0, 23.0, 10.0, 8.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.609375, -17.085693359375, -16.56201171875, -16.038330078125, -15.5146484375, -14.990966796875, -14.46728515625, -13.943603515625, -13.419921875, -12.896240234375, -12.37255859375, -11.848876953125, -11.3251953125, -10.801513671875, -10.27783203125, -9.754150390625, -9.23046875, -8.706787109375, -8.18310546875, -7.659423828125, -7.1357421875, -6.612060546875, -6.08837890625, -5.564697265625, -5.041015625, -4.517333984375, -3.99365234375, -3.469970703125, -2.9462890625, -2.422607421875, -1.89892578125, -1.375244140625, -0.8515625, -0.327880859375, 0.19580078125, 0.719482421875, 1.2431640625, 1.766845703125, 2.29052734375, 2.814208984375, 3.337890625, 3.861572265625, 4.38525390625, 4.908935546875, 5.4326171875, 5.956298828125, 6.47998046875, 7.003662109375, 7.52734375, 8.051025390625, 8.57470703125, 9.098388671875, 9.6220703125, 10.145751953125, 10.66943359375, 11.193115234375, 11.716796875, 12.240478515625, 12.76416015625, 13.287841796875, 13.8115234375, 14.335205078125, 14.85888671875, 15.382568359375, 15.90625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 6.0, 14.0, 9.0, 11.0, 27.0, 21.0, 35.0, 27.0, 37.0, 61.0, 38.0, 51.0, 65.0, 61.0, 77.0, 58.0, 60.0, 58.0, 55.0, 35.0, 42.0, 33.0, 29.0, 18.0, 15.0, 14.0, 10.0, 3.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.931640625, -3.82568359375, -3.7197265625, -3.61376953125, -3.5078125, -3.40185546875, -3.2958984375, -3.18994140625, -3.083984375, -2.97802734375, -2.8720703125, -2.76611328125, -2.66015625, -2.55419921875, -2.4482421875, -2.34228515625, -2.236328125, -2.13037109375, -2.0244140625, -1.91845703125, -1.8125, -1.70654296875, -1.6005859375, -1.49462890625, -1.388671875, -1.28271484375, -1.1767578125, -1.07080078125, -0.96484375, -0.85888671875, -0.7529296875, -0.64697265625, -0.541015625, -0.43505859375, -0.3291015625, -0.22314453125, -0.1171875, -0.01123046875, 0.0947265625, 0.20068359375, 0.306640625, 0.41259765625, 0.5185546875, 0.62451171875, 0.73046875, 0.83642578125, 0.9423828125, 1.04833984375, 1.154296875, 1.26025390625, 1.3662109375, 1.47216796875, 1.578125, 1.68408203125, 1.7900390625, 1.89599609375, 2.001953125, 2.10791015625, 2.2138671875, 2.31982421875, 2.42578125, 2.53173828125, 2.6376953125, 2.74365234375, 2.849609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 3.0, 11.0, 13.0, 20.0, 27.0, 56.0, 100.0, 133.0, 216.0, 420.0, 734.0, 1327.0, 2507.0, 4854.0, 10061.0, 22645.0, 62673.0, 236404.0, 2126202.0, 1437807.0, 194602.0, 54002.0, 20470.0, 9021.0, 4518.0, 2430.0, 1310.0, 709.0, 393.0, 245.0, 150.0, 80.0, 61.0, 29.0, 19.0, 17.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1484375, -8.832275390625, -8.51611328125, -8.199951171875, -7.8837890625, -7.567626953125, -7.25146484375, -6.935302734375, -6.619140625, -6.302978515625, -5.98681640625, -5.670654296875, -5.3544921875, -5.038330078125, -4.72216796875, -4.406005859375, -4.08984375, -3.773681640625, -3.45751953125, -3.141357421875, -2.8251953125, -2.509033203125, -2.19287109375, -1.876708984375, -1.560546875, -1.244384765625, -0.92822265625, -0.612060546875, -0.2958984375, 0.020263671875, 0.33642578125, 0.652587890625, 0.96875, 1.284912109375, 1.60107421875, 1.917236328125, 2.2333984375, 2.549560546875, 2.86572265625, 3.181884765625, 3.498046875, 3.814208984375, 4.13037109375, 4.446533203125, 4.7626953125, 5.078857421875, 5.39501953125, 5.711181640625, 6.02734375, 6.343505859375, 6.65966796875, 6.975830078125, 7.2919921875, 7.608154296875, 7.92431640625, 8.240478515625, 8.556640625, 8.872802734375, 9.18896484375, 9.505126953125, 9.8212890625, 10.137451171875, 10.45361328125, 10.769775390625, 11.0859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 8.0, 10.0, 16.0, 28.0, 22.0, 45.0, 55.0, 86.0, 109.0, 172.0, 325.0, 538.0, 950.0, 654.0, 320.0, 207.0, 135.0, 104.0, 72.0, 30.0, 30.0, 21.0, 15.0, 18.0, 12.0, 8.0, 4.0, 7.0, 7.0, 4.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.921875, -3.77996826171875, -3.6380615234375, -3.49615478515625, -3.354248046875, -3.21234130859375, -3.0704345703125, -2.92852783203125, -2.78662109375, -2.64471435546875, -2.5028076171875, -2.36090087890625, -2.218994140625, -2.07708740234375, -1.9351806640625, -1.79327392578125, -1.6513671875, -1.50946044921875, -1.3675537109375, -1.22564697265625, -1.083740234375, -0.94183349609375, -0.7999267578125, -0.65802001953125, -0.51611328125, -0.37420654296875, -0.2322998046875, -0.09039306640625, 0.051513671875, 0.19342041015625, 0.3353271484375, 0.47723388671875, 0.619140625, 0.76104736328125, 0.9029541015625, 1.04486083984375, 1.186767578125, 1.32867431640625, 1.4705810546875, 1.61248779296875, 1.75439453125, 1.89630126953125, 2.0382080078125, 2.18011474609375, 2.322021484375, 2.46392822265625, 2.6058349609375, 2.74774169921875, 2.8896484375, 3.03155517578125, 3.1734619140625, 3.31536865234375, 3.457275390625, 3.59918212890625, 3.7410888671875, 3.88299560546875, 4.02490234375, 4.16680908203125, 4.3087158203125, 4.45062255859375, 4.592529296875, 4.73443603515625, 4.8763427734375, 5.01824951171875, 5.16015625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 7.0, 5.0, 15.0, 36.0, 36.0, 78.0, 96.0, 121.0, 127.0, 143.0, 110.0, 89.0, 52.0, 29.0, 22.0, 19.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-62.25694274902344, -60.917850494384766, -59.578758239746094, -58.23966979980469, -56.900577545166016, -55.561485290527344, -54.22239303588867, -52.88330078125, -51.544212341308594, -50.20512008666992, -48.86602783203125, -47.526939392089844, -46.18784713745117, -44.8487548828125, -43.50966262817383, -42.170570373535156, -40.831478118896484, -39.49238586425781, -38.15329360961914, -36.81420135498047, -35.47511291503906, -34.13602066040039, -32.79692840576172, -31.457836151123047, -30.118745803833008, -28.779653549194336, -27.440563201904297, -26.101470947265625, -24.762378692626953, -23.423288345336914, -22.084196090698242, -20.745105743408203, -19.4060115814209, -18.066919326782227, -16.727828979492188, -15.388736724853516, -14.04964542388916, -12.710554122924805, -11.371461868286133, -10.032370567321777, -8.693279266357422, -7.354187965393066, -6.015096187591553, -4.676004409790039, -3.3369131088256836, -1.9978218078613281, -0.6587295532226562, 0.6803617477416992, 2.0194530487060547, 3.3585445880889893, 4.697636127471924, 6.0367279052734375, 7.375819206237793, 8.714910507202148, 10.05400276184082, 11.393094062805176, 12.732185363769531, 14.071276664733887, 15.410367965698242, 16.749460220336914, 18.088550567626953, 19.427642822265625, 20.766735076904297, 22.10582733154297, 23.444917678833008]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 1.0, 4.0, 5.0, 9.0, 11.0, 8.0, 6.0, 18.0, 8.0, 20.0, 17.0, 18.0, 26.0, 44.0, 28.0, 26.0, 33.0, 39.0, 47.0, 49.0, 44.0, 45.0, 42.0, 40.0, 40.0, 40.0, 40.0, 31.0, 27.0, 32.0, 19.0, 23.0, 31.0, 25.0, 11.0, 17.0, 15.0, 12.0, 11.0, 11.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.653610229492188, -17.060409545898438, -16.467206954956055, -15.874006271362305, -15.280805587768555, -14.687603950500488, -14.094402313232422, -13.501201629638672, -12.908000946044922, -12.314799308776855, -11.721598625183105, -11.128396987915039, -10.535196304321289, -9.941994667053223, -9.348793029785156, -8.755592346191406, -8.16239070892334, -7.569189548492432, -6.975988388061523, -6.382786750793457, -5.789586067199707, -5.196384429931641, -4.603183269500732, -4.009982109069824, -3.416780948638916, -2.823579788208008, -2.2303786277770996, -1.6371772289276123, -1.043976068496704, -0.4507749080657959, 0.1424264907836914, 0.7356276512145996, 1.3288288116455078, 1.922029972076416, 2.515231132507324, 3.1084325313568115, 3.7016336917877197, 4.294835090637207, 4.888036251068115, 5.481237411499023, 6.074438571929932, 6.66763973236084, 7.260840892791748, 7.854042053222656, 8.447243690490723, 9.040444374084473, 9.633646011352539, 10.226846694946289, 10.820048332214355, 11.413249969482422, 12.006450653076172, 12.599652290344238, 13.192852973937988, 13.786054611206055, 14.379255294799805, 14.972456932067871, 15.565658569335938, 16.158859252929688, 16.75206184387207, 17.34526252746582, 17.93846321105957, 18.53166389465332, 19.124866485595703, 19.718067169189453, 20.311267852783203]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 7.0, 10.0, 8.0, 19.0, 27.0, 40.0, 59.0, 102.0, 165.0, 293.0, 516.0, 878.0, 1787.0, 3583.0, 7536.0, 16413.0, 39691.0, 107358.0, 400660.0, 318841.0, 89251.0, 33878.0, 14357.0, 6419.0, 3089.0, 1580.0, 818.0, 476.0, 266.0, 151.0, 105.0, 65.0, 28.0, 23.0, 15.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.03662109375, -14.5654296875, -14.09423828125, -13.623046875, -13.15185546875, -12.6806640625, -12.20947265625, -11.73828125, -11.26708984375, -10.7958984375, -10.32470703125, -9.853515625, -9.38232421875, -8.9111328125, -8.43994140625, -7.96875, -7.49755859375, -7.0263671875, -6.55517578125, -6.083984375, -5.61279296875, -5.1416015625, -4.67041015625, -4.19921875, -3.72802734375, -3.2568359375, -2.78564453125, -2.314453125, -1.84326171875, -1.3720703125, -0.90087890625, -0.4296875, 0.04150390625, 0.5126953125, 0.98388671875, 1.455078125, 1.92626953125, 2.3974609375, 2.86865234375, 3.33984375, 3.81103515625, 4.2822265625, 4.75341796875, 5.224609375, 5.69580078125, 6.1669921875, 6.63818359375, 7.109375, 7.58056640625, 8.0517578125, 8.52294921875, 8.994140625, 9.46533203125, 9.9365234375, 10.40771484375, 10.87890625, 11.35009765625, 11.8212890625, 12.29248046875, 12.763671875, 13.23486328125, 13.7060546875, 14.17724609375, 14.6484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 14.0, 10.0, 14.0, 29.0, 25.0, 42.0, 52.0, 49.0, 60.0, 54.0, 72.0, 78.0, 52.0, 66.0, 69.0, 66.0, 51.0, 50.0, 44.0, 22.0, 15.0, 16.0, 15.0, 7.0, 5.0, 6.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.19610595703125, -4.0758056640625, -3.95550537109375, -3.835205078125, -3.71490478515625, -3.5946044921875, -3.47430419921875, -3.35400390625, -3.23370361328125, -3.1134033203125, -2.99310302734375, -2.872802734375, -2.75250244140625, -2.6322021484375, -2.51190185546875, -2.3916015625, -2.27130126953125, -2.1510009765625, -2.03070068359375, -1.910400390625, -1.79010009765625, -1.6697998046875, -1.54949951171875, -1.42919921875, -1.30889892578125, -1.1885986328125, -1.06829833984375, -0.947998046875, -0.82769775390625, -0.7073974609375, -0.58709716796875, -0.466796875, -0.34649658203125, -0.2261962890625, -0.10589599609375, 0.014404296875, 0.13470458984375, 0.2550048828125, 0.37530517578125, 0.49560546875, 0.61590576171875, 0.7362060546875, 0.85650634765625, 0.976806640625, 1.09710693359375, 1.2174072265625, 1.33770751953125, 1.4580078125, 1.57830810546875, 1.6986083984375, 1.81890869140625, 1.939208984375, 2.05950927734375, 2.1798095703125, 2.30010986328125, 2.42041015625, 2.54071044921875, 2.6610107421875, 2.78131103515625, 2.901611328125, 3.02191162109375, 3.1422119140625, 3.26251220703125, 3.3828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 7.0, 5.0, 5.0, 6.0, 13.0, 9.0, 19.0, 27.0, 40.0, 44.0, 63.0, 96.0, 125.0, 219.0, 320.0, 559.0, 1170.0, 2829.0, 7897.0, 27722.0, 123244.0, 613721.0, 209754.0, 42264.0, 11253.0, 3752.0, 1470.0, 728.0, 407.0, 253.0, 181.0, 100.0, 64.0, 62.0, 34.0, 25.0, 23.0, 18.0, 12.0, 5.0, 7.0, 1.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.609375, -19.026611328125, -18.44384765625, -17.861083984375, -17.2783203125, -16.695556640625, -16.11279296875, -15.530029296875, -14.947265625, -14.364501953125, -13.78173828125, -13.198974609375, -12.6162109375, -12.033447265625, -11.45068359375, -10.867919921875, -10.28515625, -9.702392578125, -9.11962890625, -8.536865234375, -7.9541015625, -7.371337890625, -6.78857421875, -6.205810546875, -5.623046875, -5.040283203125, -4.45751953125, -3.874755859375, -3.2919921875, -2.709228515625, -2.12646484375, -1.543701171875, -0.9609375, -0.378173828125, 0.20458984375, 0.787353515625, 1.3701171875, 1.952880859375, 2.53564453125, 3.118408203125, 3.701171875, 4.283935546875, 4.86669921875, 5.449462890625, 6.0322265625, 6.614990234375, 7.19775390625, 7.780517578125, 8.36328125, 8.946044921875, 9.52880859375, 10.111572265625, 10.6943359375, 11.277099609375, 11.85986328125, 12.442626953125, 13.025390625, 13.608154296875, 14.19091796875, 14.773681640625, 15.3564453125, 15.939208984375, 16.52197265625, 17.104736328125, 17.6875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 8.0, 5.0, 2.0, 5.0, 7.0, 11.0, 11.0, 23.0, 24.0, 31.0, 34.0, 34.0, 42.0, 47.0, 49.0, 51.0, 53.0, 68.0, 50.0, 65.0, 51.0, 45.0, 45.0, 27.0, 40.0, 44.0, 25.0, 18.0, 28.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6744384765625, -11.231689453125, -10.7889404296875, -10.34619140625, -9.9034423828125, -9.460693359375, -9.0179443359375, -8.5751953125, -8.1324462890625, -7.689697265625, -7.2469482421875, -6.80419921875, -6.3614501953125, -5.918701171875, -5.4759521484375, -5.033203125, -4.5904541015625, -4.147705078125, -3.7049560546875, -3.26220703125, -2.8194580078125, -2.376708984375, -1.9339599609375, -1.4912109375, -1.0484619140625, -0.605712890625, -0.1629638671875, 0.27978515625, 0.7225341796875, 1.165283203125, 1.6080322265625, 2.05078125, 2.4935302734375, 2.936279296875, 3.3790283203125, 3.82177734375, 4.2645263671875, 4.707275390625, 5.1500244140625, 5.5927734375, 6.0355224609375, 6.478271484375, 6.9210205078125, 7.36376953125, 7.8065185546875, 8.249267578125, 8.6920166015625, 9.134765625, 9.5775146484375, 10.020263671875, 10.4630126953125, 10.90576171875, 11.3485107421875, 11.791259765625, 12.2340087890625, 12.6767578125, 13.1195068359375, 13.562255859375, 14.0050048828125, 14.44775390625, 14.8905029296875, 15.333251953125, 15.7760009765625, 16.21875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 11.0, 14.0, 17.0, 37.0, 55.0, 151.0, 390.0, 1559.0, 12929.0, 235608.0, 766106.0, 28057.0, 2706.0, 524.0, 191.0, 80.0, 38.0, 22.0, 12.0, 12.0, 8.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.5888671875, -14.943359375, -14.2978515625, -13.65234375, -13.0068359375, -12.361328125, -11.7158203125, -11.0703125, -10.4248046875, -9.779296875, -9.1337890625, -8.48828125, -7.8427734375, -7.197265625, -6.5517578125, -5.90625, -5.2607421875, -4.615234375, -3.9697265625, -3.32421875, -2.6787109375, -2.033203125, -1.3876953125, -0.7421875, -0.0966796875, 0.548828125, 1.1943359375, 1.83984375, 2.4853515625, 3.130859375, 3.7763671875, 4.421875, 5.0673828125, 5.712890625, 6.3583984375, 7.00390625, 7.6494140625, 8.294921875, 8.9404296875, 9.5859375, 10.2314453125, 10.876953125, 11.5224609375, 12.16796875, 12.8134765625, 13.458984375, 14.1044921875, 14.75, 15.3955078125, 16.041015625, 16.6865234375, 17.33203125, 17.9775390625, 18.623046875, 19.2685546875, 19.9140625, 20.5595703125, 21.205078125, 21.8505859375, 22.49609375, 23.1416015625, 23.787109375, 24.4326171875, 25.078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 6.0, 13.0, 10.0, 14.0, 11.0, 22.0, 26.0, 36.0, 30.0, 94.0, 171.0, 212.0, 115.0, 47.0, 34.0, 25.0, 18.0, 19.0, 10.0, 18.0, 4.0, 6.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.001926422119140625, -0.0018717795610427856, -0.0018171370029449463, -0.001762494444847107, -0.0017078518867492676, -0.0016532093286514282, -0.0015985667705535889, -0.0015439242124557495, -0.0014892816543579102, -0.0014346390962600708, -0.0013799965381622314, -0.001325353980064392, -0.0012707114219665527, -0.0012160688638687134, -0.001161426305770874, -0.0011067837476730347, -0.0010521411895751953, -0.000997498631477356, -0.0009428560733795166, -0.0008882135152816772, -0.0008335709571838379, -0.0007789283990859985, -0.0007242858409881592, -0.0006696432828903198, -0.0006150007247924805, -0.0005603581666946411, -0.0005057156085968018, -0.0004510730504989624, -0.00039643049240112305, -0.0003417879343032837, -0.00028714537620544434, -0.00023250281810760498, -0.00017786026000976562, -0.00012321770191192627, -6.857514381408691e-05, -1.3932585716247559e-05, 4.07099723815918e-05, 9.535253047943115e-05, 0.0001499950885772705, 0.00020463764667510986, 0.0002592802047729492, 0.0003139227628707886, 0.00036856532096862793, 0.0004232078790664673, 0.00047785043716430664, 0.000532492995262146, 0.0005871355533599854, 0.0006417781114578247, 0.0006964206695556641, 0.0007510632276535034, 0.0008057057857513428, 0.0008603483438491821, 0.0009149909019470215, 0.0009696334600448608, 0.0010242760181427002, 0.0010789185762405396, 0.001133561134338379, 0.0011882036924362183, 0.0012428462505340576, 0.001297488808631897, 0.0013521313667297363, 0.0014067739248275757, 0.001461416482925415, 0.0015160590410232544, 0.0015707015991210938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 17.0, 16.0, 35.0, 41.0, 69.0, 135.0, 294.0, 671.0, 1802.0, 7284.0, 52681.0, 833387.0, 132713.0, 14667.0, 2896.0, 983.0, 399.0, 206.0, 95.0, 60.0, 33.0, 20.0, 12.0, 5.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.71044921875, -13.1552734375, -12.60009765625, -12.044921875, -11.48974609375, -10.9345703125, -10.37939453125, -9.82421875, -9.26904296875, -8.7138671875, -8.15869140625, -7.603515625, -7.04833984375, -6.4931640625, -5.93798828125, -5.3828125, -4.82763671875, -4.2724609375, -3.71728515625, -3.162109375, -2.60693359375, -2.0517578125, -1.49658203125, -0.94140625, -0.38623046875, 0.1689453125, 0.72412109375, 1.279296875, 1.83447265625, 2.3896484375, 2.94482421875, 3.5, 4.05517578125, 4.6103515625, 5.16552734375, 5.720703125, 6.27587890625, 6.8310546875, 7.38623046875, 7.94140625, 8.49658203125, 9.0517578125, 9.60693359375, 10.162109375, 10.71728515625, 11.2724609375, 11.82763671875, 12.3828125, 12.93798828125, 13.4931640625, 14.04833984375, 14.603515625, 15.15869140625, 15.7138671875, 16.26904296875, 16.82421875, 17.37939453125, 17.9345703125, 18.48974609375, 19.044921875, 19.60009765625, 20.1552734375, 20.71044921875, 21.265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 7.0, 14.0, 17.0, 19.0, 38.0, 53.0, 127.0, 283.0, 199.0, 83.0, 44.0, 22.0, 19.0, 17.0, 11.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.9140625, -9.5284423828125, -9.142822265625, -8.7572021484375, -8.37158203125, -7.9859619140625, -7.600341796875, -7.2147216796875, -6.8291015625, -6.4434814453125, -6.057861328125, -5.6722412109375, -5.28662109375, -4.9010009765625, -4.515380859375, -4.1297607421875, -3.744140625, -3.3585205078125, -2.972900390625, -2.5872802734375, -2.20166015625, -1.8160400390625, -1.430419921875, -1.0447998046875, -0.6591796875, -0.2735595703125, 0.112060546875, 0.4976806640625, 0.88330078125, 1.2689208984375, 1.654541015625, 2.0401611328125, 2.42578125, 2.8114013671875, 3.197021484375, 3.5826416015625, 3.96826171875, 4.3538818359375, 4.739501953125, 5.1251220703125, 5.5107421875, 5.8963623046875, 6.281982421875, 6.6676025390625, 7.05322265625, 7.4388427734375, 7.824462890625, 8.2100830078125, 8.595703125, 8.9813232421875, 9.366943359375, 9.7525634765625, 10.13818359375, 10.5238037109375, 10.909423828125, 11.2950439453125, 11.6806640625, 12.0662841796875, 12.451904296875, 12.8375244140625, 13.22314453125, 13.6087646484375, 13.994384765625, 14.3800048828125, 14.765625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 19.0, 74.0, 143.0, 228.0, 249.0, 169.0, 67.0, 28.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.49009704589844, -247.62008666992188, -240.75009155273438, -233.8800811767578, -227.01007080078125, -220.14007568359375, -213.2700653076172, -206.40005493164062, -199.53005981445312, -192.66004943847656, -185.79005432128906, -178.9200439453125, -172.050048828125, -165.18003845214844, -158.31002807617188, -151.44003295898438, -144.5700225830078, -137.70001220703125, -130.83001708984375, -123.96000671386719, -117.09000396728516, -110.22000122070312, -103.34999084472656, -96.47998809814453, -89.6099853515625, -82.73998260498047, -75.86997985839844, -68.99996948242188, -62.129966735839844, -55.25996398925781, -48.389957427978516, -41.51995086669922, -34.64996337890625, -27.779958724975586, -20.909954071044922, -14.039949417114258, -7.169944763183594, -0.2999420166015625, 6.570064544677734, 13.440071105957031, 20.310073852539062, 27.180078506469727, 34.05008316040039, 40.92008972167969, 47.79009246826172, 54.66009521484375, 61.53010177612305, 68.40010833740234, 75.27011108398438, 82.1401138305664, 89.01011657714844, 95.880126953125, 102.75012969970703, 109.62013244628906, 116.49014282226562, 123.36014556884766, 130.2301483154297, 137.10015869140625, 143.97015380859375, 150.8401641845703, 157.71017456054688, 164.58016967773438, 171.45018005371094, 178.3201904296875, 185.190185546875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 14.0, 12.0, 22.0, 24.0, 18.0, 38.0, 26.0, 25.0, 37.0, 34.0, 34.0, 44.0, 38.0, 50.0, 39.0, 41.0, 58.0, 30.0, 43.0, 40.0, 36.0, 39.0, 30.0, 24.0, 30.0, 20.0, 35.0, 14.0, 15.0, 11.0, 9.0, 9.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-66.76054382324219, -64.84466552734375, -62.92879104614258, -61.012916564941406, -59.097042083740234, -57.18116760253906, -55.265289306640625, -53.34941482543945, -51.43354034423828, -49.51766586303711, -47.60178756713867, -45.6859130859375, -43.77003860473633, -41.854164123535156, -39.93828582763672, -38.02241134643555, -36.10653305053711, -34.19065856933594, -32.2747802734375, -30.358905792236328, -28.443031311035156, -26.52715492248535, -24.611278533935547, -22.695404052734375, -20.77952766418457, -18.863651275634766, -16.947776794433594, -15.031900405883789, -13.1160249710083, -11.200149536132812, -9.284273147583008, -7.3683977127075195, -5.452518463134766, -3.5366427898406982, -1.6207671165466309, 0.2951087951660156, 2.210984230041504, 4.126859664916992, 6.042736053466797, 7.958611488342285, 9.874486923217773, 11.790362358093262, 13.70623779296875, 15.622114181518555, 17.53799057006836, 19.45386505126953, 21.369741439819336, 23.28561782836914, 25.201492309570312, 27.117368698120117, 29.03324317932129, 30.949119567871094, 32.864994049072266, 34.78086853027344, 36.696746826171875, 38.61262130737305, 40.52849578857422, 42.44437026977539, 44.36024856567383, 46.276123046875, 48.19199752807617, 50.107872009277344, 52.02375030517578, 53.93962478637695, 55.85550308227539]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 10.0, 12.0, 20.0, 25.0, 27.0, 39.0, 67.0, 76.0, 109.0, 184.0, 296.0, 491.0, 793.0, 1316.0, 2451.0, 4786.0, 9819.0, 22889.0, 67573.0, 343001.0, 3330379.0, 305200.0, 63589.0, 21758.0, 9246.0, 4486.0, 2408.0, 1292.0, 753.0, 445.0, 280.0, 149.0, 95.0, 72.0, 39.0, 38.0, 20.0, 11.0, 9.0, 5.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.9921875, -13.5863037109375, -13.180419921875, -12.7745361328125, -12.36865234375, -11.9627685546875, -11.556884765625, -11.1510009765625, -10.7451171875, -10.3392333984375, -9.933349609375, -9.5274658203125, -9.12158203125, -8.7156982421875, -8.309814453125, -7.9039306640625, -7.498046875, -7.0921630859375, -6.686279296875, -6.2803955078125, -5.87451171875, -5.4686279296875, -5.062744140625, -4.6568603515625, -4.2509765625, -3.8450927734375, -3.439208984375, -3.0333251953125, -2.62744140625, -2.2215576171875, -1.815673828125, -1.4097900390625, -1.00390625, -0.5980224609375, -0.192138671875, 0.2137451171875, 0.61962890625, 1.0255126953125, 1.431396484375, 1.8372802734375, 2.2431640625, 2.6490478515625, 3.054931640625, 3.4608154296875, 3.86669921875, 4.2725830078125, 4.678466796875, 5.0843505859375, 5.490234375, 5.8961181640625, 6.302001953125, 6.7078857421875, 7.11376953125, 7.5196533203125, 7.925537109375, 8.3314208984375, 8.7373046875, 9.1431884765625, 9.549072265625, 9.9549560546875, 10.36083984375, 10.7667236328125, 11.172607421875, 11.5784912109375, 11.984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 12.0, 16.0, 17.0, 23.0, 33.0, 38.0, 47.0, 60.0, 68.0, 59.0, 71.0, 59.0, 70.0, 68.0, 71.0, 51.0, 58.0, 55.0, 34.0, 27.0, 15.0, 15.0, 10.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -5.027069091796875, -4.89007568359375, -4.753082275390625, -4.6160888671875, -4.479095458984375, -4.34210205078125, -4.205108642578125, -4.068115234375, -3.931121826171875, -3.79412841796875, -3.657135009765625, -3.5201416015625, -3.383148193359375, -3.24615478515625, -3.109161376953125, -2.97216796875, -2.835174560546875, -2.69818115234375, -2.561187744140625, -2.4241943359375, -2.287200927734375, -2.15020751953125, -2.013214111328125, -1.876220703125, -1.739227294921875, -1.60223388671875, -1.465240478515625, -1.3282470703125, -1.191253662109375, -1.05426025390625, -0.917266845703125, -0.7802734375, -0.643280029296875, -0.50628662109375, -0.369293212890625, -0.2322998046875, -0.095306396484375, 0.04168701171875, 0.178680419921875, 0.315673828125, 0.452667236328125, 0.58966064453125, 0.726654052734375, 0.8636474609375, 1.000640869140625, 1.13763427734375, 1.274627685546875, 1.41162109375, 1.548614501953125, 1.68560791015625, 1.822601318359375, 1.9595947265625, 2.096588134765625, 2.23358154296875, 2.370574951171875, 2.507568359375, 2.644561767578125, 2.78155517578125, 2.918548583984375, 3.0555419921875, 3.192535400390625, 3.32952880859375, 3.466522216796875, 3.603515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 12.0, 16.0, 18.0, 29.0, 39.0, 72.0, 101.0, 137.0, 208.0, 407.0, 617.0, 1102.0, 1924.0, 3473.0, 7353.0, 15952.0, 42602.0, 165397.0, 1891068.0, 1826654.0, 163784.0, 42355.0, 15865.0, 6970.0, 3515.0, 1855.0, 1082.0, 625.0, 347.0, 226.0, 132.0, 95.0, 73.0, 38.0, 31.0, 26.0, 17.0, 12.0, 13.0, 5.0, 4.0, 5.0, 1.0, 0.0, 3.0, 2.0, 6.0], "bins": [-13.71875, -13.337646484375, -12.95654296875, -12.575439453125, -12.1943359375, -11.813232421875, -11.43212890625, -11.051025390625, -10.669921875, -10.288818359375, -9.90771484375, -9.526611328125, -9.1455078125, -8.764404296875, -8.38330078125, -8.002197265625, -7.62109375, -7.239990234375, -6.85888671875, -6.477783203125, -6.0966796875, -5.715576171875, -5.33447265625, -4.953369140625, -4.572265625, -4.191162109375, -3.81005859375, -3.428955078125, -3.0478515625, -2.666748046875, -2.28564453125, -1.904541015625, -1.5234375, -1.142333984375, -0.76123046875, -0.380126953125, 0.0009765625, 0.382080078125, 0.76318359375, 1.144287109375, 1.525390625, 1.906494140625, 2.28759765625, 2.668701171875, 3.0498046875, 3.430908203125, 3.81201171875, 4.193115234375, 4.57421875, 4.955322265625, 5.33642578125, 5.717529296875, 6.0986328125, 6.479736328125, 6.86083984375, 7.241943359375, 7.623046875, 8.004150390625, 8.38525390625, 8.766357421875, 9.1474609375, 9.528564453125, 9.90966796875, 10.290771484375, 10.671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 7.0, 7.0, 10.0, 19.0, 8.0, 18.0, 40.0, 38.0, 91.0, 136.0, 288.0, 693.0, 1544.0, 585.0, 248.0, 132.0, 77.0, 44.0, 16.0, 23.0, 10.0, 9.0, 12.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.53515625, -5.31744384765625, -5.0997314453125, -4.88201904296875, -4.664306640625, -4.44659423828125, -4.2288818359375, -4.01116943359375, -3.79345703125, -3.57574462890625, -3.3580322265625, -3.14031982421875, -2.922607421875, -2.70489501953125, -2.4871826171875, -2.26947021484375, -2.0517578125, -1.83404541015625, -1.6163330078125, -1.39862060546875, -1.180908203125, -0.96319580078125, -0.7454833984375, -0.52777099609375, -0.31005859375, -0.09234619140625, 0.1253662109375, 0.34307861328125, 0.560791015625, 0.77850341796875, 0.9962158203125, 1.21392822265625, 1.431640625, 1.64935302734375, 1.8670654296875, 2.08477783203125, 2.302490234375, 2.52020263671875, 2.7379150390625, 2.95562744140625, 3.17333984375, 3.39105224609375, 3.6087646484375, 3.82647705078125, 4.044189453125, 4.26190185546875, 4.4796142578125, 4.69732666015625, 4.9150390625, 5.13275146484375, 5.3504638671875, 5.56817626953125, 5.785888671875, 6.00360107421875, 6.2213134765625, 6.43902587890625, 6.65673828125, 6.87445068359375, 7.0921630859375, 7.30987548828125, 7.527587890625, 7.74530029296875, 7.9630126953125, 8.18072509765625, 8.3984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 10.0, 11.0, 27.0, 42.0, 63.0, 80.0, 125.0, 131.0, 152.0, 120.0, 92.0, 61.0, 34.0, 19.0, 15.0, 8.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.06793212890625, -44.725563049316406, -43.38319778442383, -42.040828704833984, -40.698463439941406, -39.35609436035156, -38.013729095458984, -36.67136001586914, -35.32899475097656, -33.98662567138672, -32.64426040649414, -31.30189323425293, -29.95952606201172, -28.617158889770508, -27.274791717529297, -25.932422637939453, -24.590055465698242, -23.24768829345703, -21.90532112121582, -20.56295394897461, -19.2205867767334, -17.878219604492188, -16.535850524902344, -15.19348430633545, -13.851117134094238, -12.508749961853027, -11.166382789611816, -9.824014663696289, -8.481647491455078, -7.139280796051025, -5.796913146972656, -4.454545974731445, -3.1121788024902344, -1.7698115110397339, -0.4274442195892334, 0.9149231910705566, 2.2572903633117676, 3.5996575355529785, 4.942025184631348, 6.284392356872559, 7.6267595291137695, 8.96912670135498, 10.311493873596191, 11.653861999511719, 12.99622917175293, 14.33859634399414, 15.680963516235352, 17.023330688476562, 18.365697860717773, 19.708065032958984, 21.050432205200195, 22.392799377441406, 23.735166549682617, 25.077533721923828, 26.419902801513672, 27.76226806640625, 29.104637145996094, 30.447004318237305, 31.789371490478516, 33.13174057006836, 34.47410583496094, 35.81647491455078, 37.15884017944336, 38.5012092590332, 39.84357452392578]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 7.0, 10.0, 10.0, 12.0, 14.0, 21.0, 17.0, 22.0, 29.0, 25.0, 31.0, 35.0, 44.0, 38.0, 25.0, 29.0, 39.0, 36.0, 33.0, 58.0, 39.0, 51.0, 36.0, 33.0, 34.0, 31.0, 30.0, 31.0, 23.0, 21.0, 18.0, 15.0, 15.0, 16.0, 11.0, 8.0, 8.0, 8.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.29275894165039, -16.720579147338867, -16.148399353027344, -15.576218605041504, -15.004037857055664, -14.43185806274414, -13.859678268432617, -13.287498474121094, -12.715317726135254, -12.14313793182373, -11.57095718383789, -10.998777389526367, -10.426597595214844, -9.854416847229004, -9.28223705291748, -8.71005630493164, -8.137876510620117, -7.5656962394714355, -6.993515968322754, -6.4213361740112305, -5.849155902862549, -5.276975631713867, -4.704795837402344, -4.132615566253662, -3.5604352951049805, -2.988255023956299, -2.4160749912261963, -1.8438948392868042, -1.271714687347412, -0.6995344161987305, -0.12735438346862793, 0.4448256492614746, 1.0170059204101562, 1.5891860723495483, 2.1613662242889404, 2.733546257019043, 3.3057265281677246, 3.8779067993164062, 4.45008659362793, 5.022266864776611, 5.594447135925293, 6.166627407073975, 6.738807678222656, 7.31098747253418, 7.883167743682861, 8.455348014831543, 9.027527809143066, 9.599708557128906, 10.17188835144043, 10.744068145751953, 11.316248893737793, 11.888428688049316, 12.460609436035156, 13.03278923034668, 13.604969024658203, 14.177148818969727, 14.749329566955566, 15.32150936126709, 15.89369010925293, 16.465869903564453, 17.038049697875977, 17.6102294921875, 18.182411193847656, 18.75459098815918, 19.326770782470703]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 10.0, 11.0, 22.0, 13.0, 34.0, 38.0, 65.0, 98.0, 130.0, 220.0, 366.0, 629.0, 1250.0, 2497.0, 4967.0, 10508.0, 23039.0, 50197.0, 125097.0, 402288.0, 270684.0, 85719.0, 37353.0, 17317.0, 8030.0, 3694.0, 1858.0, 983.0, 539.0, 326.0, 194.0, 140.0, 76.0, 39.0, 34.0, 29.0, 19.0, 15.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-14.1328125, -13.7489013671875, -13.364990234375, -12.9810791015625, -12.59716796875, -12.2132568359375, -11.829345703125, -11.4454345703125, -11.0615234375, -10.6776123046875, -10.293701171875, -9.9097900390625, -9.52587890625, -9.1419677734375, -8.758056640625, -8.3741455078125, -7.990234375, -7.6063232421875, -7.222412109375, -6.8385009765625, -6.45458984375, -6.0706787109375, -5.686767578125, -5.3028564453125, -4.9189453125, -4.5350341796875, -4.151123046875, -3.7672119140625, -3.38330078125, -2.9993896484375, -2.615478515625, -2.2315673828125, -1.84765625, -1.4637451171875, -1.079833984375, -0.6959228515625, -0.31201171875, 0.0718994140625, 0.455810546875, 0.8397216796875, 1.2236328125, 1.6075439453125, 1.991455078125, 2.3753662109375, 2.75927734375, 3.1431884765625, 3.527099609375, 3.9110107421875, 4.294921875, 4.6788330078125, 5.062744140625, 5.4466552734375, 5.83056640625, 6.2144775390625, 6.598388671875, 6.9822998046875, 7.3662109375, 7.7501220703125, 8.134033203125, 8.5179443359375, 8.90185546875, 9.2857666015625, 9.669677734375, 10.0535888671875, 10.4375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 16.0, 13.0, 11.0, 21.0, 36.0, 46.0, 43.0, 37.0, 53.0, 51.0, 61.0, 59.0, 59.0, 58.0, 56.0, 54.0, 55.0, 45.0, 45.0, 39.0, 30.0, 27.0, 20.0, 10.0, 6.0, 11.0, 5.0, 8.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01171875, -3.895416259765625, -3.77911376953125, -3.662811279296875, -3.5465087890625, -3.430206298828125, -3.31390380859375, -3.197601318359375, -3.081298828125, -2.964996337890625, -2.84869384765625, -2.732391357421875, -2.6160888671875, -2.499786376953125, -2.38348388671875, -2.267181396484375, -2.15087890625, -2.034576416015625, -1.91827392578125, -1.801971435546875, -1.6856689453125, -1.569366455078125, -1.45306396484375, -1.336761474609375, -1.220458984375, -1.104156494140625, -0.98785400390625, -0.871551513671875, -0.7552490234375, -0.638946533203125, -0.52264404296875, -0.406341552734375, -0.2900390625, -0.173736572265625, -0.05743408203125, 0.058868408203125, 0.1751708984375, 0.291473388671875, 0.40777587890625, 0.524078369140625, 0.640380859375, 0.756683349609375, 0.87298583984375, 0.989288330078125, 1.1055908203125, 1.221893310546875, 1.33819580078125, 1.454498291015625, 1.57080078125, 1.687103271484375, 1.80340576171875, 1.919708251953125, 2.0360107421875, 2.152313232421875, 2.26861572265625, 2.384918212890625, 2.501220703125, 2.617523193359375, 2.73382568359375, 2.850128173828125, 2.9664306640625, 3.082733154296875, 3.19903564453125, 3.315338134765625, 3.431640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 8.0, 16.0, 16.0, 18.0, 30.0, 30.0, 42.0, 82.0, 80.0, 143.0, 264.0, 562.0, 1228.0, 2922.0, 7550.0, 20582.0, 64269.0, 429683.0, 423983.0, 63578.0, 20574.0, 7574.0, 2879.0, 1110.0, 540.0, 277.0, 169.0, 98.0, 69.0, 43.0, 36.0, 26.0, 19.0, 10.0, 10.0, 7.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.34375, -18.791015625, -18.23828125, -17.685546875, -17.1328125, -16.580078125, -16.02734375, -15.474609375, -14.921875, -14.369140625, -13.81640625, -13.263671875, -12.7109375, -12.158203125, -11.60546875, -11.052734375, -10.5, -9.947265625, -9.39453125, -8.841796875, -8.2890625, -7.736328125, -7.18359375, -6.630859375, -6.078125, -5.525390625, -4.97265625, -4.419921875, -3.8671875, -3.314453125, -2.76171875, -2.208984375, -1.65625, -1.103515625, -0.55078125, 0.001953125, 0.5546875, 1.107421875, 1.66015625, 2.212890625, 2.765625, 3.318359375, 3.87109375, 4.423828125, 4.9765625, 5.529296875, 6.08203125, 6.634765625, 7.1875, 7.740234375, 8.29296875, 8.845703125, 9.3984375, 9.951171875, 10.50390625, 11.056640625, 11.609375, 12.162109375, 12.71484375, 13.267578125, 13.8203125, 14.373046875, 14.92578125, 15.478515625, 16.03125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 6.0, 4.0, 10.0, 9.0, 7.0, 13.0, 17.0, 25.0, 16.0, 29.0, 31.0, 45.0, 42.0, 44.0, 53.0, 52.0, 57.0, 67.0, 46.0, 50.0, 47.0, 44.0, 50.0, 47.0, 23.0, 31.0, 18.0, 22.0, 18.0, 9.0, 10.0, 7.0, 7.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.5625, -12.146484375, -11.73046875, -11.314453125, -10.8984375, -10.482421875, -10.06640625, -9.650390625, -9.234375, -8.818359375, -8.40234375, -7.986328125, -7.5703125, -7.154296875, -6.73828125, -6.322265625, -5.90625, -5.490234375, -5.07421875, -4.658203125, -4.2421875, -3.826171875, -3.41015625, -2.994140625, -2.578125, -2.162109375, -1.74609375, -1.330078125, -0.9140625, -0.498046875, -0.08203125, 0.333984375, 0.75, 1.166015625, 1.58203125, 1.998046875, 2.4140625, 2.830078125, 3.24609375, 3.662109375, 4.078125, 4.494140625, 4.91015625, 5.326171875, 5.7421875, 6.158203125, 6.57421875, 6.990234375, 7.40625, 7.822265625, 8.23828125, 8.654296875, 9.0703125, 9.486328125, 9.90234375, 10.318359375, 10.734375, 11.150390625, 11.56640625, 11.982421875, 12.3984375, 12.814453125, 13.23046875, 13.646484375, 14.0625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 9.0, 21.0, 25.0, 39.0, 72.0, 119.0, 301.0, 636.0, 1920.0, 5702.0, 18623.0, 59382.0, 499081.0, 385433.0, 52698.0, 16613.0, 5124.0, 1585.0, 670.0, 258.0, 100.0, 58.0, 28.0, 19.0, 20.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.13330078125, -4.8759765625, -4.61865234375, -4.361328125, -4.10400390625, -3.8466796875, -3.58935546875, -3.33203125, -3.07470703125, -2.8173828125, -2.56005859375, -2.302734375, -2.04541015625, -1.7880859375, -1.53076171875, -1.2734375, -1.01611328125, -0.7587890625, -0.50146484375, -0.244140625, 0.01318359375, 0.2705078125, 0.52783203125, 0.78515625, 1.04248046875, 1.2998046875, 1.55712890625, 1.814453125, 2.07177734375, 2.3291015625, 2.58642578125, 2.84375, 3.10107421875, 3.3583984375, 3.61572265625, 3.873046875, 4.13037109375, 4.3876953125, 4.64501953125, 4.90234375, 5.15966796875, 5.4169921875, 5.67431640625, 5.931640625, 6.18896484375, 6.4462890625, 6.70361328125, 6.9609375, 7.21826171875, 7.4755859375, 7.73291015625, 7.990234375, 8.24755859375, 8.5048828125, 8.76220703125, 9.01953125, 9.27685546875, 9.5341796875, 9.79150390625, 10.048828125, 10.30615234375, 10.5634765625, 10.82080078125, 11.078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 7.0, 5.0, 8.0, 10.0, 8.0, 20.0, 23.0, 22.0, 47.0, 252.0, 383.0, 99.0, 37.0, 22.0, 15.0, 11.0, 13.0, 13.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013904571533203125, -0.0012923777103424072, -0.001194298267364502, -0.0010962188243865967, -0.0009981393814086914, -0.0009000599384307861, -0.0008019804954528809, -0.0007039010524749756, -0.0006058216094970703, -0.000507742166519165, -0.00040966272354125977, -0.0003115832805633545, -0.00021350383758544922, -0.00011542439460754395, -1.7344951629638672e-05, 8.07344913482666e-05, 0.00017881393432617188, 0.00027689337730407715, 0.0003749728202819824, 0.0004730522632598877, 0.000571131706237793, 0.0006692111492156982, 0.0007672905921936035, 0.0008653700351715088, 0.0009634494781494141, 0.0010615289211273193, 0.0011596083641052246, 0.0012576878070831299, 0.0013557672500610352, 0.0014538466930389404, 0.0015519261360168457, 0.001650005578994751, 0.0017480850219726562, 0.0018461644649505615, 0.0019442439079284668, 0.002042323350906372, 0.0021404027938842773, 0.0022384822368621826, 0.002336561679840088, 0.002434641122817993, 0.0025327205657958984, 0.0026308000087738037, 0.002728879451751709, 0.0028269588947296143, 0.0029250383377075195, 0.003023117780685425, 0.00312119722366333, 0.0032192766666412354, 0.0033173561096191406, 0.003415435552597046, 0.003513514995574951, 0.0036115944385528564, 0.0037096738815307617, 0.003807753324508667, 0.0039058327674865723, 0.0040039122104644775, 0.004101991653442383, 0.004200071096420288, 0.004298150539398193, 0.004396229982376099, 0.004494309425354004, 0.004592388868331909, 0.0046904683113098145, 0.00478854775428772, 0.004886627197265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 14.0, 35.0, 26.0, 69.0, 99.0, 209.0, 375.0, 762.0, 2156.0, 6662.0, 22826.0, 90831.0, 765097.0, 120273.0, 26977.0, 7859.0, 2512.0, 910.0, 367.0, 179.0, 104.0, 68.0, 42.0, 30.0, 17.0, 10.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.25091552734375, -9.9705810546875, -9.69024658203125, -9.409912109375, -9.12957763671875, -8.8492431640625, -8.56890869140625, -8.28857421875, -8.00823974609375, -7.7279052734375, -7.44757080078125, -7.167236328125, -6.88690185546875, -6.6065673828125, -6.32623291015625, -6.0458984375, -5.76556396484375, -5.4852294921875, -5.20489501953125, -4.924560546875, -4.64422607421875, -4.3638916015625, -4.08355712890625, -3.80322265625, -3.52288818359375, -3.2425537109375, -2.96221923828125, -2.681884765625, -2.40155029296875, -2.1212158203125, -1.84088134765625, -1.560546875, -1.28021240234375, -0.9998779296875, -0.71954345703125, -0.439208984375, -0.15887451171875, 0.1214599609375, 0.40179443359375, 0.68212890625, 0.96246337890625, 1.2427978515625, 1.52313232421875, 1.803466796875, 2.08380126953125, 2.3641357421875, 2.64447021484375, 2.9248046875, 3.20513916015625, 3.4854736328125, 3.76580810546875, 4.046142578125, 4.32647705078125, 4.6068115234375, 4.88714599609375, 5.16748046875, 5.44781494140625, 5.7281494140625, 6.00848388671875, 6.288818359375, 6.56915283203125, 6.8494873046875, 7.12982177734375, 7.41015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 12.0, 11.0, 16.0, 20.0, 33.0, 38.0, 108.0, 184.0, 242.0, 145.0, 65.0, 30.0, 24.0, 15.0, 15.0, 10.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.21875, -10.96484375, -10.7109375, -10.45703125, -10.203125, -9.94921875, -9.6953125, -9.44140625, -9.1875, -8.93359375, -8.6796875, -8.42578125, -8.171875, -7.91796875, -7.6640625, -7.41015625, -7.15625, -6.90234375, -6.6484375, -6.39453125, -6.140625, -5.88671875, -5.6328125, -5.37890625, -5.125, -4.87109375, -4.6171875, -4.36328125, -4.109375, -3.85546875, -3.6015625, -3.34765625, -3.09375, -2.83984375, -2.5859375, -2.33203125, -2.078125, -1.82421875, -1.5703125, -1.31640625, -1.0625, -0.80859375, -0.5546875, -0.30078125, -0.046875, 0.20703125, 0.4609375, 0.71484375, 0.96875, 1.22265625, 1.4765625, 1.73046875, 1.984375, 2.23828125, 2.4921875, 2.74609375, 3.0, 3.25390625, 3.5078125, 3.76171875, 4.015625, 4.26953125, 4.5234375, 4.77734375, 5.03125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 16.0, 21.0, 33.0, 44.0, 59.0, 104.0, 109.0, 117.0, 123.0, 103.0, 84.0, 59.0, 38.0, 27.0, 26.0, 19.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.19029235839844, -64.12901306152344, -61.06774139404297, -58.006465911865234, -54.9451904296875, -51.883914947509766, -48.82263946533203, -45.76136016845703, -42.70008850097656, -39.63881301879883, -36.577537536621094, -33.51626205444336, -30.454986572265625, -27.39371109008789, -24.332433700561523, -21.27115821838379, -18.209880828857422, -15.148605346679688, -12.087329864501953, -9.026053428649902, -5.964777946472168, -2.9035024642944336, 0.1577739715576172, 3.2190494537353516, 6.280324935913086, 9.34160041809082, 12.402875900268555, 15.464152336120605, 18.525428771972656, 21.58670425415039, 24.647979736328125, 27.70925521850586, 30.770530700683594, 33.83180618286133, 36.89308166503906, 39.9543571472168, 43.01563262939453, 46.076908111572266, 49.13818359375, 52.199462890625, 55.26073455810547, 58.3220100402832, 61.38328552246094, 64.44456481933594, 67.5058364868164, 70.5671157836914, 73.62838745117188, 76.68966674804688, 79.75094604492188, 82.81222534179688, 85.87349700927734, 88.93477630615234, 91.99604797363281, 95.05732727050781, 98.11859893798828, 101.17987823486328, 104.24114990234375, 107.30242919921875, 110.36370086669922, 113.42498016357422, 116.48625183105469, 119.54753112792969, 122.60880279541016, 125.67008209228516, 128.73135375976562]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 5.0, 6.0, 5.0, 9.0, 8.0, 13.0, 9.0, 16.0, 20.0, 23.0, 26.0, 33.0, 33.0, 28.0, 30.0, 38.0, 41.0, 30.0, 44.0, 49.0, 48.0, 46.0, 38.0, 50.0, 49.0, 40.0, 34.0, 27.0, 25.0, 26.0, 29.0, 23.0, 15.0, 18.0, 19.0, 8.0, 11.0, 5.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.872650146484375, -56.1311149597168, -54.38957595825195, -52.648040771484375, -50.90650177001953, -49.16496658325195, -47.423431396484375, -45.68189239501953, -43.94035720825195, -42.198822021484375, -40.45728302001953, -38.71574783325195, -36.974212646484375, -35.23267364501953, -33.49113845825195, -31.749601364135742, -30.00806427001953, -28.26652717590332, -26.52499008178711, -24.78345489501953, -23.04191780090332, -21.30038070678711, -19.55884552001953, -17.81730842590332, -16.07577133178711, -14.334234237670898, -12.592698097229004, -10.85116195678711, -9.109624862670898, -7.3680877685546875, -5.626551628112793, -3.8850154876708984, -2.143482208251953, -0.4019455909729004, 1.3395910263061523, 3.081127643585205, 4.822664260864258, 6.564201354980469, 8.305737495422363, 10.047273635864258, 11.788810729980469, 13.53034782409668, 15.271883964538574, 17.01342010498047, 18.75495719909668, 20.49649429321289, 22.23802947998047, 23.97956657409668, 25.72110366821289, 27.4626407623291, 29.204177856445312, 30.94571304321289, 32.68724822998047, 34.42878723144531, 36.17032241821289, 37.91185760498047, 39.65339660644531, 41.39493179321289, 43.136470794677734, 44.87800598144531, 46.619544982910156, 48.361080169677734, 50.10261535644531, 51.844154357910156, 53.585689544677734]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 6.0, 2.0, 11.0, 4.0, 12.0, 22.0, 22.0, 28.0, 61.0, 85.0, 139.0, 235.0, 321.0, 609.0, 1048.0, 2047.0, 4037.0, 8232.0, 19156.0, 53166.0, 239539.0, 3369557.0, 383114.0, 69541.0, 23406.0, 9923.0, 4797.0, 2287.0, 1216.0, 720.0, 376.0, 220.0, 116.0, 79.0, 58.0, 30.0, 16.0, 18.0, 10.0, 6.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.453125, -17.904052734375, -17.35498046875, -16.805908203125, -16.2568359375, -15.707763671875, -15.15869140625, -14.609619140625, -14.060546875, -13.511474609375, -12.96240234375, -12.413330078125, -11.8642578125, -11.315185546875, -10.76611328125, -10.217041015625, -9.66796875, -9.118896484375, -8.56982421875, -8.020751953125, -7.4716796875, -6.922607421875, -6.37353515625, -5.824462890625, -5.275390625, -4.726318359375, -4.17724609375, -3.628173828125, -3.0791015625, -2.530029296875, -1.98095703125, -1.431884765625, -0.8828125, -0.333740234375, 0.21533203125, 0.764404296875, 1.3134765625, 1.862548828125, 2.41162109375, 2.960693359375, 3.509765625, 4.058837890625, 4.60791015625, 5.156982421875, 5.7060546875, 6.255126953125, 6.80419921875, 7.353271484375, 7.90234375, 8.451416015625, 9.00048828125, 9.549560546875, 10.0986328125, 10.647705078125, 11.19677734375, 11.745849609375, 12.294921875, 12.843994140625, 13.39306640625, 13.942138671875, 14.4912109375, 15.040283203125, 15.58935546875, 16.138427734375, 16.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 11.0, 18.0, 27.0, 31.0, 32.0, 43.0, 47.0, 40.0, 61.0, 60.0, 70.0, 71.0, 54.0, 51.0, 58.0, 57.0, 51.0, 45.0, 34.0, 29.0, 32.0, 18.0, 16.0, 5.0, 6.0, 12.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.8824462890625, -4.749267578125, -4.6160888671875, -4.48291015625, -4.3497314453125, -4.216552734375, -4.0833740234375, -3.9501953125, -3.8170166015625, -3.683837890625, -3.5506591796875, -3.41748046875, -3.2843017578125, -3.151123046875, -3.0179443359375, -2.884765625, -2.7515869140625, -2.618408203125, -2.4852294921875, -2.35205078125, -2.2188720703125, -2.085693359375, -1.9525146484375, -1.8193359375, -1.6861572265625, -1.552978515625, -1.4197998046875, -1.28662109375, -1.1534423828125, -1.020263671875, -0.8870849609375, -0.75390625, -0.6207275390625, -0.487548828125, -0.3543701171875, -0.22119140625, -0.0880126953125, 0.045166015625, 0.1783447265625, 0.3115234375, 0.4447021484375, 0.577880859375, 0.7110595703125, 0.84423828125, 0.9774169921875, 1.110595703125, 1.2437744140625, 1.376953125, 1.5101318359375, 1.643310546875, 1.7764892578125, 1.90966796875, 2.0428466796875, 2.176025390625, 2.3092041015625, 2.4423828125, 2.5755615234375, 2.708740234375, 2.8419189453125, 2.97509765625, 3.1082763671875, 3.241455078125, 3.3746337890625, 3.5078125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 16.0, 21.0, 14.0, 31.0, 72.0, 94.0, 148.0, 287.0, 504.0, 848.0, 1484.0, 3053.0, 6121.0, 13811.0, 35051.0, 117224.0, 809706.0, 2903752.0, 211922.0, 54005.0, 19325.0, 8424.0, 3993.0, 1995.0, 1057.0, 584.0, 292.0, 198.0, 109.0, 60.0, 28.0, 24.0, 14.0, 8.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21875, -13.731689453125, -13.24462890625, -12.757568359375, -12.2705078125, -11.783447265625, -11.29638671875, -10.809326171875, -10.322265625, -9.835205078125, -9.34814453125, -8.861083984375, -8.3740234375, -7.886962890625, -7.39990234375, -6.912841796875, -6.42578125, -5.938720703125, -5.45166015625, -4.964599609375, -4.4775390625, -3.990478515625, -3.50341796875, -3.016357421875, -2.529296875, -2.042236328125, -1.55517578125, -1.068115234375, -0.5810546875, -0.093994140625, 0.39306640625, 0.880126953125, 1.3671875, 1.854248046875, 2.34130859375, 2.828369140625, 3.3154296875, 3.802490234375, 4.28955078125, 4.776611328125, 5.263671875, 5.750732421875, 6.23779296875, 6.724853515625, 7.2119140625, 7.698974609375, 8.18603515625, 8.673095703125, 9.16015625, 9.647216796875, 10.13427734375, 10.621337890625, 11.1083984375, 11.595458984375, 12.08251953125, 12.569580078125, 13.056640625, 13.543701171875, 14.03076171875, 14.517822265625, 15.0048828125, 15.491943359375, 15.97900390625, 16.466064453125, 16.953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 13.0, 7.0, 9.0, 11.0, 20.0, 23.0, 28.0, 35.0, 69.0, 108.0, 157.0, 269.0, 669.0, 1477.0, 473.0, 226.0, 116.0, 104.0, 76.0, 29.0, 35.0, 24.0, 13.0, 9.0, 9.0, 9.0, 13.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.51953125, -6.32415771484375, -6.1287841796875, -5.93341064453125, -5.738037109375, -5.54266357421875, -5.3472900390625, -5.15191650390625, -4.95654296875, -4.76116943359375, -4.5657958984375, -4.37042236328125, -4.175048828125, -3.97967529296875, -3.7843017578125, -3.58892822265625, -3.3935546875, -3.19818115234375, -3.0028076171875, -2.80743408203125, -2.612060546875, -2.41668701171875, -2.2213134765625, -2.02593994140625, -1.83056640625, -1.63519287109375, -1.4398193359375, -1.24444580078125, -1.049072265625, -0.85369873046875, -0.6583251953125, -0.46295166015625, -0.267578125, -0.07220458984375, 0.1231689453125, 0.31854248046875, 0.513916015625, 0.70928955078125, 0.9046630859375, 1.10003662109375, 1.29541015625, 1.49078369140625, 1.6861572265625, 1.88153076171875, 2.076904296875, 2.27227783203125, 2.4676513671875, 2.66302490234375, 2.8583984375, 3.05377197265625, 3.2491455078125, 3.44451904296875, 3.639892578125, 3.83526611328125, 4.0306396484375, 4.22601318359375, 4.42138671875, 4.61676025390625, 4.8121337890625, 5.00750732421875, 5.202880859375, 5.39825439453125, 5.5936279296875, 5.78900146484375, 5.984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 26.0, 78.0, 181.0, 263.0, 250.0, 137.0, 38.0, 10.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.16787719726562, -127.96488952636719, -124.76190185546875, -121.55892181396484, -118.3559341430664, -115.15294647216797, -111.94995880126953, -108.74697875976562, -105.54399108886719, -102.34100341796875, -99.13801574707031, -95.9350357055664, -92.73204803466797, -89.52906036376953, -86.3260726928711, -83.12309265136719, -79.92010498046875, -76.71711730957031, -73.51412963867188, -70.31114959716797, -67.10816192626953, -63.905174255371094, -60.702186584472656, -57.499202728271484, -54.29621124267578, -51.093223571777344, -47.89023971557617, -44.687252044677734, -41.48426818847656, -38.281280517578125, -35.07829284667969, -31.875308990478516, -28.672325134277344, -25.46933937072754, -22.266353607177734, -19.063365936279297, -15.860381126403809, -12.657394409179688, -9.454408645629883, -6.251422882080078, -3.0484371185302734, 0.15454888343811035, 3.357534885406494, 6.560521125793457, 9.763506889343262, 12.966493606567383, 16.169479370117188, 19.372465133666992, 22.575450897216797, 25.7784366607666, 28.981422424316406, 32.184410095214844, 35.387393951416016, 38.59038162231445, 41.793365478515625, 44.99635314941406, 48.1993408203125, 51.40232849121094, 54.60531234741211, 57.80830001831055, 61.01128387451172, 64.21427154541016, 67.4172592163086, 70.6202392578125, 73.82322692871094]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 1.0, 5.0, 8.0, 12.0, 15.0, 11.0, 22.0, 25.0, 36.0, 43.0, 36.0, 38.0, 53.0, 55.0, 66.0, 71.0, 55.0, 66.0, 51.0, 43.0, 32.0, 41.0, 51.0, 38.0, 23.0, 20.0, 17.0, 18.0, 14.0, 8.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.87667465209961, -30.93840217590332, -30.0001277923584, -29.06185531616211, -28.123580932617188, -27.1853084564209, -26.24703598022461, -25.308761596679688, -24.370487213134766, -23.432214736938477, -22.493940353393555, -21.555667877197266, -20.617393493652344, -19.679121017456055, -18.740848541259766, -17.802574157714844, -16.864301681518555, -15.92602825164795, -14.987754821777344, -14.049482345581055, -13.111207962036133, -12.172935485839844, -11.234662055969238, -10.296388626098633, -9.358115196228027, -8.419841766357422, -7.481568336486816, -6.543295383453369, -5.605021953582764, -4.666748523712158, -3.728475570678711, -2.7902021408081055, -1.8519287109375, -0.9136554002761841, 0.024617910385131836, 0.9628911018371582, 1.9011645317077637, 2.839437961578369, 3.7777109146118164, 4.715984344482422, 5.654257774353027, 6.592531204223633, 7.530804634094238, 8.469078063964844, 9.407350540161133, 10.345624923706055, 11.283897399902344, 12.22217082977295, 13.160444259643555, 14.09871768951416, 15.036991119384766, 15.975263595581055, 16.913537979125977, 17.851810455322266, 18.790084838867188, 19.728357315063477, 20.666629791259766, 21.604902267456055, 22.543176651000977, 23.481449127197266, 24.419723510742188, 25.357995986938477, 26.296268463134766, 27.234542846679688, 28.17281723022461]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 16.0, 22.0, 35.0, 56.0, 99.0, 197.0, 332.0, 666.0, 1351.0, 2971.0, 7591.0, 19788.0, 53273.0, 132387.0, 353033.0, 294993.0, 110141.0, 44071.0, 16401.0, 6259.0, 2485.0, 1109.0, 548.0, 294.0, 176.0, 83.0, 54.0, 30.0, 31.0, 16.0, 10.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.6875, -16.22265625, -15.7578125, -15.29296875, -14.828125, -14.36328125, -13.8984375, -13.43359375, -12.96875, -12.50390625, -12.0390625, -11.57421875, -11.109375, -10.64453125, -10.1796875, -9.71484375, -9.25, -8.78515625, -8.3203125, -7.85546875, -7.390625, -6.92578125, -6.4609375, -5.99609375, -5.53125, -5.06640625, -4.6015625, -4.13671875, -3.671875, -3.20703125, -2.7421875, -2.27734375, -1.8125, -1.34765625, -0.8828125, -0.41796875, 0.046875, 0.51171875, 0.9765625, 1.44140625, 1.90625, 2.37109375, 2.8359375, 3.30078125, 3.765625, 4.23046875, 4.6953125, 5.16015625, 5.625, 6.08984375, 6.5546875, 7.01953125, 7.484375, 7.94921875, 8.4140625, 8.87890625, 9.34375, 9.80859375, 10.2734375, 10.73828125, 11.203125, 11.66796875, 12.1328125, 12.59765625, 13.0625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 13.0, 16.0, 18.0, 21.0, 32.0, 46.0, 48.0, 55.0, 61.0, 49.0, 61.0, 66.0, 64.0, 56.0, 59.0, 51.0, 62.0, 49.0, 47.0, 32.0, 17.0, 22.0, 14.0, 10.0, 5.0, 9.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.564208984375, -4.42529296875, -4.286376953125, -4.1474609375, -4.008544921875, -3.86962890625, -3.730712890625, -3.591796875, -3.452880859375, -3.31396484375, -3.175048828125, -3.0361328125, -2.897216796875, -2.75830078125, -2.619384765625, -2.48046875, -2.341552734375, -2.20263671875, -2.063720703125, -1.9248046875, -1.785888671875, -1.64697265625, -1.508056640625, -1.369140625, -1.230224609375, -1.09130859375, -0.952392578125, -0.8134765625, -0.674560546875, -0.53564453125, -0.396728515625, -0.2578125, -0.118896484375, 0.02001953125, 0.158935546875, 0.2978515625, 0.436767578125, 0.57568359375, 0.714599609375, 0.853515625, 0.992431640625, 1.13134765625, 1.270263671875, 1.4091796875, 1.548095703125, 1.68701171875, 1.825927734375, 1.96484375, 2.103759765625, 2.24267578125, 2.381591796875, 2.5205078125, 2.659423828125, 2.79833984375, 2.937255859375, 3.076171875, 3.215087890625, 3.35400390625, 3.492919921875, 3.6318359375, 3.770751953125, 3.90966796875, 4.048583984375, 4.1875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 12.0, 22.0, 30.0, 44.0, 58.0, 78.0, 118.0, 115.0, 227.0, 307.0, 487.0, 784.0, 1540.0, 4126.0, 17961.0, 87702.0, 456090.0, 382351.0, 74120.0, 15198.0, 3663.0, 1325.0, 697.0, 466.0, 319.0, 196.0, 164.0, 82.0, 64.0, 52.0, 41.0, 21.0, 26.0, 13.0, 9.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -17.962646484375, -17.36279296875, -16.762939453125, -16.1630859375, -15.563232421875, -14.96337890625, -14.363525390625, -13.763671875, -13.163818359375, -12.56396484375, -11.964111328125, -11.3642578125, -10.764404296875, -10.16455078125, -9.564697265625, -8.96484375, -8.364990234375, -7.76513671875, -7.165283203125, -6.5654296875, -5.965576171875, -5.36572265625, -4.765869140625, -4.166015625, -3.566162109375, -2.96630859375, -2.366455078125, -1.7666015625, -1.166748046875, -0.56689453125, 0.032958984375, 0.6328125, 1.232666015625, 1.83251953125, 2.432373046875, 3.0322265625, 3.632080078125, 4.23193359375, 4.831787109375, 5.431640625, 6.031494140625, 6.63134765625, 7.231201171875, 7.8310546875, 8.430908203125, 9.03076171875, 9.630615234375, 10.23046875, 10.830322265625, 11.43017578125, 12.030029296875, 12.6298828125, 13.229736328125, 13.82958984375, 14.429443359375, 15.029296875, 15.629150390625, 16.22900390625, 16.828857421875, 17.4287109375, 18.028564453125, 18.62841796875, 19.228271484375, 19.828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 10.0, 8.0, 15.0, 15.0, 17.0, 31.0, 30.0, 21.0, 39.0, 35.0, 47.0, 32.0, 42.0, 55.0, 65.0, 41.0, 50.0, 61.0, 41.0, 57.0, 44.0, 34.0, 31.0, 39.0, 27.0, 27.0, 16.0, 12.0, 16.0, 2.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.875, -17.3690185546875, -16.863037109375, -16.3570556640625, -15.85107421875, -15.3450927734375, -14.839111328125, -14.3331298828125, -13.8271484375, -13.3211669921875, -12.815185546875, -12.3092041015625, -11.80322265625, -11.2972412109375, -10.791259765625, -10.2852783203125, -9.779296875, -9.2733154296875, -8.767333984375, -8.2613525390625, -7.75537109375, -7.2493896484375, -6.743408203125, -6.2374267578125, -5.7314453125, -5.2254638671875, -4.719482421875, -4.2135009765625, -3.70751953125, -3.2015380859375, -2.695556640625, -2.1895751953125, -1.68359375, -1.1776123046875, -0.671630859375, -0.1656494140625, 0.34033203125, 0.8463134765625, 1.352294921875, 1.8582763671875, 2.3642578125, 2.8702392578125, 3.376220703125, 3.8822021484375, 4.38818359375, 4.8941650390625, 5.400146484375, 5.9061279296875, 6.412109375, 6.9180908203125, 7.424072265625, 7.9300537109375, 8.43603515625, 8.9420166015625, 9.447998046875, 9.9539794921875, 10.4599609375, 10.9659423828125, 11.471923828125, 11.9779052734375, 12.48388671875, 12.9898681640625, 13.495849609375, 14.0018310546875, 14.5078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 11.0, 15.0, 26.0, 35.0, 64.0, 117.0, 181.0, 420.0, 1007.0, 2732.0, 9164.0, 36757.0, 147573.0, 580930.0, 200705.0, 50476.0, 12554.0, 3562.0, 1200.0, 477.0, 233.0, 147.0, 64.0, 34.0, 26.0, 16.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37109375, -7.08331298828125, -6.7955322265625, -6.50775146484375, -6.219970703125, -5.93218994140625, -5.6444091796875, -5.35662841796875, -5.06884765625, -4.78106689453125, -4.4932861328125, -4.20550537109375, -3.917724609375, -3.62994384765625, -3.3421630859375, -3.05438232421875, -2.7666015625, -2.47882080078125, -2.1910400390625, -1.90325927734375, -1.615478515625, -1.32769775390625, -1.0399169921875, -0.75213623046875, -0.46435546875, -0.17657470703125, 0.1112060546875, 0.39898681640625, 0.686767578125, 0.97454833984375, 1.2623291015625, 1.55010986328125, 1.837890625, 2.12567138671875, 2.4134521484375, 2.70123291015625, 2.989013671875, 3.27679443359375, 3.5645751953125, 3.85235595703125, 4.14013671875, 4.42791748046875, 4.7156982421875, 5.00347900390625, 5.291259765625, 5.57904052734375, 5.8668212890625, 6.15460205078125, 6.4423828125, 6.73016357421875, 7.0179443359375, 7.30572509765625, 7.593505859375, 7.88128662109375, 8.1690673828125, 8.45684814453125, 8.74462890625, 9.03240966796875, 9.3201904296875, 9.60797119140625, 9.895751953125, 10.18353271484375, 10.4713134765625, 10.75909423828125, 11.046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 6.0, 4.0, 2.0, 4.0, 6.0, 12.0, 8.0, 17.0, 12.0, 19.0, 11.0, 17.0, 21.0, 25.0, 34.0, 45.0, 43.0, 67.0, 147.0, 121.0, 76.0, 48.0, 34.0, 28.0, 27.0, 20.0, 25.0, 14.0, 12.0, 16.0, 12.0, 4.0, 13.0, 6.0, 10.0, 8.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001369476318359375, -0.0013265162706375122, -0.0012835562229156494, -0.0012405961751937866, -0.0011976361274719238, -0.001154676079750061, -0.0011117160320281982, -0.0010687559843063354, -0.0010257959365844727, -0.0009828358888626099, -0.0009398758411407471, -0.0008969157934188843, -0.0008539557456970215, -0.0008109956979751587, -0.0007680356502532959, -0.0007250756025314331, -0.0006821155548095703, -0.0006391555070877075, -0.0005961954593658447, -0.0005532354116439819, -0.0005102753639221191, -0.00046731531620025635, -0.00042435526847839355, -0.00038139522075653076, -0.00033843517303466797, -0.0002954751253128052, -0.0002525150775909424, -0.0002095550298690796, -0.0001665949821472168, -0.000123634934425354, -8.067488670349121e-05, -3.771483898162842e-05, 5.245208740234375e-06, 4.820525646209717e-05, 9.116530418395996e-05, 0.00013412535190582275, 0.00017708539962768555, 0.00022004544734954834, 0.00026300549507141113, 0.0003059655427932739, 0.0003489255905151367, 0.0003918856382369995, 0.0004348456859588623, 0.0004778057336807251, 0.0005207657814025879, 0.0005637258291244507, 0.0006066858768463135, 0.0006496459245681763, 0.0006926059722900391, 0.0007355660200119019, 0.0007785260677337646, 0.0008214861154556274, 0.0008644461631774902, 0.000907406210899353, 0.0009503662586212158, 0.0009933263063430786, 0.0010362863540649414, 0.0010792464017868042, 0.001122206449508667, 0.0011651664972305298, 0.0012081265449523926, 0.0012510865926742554, 0.0012940466403961182, 0.001337006688117981, 0.0013799667358398438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 15.0, 21.0, 30.0, 57.0, 81.0, 153.0, 256.0, 406.0, 802.0, 1825.0, 5432.0, 21310.0, 105514.0, 567489.0, 276343.0, 51783.0, 11191.0, 3211.0, 1228.0, 596.0, 325.0, 180.0, 91.0, 64.0, 29.0, 29.0, 24.0, 18.0, 7.0, 7.0, 6.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1875, -10.84619140625, -10.5048828125, -10.16357421875, -9.822265625, -9.48095703125, -9.1396484375, -8.79833984375, -8.45703125, -8.11572265625, -7.7744140625, -7.43310546875, -7.091796875, -6.75048828125, -6.4091796875, -6.06787109375, -5.7265625, -5.38525390625, -5.0439453125, -4.70263671875, -4.361328125, -4.02001953125, -3.6787109375, -3.33740234375, -2.99609375, -2.65478515625, -2.3134765625, -1.97216796875, -1.630859375, -1.28955078125, -0.9482421875, -0.60693359375, -0.265625, 0.07568359375, 0.4169921875, 0.75830078125, 1.099609375, 1.44091796875, 1.7822265625, 2.12353515625, 2.46484375, 2.80615234375, 3.1474609375, 3.48876953125, 3.830078125, 4.17138671875, 4.5126953125, 4.85400390625, 5.1953125, 5.53662109375, 5.8779296875, 6.21923828125, 6.560546875, 6.90185546875, 7.2431640625, 7.58447265625, 7.92578125, 8.26708984375, 8.6083984375, 8.94970703125, 9.291015625, 9.63232421875, 9.9736328125, 10.31494140625, 10.65625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 1.0, 5.0, 1.0, 6.0, 5.0, 3.0, 7.0, 6.0, 7.0, 9.0, 13.0, 14.0, 28.0, 23.0, 30.0, 30.0, 48.0, 54.0, 64.0, 85.0, 90.0, 103.0, 85.0, 40.0, 44.0, 35.0, 33.0, 26.0, 21.0, 17.0, 12.0, 13.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.99609375, -4.78497314453125, -4.5738525390625, -4.36273193359375, -4.151611328125, -3.94049072265625, -3.7293701171875, -3.51824951171875, -3.30712890625, -3.09600830078125, -2.8848876953125, -2.67376708984375, -2.462646484375, -2.25152587890625, -2.0404052734375, -1.82928466796875, -1.6181640625, -1.40704345703125, -1.1959228515625, -0.98480224609375, -0.773681640625, -0.56256103515625, -0.3514404296875, -0.14031982421875, 0.07080078125, 0.28192138671875, 0.4930419921875, 0.70416259765625, 0.915283203125, 1.12640380859375, 1.3375244140625, 1.54864501953125, 1.759765625, 1.97088623046875, 2.1820068359375, 2.39312744140625, 2.604248046875, 2.81536865234375, 3.0264892578125, 3.23760986328125, 3.44873046875, 3.65985107421875, 3.8709716796875, 4.08209228515625, 4.293212890625, 4.50433349609375, 4.7154541015625, 4.92657470703125, 5.1376953125, 5.34881591796875, 5.5599365234375, 5.77105712890625, 5.982177734375, 6.19329833984375, 6.4044189453125, 6.61553955078125, 6.82666015625, 7.03778076171875, 7.2489013671875, 7.46002197265625, 7.671142578125, 7.88226318359375, 8.0933837890625, 8.30450439453125, 8.515625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 9.0, 11.0, 28.0, 53.0, 104.0, 157.0, 185.0, 158.0, 144.0, 88.0, 37.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.6143341064453, -236.9787139892578, -231.3430938720703, -225.7074737548828, -220.0718536376953, -214.4362335205078, -208.8006134033203, -203.1649932861328, -197.5293731689453, -191.8937530517578, -186.2581329345703, -180.6225128173828, -174.9868927001953, -169.3512725830078, -163.7156524658203, -158.0800323486328, -152.44439697265625, -146.80877685546875, -141.17315673828125, -135.53753662109375, -129.90191650390625, -124.26629638671875, -118.63067626953125, -112.99505615234375, -107.35943603515625, -101.72381591796875, -96.08819580078125, -90.45257568359375, -84.81695556640625, -79.18133544921875, -73.54571533203125, -67.91009521484375, -62.27446746826172, -56.63884735107422, -51.00322723388672, -45.36760711669922, -39.73198699951172, -34.09636688232422, -28.460742950439453, -22.825122833251953, -17.189502716064453, -11.553882598876953, -5.918261528015137, -0.2826404571533203, 5.35297966003418, 10.98859977722168, 16.624221801757812, 22.259841918945312, 27.895462036132812, 33.53108215332031, 39.16670227050781, 44.80232238769531, 50.43794250488281, 56.07356262207031, 61.70918655395508, 67.34480285644531, 72.98042297363281, 78.61604309082031, 84.25166320800781, 89.88728332519531, 95.52290344238281, 101.15852355957031, 106.79414367675781, 112.42976379394531, 118.06539154052734]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 8.0, 3.0, 15.0, 18.0, 14.0, 17.0, 18.0, 16.0, 23.0, 21.0, 30.0, 32.0, 30.0, 35.0, 41.0, 49.0, 44.0, 34.0, 48.0, 46.0, 39.0, 42.0, 43.0, 47.0, 35.0, 25.0, 39.0, 33.0, 30.0, 13.0, 17.0, 16.0, 18.0, 5.0, 9.0, 9.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.42166137695312, -71.0766372680664, -68.73160552978516, -66.38658142089844, -64.04154968261719, -61.69652557373047, -59.35150146484375, -57.006473541259766, -54.66144561767578, -52.3164176940918, -49.97138977050781, -47.626365661621094, -45.28133773803711, -42.936309814453125, -40.591285705566406, -38.24625778198242, -35.90122985839844, -33.55620193481445, -31.2111759185791, -28.86614990234375, -26.521121978759766, -24.17609405517578, -21.83106803894043, -19.486042022705078, -17.141014099121094, -14.795987129211426, -12.450960159301758, -10.10593318939209, -7.760906219482422, -5.415879249572754, -3.070852279663086, -0.7258262634277344, 1.6192092895507812, 3.964236259460449, 6.309263229370117, 8.654290199279785, 10.999317169189453, 13.344344139099121, 15.689371109008789, 18.03439712524414, 20.379425048828125, 22.72445297241211, 25.06947898864746, 27.414505004882812, 29.759532928466797, 32.10456085205078, 34.4495849609375, 36.794612884521484, 39.13964080810547, 41.48466873168945, 43.82969665527344, 46.174720764160156, 48.51974868774414, 50.864776611328125, 53.209800720214844, 55.55482864379883, 57.89985656738281, 60.2448844909668, 62.58991241455078, 64.9349365234375, 67.27996826171875, 69.62499237060547, 71.97001647949219, 74.31504821777344, 76.66007232666016]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 8.0, 8.0, 11.0, 17.0, 21.0, 22.0, 40.0, 71.0, 95.0, 148.0, 254.0, 421.0, 790.0, 1441.0, 2620.0, 5332.0, 11031.0, 25919.0, 70864.0, 267471.0, 2625719.0, 938156.0, 158296.0, 48721.0, 18928.0, 8629.0, 4269.0, 2181.0, 1152.0, 700.0, 374.0, 221.0, 142.0, 74.0, 56.0, 24.0, 17.0, 21.0, 3.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1171875, -12.7293701171875, -12.341552734375, -11.9537353515625, -11.56591796875, -11.1781005859375, -10.790283203125, -10.4024658203125, -10.0146484375, -9.6268310546875, -9.239013671875, -8.8511962890625, -8.46337890625, -8.0755615234375, -7.687744140625, -7.2999267578125, -6.912109375, -6.5242919921875, -6.136474609375, -5.7486572265625, -5.36083984375, -4.9730224609375, -4.585205078125, -4.1973876953125, -3.8095703125, -3.4217529296875, -3.033935546875, -2.6461181640625, -2.25830078125, -1.8704833984375, -1.482666015625, -1.0948486328125, -0.70703125, -0.3192138671875, 0.068603515625, 0.4564208984375, 0.84423828125, 1.2320556640625, 1.619873046875, 2.0076904296875, 2.3955078125, 2.7833251953125, 3.171142578125, 3.5589599609375, 3.94677734375, 4.3345947265625, 4.722412109375, 5.1102294921875, 5.498046875, 5.8858642578125, 6.273681640625, 6.6614990234375, 7.04931640625, 7.4371337890625, 7.824951171875, 8.2127685546875, 8.6005859375, 8.9884033203125, 9.376220703125, 9.7640380859375, 10.15185546875, 10.5396728515625, 10.927490234375, 11.3153076171875, 11.703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 14.0, 9.0, 18.0, 23.0, 33.0, 31.0, 35.0, 35.0, 55.0, 50.0, 54.0, 71.0, 59.0, 65.0, 72.0, 65.0, 59.0, 46.0, 34.0, 35.0, 29.0, 25.0, 30.0, 12.0, 9.0, 7.0, 6.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.576171875, -4.4375, -4.298828125, -4.16015625, -4.021484375, -3.8828125, -3.744140625, -3.60546875, -3.466796875, -3.328125, -3.189453125, -3.05078125, -2.912109375, -2.7734375, -2.634765625, -2.49609375, -2.357421875, -2.21875, -2.080078125, -1.94140625, -1.802734375, -1.6640625, -1.525390625, -1.38671875, -1.248046875, -1.109375, -0.970703125, -0.83203125, -0.693359375, -0.5546875, -0.416015625, -0.27734375, -0.138671875, 0.0, 0.138671875, 0.27734375, 0.416015625, 0.5546875, 0.693359375, 0.83203125, 0.970703125, 1.109375, 1.248046875, 1.38671875, 1.525390625, 1.6640625, 1.802734375, 1.94140625, 2.080078125, 2.21875, 2.357421875, 2.49609375, 2.634765625, 2.7734375, 2.912109375, 3.05078125, 3.189453125, 3.328125, 3.466796875, 3.60546875, 3.744140625, 3.8828125, 4.021484375, 4.16015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 15.0, 45.0, 41.0, 81.0, 98.0, 156.0, 280.0, 459.0, 824.0, 1504.0, 2870.0, 6087.0, 13132.0, 30932.0, 83482.0, 270308.0, 1324342.0, 1954990.0, 338585.0, 100515.0, 36282.0, 15099.0, 6928.0, 3320.0, 1751.0, 882.0, 462.0, 289.0, 186.0, 106.0, 71.0, 53.0, 27.0, 17.0, 14.0, 6.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.181640625, -7.85546875, -7.529296875, -7.203125, -6.876953125, -6.55078125, -6.224609375, -5.8984375, -5.572265625, -5.24609375, -4.919921875, -4.59375, -4.267578125, -3.94140625, -3.615234375, -3.2890625, -2.962890625, -2.63671875, -2.310546875, -1.984375, -1.658203125, -1.33203125, -1.005859375, -0.6796875, -0.353515625, -0.02734375, 0.298828125, 0.625, 0.951171875, 1.27734375, 1.603515625, 1.9296875, 2.255859375, 2.58203125, 2.908203125, 3.234375, 3.560546875, 3.88671875, 4.212890625, 4.5390625, 4.865234375, 5.19140625, 5.517578125, 5.84375, 6.169921875, 6.49609375, 6.822265625, 7.1484375, 7.474609375, 7.80078125, 8.126953125, 8.453125, 8.779296875, 9.10546875, 9.431640625, 9.7578125, 10.083984375, 10.41015625, 10.736328125, 11.0625, 11.388671875, 11.71484375, 12.041015625, 12.3671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 6.0, 10.0, 18.0, 20.0, 18.0, 35.0, 68.0, 95.0, 142.0, 221.0, 379.0, 886.0, 977.0, 473.0, 270.0, 167.0, 96.0, 59.0, 31.0, 29.0, 21.0, 13.0, 13.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1015625, -10.8311767578125, -10.560791015625, -10.2904052734375, -10.02001953125, -9.7496337890625, -9.479248046875, -9.2088623046875, -8.9384765625, -8.6680908203125, -8.397705078125, -8.1273193359375, -7.85693359375, -7.5865478515625, -7.316162109375, -7.0457763671875, -6.775390625, -6.5050048828125, -6.234619140625, -5.9642333984375, -5.69384765625, -5.4234619140625, -5.153076171875, -4.8826904296875, -4.6123046875, -4.3419189453125, -4.071533203125, -3.8011474609375, -3.53076171875, -3.2603759765625, -2.989990234375, -2.7196044921875, -2.44921875, -2.1788330078125, -1.908447265625, -1.6380615234375, -1.36767578125, -1.0972900390625, -0.826904296875, -0.5565185546875, -0.2861328125, -0.0157470703125, 0.254638671875, 0.5250244140625, 0.79541015625, 1.0657958984375, 1.336181640625, 1.6065673828125, 1.876953125, 2.1473388671875, 2.417724609375, 2.6881103515625, 2.95849609375, 3.2288818359375, 3.499267578125, 3.7696533203125, 4.0400390625, 4.3104248046875, 4.580810546875, 4.8511962890625, 5.12158203125, 5.3919677734375, 5.662353515625, 5.9327392578125, 6.203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 17.0, 12.0, 34.0, 47.0, 69.0, 92.0, 113.0, 118.0, 130.0, 101.0, 74.0, 64.0, 41.0, 25.0, 22.0, 14.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.33293914794922, -58.6876335144043, -57.04232406616211, -55.39701843261719, -53.751712799072266, -52.106407165527344, -50.461097717285156, -48.815792083740234, -47.17048645019531, -45.52518081665039, -43.8798713684082, -42.23456573486328, -40.58926010131836, -38.94395446777344, -37.29864501953125, -35.65333938598633, -34.008033752441406, -32.362728118896484, -30.71742057800293, -29.072113037109375, -27.426807403564453, -25.7814998626709, -24.136192321777344, -22.490886688232422, -20.845577239990234, -19.20026969909668, -17.554964065551758, -15.909656524658203, -14.264350891113281, -12.619043350219727, -10.973736763000488, -9.32843017578125, -7.683124542236328, -6.03781795501709, -4.392511367797852, -2.747204303741455, -1.1018977165222168, 0.5434093475341797, 2.188715934753418, 3.8340225219726562, 5.4793291091918945, 7.124635696411133, 8.769942283630371, 10.41524887084961, 12.060556411743164, 13.705862998962402, 15.35116958618164, 16.996475219726562, 18.641782760620117, 20.287090301513672, 21.932395935058594, 23.57770347595215, 25.22300910949707, 26.868316650390625, 28.513622283935547, 30.1589298248291, 31.804237365722656, 33.44954299926758, 35.094852447509766, 36.74015808105469, 38.38546371459961, 40.03076934814453, 41.67607879638672, 43.32138442993164, 44.96669006347656]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 6.0, 3.0, 9.0, 9.0, 15.0, 18.0, 27.0, 17.0, 29.0, 35.0, 37.0, 39.0, 40.0, 41.0, 41.0, 55.0, 42.0, 54.0, 49.0, 43.0, 46.0, 38.0, 33.0, 47.0, 32.0, 29.0, 37.0, 19.0, 16.0, 13.0, 16.0, 11.0, 11.0, 8.0, 9.0, 8.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.20871353149414, -26.219411849975586, -25.23011016845703, -24.240806579589844, -23.25150489807129, -22.262203216552734, -21.27290153503418, -20.283599853515625, -19.294296264648438, -18.304994583129883, -17.315692901611328, -16.32638931274414, -15.337087631225586, -14.347785949707031, -13.358484268188477, -12.369182586669922, -11.379880905151367, -10.390579223632812, -9.401276588439941, -8.411974906921387, -7.422672748565674, -6.433370590209961, -5.444068908691406, -4.454766750335693, -3.4654645919799805, -2.4761624336242676, -1.4868605136871338, -0.49755859375, 0.4917435646057129, 1.4810457229614258, 2.4703474044799805, 3.4596495628356934, 4.448951721191406, 5.438253879547119, 6.427556037902832, 7.416857719421387, 8.406160354614258, 9.395462036132812, 10.384763717651367, 11.374065399169922, 12.363368034362793, 13.352669715881348, 14.341972351074219, 15.331274032592773, 16.320575714111328, 17.309879302978516, 18.299179077148438, 19.288482666015625, 20.27778434753418, 21.267086029052734, 22.25638771057129, 23.245689392089844, 24.23499298095703, 25.224294662475586, 26.21359634399414, 27.202898025512695, 28.19219970703125, 29.181501388549805, 30.17080307006836, 31.160106658935547, 32.14940643310547, 33.138710021972656, 34.128013610839844, 35.117313385009766, 36.10661697387695]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 8.0, 21.0, 23.0, 31.0, 46.0, 94.0, 145.0, 278.0, 469.0, 938.0, 1647.0, 3537.0, 8498.0, 20922.0, 53434.0, 130691.0, 257050.0, 287000.0, 165324.0, 70614.0, 27430.0, 11044.0, 4752.0, 2115.0, 1053.0, 617.0, 283.0, 176.0, 92.0, 64.0, 39.0, 25.0, 23.0, 12.0, 13.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.9898681640625, -11.628173828125, -11.2664794921875, -10.90478515625, -10.5430908203125, -10.181396484375, -9.8197021484375, -9.4580078125, -9.0963134765625, -8.734619140625, -8.3729248046875, -8.01123046875, -7.6495361328125, -7.287841796875, -6.9261474609375, -6.564453125, -6.2027587890625, -5.841064453125, -5.4793701171875, -5.11767578125, -4.7559814453125, -4.394287109375, -4.0325927734375, -3.6708984375, -3.3092041015625, -2.947509765625, -2.5858154296875, -2.22412109375, -1.8624267578125, -1.500732421875, -1.1390380859375, -0.77734375, -0.4156494140625, -0.053955078125, 0.3077392578125, 0.66943359375, 1.0311279296875, 1.392822265625, 1.7545166015625, 2.1162109375, 2.4779052734375, 2.839599609375, 3.2012939453125, 3.56298828125, 3.9246826171875, 4.286376953125, 4.6480712890625, 5.009765625, 5.3714599609375, 5.733154296875, 6.0948486328125, 6.45654296875, 6.8182373046875, 7.179931640625, 7.5416259765625, 7.9033203125, 8.2650146484375, 8.626708984375, 8.9884033203125, 9.35009765625, 9.7117919921875, 10.073486328125, 10.4351806640625, 10.796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 3.0, 12.0, 14.0, 24.0, 23.0, 17.0, 33.0, 56.0, 38.0, 54.0, 64.0, 72.0, 60.0, 65.0, 63.0, 61.0, 59.0, 48.0, 52.0, 42.0, 43.0, 23.0, 20.0, 15.0, 12.0, 6.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.61004638671875, -4.4583740234375, -4.30670166015625, -4.155029296875, -4.00335693359375, -3.8516845703125, -3.70001220703125, -3.54833984375, -3.39666748046875, -3.2449951171875, -3.09332275390625, -2.941650390625, -2.78997802734375, -2.6383056640625, -2.48663330078125, -2.3349609375, -2.18328857421875, -2.0316162109375, -1.87994384765625, -1.728271484375, -1.57659912109375, -1.4249267578125, -1.27325439453125, -1.12158203125, -0.96990966796875, -0.8182373046875, -0.66656494140625, -0.514892578125, -0.36322021484375, -0.2115478515625, -0.05987548828125, 0.091796875, 0.24346923828125, 0.3951416015625, 0.54681396484375, 0.698486328125, 0.85015869140625, 1.0018310546875, 1.15350341796875, 1.30517578125, 1.45684814453125, 1.6085205078125, 1.76019287109375, 1.911865234375, 2.06353759765625, 2.2152099609375, 2.36688232421875, 2.5185546875, 2.67022705078125, 2.8218994140625, 2.97357177734375, 3.125244140625, 3.27691650390625, 3.4285888671875, 3.58026123046875, 3.73193359375, 3.88360595703125, 4.0352783203125, 4.18695068359375, 4.338623046875, 4.49029541015625, 4.6419677734375, 4.79364013671875, 4.9453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 11.0, 9.0, 25.0, 40.0, 45.0, 57.0, 87.0, 107.0, 179.0, 319.0, 509.0, 823.0, 1583.0, 4367.0, 18373.0, 112397.0, 539275.0, 306371.0, 49464.0, 8966.0, 2500.0, 1200.0, 634.0, 409.0, 275.0, 165.0, 101.0, 69.0, 46.0, 40.0, 24.0, 19.0, 15.0, 10.0, 8.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.50830078125, -16.8291015625, -16.14990234375, -15.470703125, -14.79150390625, -14.1123046875, -13.43310546875, -12.75390625, -12.07470703125, -11.3955078125, -10.71630859375, -10.037109375, -9.35791015625, -8.6787109375, -7.99951171875, -7.3203125, -6.64111328125, -5.9619140625, -5.28271484375, -4.603515625, -3.92431640625, -3.2451171875, -2.56591796875, -1.88671875, -1.20751953125, -0.5283203125, 0.15087890625, 0.830078125, 1.50927734375, 2.1884765625, 2.86767578125, 3.546875, 4.22607421875, 4.9052734375, 5.58447265625, 6.263671875, 6.94287109375, 7.6220703125, 8.30126953125, 8.98046875, 9.65966796875, 10.3388671875, 11.01806640625, 11.697265625, 12.37646484375, 13.0556640625, 13.73486328125, 14.4140625, 15.09326171875, 15.7724609375, 16.45166015625, 17.130859375, 17.81005859375, 18.4892578125, 19.16845703125, 19.84765625, 20.52685546875, 21.2060546875, 21.88525390625, 22.564453125, 23.24365234375, 23.9228515625, 24.60205078125, 25.28125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 12.0, 7.0, 12.0, 7.0, 19.0, 32.0, 13.0, 23.0, 30.0, 34.0, 53.0, 48.0, 45.0, 43.0, 49.0, 46.0, 52.0, 52.0, 48.0, 46.0, 49.0, 41.0, 43.0, 34.0, 24.0, 17.0, 24.0, 14.0, 13.0, 15.0, 2.0, 9.0, 4.0, 8.0, 8.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.2216796875, -17.599609375, -16.9775390625, -16.35546875, -15.7333984375, -15.111328125, -14.4892578125, -13.8671875, -13.2451171875, -12.623046875, -12.0009765625, -11.37890625, -10.7568359375, -10.134765625, -9.5126953125, -8.890625, -8.2685546875, -7.646484375, -7.0244140625, -6.40234375, -5.7802734375, -5.158203125, -4.5361328125, -3.9140625, -3.2919921875, -2.669921875, -2.0478515625, -1.42578125, -0.8037109375, -0.181640625, 0.4404296875, 1.0625, 1.6845703125, 2.306640625, 2.9287109375, 3.55078125, 4.1728515625, 4.794921875, 5.4169921875, 6.0390625, 6.6611328125, 7.283203125, 7.9052734375, 8.52734375, 9.1494140625, 9.771484375, 10.3935546875, 11.015625, 11.6376953125, 12.259765625, 12.8818359375, 13.50390625, 14.1259765625, 14.748046875, 15.3701171875, 15.9921875, 16.6142578125, 17.236328125, 17.8583984375, 18.48046875, 19.1025390625, 19.724609375, 20.3466796875, 20.96875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 12.0, 21.0, 23.0, 52.0, 79.0, 160.0, 330.0, 954.0, 3389.0, 19033.0, 130057.0, 578949.0, 267062.0, 39552.0, 6460.0, 1466.0, 489.0, 220.0, 99.0, 58.0, 28.0, 12.0, 13.0, 9.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-10.2734375, -9.9154052734375, -9.557373046875, -9.1993408203125, -8.84130859375, -8.4832763671875, -8.125244140625, -7.7672119140625, -7.4091796875, -7.0511474609375, -6.693115234375, -6.3350830078125, -5.97705078125, -5.6190185546875, -5.260986328125, -4.9029541015625, -4.544921875, -4.1868896484375, -3.828857421875, -3.4708251953125, -3.11279296875, -2.7547607421875, -2.396728515625, -2.0386962890625, -1.6806640625, -1.3226318359375, -0.964599609375, -0.6065673828125, -0.24853515625, 0.1094970703125, 0.467529296875, 0.8255615234375, 1.18359375, 1.5416259765625, 1.899658203125, 2.2576904296875, 2.61572265625, 2.9737548828125, 3.331787109375, 3.6898193359375, 4.0478515625, 4.4058837890625, 4.763916015625, 5.1219482421875, 5.47998046875, 5.8380126953125, 6.196044921875, 6.5540771484375, 6.912109375, 7.2701416015625, 7.628173828125, 7.9862060546875, 8.34423828125, 8.7022705078125, 9.060302734375, 9.4183349609375, 9.7763671875, 10.1343994140625, 10.492431640625, 10.8504638671875, 11.20849609375, 11.5665283203125, 11.924560546875, 12.2825927734375, 12.640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 5.0, 13.0, 8.0, 10.0, 18.0, 18.0, 20.0, 26.0, 30.0, 32.0, 44.0, 53.0, 59.0, 51.0, 83.0, 62.0, 76.0, 55.0, 49.0, 42.0, 35.0, 36.0, 18.0, 27.0, 29.0, 16.0, 18.0, 9.0, 10.0, 3.0, 8.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013256072998046875, -0.0012833178043365479, -0.0012410283088684082, -0.0011987388134002686, -0.001156449317932129, -0.0011141598224639893, -0.0010718703269958496, -0.00102958083152771, -0.0009872913360595703, -0.0009450018405914307, -0.000902712345123291, -0.0008604228496551514, -0.0008181333541870117, -0.0007758438587188721, -0.0007335543632507324, -0.0006912648677825928, -0.0006489753723144531, -0.0006066858768463135, -0.0005643963813781738, -0.0005221068859100342, -0.00047981739044189453, -0.0004375278949737549, -0.00039523839950561523, -0.0003529489040374756, -0.00031065940856933594, -0.0002683699131011963, -0.00022608041763305664, -0.000183790922164917, -0.00014150142669677734, -9.92119312286377e-05, -5.692243576049805e-05, -1.4632940292358398e-05, 2.765655517578125e-05, 6.99460506439209e-05, 0.00011223554611206055, 0.0001545250415802002, 0.00019681453704833984, 0.0002391040325164795, 0.00028139352798461914, 0.0003236830234527588, 0.00036597251892089844, 0.0004082620143890381, 0.00045055150985717773, 0.0004928410053253174, 0.000535130500793457, 0.0005774199962615967, 0.0006197094917297363, 0.000661998987197876, 0.0007042884826660156, 0.0007465779781341553, 0.0007888674736022949, 0.0008311569690704346, 0.0008734464645385742, 0.0009157359600067139, 0.0009580254554748535, 0.0010003149509429932, 0.0010426044464111328, 0.0010848939418792725, 0.0011271834373474121, 0.0011694729328155518, 0.0012117624282836914, 0.001254051923751831, 0.0012963414192199707, 0.0013386309146881104, 0.00138092041015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 9.0, 25.0, 36.0, 39.0, 49.0, 88.0, 138.0, 237.0, 372.0, 721.0, 1451.0, 3340.0, 11083.0, 47753.0, 199857.0, 490855.0, 220175.0, 52967.0, 12181.0, 3728.0, 1521.0, 746.0, 419.0, 276.0, 166.0, 108.0, 64.0, 61.0, 32.0, 19.0, 14.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.7347412109375, -7.453857421875, -7.1729736328125, -6.89208984375, -6.6112060546875, -6.330322265625, -6.0494384765625, -5.7685546875, -5.4876708984375, -5.206787109375, -4.9259033203125, -4.64501953125, -4.3641357421875, -4.083251953125, -3.8023681640625, -3.521484375, -3.2406005859375, -2.959716796875, -2.6788330078125, -2.39794921875, -2.1170654296875, -1.836181640625, -1.5552978515625, -1.2744140625, -0.9935302734375, -0.712646484375, -0.4317626953125, -0.15087890625, 0.1300048828125, 0.410888671875, 0.6917724609375, 0.97265625, 1.2535400390625, 1.534423828125, 1.8153076171875, 2.09619140625, 2.3770751953125, 2.657958984375, 2.9388427734375, 3.2197265625, 3.5006103515625, 3.781494140625, 4.0623779296875, 4.34326171875, 4.6241455078125, 4.905029296875, 5.1859130859375, 5.466796875, 5.7476806640625, 6.028564453125, 6.3094482421875, 6.59033203125, 6.8712158203125, 7.152099609375, 7.4329833984375, 7.7138671875, 7.9947509765625, 8.275634765625, 8.5565185546875, 8.83740234375, 9.1182861328125, 9.399169921875, 9.6800537109375, 9.9609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 8.0, 9.0, 11.0, 24.0, 18.0, 24.0, 25.0, 33.0, 39.0, 38.0, 49.0, 53.0, 78.0, 80.0, 81.0, 68.0, 62.0, 45.0, 60.0, 43.0, 27.0, 21.0, 12.0, 19.0, 15.0, 12.0, 8.0, 8.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.1849365234375, -5.955810546875, -5.7266845703125, -5.49755859375, -5.2684326171875, -5.039306640625, -4.8101806640625, -4.5810546875, -4.3519287109375, -4.122802734375, -3.8936767578125, -3.66455078125, -3.4354248046875, -3.206298828125, -2.9771728515625, -2.748046875, -2.5189208984375, -2.289794921875, -2.0606689453125, -1.83154296875, -1.6024169921875, -1.373291015625, -1.1441650390625, -0.9150390625, -0.6859130859375, -0.456787109375, -0.2276611328125, 0.00146484375, 0.2305908203125, 0.459716796875, 0.6888427734375, 0.91796875, 1.1470947265625, 1.376220703125, 1.6053466796875, 1.83447265625, 2.0635986328125, 2.292724609375, 2.5218505859375, 2.7509765625, 2.9801025390625, 3.209228515625, 3.4383544921875, 3.66748046875, 3.8966064453125, 4.125732421875, 4.3548583984375, 4.583984375, 4.8131103515625, 5.042236328125, 5.2713623046875, 5.50048828125, 5.7296142578125, 5.958740234375, 6.1878662109375, 6.4169921875, 6.6461181640625, 6.875244140625, 7.1043701171875, 7.33349609375, 7.5626220703125, 7.791748046875, 8.0208740234375, 8.25]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 9.0, 27.0, 68.0, 162.0, 283.0, 259.0, 139.0, 44.0, 8.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.36935424804688, -74.14250946044922, -64.91566467285156, -55.688812255859375, -46.46196746826172, -37.23512268066406, -28.00827407836914, -18.78142547607422, -9.554580688476562, -0.32773399353027344, 8.899112701416016, 18.125959396362305, 27.352806091308594, 36.57965087890625, 45.80649948120117, 55.033348083496094, 64.26019287109375, 73.4870376586914, 82.71388244628906, 91.94073486328125, 101.1675796508789, 110.39442443847656, 119.62127685546875, 128.84811401367188, 138.07496643066406, 147.30181884765625, 156.52865600585938, 165.75550842285156, 174.98236083984375, 184.20919799804688, 193.43605041503906, 202.66290283203125, 211.88973999023438, 221.11659240722656, 230.3434295654297, 239.57028198242188, 248.797119140625, 258.02398681640625, 267.2508239746094, 276.4776611328125, 285.70452880859375, 294.9313659667969, 304.1582336425781, 313.38507080078125, 322.6119079589844, 331.8387451171875, 341.06561279296875, 350.2924499511719, 359.519287109375, 368.7461242675781, 377.9729919433594, 387.1998291015625, 396.4266662597656, 405.65350341796875, 414.88037109375, 424.1072082519531, 433.33404541015625, 442.5608825683594, 451.7877502441406, 461.01458740234375, 470.2414245605469, 479.46826171875, 488.69512939453125, 497.9219665527344, 507.1488342285156]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 7.0, 5.0, 14.0, 13.0, 19.0, 26.0, 24.0, 26.0, 26.0, 34.0, 38.0, 41.0, 43.0, 53.0, 44.0, 52.0, 43.0, 44.0, 43.0, 51.0, 45.0, 38.0, 33.0, 34.0, 25.0, 33.0, 21.0, 16.0, 18.0, 20.0, 13.0, 4.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-84.62775421142578, -81.8919677734375, -79.15618896484375, -76.42040252685547, -73.68462371826172, -70.94883728027344, -68.21305847167969, -65.4772720336914, -62.74148941040039, -60.005706787109375, -57.26992416381836, -54.534141540527344, -51.79835510253906, -49.06257629394531, -46.32678985595703, -43.591007232666016, -40.855224609375, -38.119441986083984, -35.38365936279297, -32.64787292480469, -29.912092208862305, -27.17630958557129, -24.44052505493164, -21.704742431640625, -18.96895980834961, -16.233177185058594, -13.497393608093262, -10.76161003112793, -8.025827407836914, -5.290044784545898, -2.55426025390625, 0.18152236938476562, 2.9173049926757812, 5.653088092803955, 8.388871192932129, 11.124654769897461, 13.860437393188477, 16.596220016479492, 19.33200454711914, 22.067787170410156, 24.803569793701172, 27.539352416992188, 30.275135040283203, 33.01091766357422, 35.7467041015625, 38.48248291015625, 41.21826934814453, 43.95405197143555, 46.68983459472656, 49.42561721801758, 52.161399841308594, 54.897186279296875, 57.632965087890625, 60.368751525878906, 63.10453414916992, 65.84031677246094, 68.57609558105469, 71.31188201904297, 74.04766082763672, 76.783447265625, 79.51922607421875, 82.25501251220703, 84.99079895019531, 87.72657775878906, 90.46236419677734]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 6.0, 11.0, 16.0, 19.0, 23.0, 42.0, 48.0, 62.0, 86.0, 146.0, 222.0, 319.0, 472.0, 793.0, 1212.0, 1871.0, 3316.0, 6165.0, 12619.0, 30491.0, 95204.0, 3482194.0, 439447.0, 71242.0, 24686.0, 10606.0, 5264.0, 2906.0, 1669.0, 1106.0, 637.0, 425.0, 287.0, 203.0, 135.0, 83.0, 56.0, 56.0, 40.0, 23.0, 24.0, 9.0, 12.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3515625, -11.95166015625, -11.5517578125, -11.15185546875, -10.751953125, -10.35205078125, -9.9521484375, -9.55224609375, -9.15234375, -8.75244140625, -8.3525390625, -7.95263671875, -7.552734375, -7.15283203125, -6.7529296875, -6.35302734375, -5.953125, -5.55322265625, -5.1533203125, -4.75341796875, -4.353515625, -3.95361328125, -3.5537109375, -3.15380859375, -2.75390625, -2.35400390625, -1.9541015625, -1.55419921875, -1.154296875, -0.75439453125, -0.3544921875, 0.04541015625, 0.4453125, 0.84521484375, 1.2451171875, 1.64501953125, 2.044921875, 2.44482421875, 2.8447265625, 3.24462890625, 3.64453125, 4.04443359375, 4.4443359375, 4.84423828125, 5.244140625, 5.64404296875, 6.0439453125, 6.44384765625, 6.84375, 7.24365234375, 7.6435546875, 8.04345703125, 8.443359375, 8.84326171875, 9.2431640625, 9.64306640625, 10.04296875, 10.44287109375, 10.8427734375, 11.24267578125, 11.642578125, 12.04248046875, 12.4423828125, 12.84228515625, 13.2421875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 5.0, 12.0, 12.0, 20.0, 19.0, 33.0, 39.0, 47.0, 51.0, 44.0, 55.0, 65.0, 67.0, 60.0, 51.0, 71.0, 53.0, 57.0, 42.0, 43.0, 32.0, 23.0, 25.0, 12.0, 11.0, 3.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.2432861328125, -5.080322265625, -4.9173583984375, -4.75439453125, -4.5914306640625, -4.428466796875, -4.2655029296875, -4.1025390625, -3.9395751953125, -3.776611328125, -3.6136474609375, -3.45068359375, -3.2877197265625, -3.124755859375, -2.9617919921875, -2.798828125, -2.6358642578125, -2.472900390625, -2.3099365234375, -2.14697265625, -1.9840087890625, -1.821044921875, -1.6580810546875, -1.4951171875, -1.3321533203125, -1.169189453125, -1.0062255859375, -0.84326171875, -0.6802978515625, -0.517333984375, -0.3543701171875, -0.19140625, -0.0284423828125, 0.134521484375, 0.2974853515625, 0.46044921875, 0.6234130859375, 0.786376953125, 0.9493408203125, 1.1123046875, 1.2752685546875, 1.438232421875, 1.6011962890625, 1.76416015625, 1.9271240234375, 2.090087890625, 2.2530517578125, 2.416015625, 2.5789794921875, 2.741943359375, 2.9049072265625, 3.06787109375, 3.2308349609375, 3.393798828125, 3.5567626953125, 3.7197265625, 3.8826904296875, 4.045654296875, 4.2086181640625, 4.37158203125, 4.5345458984375, 4.697509765625, 4.8604736328125, 5.0234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 10.0, 7.0, 14.0, 26.0, 33.0, 61.0, 103.0, 200.0, 351.0, 855.0, 2501.0, 8676.0, 48014.0, 3388619.0, 695998.0, 37614.0, 7524.0, 2176.0, 823.0, 301.0, 149.0, 90.0, 40.0, 43.0, 21.0, 17.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.34912109375, -18.5732421875, -17.79736328125, -17.021484375, -16.24560546875, -15.4697265625, -14.69384765625, -13.91796875, -13.14208984375, -12.3662109375, -11.59033203125, -10.814453125, -10.03857421875, -9.2626953125, -8.48681640625, -7.7109375, -6.93505859375, -6.1591796875, -5.38330078125, -4.607421875, -3.83154296875, -3.0556640625, -2.27978515625, -1.50390625, -0.72802734375, 0.0478515625, 0.82373046875, 1.599609375, 2.37548828125, 3.1513671875, 3.92724609375, 4.703125, 5.47900390625, 6.2548828125, 7.03076171875, 7.806640625, 8.58251953125, 9.3583984375, 10.13427734375, 10.91015625, 11.68603515625, 12.4619140625, 13.23779296875, 14.013671875, 14.78955078125, 15.5654296875, 16.34130859375, 17.1171875, 17.89306640625, 18.6689453125, 19.44482421875, 20.220703125, 20.99658203125, 21.7724609375, 22.54833984375, 23.32421875, 24.10009765625, 24.8759765625, 25.65185546875, 26.427734375, 27.20361328125, 27.9794921875, 28.75537109375, 29.53125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 13.0, 12.0, 18.0, 33.0, 49.0, 87.0, 141.0, 302.0, 2610.0, 409.0, 146.0, 89.0, 43.0, 33.0, 15.0, 20.0, 14.0, 11.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.41796875, -4.3092041015625, -4.200439453125, -4.0916748046875, -3.98291015625, -3.8741455078125, -3.765380859375, -3.6566162109375, -3.5478515625, -3.4390869140625, -3.330322265625, -3.2215576171875, -3.11279296875, -3.0040283203125, -2.895263671875, -2.7864990234375, -2.677734375, -2.5689697265625, -2.460205078125, -2.3514404296875, -2.24267578125, -2.1339111328125, -2.025146484375, -1.9163818359375, -1.8076171875, -1.6988525390625, -1.590087890625, -1.4813232421875, -1.37255859375, -1.2637939453125, -1.155029296875, -1.0462646484375, -0.9375, -0.8287353515625, -0.719970703125, -0.6112060546875, -0.50244140625, -0.3936767578125, -0.284912109375, -0.1761474609375, -0.0673828125, 0.0413818359375, 0.150146484375, 0.2589111328125, 0.36767578125, 0.4764404296875, 0.585205078125, 0.6939697265625, 0.802734375, 0.9114990234375, 1.020263671875, 1.1290283203125, 1.23779296875, 1.3465576171875, 1.455322265625, 1.5640869140625, 1.6728515625, 1.7816162109375, 1.890380859375, 1.9991455078125, 2.10791015625, 2.2166748046875, 2.325439453125, 2.4342041015625, 2.54296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 13.0, 7.0, 16.0, 21.0, 46.0, 55.0, 81.0, 92.0, 124.0, 142.0, 114.0, 93.0, 73.0, 46.0, 36.0, 17.0, 10.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.40271759033203, -21.832439422607422, -21.262161254882812, -20.691883087158203, -20.121604919433594, -19.551326751708984, -18.981048583984375, -18.410770416259766, -17.840492248535156, -17.270214080810547, -16.699935913085938, -16.129657745361328, -15.559379577636719, -14.98910140991211, -14.4188232421875, -13.84854507446289, -13.278267860412598, -12.707989692687988, -12.137711524963379, -11.56743335723877, -10.99715518951416, -10.42687702178955, -9.856599807739258, -9.286321640014648, -8.716043472290039, -8.14576530456543, -7.57548713684082, -7.005208969116211, -6.434930801391602, -5.864652633666992, -5.294374942779541, -4.724096775054932, -4.153818130493164, -3.5835399627685547, -3.0132617950439453, -2.442983865737915, -1.8727056980133057, -1.3024275302886963, -0.732149600982666, -0.16187143325805664, 0.40840673446655273, 0.9786848425865173, 1.548962950706482, 2.1192409992218018, 2.689519166946411, 3.2597973346710205, 3.830075263977051, 4.40035343170166, 4.9706315994262695, 5.540909767150879, 6.111187934875488, 6.681466102600098, 7.251744270324707, 7.822022438049316, 8.39229965209961, 8.962577819824219, 9.532855987548828, 10.103134155273438, 10.673412322998047, 11.243690490722656, 11.813968658447266, 12.384246826171875, 12.954524993896484, 13.524803161621094, 14.095081329345703]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 10.0, 11.0, 10.0, 13.0, 14.0, 18.0, 21.0, 14.0, 23.0, 21.0, 32.0, 27.0, 32.0, 31.0, 39.0, 26.0, 47.0, 38.0, 40.0, 45.0, 40.0, 39.0, 22.0, 35.0, 40.0, 38.0, 34.0, 32.0, 34.0, 23.0, 26.0, 19.0, 15.0, 13.0, 16.0, 16.0, 7.0, 8.0, 2.0, 2.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1619720458984375, -5.936976432800293, -5.711980819702148, -5.486985206604004, -5.261989593505859, -5.036993980407715, -4.81199836730957, -4.587002754211426, -4.362007141113281, -4.137011528015137, -3.912015914916992, -3.6870203018188477, -3.462024688720703, -3.2370290756225586, -3.012033462524414, -2.7870378494262695, -2.562042236328125, -2.3370466232299805, -2.112051010131836, -1.8870553970336914, -1.6620597839355469, -1.4370641708374023, -1.2120685577392578, -0.9870729446411133, -0.7620773315429688, -0.5370817184448242, -0.3120861053466797, -0.08709049224853516, 0.13790512084960938, 0.3629007339477539, 0.5878963470458984, 0.812891960144043, 1.0378875732421875, 1.262883186340332, 1.4878787994384766, 1.712874412536621, 1.9378700256347656, 2.16286563873291, 2.3878612518310547, 2.612856864929199, 2.8378524780273438, 3.0628480911254883, 3.287843704223633, 3.5128393173217773, 3.737834930419922, 3.9628305435180664, 4.187826156616211, 4.4128217697143555, 4.6378173828125, 4.8628129959106445, 5.087808609008789, 5.312804222106934, 5.537799835205078, 5.762795448303223, 5.987791061401367, 6.212786674499512, 6.437782287597656, 6.662777900695801, 6.887773513793945, 7.11276912689209, 7.337764739990234, 7.562760353088379, 7.787755966186523, 8.012751579284668, 8.237747192382812]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 18.0, 31.0, 47.0, 73.0, 170.0, 309.0, 659.0, 1553.0, 4607.0, 14274.0, 45791.0, 135887.0, 303766.0, 317052.0, 149207.0, 50778.0, 16101.0, 5048.0, 1803.0, 723.0, 291.0, 151.0, 88.0, 47.0, 23.0, 16.0, 8.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.6142578125, -14.197265625, -13.7802734375, -13.36328125, -12.9462890625, -12.529296875, -12.1123046875, -11.6953125, -11.2783203125, -10.861328125, -10.4443359375, -10.02734375, -9.6103515625, -9.193359375, -8.7763671875, -8.359375, -7.9423828125, -7.525390625, -7.1083984375, -6.69140625, -6.2744140625, -5.857421875, -5.4404296875, -5.0234375, -4.6064453125, -4.189453125, -3.7724609375, -3.35546875, -2.9384765625, -2.521484375, -2.1044921875, -1.6875, -1.2705078125, -0.853515625, -0.4365234375, -0.01953125, 0.3974609375, 0.814453125, 1.2314453125, 1.6484375, 2.0654296875, 2.482421875, 2.8994140625, 3.31640625, 3.7333984375, 4.150390625, 4.5673828125, 4.984375, 5.4013671875, 5.818359375, 6.2353515625, 6.65234375, 7.0693359375, 7.486328125, 7.9033203125, 8.3203125, 8.7373046875, 9.154296875, 9.5712890625, 9.98828125, 10.4052734375, 10.822265625, 11.2392578125, 11.65625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 13.0, 16.0, 23.0, 31.0, 36.0, 35.0, 43.0, 49.0, 49.0, 52.0, 61.0, 70.0, 50.0, 67.0, 56.0, 68.0, 50.0, 34.0, 29.0, 36.0, 33.0, 17.0, 17.0, 10.0, 13.0, 6.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.540771484375, -5.36669921875, -5.192626953125, -5.0185546875, -4.844482421875, -4.67041015625, -4.496337890625, -4.322265625, -4.148193359375, -3.97412109375, -3.800048828125, -3.6259765625, -3.451904296875, -3.27783203125, -3.103759765625, -2.9296875, -2.755615234375, -2.58154296875, -2.407470703125, -2.2333984375, -2.059326171875, -1.88525390625, -1.711181640625, -1.537109375, -1.363037109375, -1.18896484375, -1.014892578125, -0.8408203125, -0.666748046875, -0.49267578125, -0.318603515625, -0.14453125, 0.029541015625, 0.20361328125, 0.377685546875, 0.5517578125, 0.725830078125, 0.89990234375, 1.073974609375, 1.248046875, 1.422119140625, 1.59619140625, 1.770263671875, 1.9443359375, 2.118408203125, 2.29248046875, 2.466552734375, 2.640625, 2.814697265625, 2.98876953125, 3.162841796875, 3.3369140625, 3.510986328125, 3.68505859375, 3.859130859375, 4.033203125, 4.207275390625, 4.38134765625, 4.555419921875, 4.7294921875, 4.903564453125, 5.07763671875, 5.251708984375, 5.42578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 9.0, 21.0, 31.0, 40.0, 60.0, 90.0, 124.0, 173.0, 292.0, 426.0, 738.0, 1495.0, 4539.0, 26102.0, 226015.0, 640451.0, 126234.0, 15423.0, 3129.0, 1201.0, 704.0, 395.0, 276.0, 182.0, 119.0, 68.0, 44.0, 30.0, 30.0, 24.0, 16.0, 10.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-23.53125, -22.80419921875, -22.0771484375, -21.35009765625, -20.623046875, -19.89599609375, -19.1689453125, -18.44189453125, -17.71484375, -16.98779296875, -16.2607421875, -15.53369140625, -14.806640625, -14.07958984375, -13.3525390625, -12.62548828125, -11.8984375, -11.17138671875, -10.4443359375, -9.71728515625, -8.990234375, -8.26318359375, -7.5361328125, -6.80908203125, -6.08203125, -5.35498046875, -4.6279296875, -3.90087890625, -3.173828125, -2.44677734375, -1.7197265625, -0.99267578125, -0.265625, 0.46142578125, 1.1884765625, 1.91552734375, 2.642578125, 3.36962890625, 4.0966796875, 4.82373046875, 5.55078125, 6.27783203125, 7.0048828125, 7.73193359375, 8.458984375, 9.18603515625, 9.9130859375, 10.64013671875, 11.3671875, 12.09423828125, 12.8212890625, 13.54833984375, 14.275390625, 15.00244140625, 15.7294921875, 16.45654296875, 17.18359375, 17.91064453125, 18.6376953125, 19.36474609375, 20.091796875, 20.81884765625, 21.5458984375, 22.27294921875, 23.0]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 7.0, 8.0, 11.0, 7.0, 13.0, 13.0, 26.0, 22.0, 27.0, 30.0, 45.0, 27.0, 31.0, 40.0, 46.0, 47.0, 53.0, 57.0, 53.0, 57.0, 51.0, 42.0, 45.0, 35.0, 39.0, 21.0, 19.0, 36.0, 16.0, 18.0, 12.0, 10.0, 3.0, 4.0, 5.0, 3.0, 7.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.4375, -24.696044921875, -23.95458984375, -23.213134765625, -22.4716796875, -21.730224609375, -20.98876953125, -20.247314453125, -19.505859375, -18.764404296875, -18.02294921875, -17.281494140625, -16.5400390625, -15.798583984375, -15.05712890625, -14.315673828125, -13.57421875, -12.832763671875, -12.09130859375, -11.349853515625, -10.6083984375, -9.866943359375, -9.12548828125, -8.384033203125, -7.642578125, -6.901123046875, -6.15966796875, -5.418212890625, -4.6767578125, -3.935302734375, -3.19384765625, -2.452392578125, -1.7109375, -0.969482421875, -0.22802734375, 0.513427734375, 1.2548828125, 1.996337890625, 2.73779296875, 3.479248046875, 4.220703125, 4.962158203125, 5.70361328125, 6.445068359375, 7.1865234375, 7.927978515625, 8.66943359375, 9.410888671875, 10.15234375, 10.893798828125, 11.63525390625, 12.376708984375, 13.1181640625, 13.859619140625, 14.60107421875, 15.342529296875, 16.083984375, 16.825439453125, 17.56689453125, 18.308349609375, 19.0498046875, 19.791259765625, 20.53271484375, 21.274169921875, 22.015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 10.0, 12.0, 17.0, 32.0, 81.0, 132.0, 344.0, 973.0, 4357.0, 40227.0, 576901.0, 395627.0, 25239.0, 3206.0, 811.0, 287.0, 136.0, 62.0, 37.0, 24.0, 11.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.8221435546875, -12.378662109375, -11.9351806640625, -11.49169921875, -11.0482177734375, -10.604736328125, -10.1612548828125, -9.7177734375, -9.2742919921875, -8.830810546875, -8.3873291015625, -7.94384765625, -7.5003662109375, -7.056884765625, -6.6134033203125, -6.169921875, -5.7264404296875, -5.282958984375, -4.8394775390625, -4.39599609375, -3.9525146484375, -3.509033203125, -3.0655517578125, -2.6220703125, -2.1785888671875, -1.735107421875, -1.2916259765625, -0.84814453125, -0.4046630859375, 0.038818359375, 0.4822998046875, 0.92578125, 1.3692626953125, 1.812744140625, 2.2562255859375, 2.69970703125, 3.1431884765625, 3.586669921875, 4.0301513671875, 4.4736328125, 4.9171142578125, 5.360595703125, 5.8040771484375, 6.24755859375, 6.6910400390625, 7.134521484375, 7.5780029296875, 8.021484375, 8.4649658203125, 8.908447265625, 9.3519287109375, 9.79541015625, 10.2388916015625, 10.682373046875, 11.1258544921875, 11.5693359375, 12.0128173828125, 12.456298828125, 12.8997802734375, 13.34326171875, 13.7867431640625, 14.230224609375, 14.6737060546875, 15.1171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 7.0, 10.0, 20.0, 23.0, 27.0, 34.0, 34.0, 51.0, 41.0, 47.0, 78.0, 59.0, 67.0, 66.0, 81.0, 60.0, 68.0, 34.0, 31.0, 34.0, 25.0, 19.0, 9.0, 13.0, 11.0, 10.0, 4.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012292861938476562, -0.0011877268552780151, -0.001146167516708374, -0.001104608178138733, -0.0010630488395690918, -0.0010214895009994507, -0.0009799301624298096, -0.0009383708238601685, -0.0008968114852905273, -0.0008552521467208862, -0.0008136928081512451, -0.000772133469581604, -0.0007305741310119629, -0.0006890147924423218, -0.0006474554538726807, -0.0006058961153030396, -0.0005643367767333984, -0.0005227774381637573, -0.0004812180995941162, -0.0004396587610244751, -0.000398099422454834, -0.00035654008388519287, -0.00031498074531555176, -0.00027342140674591064, -0.00023186206817626953, -0.00019030272960662842, -0.0001487433910369873, -0.00010718405246734619, -6.562471389770508e-05, -2.4065375328063965e-05, 1.749396324157715e-05, 5.905330181121826e-05, 0.00010061264038085938, 0.0001421719789505005, 0.0001837313175201416, 0.00022529065608978271, 0.00026684999465942383, 0.00030840933322906494, 0.00034996867179870605, 0.00039152801036834717, 0.0004330873489379883, 0.0004746466875076294, 0.0005162060260772705, 0.0005577653646469116, 0.0005993247032165527, 0.0006408840417861938, 0.000682443380355835, 0.0007240027189254761, 0.0007655620574951172, 0.0008071213960647583, 0.0008486807346343994, 0.0008902400732040405, 0.0009317994117736816, 0.0009733587503433228, 0.0010149180889129639, 0.001056477427482605, 0.001098036766052246, 0.0011395961046218872, 0.0011811554431915283, 0.0012227147817611694, 0.0012642741203308105, 0.0013058334589004517, 0.0013473927974700928, 0.0013889521360397339, 0.001430511474609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 2.0, 13.0, 11.0, 21.0, 28.0, 44.0, 95.0, 193.0, 428.0, 1190.0, 4019.0, 33412.0, 579998.0, 402108.0, 21843.0, 3431.0, 984.0, 370.0, 172.0, 73.0, 41.0, 22.0, 19.0, 7.0, 6.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -15.0673828125, -14.580078125, -14.0927734375, -13.60546875, -13.1181640625, -12.630859375, -12.1435546875, -11.65625, -11.1689453125, -10.681640625, -10.1943359375, -9.70703125, -9.2197265625, -8.732421875, -8.2451171875, -7.7578125, -7.2705078125, -6.783203125, -6.2958984375, -5.80859375, -5.3212890625, -4.833984375, -4.3466796875, -3.859375, -3.3720703125, -2.884765625, -2.3974609375, -1.91015625, -1.4228515625, -0.935546875, -0.4482421875, 0.0390625, 0.5263671875, 1.013671875, 1.5009765625, 1.98828125, 2.4755859375, 2.962890625, 3.4501953125, 3.9375, 4.4248046875, 4.912109375, 5.3994140625, 5.88671875, 6.3740234375, 6.861328125, 7.3486328125, 7.8359375, 8.3232421875, 8.810546875, 9.2978515625, 9.78515625, 10.2724609375, 10.759765625, 11.2470703125, 11.734375, 12.2216796875, 12.708984375, 13.1962890625, 13.68359375, 14.1708984375, 14.658203125, 15.1455078125, 15.6328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 10.0, 20.0, 25.0, 33.0, 61.0, 81.0, 109.0, 162.0, 130.0, 109.0, 93.0, 63.0, 41.0, 26.0, 9.0, 9.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.4984130859375, -15.028076171875, -14.5577392578125, -14.08740234375, -13.6170654296875, -13.146728515625, -12.6763916015625, -12.2060546875, -11.7357177734375, -11.265380859375, -10.7950439453125, -10.32470703125, -9.8543701171875, -9.384033203125, -8.9136962890625, -8.443359375, -7.9730224609375, -7.502685546875, -7.0323486328125, -6.56201171875, -6.0916748046875, -5.621337890625, -5.1510009765625, -4.6806640625, -4.2103271484375, -3.739990234375, -3.2696533203125, -2.79931640625, -2.3289794921875, -1.858642578125, -1.3883056640625, -0.91796875, -0.4476318359375, 0.022705078125, 0.4930419921875, 0.96337890625, 1.4337158203125, 1.904052734375, 2.3743896484375, 2.8447265625, 3.3150634765625, 3.785400390625, 4.2557373046875, 4.72607421875, 5.1964111328125, 5.666748046875, 6.1370849609375, 6.607421875, 7.0777587890625, 7.548095703125, 8.0184326171875, 8.48876953125, 8.9591064453125, 9.429443359375, 9.8997802734375, 10.3701171875, 10.8404541015625, 11.310791015625, 11.7811279296875, 12.25146484375, 12.7218017578125, 13.192138671875, 13.6624755859375, 14.1328125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 20.0, 30.0, 65.0, 136.0, 222.0, 194.0, 158.0, 95.0, 52.0, 15.0, 10.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.3706817626953, -207.46087646484375, -200.5510711669922, -193.6412811279297, -186.73147583007812, -179.82167053222656, -172.911865234375, -166.0020751953125, -159.09226989746094, -152.18246459960938, -145.2726593017578, -138.3628692626953, -131.45306396484375, -124.54325866699219, -117.63345336914062, -110.7236557006836, -103.81385040283203, -96.90404510498047, -89.99424743652344, -83.08444213867188, -76.17464447021484, -69.26483917236328, -62.355037689208984, -55.44523620605469, -48.53543472290039, -41.625633239746094, -34.7158317565918, -27.806028366088867, -20.89622688293457, -13.98642349243164, -7.076622009277344, -0.16682052612304688, 6.74298095703125, 13.652782440185547, 20.562583923339844, 27.472387313842773, 34.38218688964844, 41.2919921875, 48.2017936706543, 55.111595153808594, 62.02139663696289, 68.93119812011719, 75.84100341796875, 82.75080108642578, 89.66060638427734, 96.57040405273438, 103.48020935058594, 110.3900146484375, 117.29981231689453, 124.2096176147461, 131.11941528320312, 138.0292205810547, 144.93902587890625, 151.84881591796875, 158.7586212158203, 165.66842651367188, 172.57823181152344, 179.488037109375, 186.39784240722656, 193.30763244628906, 200.21743774414062, 207.1272430419922, 214.03704833984375, 220.94683837890625, 227.8566436767578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 6.0, 11.0, 11.0, 15.0, 11.0, 21.0, 21.0, 22.0, 23.0, 25.0, 26.0, 35.0, 33.0, 39.0, 34.0, 34.0, 44.0, 47.0, 44.0, 42.0, 44.0, 36.0, 30.0, 38.0, 41.0, 30.0, 25.0, 29.0, 23.0, 22.0, 14.0, 20.0, 17.0, 17.0, 10.0, 9.0, 9.0, 7.0, 7.0, 5.0, 1.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-84.09310913085938, -81.26773834228516, -78.44236755371094, -75.61700439453125, -72.79163360595703, -69.96626281738281, -67.14089965820312, -64.3155288696289, -61.49015808105469, -58.66478729248047, -55.839420318603516, -53.01405334472656, -50.188682556152344, -47.363311767578125, -44.53794479370117, -41.71257781982422, -38.88720703125, -36.06183624267578, -33.23646926879883, -30.411100387573242, -27.585731506347656, -24.76036262512207, -21.934993743896484, -19.1096248626709, -16.284255981445312, -13.458887100219727, -10.63351821899414, -7.808149337768555, -4.982780456542969, -2.157411575317383, 0.6679573059082031, 3.493326187133789, 6.318695068359375, 9.144063949584961, 11.969432830810547, 14.794801712036133, 17.62017059326172, 20.445539474487305, 23.27090835571289, 26.096277236938477, 28.921646118164062, 31.74701499938965, 34.572383880615234, 37.39775085449219, 40.223121643066406, 43.048492431640625, 45.87385940551758, 48.69922637939453, 51.52459716796875, 54.34996795654297, 57.17533493041992, 60.000701904296875, 62.826072692871094, 65.65144348144531, 68.476806640625, 71.30217742919922, 74.12754821777344, 76.95291900634766, 79.77828979492188, 82.60365295410156, 85.42902374267578, 88.25439453125, 91.07975769042969, 93.9051284790039, 96.73049926757812]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 7.0, 13.0, 17.0, 34.0, 51.0, 82.0, 147.0, 240.0, 474.0, 814.0, 1575.0, 3240.0, 6766.0, 16633.0, 48644.0, 248068.0, 3682112.0, 129377.0, 33181.0, 12343.0, 5115.0, 2513.0, 1307.0, 671.0, 374.0, 207.0, 106.0, 70.0, 35.0, 18.0, 20.0, 5.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.412841796875, -11.98974609375, -11.566650390625, -11.1435546875, -10.720458984375, -10.29736328125, -9.874267578125, -9.451171875, -9.028076171875, -8.60498046875, -8.181884765625, -7.7587890625, -7.335693359375, -6.91259765625, -6.489501953125, -6.06640625, -5.643310546875, -5.22021484375, -4.797119140625, -4.3740234375, -3.950927734375, -3.52783203125, -3.104736328125, -2.681640625, -2.258544921875, -1.83544921875, -1.412353515625, -0.9892578125, -0.566162109375, -0.14306640625, 0.280029296875, 0.703125, 1.126220703125, 1.54931640625, 1.972412109375, 2.3955078125, 2.818603515625, 3.24169921875, 3.664794921875, 4.087890625, 4.510986328125, 4.93408203125, 5.357177734375, 5.7802734375, 6.203369140625, 6.62646484375, 7.049560546875, 7.47265625, 7.895751953125, 8.31884765625, 8.741943359375, 9.1650390625, 9.588134765625, 10.01123046875, 10.434326171875, 10.857421875, 11.280517578125, 11.70361328125, 12.126708984375, 12.5498046875, 12.972900390625, 13.39599609375, 13.819091796875, 14.2421875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 18.0, 13.0, 16.0, 24.0, 33.0, 38.0, 42.0, 36.0, 58.0, 48.0, 53.0, 65.0, 58.0, 54.0, 61.0, 50.0, 45.0, 46.0, 43.0, 40.0, 34.0, 17.0, 28.0, 11.0, 13.0, 11.0, 8.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.27178955078125, -6.1060791015625, -5.94036865234375, -5.774658203125, -5.60894775390625, -5.4432373046875, -5.27752685546875, -5.11181640625, -4.94610595703125, -4.7803955078125, -4.61468505859375, -4.448974609375, -4.28326416015625, -4.1175537109375, -3.95184326171875, -3.7861328125, -3.62042236328125, -3.4547119140625, -3.28900146484375, -3.123291015625, -2.95758056640625, -2.7918701171875, -2.62615966796875, -2.46044921875, -2.29473876953125, -2.1290283203125, -1.96331787109375, -1.797607421875, -1.63189697265625, -1.4661865234375, -1.30047607421875, -1.134765625, -0.96905517578125, -0.8033447265625, -0.63763427734375, -0.471923828125, -0.30621337890625, -0.1405029296875, 0.02520751953125, 0.19091796875, 0.35662841796875, 0.5223388671875, 0.68804931640625, 0.853759765625, 1.01947021484375, 1.1851806640625, 1.35089111328125, 1.5166015625, 1.68231201171875, 1.8480224609375, 2.01373291015625, 2.179443359375, 2.34515380859375, 2.5108642578125, 2.67657470703125, 2.84228515625, 3.00799560546875, 3.1737060546875, 3.33941650390625, 3.505126953125, 3.67083740234375, 3.8365478515625, 4.00225830078125, 4.16796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 15.0, 17.0, 19.0, 29.0, 60.0, 58.0, 100.0, 210.0, 380.0, 747.0, 1474.0, 3675.0, 10129.0, 34229.0, 190010.0, 3672728.0, 224334.0, 38042.0, 11035.0, 3812.0, 1563.0, 721.0, 335.0, 216.0, 124.0, 80.0, 41.0, 22.0, 21.0, 15.0, 12.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.7279052734375, -14.229248046875, -13.7305908203125, -13.23193359375, -12.7332763671875, -12.234619140625, -11.7359619140625, -11.2373046875, -10.7386474609375, -10.239990234375, -9.7413330078125, -9.24267578125, -8.7440185546875, -8.245361328125, -7.7467041015625, -7.248046875, -6.7493896484375, -6.250732421875, -5.7520751953125, -5.25341796875, -4.7547607421875, -4.256103515625, -3.7574462890625, -3.2587890625, -2.7601318359375, -2.261474609375, -1.7628173828125, -1.26416015625, -0.7655029296875, -0.266845703125, 0.2318115234375, 0.73046875, 1.2291259765625, 1.727783203125, 2.2264404296875, 2.72509765625, 3.2237548828125, 3.722412109375, 4.2210693359375, 4.7197265625, 5.2183837890625, 5.717041015625, 6.2156982421875, 6.71435546875, 7.2130126953125, 7.711669921875, 8.2103271484375, 8.708984375, 9.2076416015625, 9.706298828125, 10.2049560546875, 10.70361328125, 11.2022705078125, 11.700927734375, 12.1995849609375, 12.6982421875, 13.1968994140625, 13.695556640625, 14.1942138671875, 14.69287109375, 15.1915283203125, 15.690185546875, 16.1888427734375, 16.6875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 18.0, 17.0, 28.0, 23.0, 47.0, 67.0, 135.0, 266.0, 1598.0, 1219.0, 232.0, 138.0, 85.0, 44.0, 43.0, 20.0, 15.0, 14.0, 9.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.986846923828125, -2.88385009765625, -2.780853271484375, -2.6778564453125, -2.574859619140625, -2.47186279296875, -2.368865966796875, -2.265869140625, -2.162872314453125, -2.05987548828125, -1.956878662109375, -1.8538818359375, -1.750885009765625, -1.64788818359375, -1.544891357421875, -1.44189453125, -1.338897705078125, -1.23590087890625, -1.132904052734375, -1.0299072265625, -0.926910400390625, -0.82391357421875, -0.720916748046875, -0.617919921875, -0.514923095703125, -0.41192626953125, -0.308929443359375, -0.2059326171875, -0.102935791015625, 6.103515625e-05, 0.103057861328125, 0.2060546875, 0.309051513671875, 0.41204833984375, 0.515045166015625, 0.6180419921875, 0.721038818359375, 0.82403564453125, 0.927032470703125, 1.030029296875, 1.133026123046875, 1.23602294921875, 1.339019775390625, 1.4420166015625, 1.545013427734375, 1.64801025390625, 1.751007080078125, 1.85400390625, 1.957000732421875, 2.05999755859375, 2.162994384765625, 2.2659912109375, 2.368988037109375, 2.47198486328125, 2.574981689453125, 2.677978515625, 2.780975341796875, 2.88397216796875, 2.986968994140625, 3.0899658203125, 3.192962646484375, 3.29595947265625, 3.398956298828125, 3.501953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 13.0, 24.0, 17.0, 30.0, 27.0, 48.0, 54.0, 65.0, 75.0, 75.0, 74.0, 78.0, 80.0, 64.0, 50.0, 46.0, 26.0, 30.0, 28.0, 20.0, 14.0, 9.0, 4.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.424139022827148, -13.043779373168945, -12.663419723510742, -12.283060073852539, -11.902700424194336, -11.522340774536133, -11.14198112487793, -10.761621475219727, -10.381261825561523, -10.00090217590332, -9.620542526245117, -9.240182876586914, -8.859823226928711, -8.479463577270508, -8.099103927612305, -7.718743801116943, -7.338383674621582, -6.958024024963379, -6.577664375305176, -6.197304725646973, -5.8169450759887695, -5.436585426330566, -5.056225299835205, -4.675865650177002, -4.295506000518799, -3.9151463508605957, -3.5347867012023926, -3.1544268131256104, -2.7740671634674072, -2.393707513809204, -2.013347625732422, -1.6329879760742188, -1.252629280090332, -0.8722695708274841, -0.49190986156463623, -0.11155009269714355, 0.26880955696105957, 0.6491692066192627, 1.029529094696045, 1.409888744354248, 1.7902483940124512, 2.1706080436706543, 2.5509676933288574, 2.9313275814056396, 3.3116872310638428, 3.692046880722046, 4.072406768798828, 4.452766418457031, 4.833126068115234, 5.2134857177734375, 5.593845367431641, 5.974205017089844, 6.354564666748047, 6.73492431640625, 7.115284442901611, 7.4956440925598145, 7.876003742218018, 8.256363868713379, 8.636723518371582, 9.017083168029785, 9.397442817687988, 9.777802467346191, 10.158162117004395, 10.538521766662598, 10.9188814163208]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 8.0, 15.0, 11.0, 9.0, 12.0, 24.0, 19.0, 27.0, 36.0, 32.0, 20.0, 28.0, 33.0, 47.0, 39.0, 41.0, 36.0, 51.0, 48.0, 37.0, 41.0, 37.0, 39.0, 32.0, 30.0, 34.0, 28.0, 31.0, 27.0, 18.0, 17.0, 8.0, 17.0, 15.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.556029319763184, -8.2909574508667, -8.025885581970215, -7.760814189910889, -7.4957427978515625, -7.230670928955078, -6.965599060058594, -6.700527191162109, -6.435455799102783, -6.170383930206299, -5.905312538146973, -5.640240669250488, -5.375168800354004, -5.110097408294678, -4.845025539398193, -4.579954147338867, -4.314882278442383, -4.049810409545898, -3.7847390174865723, -3.519667148590088, -3.2545955181121826, -2.9895238876342773, -2.724452018737793, -2.4593803882598877, -2.1943087577819824, -1.9292371273040771, -1.6641653776168823, -1.3990936279296875, -1.1340219974517822, -0.868950366973877, -0.6038786172866821, -0.3388068675994873, -0.07373428344726562, 0.19133740663528442, 0.4564090967178345, 0.7214807868003845, 0.9865524768829346, 1.2516241073608398, 1.5166958570480347, 1.7817676067352295, 2.0468392372131348, 2.31191086769104, 2.5769824981689453, 2.8420543670654297, 3.107125997543335, 3.3721976280212402, 3.6372694969177246, 3.90234112739563, 4.167412757873535, 4.4324846267700195, 4.697556018829346, 4.96262788772583, 5.227699279785156, 5.492771148681641, 5.757843017578125, 6.022914886474609, 6.2879862785339355, 6.55305814743042, 6.818129539489746, 7.0832014083862305, 7.348273277282715, 7.613344669342041, 7.878416538238525, 8.143487930297852, 8.408559799194336]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 7.0, 14.0, 17.0, 28.0, 34.0, 53.0, 75.0, 123.0, 155.0, 275.0, 445.0, 748.0, 1360.0, 2458.0, 4503.0, 9043.0, 17594.0, 34730.0, 67237.0, 122328.0, 187981.0, 213572.0, 168349.0, 103479.0, 55380.0, 28130.0, 14187.0, 7423.0, 3944.0, 2045.0, 1147.0, 670.0, 366.0, 213.0, 166.0, 93.0, 64.0, 40.0, 26.0, 14.0, 13.0, 5.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.91796875, -6.7041015625, -6.490234375, -6.2763671875, -6.0625, -5.8486328125, -5.634765625, -5.4208984375, -5.20703125, -4.9931640625, -4.779296875, -4.5654296875, -4.3515625, -4.1376953125, -3.923828125, -3.7099609375, -3.49609375, -3.2822265625, -3.068359375, -2.8544921875, -2.640625, -2.4267578125, -2.212890625, -1.9990234375, -1.78515625, -1.5712890625, -1.357421875, -1.1435546875, -0.9296875, -0.7158203125, -0.501953125, -0.2880859375, -0.07421875, 0.1396484375, 0.353515625, 0.5673828125, 0.78125, 0.9951171875, 1.208984375, 1.4228515625, 1.63671875, 1.8505859375, 2.064453125, 2.2783203125, 2.4921875, 2.7060546875, 2.919921875, 3.1337890625, 3.34765625, 3.5615234375, 3.775390625, 3.9892578125, 4.203125, 4.4169921875, 4.630859375, 4.8447265625, 5.05859375, 5.2724609375, 5.486328125, 5.7001953125, 5.9140625, 6.1279296875, 6.341796875, 6.5556640625, 6.76953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 13.0, 21.0, 28.0, 28.0, 30.0, 31.0, 37.0, 44.0, 46.0, 45.0, 51.0, 66.0, 59.0, 51.0, 54.0, 35.0, 29.0, 52.0, 50.0, 48.0, 24.0, 21.0, 21.0, 15.0, 16.0, 10.0, 9.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.36810302734375, -5.2088623046875, -5.04962158203125, -4.890380859375, -4.73114013671875, -4.5718994140625, -4.41265869140625, -4.25341796875, -4.09417724609375, -3.9349365234375, -3.77569580078125, -3.616455078125, -3.45721435546875, -3.2979736328125, -3.13873291015625, -2.9794921875, -2.82025146484375, -2.6610107421875, -2.50177001953125, -2.342529296875, -2.18328857421875, -2.0240478515625, -1.86480712890625, -1.70556640625, -1.54632568359375, -1.3870849609375, -1.22784423828125, -1.068603515625, -0.90936279296875, -0.7501220703125, -0.59088134765625, -0.431640625, -0.27239990234375, -0.1131591796875, 0.04608154296875, 0.205322265625, 0.36456298828125, 0.5238037109375, 0.68304443359375, 0.84228515625, 1.00152587890625, 1.1607666015625, 1.32000732421875, 1.479248046875, 1.63848876953125, 1.7977294921875, 1.95697021484375, 2.1162109375, 2.27545166015625, 2.4346923828125, 2.59393310546875, 2.753173828125, 2.91241455078125, 3.0716552734375, 3.23089599609375, 3.39013671875, 3.54937744140625, 3.7086181640625, 3.86785888671875, 4.027099609375, 4.18634033203125, 4.3455810546875, 4.50482177734375, 4.6640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 19.0, 18.0, 28.0, 45.0, 61.0, 100.0, 184.0, 287.0, 595.0, 1036.0, 2470.0, 11650.0, 168349.0, 780380.0, 72353.0, 7054.0, 1894.0, 875.0, 454.0, 247.0, 154.0, 88.0, 63.0, 46.0, 25.0, 15.0, 11.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.33740234375, -25.4404296875, -24.54345703125, -23.646484375, -22.74951171875, -21.8525390625, -20.95556640625, -20.05859375, -19.16162109375, -18.2646484375, -17.36767578125, -16.470703125, -15.57373046875, -14.6767578125, -13.77978515625, -12.8828125, -11.98583984375, -11.0888671875, -10.19189453125, -9.294921875, -8.39794921875, -7.5009765625, -6.60400390625, -5.70703125, -4.81005859375, -3.9130859375, -3.01611328125, -2.119140625, -1.22216796875, -0.3251953125, 0.57177734375, 1.46875, 2.36572265625, 3.2626953125, 4.15966796875, 5.056640625, 5.95361328125, 6.8505859375, 7.74755859375, 8.64453125, 9.54150390625, 10.4384765625, 11.33544921875, 12.232421875, 13.12939453125, 14.0263671875, 14.92333984375, 15.8203125, 16.71728515625, 17.6142578125, 18.51123046875, 19.408203125, 20.30517578125, 21.2021484375, 22.09912109375, 22.99609375, 23.89306640625, 24.7900390625, 25.68701171875, 26.583984375, 27.48095703125, 28.3779296875, 29.27490234375, 30.171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 10.0, 12.0, 8.0, 16.0, 21.0, 29.0, 33.0, 47.0, 58.0, 61.0, 65.0, 63.0, 68.0, 73.0, 74.0, 54.0, 48.0, 57.0, 36.0, 42.0, 29.0, 22.0, 16.0, 9.0, 14.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.4375, -34.452392578125, -33.46728515625, -32.482177734375, -31.4970703125, -30.511962890625, -29.52685546875, -28.541748046875, -27.556640625, -26.571533203125, -25.58642578125, -24.601318359375, -23.6162109375, -22.631103515625, -21.64599609375, -20.660888671875, -19.67578125, -18.690673828125, -17.70556640625, -16.720458984375, -15.7353515625, -14.750244140625, -13.76513671875, -12.780029296875, -11.794921875, -10.809814453125, -9.82470703125, -8.839599609375, -7.8544921875, -6.869384765625, -5.88427734375, -4.899169921875, -3.9140625, -2.928955078125, -1.94384765625, -0.958740234375, 0.0263671875, 1.011474609375, 1.99658203125, 2.981689453125, 3.966796875, 4.951904296875, 5.93701171875, 6.922119140625, 7.9072265625, 8.892333984375, 9.87744140625, 10.862548828125, 11.84765625, 12.832763671875, 13.81787109375, 14.802978515625, 15.7880859375, 16.773193359375, 17.75830078125, 18.743408203125, 19.728515625, 20.713623046875, 21.69873046875, 22.683837890625, 23.6689453125, 24.654052734375, 25.63916015625, 26.624267578125, 27.609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 8.0, 6.0, 13.0, 15.0, 23.0, 30.0, 40.0, 53.0, 81.0, 136.0, 213.0, 358.0, 669.0, 1444.0, 3950.0, 14411.0, 81926.0, 565462.0, 322687.0, 42815.0, 9000.0, 2742.0, 1070.0, 524.0, 312.0, 182.0, 108.0, 71.0, 54.0, 38.0, 17.0, 24.0, 10.0, 16.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2939453125, -9.001953125, -8.7099609375, -8.41796875, -8.1259765625, -7.833984375, -7.5419921875, -7.25, -6.9580078125, -6.666015625, -6.3740234375, -6.08203125, -5.7900390625, -5.498046875, -5.2060546875, -4.9140625, -4.6220703125, -4.330078125, -4.0380859375, -3.74609375, -3.4541015625, -3.162109375, -2.8701171875, -2.578125, -2.2861328125, -1.994140625, -1.7021484375, -1.41015625, -1.1181640625, -0.826171875, -0.5341796875, -0.2421875, 0.0498046875, 0.341796875, 0.6337890625, 0.92578125, 1.2177734375, 1.509765625, 1.8017578125, 2.09375, 2.3857421875, 2.677734375, 2.9697265625, 3.26171875, 3.5537109375, 3.845703125, 4.1376953125, 4.4296875, 4.7216796875, 5.013671875, 5.3056640625, 5.59765625, 5.8896484375, 6.181640625, 6.4736328125, 6.765625, 7.0576171875, 7.349609375, 7.6416015625, 7.93359375, 8.2255859375, 8.517578125, 8.8095703125, 9.1015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 11.0, 18.0, 21.0, 28.0, 40.0, 41.0, 69.0, 80.0, 108.0, 116.0, 104.0, 75.0, 60.0, 53.0, 30.0, 27.0, 15.0, 15.0, 16.0, 10.0, 10.0, 4.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00179290771484375, -0.0017375648021697998, -0.0016822218894958496, -0.0016268789768218994, -0.0015715360641479492, -0.001516193151473999, -0.0014608502388000488, -0.0014055073261260986, -0.0013501644134521484, -0.0012948215007781982, -0.001239478588104248, -0.0011841356754302979, -0.0011287927627563477, -0.0010734498500823975, -0.0010181069374084473, -0.0009627640247344971, -0.0009074211120605469, -0.0008520781993865967, -0.0007967352867126465, -0.0007413923740386963, -0.0006860494613647461, -0.0006307065486907959, -0.0005753636360168457, -0.0005200207233428955, -0.0004646778106689453, -0.0004093348979949951, -0.0003539919853210449, -0.0002986490726470947, -0.00024330615997314453, -0.00018796324729919434, -0.00013262033462524414, -7.727742195129395e-05, -2.193450927734375e-05, 3.3408403396606445e-05, 8.875131607055664e-05, 0.00014409422874450684, 0.00019943714141845703, 0.0002547800540924072, 0.0003101229667663574, 0.0003654658794403076, 0.0004208087921142578, 0.000476151704788208, 0.0005314946174621582, 0.0005868375301361084, 0.0006421804428100586, 0.0006975233554840088, 0.000752866268157959, 0.0008082091808319092, 0.0008635520935058594, 0.0009188950061798096, 0.0009742379188537598, 0.00102958083152771, 0.0010849237442016602, 0.0011402666568756104, 0.0011956095695495605, 0.0012509524822235107, 0.001306295394897461, 0.0013616383075714111, 0.0014169812202453613, 0.0014723241329193115, 0.0015276670455932617, 0.001583009958267212, 0.0016383528709411621, 0.0016936957836151123, 0.0017490386962890625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 10.0, 14.0, 25.0, 36.0, 49.0, 82.0, 124.0, 227.0, 455.0, 976.0, 2626.0, 11552.0, 112069.0, 759626.0, 142230.0, 13330.0, 2915.0, 1120.0, 459.0, 237.0, 129.0, 98.0, 42.0, 32.0, 23.0, 13.0, 15.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7890625, -10.3973388671875, -10.005615234375, -9.6138916015625, -9.22216796875, -8.8304443359375, -8.438720703125, -8.0469970703125, -7.6552734375, -7.2635498046875, -6.871826171875, -6.4801025390625, -6.08837890625, -5.6966552734375, -5.304931640625, -4.9132080078125, -4.521484375, -4.1297607421875, -3.738037109375, -3.3463134765625, -2.95458984375, -2.5628662109375, -2.171142578125, -1.7794189453125, -1.3876953125, -0.9959716796875, -0.604248046875, -0.2125244140625, 0.17919921875, 0.5709228515625, 0.962646484375, 1.3543701171875, 1.74609375, 2.1378173828125, 2.529541015625, 2.9212646484375, 3.31298828125, 3.7047119140625, 4.096435546875, 4.4881591796875, 4.8798828125, 5.2716064453125, 5.663330078125, 6.0550537109375, 6.44677734375, 6.8385009765625, 7.230224609375, 7.6219482421875, 8.013671875, 8.4053955078125, 8.797119140625, 9.1888427734375, 9.58056640625, 9.9722900390625, 10.364013671875, 10.7557373046875, 11.1474609375, 11.5391845703125, 11.930908203125, 12.3226318359375, 12.71435546875, 13.1060791015625, 13.497802734375, 13.8895263671875, 14.28125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 14.0, 9.0, 9.0, 16.0, 25.0, 31.0, 32.0, 50.0, 59.0, 61.0, 63.0, 92.0, 88.0, 90.0, 71.0, 63.0, 31.0, 39.0, 31.0, 22.0, 19.0, 14.0, 13.0, 4.0, 7.0, 4.0, 4.0, 6.0, 1.0, 8.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0859375, -6.8497314453125, -6.613525390625, -6.3773193359375, -6.14111328125, -5.9049072265625, -5.668701171875, -5.4324951171875, -5.1962890625, -4.9600830078125, -4.723876953125, -4.4876708984375, -4.25146484375, -4.0152587890625, -3.779052734375, -3.5428466796875, -3.306640625, -3.0704345703125, -2.834228515625, -2.5980224609375, -2.36181640625, -2.1256103515625, -1.889404296875, -1.6531982421875, -1.4169921875, -1.1807861328125, -0.944580078125, -0.7083740234375, -0.47216796875, -0.2359619140625, 0.000244140625, 0.2364501953125, 0.47265625, 0.7088623046875, 0.945068359375, 1.1812744140625, 1.41748046875, 1.6536865234375, 1.889892578125, 2.1260986328125, 2.3623046875, 2.5985107421875, 2.834716796875, 3.0709228515625, 3.30712890625, 3.5433349609375, 3.779541015625, 4.0157470703125, 4.251953125, 4.4881591796875, 4.724365234375, 4.9605712890625, 5.19677734375, 5.4329833984375, 5.669189453125, 5.9053955078125, 6.1416015625, 6.3778076171875, 6.614013671875, 6.8502197265625, 7.08642578125, 7.3226318359375, 7.558837890625, 7.7950439453125, 8.03125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 7.0, 20.0, 30.0, 58.0, 105.0, 104.0, 144.0, 134.0, 137.0, 94.0, 60.0, 39.0, 33.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-196.7230224609375, -192.2137908935547, -187.70455932617188, -183.19534301757812, -178.6861114501953, -174.1768798828125, -169.6676483154297, -165.15841674804688, -160.64920043945312, -156.1399688720703, -151.6307373046875, -147.12152099609375, -142.61228942871094, -138.10305786132812, -133.5938262939453, -129.0845947265625, -124.57537078857422, -120.0661392211914, -115.55691528320312, -111.04768371582031, -106.53845977783203, -102.02922821044922, -97.52000427246094, -93.01077270507812, -88.50154113769531, -83.9923095703125, -79.48308563232422, -74.9738540649414, -70.46463012695312, -65.95539855957031, -61.446170806884766, -56.93694305419922, -52.42771911621094, -47.91849136352539, -43.409263610839844, -38.90003204345703, -34.39080810546875, -29.88157844543457, -25.37234878540039, -20.863121032714844, -16.353893280029297, -11.84466552734375, -7.335436820983887, -2.8262081146240234, 1.6830196380615234, 6.19224739074707, 10.70147705078125, 15.210704803466797, 19.719932556152344, 24.22916030883789, 28.738388061523438, 33.24761962890625, 37.75684356689453, 42.266075134277344, 46.77530288696289, 51.28453063964844, 55.793758392333984, 60.30298614501953, 64.81221771240234, 69.32144165039062, 73.83067321777344, 78.33989715576172, 82.84912872314453, 87.35835266113281, 91.86758422851562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 6.0, 10.0, 4.0, 13.0, 14.0, 12.0, 37.0, 24.0, 29.0, 31.0, 30.0, 38.0, 35.0, 47.0, 58.0, 66.0, 45.0, 51.0, 51.0, 47.0, 44.0, 44.0, 43.0, 42.0, 28.0, 29.0, 20.0, 21.0, 14.0, 16.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.01398468017578, -86.9566879272461, -83.89939880371094, -80.84210205078125, -77.7848129272461, -74.7275161743164, -71.67022705078125, -68.61293029785156, -65.5556411743164, -62.498348236083984, -59.44105529785156, -56.38376235961914, -53.32646942138672, -50.2691764831543, -47.211883544921875, -44.15458679199219, -41.097293853759766, -38.040000915527344, -34.98270797729492, -31.9254150390625, -28.868122100830078, -25.810829162597656, -22.7535343170166, -19.69624137878418, -16.638948440551758, -13.581655502319336, -10.524362564086914, -7.467068672180176, -4.409775733947754, -1.352482795715332, 1.7048110961914062, 4.762104034423828, 7.81939697265625, 10.876689910888672, 13.933982849121094, 16.991275787353516, 20.048568725585938, 23.10586166381836, 26.163156509399414, 29.220449447631836, 32.277740478515625, 35.33503341674805, 38.39232635498047, 41.44961929321289, 44.50691223144531, 47.564205169677734, 50.621498107910156, 53.678794860839844, 56.736087799072266, 59.79338073730469, 62.85067367553711, 65.90796661376953, 68.96526336669922, 72.02255249023438, 75.07984924316406, 78.13713836669922, 81.1944351196289, 84.2517318725586, 87.30902099609375, 90.36631774902344, 93.4236068725586, 96.48090362548828, 99.53819274902344, 102.59548950195312, 105.65277862548828]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 5.0, 11.0, 7.0, 25.0, 25.0, 38.0, 51.0, 66.0, 91.0, 119.0, 176.0, 242.0, 422.0, 721.0, 1152.0, 2021.0, 3906.0, 8345.0, 20223.0, 66590.0, 3746149.0, 271533.0, 43230.0, 15064.0, 6501.0, 3149.0, 1663.0, 991.0, 607.0, 363.0, 232.0, 183.0, 105.0, 74.0, 60.0, 43.0, 26.0, 19.0, 16.0, 12.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.078125, -12.691650390625, -12.30517578125, -11.918701171875, -11.5322265625, -11.145751953125, -10.75927734375, -10.372802734375, -9.986328125, -9.599853515625, -9.21337890625, -8.826904296875, -8.4404296875, -8.053955078125, -7.66748046875, -7.281005859375, -6.89453125, -6.508056640625, -6.12158203125, -5.735107421875, -5.3486328125, -4.962158203125, -4.57568359375, -4.189208984375, -3.802734375, -3.416259765625, -3.02978515625, -2.643310546875, -2.2568359375, -1.870361328125, -1.48388671875, -1.097412109375, -0.7109375, -0.324462890625, 0.06201171875, 0.448486328125, 0.8349609375, 1.221435546875, 1.60791015625, 1.994384765625, 2.380859375, 2.767333984375, 3.15380859375, 3.540283203125, 3.9267578125, 4.313232421875, 4.69970703125, 5.086181640625, 5.47265625, 5.859130859375, 6.24560546875, 6.632080078125, 7.0185546875, 7.405029296875, 7.79150390625, 8.177978515625, 8.564453125, 8.950927734375, 9.33740234375, 9.723876953125, 10.1103515625, 10.496826171875, 10.88330078125, 11.269775390625, 11.65625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 10.0, 15.0, 15.0, 21.0, 26.0, 36.0, 35.0, 50.0, 48.0, 58.0, 70.0, 67.0, 66.0, 59.0, 60.0, 58.0, 53.0, 50.0, 37.0, 37.0, 19.0, 24.0, 15.0, 6.0, 16.0, 9.0, 11.0, 7.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.48046875, -7.2862548828125, -7.092041015625, -6.8978271484375, -6.70361328125, -6.5093994140625, -6.315185546875, -6.1209716796875, -5.9267578125, -5.7325439453125, -5.538330078125, -5.3441162109375, -5.14990234375, -4.9556884765625, -4.761474609375, -4.5672607421875, -4.373046875, -4.1788330078125, -3.984619140625, -3.7904052734375, -3.59619140625, -3.4019775390625, -3.207763671875, -3.0135498046875, -2.8193359375, -2.6251220703125, -2.430908203125, -2.2366943359375, -2.04248046875, -1.8482666015625, -1.654052734375, -1.4598388671875, -1.265625, -1.0714111328125, -0.877197265625, -0.6829833984375, -0.48876953125, -0.2945556640625, -0.100341796875, 0.0938720703125, 0.2880859375, 0.4822998046875, 0.676513671875, 0.8707275390625, 1.06494140625, 1.2591552734375, 1.453369140625, 1.6475830078125, 1.841796875, 2.0360107421875, 2.230224609375, 2.4244384765625, 2.61865234375, 2.8128662109375, 3.007080078125, 3.2012939453125, 3.3955078125, 3.5897216796875, 3.783935546875, 3.9781494140625, 4.17236328125, 4.3665771484375, 4.560791015625, 4.7550048828125, 4.94921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 12.0, 19.0, 45.0, 81.0, 142.0, 280.0, 557.0, 1094.0, 2286.0, 5497.0, 16683.0, 74912.0, 3689133.0, 345719.0, 39747.0, 10715.0, 3940.0, 1744.0, 802.0, 421.0, 205.0, 95.0, 61.0, 38.0, 26.0, 12.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.157958984375, -13.68310546875, -13.208251953125, -12.7333984375, -12.258544921875, -11.78369140625, -11.308837890625, -10.833984375, -10.359130859375, -9.88427734375, -9.409423828125, -8.9345703125, -8.459716796875, -7.98486328125, -7.510009765625, -7.03515625, -6.560302734375, -6.08544921875, -5.610595703125, -5.1357421875, -4.660888671875, -4.18603515625, -3.711181640625, -3.236328125, -2.761474609375, -2.28662109375, -1.811767578125, -1.3369140625, -0.862060546875, -0.38720703125, 0.087646484375, 0.5625, 1.037353515625, 1.51220703125, 1.987060546875, 2.4619140625, 2.936767578125, 3.41162109375, 3.886474609375, 4.361328125, 4.836181640625, 5.31103515625, 5.785888671875, 6.2607421875, 6.735595703125, 7.21044921875, 7.685302734375, 8.16015625, 8.635009765625, 9.10986328125, 9.584716796875, 10.0595703125, 10.534423828125, 11.00927734375, 11.484130859375, 11.958984375, 12.433837890625, 12.90869140625, 13.383544921875, 13.8583984375, 14.333251953125, 14.80810546875, 15.282958984375, 15.7578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 2.0, 6.0, 8.0, 7.0, 22.0, 29.0, 49.0, 69.0, 89.0, 206.0, 2627.0, 542.0, 149.0, 84.0, 55.0, 33.0, 27.0, 13.0, 10.0, 11.0, 3.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.59765625, -3.502655029296875, -3.40765380859375, -3.312652587890625, -3.2176513671875, -3.122650146484375, -3.02764892578125, -2.932647705078125, -2.837646484375, -2.742645263671875, -2.64764404296875, -2.552642822265625, -2.4576416015625, -2.362640380859375, -2.26763916015625, -2.172637939453125, -2.07763671875, -1.982635498046875, -1.88763427734375, -1.792633056640625, -1.6976318359375, -1.602630615234375, -1.50762939453125, -1.412628173828125, -1.317626953125, -1.222625732421875, -1.12762451171875, -1.032623291015625, -0.9376220703125, -0.842620849609375, -0.74761962890625, -0.652618408203125, -0.5576171875, -0.462615966796875, -0.36761474609375, -0.272613525390625, -0.1776123046875, -0.082611083984375, 0.01239013671875, 0.107391357421875, 0.202392578125, 0.297393798828125, 0.39239501953125, 0.487396240234375, 0.5823974609375, 0.677398681640625, 0.77239990234375, 0.867401123046875, 0.96240234375, 1.057403564453125, 1.15240478515625, 1.247406005859375, 1.3424072265625, 1.437408447265625, 1.53240966796875, 1.627410888671875, 1.722412109375, 1.817413330078125, 1.91241455078125, 2.007415771484375, 2.1024169921875, 2.197418212890625, 2.29241943359375, 2.387420654296875, 2.482421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 6.0, 9.0, 23.0, 39.0, 66.0, 86.0, 132.0, 139.0, 142.0, 120.0, 81.0, 65.0, 38.0, 20.0, 9.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.356361389160156, -21.773834228515625, -21.191307067871094, -20.608779907226562, -20.02625274658203, -19.4437255859375, -18.86119842529297, -18.278671264648438, -17.696144104003906, -17.113616943359375, -16.531089782714844, -15.948562622070312, -15.366035461425781, -14.78350830078125, -14.200980186462402, -13.618453025817871, -13.035924911499023, -12.453397750854492, -11.870870590209961, -11.28834342956543, -10.705816268920898, -10.123289108276367, -9.54076099395752, -8.958233833312988, -8.375706672668457, -7.793179512023926, -7.2106523513793945, -6.628124713897705, -6.045597553253174, -5.463070392608643, -4.880542755126953, -4.298015594482422, -3.715486526489258, -3.1329593658447266, -2.550431966781616, -1.9679046869277954, -1.3853774070739746, -0.8028502464294434, -0.220322847366333, 0.36220455169677734, 0.9447317123413086, 1.5272589921951294, 2.10978627204895, 2.6923136711120605, 3.274840831756592, 3.857367992401123, 4.4398956298828125, 5.022422790527344, 5.604949951171875, 6.187477111816406, 6.7700042724609375, 7.352531909942627, 7.935059070587158, 8.517585754394531, 9.100113868713379, 9.68264102935791, 10.265168190002441, 10.847695350646973, 11.430222511291504, 12.012749671936035, 12.595277786254883, 13.177804946899414, 13.760332107543945, 14.342859268188477, 14.925386428833008]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 2.0, 6.0, 5.0, 4.0, 7.0, 8.0, 6.0, 10.0, 19.0, 13.0, 16.0, 23.0, 21.0, 37.0, 28.0, 34.0, 32.0, 31.0, 38.0, 38.0, 42.0, 43.0, 40.0, 35.0, 37.0, 38.0, 38.0, 42.0, 40.0, 34.0, 28.0, 24.0, 35.0, 34.0, 12.0, 19.0, 18.0, 17.0, 9.0, 9.0, 6.0, 5.0, 8.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.941380500793457, -7.705964088439941, -7.470547676086426, -7.23513126373291, -6.9997148513793945, -6.764298439025879, -6.528882026672363, -6.293465614318848, -6.058049201965332, -5.822632789611816, -5.587216377258301, -5.351799964904785, -5.1163835525512695, -4.880967140197754, -4.645550727844238, -4.410134315490723, -4.174718379974365, -3.9393019676208496, -3.703885555267334, -3.4684691429138184, -3.2330527305603027, -2.997636318206787, -2.7622201442718506, -2.526803731918335, -2.2913873195648193, -2.0559709072113037, -1.820554494857788, -1.585138201713562, -1.3497217893600464, -1.1143053770065308, -0.8788890838623047, -0.6434726715087891, -0.40805578231811523, -0.172639399766922, 0.06277698278427124, 0.2981933355331421, 0.5336097478866577, 0.7690261602401733, 1.0044424533843994, 1.239858865737915, 1.4752752780914307, 1.7106916904449463, 1.946108102798462, 2.1815242767333984, 2.416940689086914, 2.6523571014404297, 2.8877735137939453, 3.123189926147461, 3.3586063385009766, 3.594022750854492, 3.829439163208008, 4.064855575561523, 4.300271987915039, 4.535688400268555, 4.77110481262207, 5.006521224975586, 5.241937637329102, 5.477354049682617, 5.712770462036133, 5.948186874389648, 6.183603286743164, 6.41901969909668, 6.654436111450195, 6.889852523803711, 7.125268459320068]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 12.0, 26.0, 18.0, 37.0, 52.0, 99.0, 149.0, 340.0, 639.0, 1326.0, 3334.0, 8982.0, 26626.0, 81042.0, 224408.0, 375750.0, 211532.0, 75483.0, 24591.0, 8310.0, 3164.0, 1239.0, 610.0, 297.0, 185.0, 98.0, 65.0, 34.0, 32.0, 19.0, 12.0, 12.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.470703125, -7.15234375, -6.833984375, -6.515625, -6.197265625, -5.87890625, -5.560546875, -5.2421875, -4.923828125, -4.60546875, -4.287109375, -3.96875, -3.650390625, -3.33203125, -3.013671875, -2.6953125, -2.376953125, -2.05859375, -1.740234375, -1.421875, -1.103515625, -0.78515625, -0.466796875, -0.1484375, 0.169921875, 0.48828125, 0.806640625, 1.125, 1.443359375, 1.76171875, 2.080078125, 2.3984375, 2.716796875, 3.03515625, 3.353515625, 3.671875, 3.990234375, 4.30859375, 4.626953125, 4.9453125, 5.263671875, 5.58203125, 5.900390625, 6.21875, 6.537109375, 6.85546875, 7.173828125, 7.4921875, 7.810546875, 8.12890625, 8.447265625, 8.765625, 9.083984375, 9.40234375, 9.720703125, 10.0390625, 10.357421875, 10.67578125, 10.994140625, 11.3125, 11.630859375, 11.94921875, 12.267578125, 12.5859375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 12.0, 7.0, 18.0, 18.0, 21.0, 37.0, 37.0, 33.0, 45.0, 41.0, 55.0, 62.0, 70.0, 67.0, 70.0, 51.0, 47.0, 59.0, 44.0, 34.0, 33.0, 22.0, 19.0, 26.0, 19.0, 7.0, 7.0, 10.0, 5.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-8.0, -7.80706787109375, -7.6141357421875, -7.42120361328125, -7.228271484375, -7.03533935546875, -6.8424072265625, -6.64947509765625, -6.45654296875, -6.26361083984375, -6.0706787109375, -5.87774658203125, -5.684814453125, -5.49188232421875, -5.2989501953125, -5.10601806640625, -4.9130859375, -4.72015380859375, -4.5272216796875, -4.33428955078125, -4.141357421875, -3.94842529296875, -3.7554931640625, -3.56256103515625, -3.36962890625, -3.17669677734375, -2.9837646484375, -2.79083251953125, -2.597900390625, -2.40496826171875, -2.2120361328125, -2.01910400390625, -1.826171875, -1.63323974609375, -1.4403076171875, -1.24737548828125, -1.054443359375, -0.86151123046875, -0.6685791015625, -0.47564697265625, -0.28271484375, -0.08978271484375, 0.1031494140625, 0.29608154296875, 0.489013671875, 0.68194580078125, 0.8748779296875, 1.06781005859375, 1.2607421875, 1.45367431640625, 1.6466064453125, 1.83953857421875, 2.032470703125, 2.22540283203125, 2.4183349609375, 2.61126708984375, 2.80419921875, 2.99713134765625, 3.1900634765625, 3.38299560546875, 3.575927734375, 3.76885986328125, 3.9617919921875, 4.15472412109375, 4.34765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 4.0, 19.0, 13.0, 20.0, 30.0, 61.0, 73.0, 147.0, 262.0, 498.0, 882.0, 1928.0, 7959.0, 165320.0, 830248.0, 34227.0, 3961.0, 1378.0, 631.0, 382.0, 212.0, 94.0, 67.0, 41.0, 26.0, 10.0, 13.0, 12.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-33.75, -32.70458984375, -31.6591796875, -30.61376953125, -29.568359375, -28.52294921875, -27.4775390625, -26.43212890625, -25.38671875, -24.34130859375, -23.2958984375, -22.25048828125, -21.205078125, -20.15966796875, -19.1142578125, -18.06884765625, -17.0234375, -15.97802734375, -14.9326171875, -13.88720703125, -12.841796875, -11.79638671875, -10.7509765625, -9.70556640625, -8.66015625, -7.61474609375, -6.5693359375, -5.52392578125, -4.478515625, -3.43310546875, -2.3876953125, -1.34228515625, -0.296875, 0.74853515625, 1.7939453125, 2.83935546875, 3.884765625, 4.93017578125, 5.9755859375, 7.02099609375, 8.06640625, 9.11181640625, 10.1572265625, 11.20263671875, 12.248046875, 13.29345703125, 14.3388671875, 15.38427734375, 16.4296875, 17.47509765625, 18.5205078125, 19.56591796875, 20.611328125, 21.65673828125, 22.7021484375, 23.74755859375, 24.79296875, 25.83837890625, 26.8837890625, 27.92919921875, 28.974609375, 30.02001953125, 31.0654296875, 32.11083984375, 33.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 8.0, 4.0, 7.0, 15.0, 18.0, 28.0, 30.0, 50.0, 65.0, 61.0, 85.0, 100.0, 109.0, 103.0, 77.0, 68.0, 51.0, 31.0, 28.0, 27.0, 11.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.34375, -58.6865234375, -57.029296875, -55.3720703125, -53.71484375, -52.0576171875, -50.400390625, -48.7431640625, -47.0859375, -45.4287109375, -43.771484375, -42.1142578125, -40.45703125, -38.7998046875, -37.142578125, -35.4853515625, -33.828125, -32.1708984375, -30.513671875, -28.8564453125, -27.19921875, -25.5419921875, -23.884765625, -22.2275390625, -20.5703125, -18.9130859375, -17.255859375, -15.5986328125, -13.94140625, -12.2841796875, -10.626953125, -8.9697265625, -7.3125, -5.6552734375, -3.998046875, -2.3408203125, -0.68359375, 0.9736328125, 2.630859375, 4.2880859375, 5.9453125, 7.6025390625, 9.259765625, 10.9169921875, 12.57421875, 14.2314453125, 15.888671875, 17.5458984375, 19.203125, 20.8603515625, 22.517578125, 24.1748046875, 25.83203125, 27.4892578125, 29.146484375, 30.8037109375, 32.4609375, 34.1181640625, 35.775390625, 37.4326171875, 39.08984375, 40.7470703125, 42.404296875, 44.0615234375, 45.71875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 11.0, 6.0, 7.0, 11.0, 13.0, 28.0, 35.0, 45.0, 59.0, 100.0, 177.0, 321.0, 637.0, 1883.0, 15324.0, 698892.0, 319424.0, 8868.0, 1491.0, 516.0, 247.0, 157.0, 95.0, 55.0, 38.0, 29.0, 19.0, 14.0, 9.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-19.84375, -19.275146484375, -18.70654296875, -18.137939453125, -17.5693359375, -17.000732421875, -16.43212890625, -15.863525390625, -15.294921875, -14.726318359375, -14.15771484375, -13.589111328125, -13.0205078125, -12.451904296875, -11.88330078125, -11.314697265625, -10.74609375, -10.177490234375, -9.60888671875, -9.040283203125, -8.4716796875, -7.903076171875, -7.33447265625, -6.765869140625, -6.197265625, -5.628662109375, -5.06005859375, -4.491455078125, -3.9228515625, -3.354248046875, -2.78564453125, -2.217041015625, -1.6484375, -1.079833984375, -0.51123046875, 0.057373046875, 0.6259765625, 1.194580078125, 1.76318359375, 2.331787109375, 2.900390625, 3.468994140625, 4.03759765625, 4.606201171875, 5.1748046875, 5.743408203125, 6.31201171875, 6.880615234375, 7.44921875, 8.017822265625, 8.58642578125, 9.155029296875, 9.7236328125, 10.292236328125, 10.86083984375, 11.429443359375, 11.998046875, 12.566650390625, 13.13525390625, 13.703857421875, 14.2724609375, 14.841064453125, 15.40966796875, 15.978271484375, 16.546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 5.0, 5.0, 11.0, 16.0, 11.0, 22.0, 31.0, 31.0, 41.0, 49.0, 63.0, 82.0, 115.0, 100.0, 89.0, 62.0, 43.0, 45.0, 33.0, 33.0, 22.0, 15.0, 13.0, 13.0, 11.0, 8.0, 10.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011892318725585938, -0.0011435449123382568, -0.00109785795211792, -0.001052170991897583, -0.001006484031677246, -0.0009607970714569092, -0.0009151101112365723, -0.0008694231510162354, -0.0008237361907958984, -0.0007780492305755615, -0.0007323622703552246, -0.0006866753101348877, -0.0006409883499145508, -0.0005953013896942139, -0.000549614429473877, -0.00050392746925354, -0.0004582405090332031, -0.0004125535488128662, -0.0003668665885925293, -0.0003211796283721924, -0.00027549266815185547, -0.00022980570793151855, -0.00018411874771118164, -0.00013843178749084473, -9.274482727050781e-05, -4.70578670501709e-05, -1.3709068298339844e-06, 4.431605339050293e-05, 9.000301361083984e-05, 0.00013568997383117676, 0.00018137693405151367, 0.00022706389427185059, 0.0002727508544921875, 0.0003184378147125244, 0.00036412477493286133, 0.00040981173515319824, 0.00045549869537353516, 0.0005011856555938721, 0.000546872615814209, 0.0005925595760345459, 0.0006382465362548828, 0.0006839334964752197, 0.0007296204566955566, 0.0007753074169158936, 0.0008209943771362305, 0.0008666813373565674, 0.0009123682975769043, 0.0009580552577972412, 0.0010037422180175781, 0.001049429178237915, 0.001095116138458252, 0.0011408030986785889, 0.0011864900588989258, 0.0012321770191192627, 0.0012778639793395996, 0.0013235509395599365, 0.0013692378997802734, 0.0014149248600006104, 0.0014606118202209473, 0.0015062987804412842, 0.001551985740661621, 0.001597672700881958, 0.001643359661102295, 0.0016890466213226318, 0.0017347335815429688]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 14.0, 13.0, 15.0, 23.0, 16.0, 43.0, 68.0, 89.0, 154.0, 224.0, 461.0, 876.0, 2029.0, 6517.0, 38160.0, 515571.0, 440702.0, 33778.0, 5899.0, 1892.0, 862.0, 411.0, 259.0, 137.0, 100.0, 56.0, 38.0, 26.0, 32.0, 17.0, 8.0, 9.0, 7.0, 7.0, 8.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0], "bins": [-13.359375, -12.998046875, -12.63671875, -12.275390625, -11.9140625, -11.552734375, -11.19140625, -10.830078125, -10.46875, -10.107421875, -9.74609375, -9.384765625, -9.0234375, -8.662109375, -8.30078125, -7.939453125, -7.578125, -7.216796875, -6.85546875, -6.494140625, -6.1328125, -5.771484375, -5.41015625, -5.048828125, -4.6875, -4.326171875, -3.96484375, -3.603515625, -3.2421875, -2.880859375, -2.51953125, -2.158203125, -1.796875, -1.435546875, -1.07421875, -0.712890625, -0.3515625, 0.009765625, 0.37109375, 0.732421875, 1.09375, 1.455078125, 1.81640625, 2.177734375, 2.5390625, 2.900390625, 3.26171875, 3.623046875, 3.984375, 4.345703125, 4.70703125, 5.068359375, 5.4296875, 5.791015625, 6.15234375, 6.513671875, 6.875, 7.236328125, 7.59765625, 7.958984375, 8.3203125, 8.681640625, 9.04296875, 9.404296875, 9.765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 1.0, 7.0, 18.0, 17.0, 16.0, 21.0, 36.0, 63.0, 60.0, 100.0, 110.0, 103.0, 105.0, 92.0, 62.0, 42.0, 31.0, 26.0, 22.0, 10.0, 11.0, 10.0, 4.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.3856201171875, -11.044677734375, -10.7037353515625, -10.36279296875, -10.0218505859375, -9.680908203125, -9.3399658203125, -8.9990234375, -8.6580810546875, -8.317138671875, -7.9761962890625, -7.63525390625, -7.2943115234375, -6.953369140625, -6.6124267578125, -6.271484375, -5.9305419921875, -5.589599609375, -5.2486572265625, -4.90771484375, -4.5667724609375, -4.225830078125, -3.8848876953125, -3.5439453125, -3.2030029296875, -2.862060546875, -2.5211181640625, -2.18017578125, -1.8392333984375, -1.498291015625, -1.1573486328125, -0.81640625, -0.4754638671875, -0.134521484375, 0.2064208984375, 0.54736328125, 0.8883056640625, 1.229248046875, 1.5701904296875, 1.9111328125, 2.2520751953125, 2.593017578125, 2.9339599609375, 3.27490234375, 3.6158447265625, 3.956787109375, 4.2977294921875, 4.638671875, 4.9796142578125, 5.320556640625, 5.6614990234375, 6.00244140625, 6.3433837890625, 6.684326171875, 7.0252685546875, 7.3662109375, 7.7071533203125, 8.048095703125, 8.3890380859375, 8.72998046875, 9.0709228515625, 9.411865234375, 9.7528076171875, 10.09375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 53.0, 310.0, 431.0, 151.0, 27.0, 11.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-609.361083984375, -596.2040405273438, -583.0469970703125, -569.889892578125, -556.7328491210938, -543.5758056640625, -530.4187622070312, -517.2616577148438, -504.1046142578125, -490.94757080078125, -477.7904968261719, -464.6334533691406, -451.47637939453125, -438.3193359375, -425.1622619628906, -412.0052185058594, -398.84814453125, -385.69110107421875, -372.5340270996094, -359.3769836425781, -346.21990966796875, -333.0628662109375, -319.9057922363281, -306.7487487792969, -293.5917053222656, -280.4346618652344, -267.277587890625, -254.1205291748047, -240.96347045898438, -227.80642700195312, -214.64935302734375, -201.4923095703125, -188.33523559570312, -175.1781768798828, -162.0211181640625, -148.8640594482422, -135.70700073242188, -122.5499496459961, -109.39289093017578, -96.23583221435547, -83.07877349853516, -69.92171478271484, -56.76465606689453, -43.607601165771484, -30.450542449951172, -17.293487548828125, -4.1364288330078125, 9.0206298828125, 22.177688598632812, 35.334747314453125, 48.49180603027344, 61.648860931396484, 74.80592346191406, 87.96297454833984, 101.12003326416016, 114.27709197998047, 127.43415069580078, 140.59120178222656, 153.74826049804688, 166.9053192138672, 180.0623779296875, 193.2194366455078, 206.37649536132812, 219.53355407714844, 232.69061279296875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 11.0, 14.0, 17.0, 14.0, 22.0, 23.0, 30.0, 22.0, 29.0, 45.0, 46.0, 43.0, 46.0, 53.0, 49.0, 43.0, 44.0, 50.0, 46.0, 51.0, 50.0, 43.0, 35.0, 23.0, 19.0, 36.0, 18.0, 13.0, 14.0, 9.0, 10.0, 2.0, 6.0, 7.0, 1.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.31135559082031, -90.91300201416016, -87.51464080810547, -84.11628723144531, -80.71792602539062, -77.31957244873047, -73.92121887207031, -70.52285766601562, -67.12449645996094, -63.726139068603516, -60.327781677246094, -56.92942810058594, -53.53106689453125, -50.132713317871094, -46.73435592651367, -43.33599853515625, -39.937644958496094, -36.53928756713867, -33.14093017578125, -29.74257469177246, -26.34421730041504, -22.945859909057617, -19.547504425048828, -16.149147033691406, -12.750789642333984, -9.352432250976562, -5.954075813293457, -2.5557193756103516, 0.8426380157470703, 4.240995407104492, 7.639350891113281, 11.037708282470703, 14.436058044433594, 17.834415435791016, 21.232772827148438, 24.631128311157227, 28.02948570251465, 31.42784309387207, 34.82619857788086, 38.22455596923828, 41.6229133605957, 45.021270751953125, 48.41962814331055, 51.81798553466797, 55.216339111328125, 58.61470031738281, 62.01305389404297, 65.41140747070312, 68.80976867675781, 72.20812225341797, 75.60648345947266, 79.00483703613281, 82.4031982421875, 85.80155181884766, 89.19990539550781, 92.5982666015625, 95.99662780761719, 99.39498138427734, 102.79334259033203, 106.19169616699219, 109.59005737304688, 112.98841094970703, 116.38676452636719, 119.78512573242188, 123.18347930908203]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 17.0, 28.0, 51.0, 57.0, 100.0, 149.0, 292.0, 527.0, 1095.0, 2422.0, 5955.0, 18319.0, 81078.0, 3380544.0, 620771.0, 58975.0, 14682.0, 4998.0, 2109.0, 967.0, 480.0, 284.0, 154.0, 89.0, 58.0, 27.0, 21.0, 8.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.1624755859375, -12.762451171875, -12.3624267578125, -11.96240234375, -11.5623779296875, -11.162353515625, -10.7623291015625, -10.3623046875, -9.9622802734375, -9.562255859375, -9.1622314453125, -8.76220703125, -8.3621826171875, -7.962158203125, -7.5621337890625, -7.162109375, -6.7620849609375, -6.362060546875, -5.9620361328125, -5.56201171875, -5.1619873046875, -4.761962890625, -4.3619384765625, -3.9619140625, -3.5618896484375, -3.161865234375, -2.7618408203125, -2.36181640625, -1.9617919921875, -1.561767578125, -1.1617431640625, -0.76171875, -0.3616943359375, 0.038330078125, 0.4383544921875, 0.83837890625, 1.2384033203125, 1.638427734375, 2.0384521484375, 2.4384765625, 2.8385009765625, 3.238525390625, 3.6385498046875, 4.03857421875, 4.4385986328125, 4.838623046875, 5.2386474609375, 5.638671875, 6.0386962890625, 6.438720703125, 6.8387451171875, 7.23876953125, 7.6387939453125, 8.038818359375, 8.4388427734375, 8.8388671875, 9.2388916015625, 9.638916015625, 10.0389404296875, 10.43896484375, 10.8389892578125, 11.239013671875, 11.6390380859375, 12.0390625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 8.0, 3.0, 7.0, 10.0, 9.0, 18.0, 29.0, 29.0, 33.0, 39.0, 38.0, 47.0, 61.0, 64.0, 71.0, 73.0, 47.0, 70.0, 49.0, 59.0, 42.0, 36.0, 37.0, 27.0, 20.0, 16.0, 16.0, 11.0, 3.0, 9.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.46575927734375, -6.2674560546875, -6.06915283203125, -5.870849609375, -5.67254638671875, -5.4742431640625, -5.27593994140625, -5.07763671875, -4.87933349609375, -4.6810302734375, -4.48272705078125, -4.284423828125, -4.08612060546875, -3.8878173828125, -3.68951416015625, -3.4912109375, -3.29290771484375, -3.0946044921875, -2.89630126953125, -2.697998046875, -2.49969482421875, -2.3013916015625, -2.10308837890625, -1.90478515625, -1.70648193359375, -1.5081787109375, -1.30987548828125, -1.111572265625, -0.91326904296875, -0.7149658203125, -0.51666259765625, -0.318359375, -0.12005615234375, 0.0782470703125, 0.27655029296875, 0.474853515625, 0.67315673828125, 0.8714599609375, 1.06976318359375, 1.26806640625, 1.46636962890625, 1.6646728515625, 1.86297607421875, 2.061279296875, 2.25958251953125, 2.4578857421875, 2.65618896484375, 2.8544921875, 3.05279541015625, 3.2510986328125, 3.44940185546875, 3.647705078125, 3.84600830078125, 4.0443115234375, 4.24261474609375, 4.44091796875, 4.63922119140625, 4.8375244140625, 5.03582763671875, 5.234130859375, 5.43243408203125, 5.6307373046875, 5.82904052734375, 6.02734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 9.0, 9.0, 7.0, 17.0, 34.0, 32.0, 47.0, 66.0, 81.0, 119.0, 197.0, 330.0, 570.0, 1018.0, 2047.0, 4877.0, 13711.0, 49922.0, 330536.0, 3541395.0, 194328.0, 36403.0, 10718.0, 3934.0, 1724.0, 833.0, 485.0, 294.0, 161.0, 114.0, 79.0, 54.0, 35.0, 28.0, 20.0, 12.0, 11.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.7578125, -11.4158935546875, -11.073974609375, -10.7320556640625, -10.39013671875, -10.0482177734375, -9.706298828125, -9.3643798828125, -9.0224609375, -8.6805419921875, -8.338623046875, -7.9967041015625, -7.65478515625, -7.3128662109375, -6.970947265625, -6.6290283203125, -6.287109375, -5.9451904296875, -5.603271484375, -5.2613525390625, -4.91943359375, -4.5775146484375, -4.235595703125, -3.8936767578125, -3.5517578125, -3.2098388671875, -2.867919921875, -2.5260009765625, -2.18408203125, -1.8421630859375, -1.500244140625, -1.1583251953125, -0.81640625, -0.4744873046875, -0.132568359375, 0.2093505859375, 0.55126953125, 0.8931884765625, 1.235107421875, 1.5770263671875, 1.9189453125, 2.2608642578125, 2.602783203125, 2.9447021484375, 3.28662109375, 3.6285400390625, 3.970458984375, 4.3123779296875, 4.654296875, 4.9962158203125, 5.338134765625, 5.6800537109375, 6.02197265625, 6.3638916015625, 6.705810546875, 7.0477294921875, 7.3896484375, 7.7315673828125, 8.073486328125, 8.4154052734375, 8.75732421875, 9.0992431640625, 9.441162109375, 9.7830810546875, 10.125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 4.0, 4.0, 2.0, 6.0, 13.0, 15.0, 12.0, 20.0, 37.0, 64.0, 84.0, 161.0, 374.0, 1892.0, 739.0, 282.0, 132.0, 79.0, 45.0, 42.0, 20.0, 12.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.86529541015625, -4.7071533203125, -4.54901123046875, -4.390869140625, -4.23272705078125, -4.0745849609375, -3.91644287109375, -3.75830078125, -3.60015869140625, -3.4420166015625, -3.28387451171875, -3.125732421875, -2.96759033203125, -2.8094482421875, -2.65130615234375, -2.4931640625, -2.33502197265625, -2.1768798828125, -2.01873779296875, -1.860595703125, -1.70245361328125, -1.5443115234375, -1.38616943359375, -1.22802734375, -1.06988525390625, -0.9117431640625, -0.75360107421875, -0.595458984375, -0.43731689453125, -0.2791748046875, -0.12103271484375, 0.037109375, 0.19525146484375, 0.3533935546875, 0.51153564453125, 0.669677734375, 0.82781982421875, 0.9859619140625, 1.14410400390625, 1.30224609375, 1.46038818359375, 1.6185302734375, 1.77667236328125, 1.934814453125, 2.09295654296875, 2.2510986328125, 2.40924072265625, 2.5673828125, 2.72552490234375, 2.8836669921875, 3.04180908203125, 3.199951171875, 3.35809326171875, 3.5162353515625, 3.67437744140625, 3.83251953125, 3.99066162109375, 4.1488037109375, 4.30694580078125, 4.465087890625, 4.62322998046875, 4.7813720703125, 4.93951416015625, 5.09765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 8.0, 19.0, 32.0, 56.0, 93.0, 143.0, 171.0, 161.0, 121.0, 79.0, 45.0, 28.0, 10.0, 11.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.189285278320312, -29.023456573486328, -27.85762596130371, -26.691795349121094, -25.52596664428711, -24.360137939453125, -23.194307327270508, -22.02847671508789, -20.862648010253906, -19.696819305419922, -18.530988693237305, -17.365158081054688, -16.199329376220703, -15.033499717712402, -13.867670059204102, -12.7018404006958, -11.5360107421875, -10.3701810836792, -9.204351425170898, -8.038521766662598, -6.872692108154297, -5.706862449645996, -4.541032791137695, -3.3752031326293945, -2.2093734741210938, -1.043543815612793, 0.12228584289550781, 1.2881155014038086, 2.4539451599121094, 3.61977481842041, 4.785604476928711, 5.951434135437012, 7.1172637939453125, 8.283093452453613, 9.448923110961914, 10.614752769470215, 11.780582427978516, 12.946412086486816, 14.112241744995117, 15.278071403503418, 16.44390106201172, 17.609729766845703, 18.77556037902832, 19.941390991210938, 21.107219696044922, 22.273048400878906, 23.438879013061523, 24.60470962524414, 25.770538330078125, 26.93636703491211, 28.102197647094727, 29.268028259277344, 30.433856964111328, 31.599685668945312, 32.76551818847656, 33.93134689331055, 35.09717559814453, 36.263004302978516, 37.4288330078125, 38.59466552734375, 39.760494232177734, 40.92632293701172, 42.09215545654297, 43.25798416137695, 44.42381286621094]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 3.0, 9.0, 9.0, 10.0, 12.0, 15.0, 17.0, 16.0, 21.0, 29.0, 23.0, 23.0, 38.0, 41.0, 42.0, 47.0, 38.0, 51.0, 49.0, 48.0, 41.0, 48.0, 38.0, 36.0, 44.0, 28.0, 37.0, 18.0, 27.0, 23.0, 17.0, 12.0, 21.0, 12.0, 11.0, 3.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.86805248260498, -15.43425464630127, -15.000456809997559, -14.566658973693848, -14.132862091064453, -13.699064254760742, -13.265266418457031, -12.83146858215332, -12.39767074584961, -11.963872909545898, -11.530075073242188, -11.096277236938477, -10.662479400634766, -10.228681564331055, -9.79488468170166, -9.36108684539795, -8.927289009094238, -8.493491172790527, -8.059693336486816, -7.625895977020264, -7.192098140716553, -6.758300304412842, -6.324502944946289, -5.890705108642578, -5.456907272338867, -5.023109436035156, -4.589311599731445, -4.155514240264893, -3.7217164039611816, -3.2879185676574707, -2.854120969772339, -2.420323371887207, -1.9865245819091797, -1.5527268648147583, -1.118929147720337, -0.6851314306259155, -0.25133371353149414, 0.1824641227722168, 0.6162617206573486, 1.0500593185424805, 1.4838571548461914, 1.9176548719406128, 2.351452589035034, 2.785250186920166, 3.219048023223877, 3.652845859527588, 4.086643218994141, 4.520441055297852, 4.9542388916015625, 5.388036727905273, 5.821834564208984, 6.255631923675537, 6.689429759979248, 7.123227596282959, 7.557024955749512, 7.990822792053223, 8.424620628356934, 8.858418464660645, 9.292216300964355, 9.726014137268066, 10.159811019897461, 10.593608856201172, 11.027406692504883, 11.461204528808594, 11.895002365112305]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 8.0, 13.0, 14.0, 25.0, 39.0, 87.0, 200.0, 411.0, 1093.0, 3343.0, 12296.0, 54078.0, 231076.0, 522627.0, 170588.0, 39300.0, 9207.0, 2650.0, 840.0, 321.0, 159.0, 81.0, 40.0, 24.0, 14.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.703125, -18.189208984375, -17.67529296875, -17.161376953125, -16.6474609375, -16.133544921875, -15.61962890625, -15.105712890625, -14.591796875, -14.077880859375, -13.56396484375, -13.050048828125, -12.5361328125, -12.022216796875, -11.50830078125, -10.994384765625, -10.48046875, -9.966552734375, -9.45263671875, -8.938720703125, -8.4248046875, -7.910888671875, -7.39697265625, -6.883056640625, -6.369140625, -5.855224609375, -5.34130859375, -4.827392578125, -4.3134765625, -3.799560546875, -3.28564453125, -2.771728515625, -2.2578125, -1.743896484375, -1.22998046875, -0.716064453125, -0.2021484375, 0.311767578125, 0.82568359375, 1.339599609375, 1.853515625, 2.367431640625, 2.88134765625, 3.395263671875, 3.9091796875, 4.423095703125, 4.93701171875, 5.450927734375, 5.96484375, 6.478759765625, 6.99267578125, 7.506591796875, 8.0205078125, 8.534423828125, 9.04833984375, 9.562255859375, 10.076171875, 10.590087890625, 11.10400390625, 11.617919921875, 12.1318359375, 12.645751953125, 13.15966796875, 13.673583984375, 14.1875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 7.0, 12.0, 21.0, 23.0, 25.0, 38.0, 34.0, 37.0, 46.0, 50.0, 58.0, 67.0, 66.0, 66.0, 57.0, 66.0, 54.0, 43.0, 50.0, 27.0, 36.0, 22.0, 20.0, 16.0, 15.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.56463623046875, -6.3597412109375, -6.15484619140625, -5.949951171875, -5.74505615234375, -5.5401611328125, -5.33526611328125, -5.13037109375, -4.92547607421875, -4.7205810546875, -4.51568603515625, -4.310791015625, -4.10589599609375, -3.9010009765625, -3.69610595703125, -3.4912109375, -3.28631591796875, -3.0814208984375, -2.87652587890625, -2.671630859375, -2.46673583984375, -2.2618408203125, -2.05694580078125, -1.85205078125, -1.64715576171875, -1.4422607421875, -1.23736572265625, -1.032470703125, -0.82757568359375, -0.6226806640625, -0.41778564453125, -0.212890625, -0.00799560546875, 0.1968994140625, 0.40179443359375, 0.606689453125, 0.81158447265625, 1.0164794921875, 1.22137451171875, 1.42626953125, 1.63116455078125, 1.8360595703125, 2.04095458984375, 2.245849609375, 2.45074462890625, 2.6556396484375, 2.86053466796875, 3.0654296875, 3.27032470703125, 3.4752197265625, 3.68011474609375, 3.885009765625, 4.08990478515625, 4.2947998046875, 4.49969482421875, 4.70458984375, 4.90948486328125, 5.1143798828125, 5.31927490234375, 5.524169921875, 5.72906494140625, 5.9339599609375, 6.13885498046875, 6.34375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 7.0, 8.0, 9.0, 12.0, 14.0, 24.0, 33.0, 34.0, 47.0, 75.0, 99.0, 180.0, 338.0, 586.0, 1309.0, 3581.0, 17951.0, 396338.0, 596699.0, 23920.0, 4152.0, 1483.0, 676.0, 380.0, 205.0, 115.0, 76.0, 51.0, 47.0, 20.0, 20.0, 19.0, 13.0, 13.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.517822265625, -33.50439453125, -32.490966796875, -31.4775390625, -30.464111328125, -29.45068359375, -28.437255859375, -27.423828125, -26.410400390625, -25.39697265625, -24.383544921875, -23.3701171875, -22.356689453125, -21.34326171875, -20.329833984375, -19.31640625, -18.302978515625, -17.28955078125, -16.276123046875, -15.2626953125, -14.249267578125, -13.23583984375, -12.222412109375, -11.208984375, -10.195556640625, -9.18212890625, -8.168701171875, -7.1552734375, -6.141845703125, -5.12841796875, -4.114990234375, -3.1015625, -2.088134765625, -1.07470703125, -0.061279296875, 0.9521484375, 1.965576171875, 2.97900390625, 3.992431640625, 5.005859375, 6.019287109375, 7.03271484375, 8.046142578125, 9.0595703125, 10.072998046875, 11.08642578125, 12.099853515625, 13.11328125, 14.126708984375, 15.14013671875, 16.153564453125, 17.1669921875, 18.180419921875, 19.19384765625, 20.207275390625, 21.220703125, 22.234130859375, 23.24755859375, 24.260986328125, 25.2744140625, 26.287841796875, 27.30126953125, 28.314697265625, 29.328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 6.0, 8.0, 8.0, 19.0, 34.0, 49.0, 65.0, 74.0, 97.0, 103.0, 93.0, 96.0, 88.0, 69.0, 57.0, 37.0, 26.0, 26.0, 10.0, 5.0, 9.0, 3.0, 4.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.80322265625, -32.3564453125, -30.90966796875, -29.462890625, -28.01611328125, -26.5693359375, -25.12255859375, -23.67578125, -22.22900390625, -20.7822265625, -19.33544921875, -17.888671875, -16.44189453125, -14.9951171875, -13.54833984375, -12.1015625, -10.65478515625, -9.2080078125, -7.76123046875, -6.314453125, -4.86767578125, -3.4208984375, -1.97412109375, -0.52734375, 0.91943359375, 2.3662109375, 3.81298828125, 5.259765625, 6.70654296875, 8.1533203125, 9.60009765625, 11.046875, 12.49365234375, 13.9404296875, 15.38720703125, 16.833984375, 18.28076171875, 19.7275390625, 21.17431640625, 22.62109375, 24.06787109375, 25.5146484375, 26.96142578125, 28.408203125, 29.85498046875, 31.3017578125, 32.74853515625, 34.1953125, 35.64208984375, 37.0888671875, 38.53564453125, 39.982421875, 41.42919921875, 42.8759765625, 44.32275390625, 45.76953125, 47.21630859375, 48.6630859375, 50.10986328125, 51.556640625, 53.00341796875, 54.4501953125, 55.89697265625, 57.34375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 7.0, 11.0, 8.0, 14.0, 19.0, 32.0, 42.0, 48.0, 71.0, 95.0, 161.0, 285.0, 479.0, 846.0, 2268.0, 6788.0, 30944.0, 187334.0, 668714.0, 120530.0, 21137.0, 5104.0, 1734.0, 778.0, 394.0, 234.0, 112.0, 101.0, 54.0, 46.0, 37.0, 32.0, 20.0, 18.0, 19.0, 8.0, 5.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0625, -7.8280029296875, -7.593505859375, -7.3590087890625, -7.12451171875, -6.8900146484375, -6.655517578125, -6.4210205078125, -6.1865234375, -5.9520263671875, -5.717529296875, -5.4830322265625, -5.24853515625, -5.0140380859375, -4.779541015625, -4.5450439453125, -4.310546875, -4.0760498046875, -3.841552734375, -3.6070556640625, -3.37255859375, -3.1380615234375, -2.903564453125, -2.6690673828125, -2.4345703125, -2.2000732421875, -1.965576171875, -1.7310791015625, -1.49658203125, -1.2620849609375, -1.027587890625, -0.7930908203125, -0.55859375, -0.3240966796875, -0.089599609375, 0.1448974609375, 0.37939453125, 0.6138916015625, 0.848388671875, 1.0828857421875, 1.3173828125, 1.5518798828125, 1.786376953125, 2.0208740234375, 2.25537109375, 2.4898681640625, 2.724365234375, 2.9588623046875, 3.193359375, 3.4278564453125, 3.662353515625, 3.8968505859375, 4.13134765625, 4.3658447265625, 4.600341796875, 4.8348388671875, 5.0693359375, 5.3038330078125, 5.538330078125, 5.7728271484375, 6.00732421875, 6.2418212890625, 6.476318359375, 6.7108154296875, 6.9453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 6.0, 12.0, 7.0, 13.0, 7.0, 12.0, 19.0, 19.0, 15.0, 20.0, 26.0, 28.0, 35.0, 33.0, 31.0, 79.0, 111.0, 99.0, 81.0, 42.0, 37.0, 36.0, 39.0, 25.0, 21.0, 32.0, 17.0, 22.0, 11.0, 7.0, 12.0, 7.0, 0.0, 4.0, 5.0, 2.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0015230178833007812, -0.0014805346727371216, -0.001438051462173462, -0.0013955682516098022, -0.0013530850410461426, -0.001310601830482483, -0.0012681186199188232, -0.0012256354093551636, -0.001183152198791504, -0.0011406689882278442, -0.0010981857776641846, -0.001055702567100525, -0.0010132193565368652, -0.0009707361459732056, -0.0009282529354095459, -0.0008857697248458862, -0.0008432865142822266, -0.0008008033037185669, -0.0007583200931549072, -0.0007158368825912476, -0.0006733536720275879, -0.0006308704614639282, -0.0005883872509002686, -0.0005459040403366089, -0.0005034208297729492, -0.00046093761920928955, -0.0004184544086456299, -0.0003759711980819702, -0.00033348798751831055, -0.0002910047769546509, -0.0002485215663909912, -0.00020603835582733154, -0.00016355514526367188, -0.00012107193470001221, -7.858872413635254e-05, -3.610551357269287e-05, 6.377696990966797e-06, 4.8860907554626465e-05, 9.134411811828613e-05, 0.0001338273286819458, 0.00017631053924560547, 0.00021879374980926514, 0.0002612769603729248, 0.00030376017093658447, 0.00034624338150024414, 0.0003887265920639038, 0.0004312098026275635, 0.00047369301319122314, 0.0005161762237548828, 0.0005586594343185425, 0.0006011426448822021, 0.0006436258554458618, 0.0006861090660095215, 0.0007285922765731812, 0.0007710754871368408, 0.0008135586977005005, 0.0008560419082641602, 0.0008985251188278198, 0.0009410083293914795, 0.0009834915399551392, 0.0010259747505187988, 0.0010684579610824585, 0.0011109411716461182, 0.0011534243822097778, 0.0011959075927734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 24.0, 13.0, 26.0, 30.0, 44.0, 59.0, 116.0, 207.0, 359.0, 927.0, 2320.0, 8684.0, 65442.0, 807223.0, 143922.0, 13627.0, 3285.0, 1196.0, 465.0, 219.0, 129.0, 79.0, 41.0, 32.0, 26.0, 13.0, 11.0, 7.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.382080078125, -11.99072265625, -11.599365234375, -11.2080078125, -10.816650390625, -10.42529296875, -10.033935546875, -9.642578125, -9.251220703125, -8.85986328125, -8.468505859375, -8.0771484375, -7.685791015625, -7.29443359375, -6.903076171875, -6.51171875, -6.120361328125, -5.72900390625, -5.337646484375, -4.9462890625, -4.554931640625, -4.16357421875, -3.772216796875, -3.380859375, -2.989501953125, -2.59814453125, -2.206787109375, -1.8154296875, -1.424072265625, -1.03271484375, -0.641357421875, -0.25, 0.141357421875, 0.53271484375, 0.924072265625, 1.3154296875, 1.706787109375, 2.09814453125, 2.489501953125, 2.880859375, 3.272216796875, 3.66357421875, 4.054931640625, 4.4462890625, 4.837646484375, 5.22900390625, 5.620361328125, 6.01171875, 6.403076171875, 6.79443359375, 7.185791015625, 7.5771484375, 7.968505859375, 8.35986328125, 8.751220703125, 9.142578125, 9.533935546875, 9.92529296875, 10.316650390625, 10.7080078125, 11.099365234375, 11.49072265625, 11.882080078125, 12.2734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 14.0, 13.0, 12.0, 32.0, 47.0, 36.0, 62.0, 76.0, 96.0, 116.0, 106.0, 89.0, 68.0, 39.0, 40.0, 32.0, 17.0, 21.0, 12.0, 16.0, 9.0, 4.0, 7.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.5078125, -9.24285888671875, -8.9779052734375, -8.71295166015625, -8.447998046875, -8.18304443359375, -7.9180908203125, -7.65313720703125, -7.38818359375, -7.12322998046875, -6.8582763671875, -6.59332275390625, -6.328369140625, -6.06341552734375, -5.7984619140625, -5.53350830078125, -5.2685546875, -5.00360107421875, -4.7386474609375, -4.47369384765625, -4.208740234375, -3.94378662109375, -3.6788330078125, -3.41387939453125, -3.14892578125, -2.88397216796875, -2.6190185546875, -2.35406494140625, -2.089111328125, -1.82415771484375, -1.5592041015625, -1.29425048828125, -1.029296875, -0.76434326171875, -0.4993896484375, -0.23443603515625, 0.030517578125, 0.29547119140625, 0.5604248046875, 0.82537841796875, 1.09033203125, 1.35528564453125, 1.6202392578125, 1.88519287109375, 2.150146484375, 2.41510009765625, 2.6800537109375, 2.94500732421875, 3.2099609375, 3.47491455078125, 3.7398681640625, 4.00482177734375, 4.269775390625, 4.53472900390625, 4.7996826171875, 5.06463623046875, 5.32958984375, 5.59454345703125, 5.8594970703125, 6.12445068359375, 6.389404296875, 6.65435791015625, 6.9193115234375, 7.18426513671875, 7.44921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 9.0, 16.0, 84.0, 273.0, 357.0, 201.0, 45.0, 11.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-369.8257751464844, -358.3690185546875, -346.9122314453125, -335.4554748535156, -323.99871826171875, -312.54193115234375, -301.0851745605469, -289.62841796875, -278.171630859375, -266.7148742675781, -255.2581024169922, -243.80133056640625, -232.34457397460938, -220.88780212402344, -209.4310302734375, -197.97427368164062, -186.51751708984375, -175.0607452392578, -163.60398864746094, -152.147216796875, -140.69046020507812, -129.2336883544922, -117.77691650390625, -106.32015228271484, -94.86338806152344, -83.40662384033203, -71.94985961914062, -60.49308776855469, -49.03632354736328, -37.579559326171875, -26.122787475585938, -14.666023254394531, -3.209228515625, 8.247537612915039, 19.704303741455078, 31.16107177734375, 42.617835998535156, 54.07460021972656, 65.5313720703125, 76.9881362915039, 88.44490051269531, 99.90166473388672, 111.35842895507812, 122.81520080566406, 134.27197265625, 145.72872924804688, 157.1855010986328, 168.64227294921875, 180.09902954101562, 191.55580139160156, 203.01255798339844, 214.46932983398438, 225.92608642578125, 237.3828582763672, 248.83963012695312, 260.29638671875, 271.753173828125, 283.2099304199219, 294.6667175292969, 306.12347412109375, 317.5802307128906, 329.0369873046875, 340.4937744140625, 351.9505310058594, 363.40728759765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 9.0, 10.0, 16.0, 18.0, 21.0, 23.0, 25.0, 32.0, 31.0, 32.0, 32.0, 46.0, 44.0, 61.0, 50.0, 45.0, 57.0, 50.0, 52.0, 40.0, 41.0, 31.0, 31.0, 35.0, 23.0, 18.0, 14.0, 18.0, 11.0, 12.0, 8.0, 15.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.42587280273438, -112.06140899658203, -108.69695281982422, -105.33248901367188, -101.96803283691406, -98.60356903076172, -95.23910522460938, -91.87464904785156, -88.51019287109375, -85.1457290649414, -81.7812728881836, -78.41680908203125, -75.05235290527344, -71.6878890991211, -68.32342529296875, -64.95896911621094, -61.594505310058594, -58.230045318603516, -54.86558532714844, -51.501121520996094, -48.13666534423828, -44.77220153808594, -41.40774154663086, -38.04328155517578, -34.6788215637207, -31.314361572265625, -27.949901580810547, -24.585439682006836, -21.220979690551758, -17.85651969909668, -14.492057800292969, -11.12759780883789, -7.7631378173828125, -4.398677349090576, -1.0342168807983398, 2.3302440643310547, 5.694704055786133, 9.059164047241211, 12.423625946044922, 15.7880859375, 19.152545928955078, 22.517005920410156, 25.881465911865234, 29.245927810668945, 32.610389709472656, 35.97484588623047, 39.33930969238281, 42.70376968383789, 46.06822967529297, 49.43268966674805, 52.797149658203125, 56.16161346435547, 59.52606964111328, 62.890533447265625, 66.25498962402344, 69.61945343017578, 72.98391723632812, 76.34838104248047, 79.71283721923828, 83.07730102539062, 86.44175720214844, 89.80622100830078, 93.17068481445312, 96.53514099121094, 99.89959716796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 11.0, 17.0, 30.0, 49.0, 74.0, 153.0, 315.0, 795.0, 2179.0, 8142.0, 39648.0, 412697.0, 3287175.0, 392949.0, 38223.0, 8068.0, 2293.0, 788.0, 327.0, 149.0, 72.0, 48.0, 30.0, 14.0, 12.0, 10.0, 6.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.6375732421875, -9.259521484375, -8.8814697265625, -8.50341796875, -8.1253662109375, -7.747314453125, -7.3692626953125, -6.9912109375, -6.6131591796875, -6.235107421875, -5.8570556640625, -5.47900390625, -5.1009521484375, -4.722900390625, -4.3448486328125, -3.966796875, -3.5887451171875, -3.210693359375, -2.8326416015625, -2.45458984375, -2.0765380859375, -1.698486328125, -1.3204345703125, -0.9423828125, -0.5643310546875, -0.186279296875, 0.1917724609375, 0.56982421875, 0.9478759765625, 1.325927734375, 1.7039794921875, 2.08203125, 2.4600830078125, 2.838134765625, 3.2161865234375, 3.59423828125, 3.9722900390625, 4.350341796875, 4.7283935546875, 5.1064453125, 5.4844970703125, 5.862548828125, 6.2406005859375, 6.61865234375, 6.9967041015625, 7.374755859375, 7.7528076171875, 8.130859375, 8.5089111328125, 8.886962890625, 9.2650146484375, 9.64306640625, 10.0211181640625, 10.399169921875, 10.7772216796875, 11.1552734375, 11.5333251953125, 11.911376953125, 12.2894287109375, 12.66748046875, 13.0455322265625, 13.423583984375, 13.8016357421875, 14.1796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 11.0, 17.0, 23.0, 21.0, 18.0, 47.0, 50.0, 50.0, 52.0, 71.0, 85.0, 64.0, 66.0, 71.0, 76.0, 57.0, 47.0, 39.0, 39.0, 22.0, 22.0, 10.0, 15.0, 3.0, 7.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.84063720703125, -6.6187744140625, -6.39691162109375, -6.175048828125, -5.95318603515625, -5.7313232421875, -5.50946044921875, -5.28759765625, -5.06573486328125, -4.8438720703125, -4.62200927734375, -4.400146484375, -4.17828369140625, -3.9564208984375, -3.73455810546875, -3.5126953125, -3.29083251953125, -3.0689697265625, -2.84710693359375, -2.625244140625, -2.40338134765625, -2.1815185546875, -1.95965576171875, -1.73779296875, -1.51593017578125, -1.2940673828125, -1.07220458984375, -0.850341796875, -0.62847900390625, -0.4066162109375, -0.18475341796875, 0.037109375, 0.25897216796875, 0.4808349609375, 0.70269775390625, 0.924560546875, 1.14642333984375, 1.3682861328125, 1.59014892578125, 1.81201171875, 2.03387451171875, 2.2557373046875, 2.47760009765625, 2.699462890625, 2.92132568359375, 3.1431884765625, 3.36505126953125, 3.5869140625, 3.80877685546875, 4.0306396484375, 4.25250244140625, 4.474365234375, 4.69622802734375, 4.9180908203125, 5.13995361328125, 5.36181640625, 5.58367919921875, 5.8055419921875, 6.02740478515625, 6.249267578125, 6.47113037109375, 6.6929931640625, 6.91485595703125, 7.13671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 13.0, 22.0, 22.0, 30.0, 42.0, 62.0, 153.0, 304.0, 700.0, 1927.0, 6335.0, 27122.0, 196030.0, 2952091.0, 919750.0, 70347.0, 13513.0, 3649.0, 1201.0, 454.0, 219.0, 97.0, 51.0, 33.0, 21.0, 21.0, 12.0, 10.0, 6.0, 4.0, 5.0, 7.0, 0.0, 3.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.4453125, -13.047119140625, -12.64892578125, -12.250732421875, -11.8525390625, -11.454345703125, -11.05615234375, -10.657958984375, -10.259765625, -9.861572265625, -9.46337890625, -9.065185546875, -8.6669921875, -8.268798828125, -7.87060546875, -7.472412109375, -7.07421875, -6.676025390625, -6.27783203125, -5.879638671875, -5.4814453125, -5.083251953125, -4.68505859375, -4.286865234375, -3.888671875, -3.490478515625, -3.09228515625, -2.694091796875, -2.2958984375, -1.897705078125, -1.49951171875, -1.101318359375, -0.703125, -0.304931640625, 0.09326171875, 0.491455078125, 0.8896484375, 1.287841796875, 1.68603515625, 2.084228515625, 2.482421875, 2.880615234375, 3.27880859375, 3.677001953125, 4.0751953125, 4.473388671875, 4.87158203125, 5.269775390625, 5.66796875, 6.066162109375, 6.46435546875, 6.862548828125, 7.2607421875, 7.658935546875, 8.05712890625, 8.455322265625, 8.853515625, 9.251708984375, 9.64990234375, 10.048095703125, 10.4462890625, 10.844482421875, 11.24267578125, 11.640869140625, 12.0390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 3.0, 9.0, 18.0, 30.0, 31.0, 55.0, 65.0, 107.0, 158.0, 243.0, 398.0, 625.0, 713.0, 552.0, 359.0, 261.0, 142.0, 100.0, 62.0, 35.0, 34.0, 15.0, 10.0, 8.0, 11.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.3671875, -13.0093994140625, -12.651611328125, -12.2938232421875, -11.93603515625, -11.5782470703125, -11.220458984375, -10.8626708984375, -10.5048828125, -10.1470947265625, -9.789306640625, -9.4315185546875, -9.07373046875, -8.7159423828125, -8.358154296875, -8.0003662109375, -7.642578125, -7.2847900390625, -6.927001953125, -6.5692138671875, -6.21142578125, -5.8536376953125, -5.495849609375, -5.1380615234375, -4.7802734375, -4.4224853515625, -4.064697265625, -3.7069091796875, -3.34912109375, -2.9913330078125, -2.633544921875, -2.2757568359375, -1.91796875, -1.5601806640625, -1.202392578125, -0.8446044921875, -0.48681640625, -0.1290283203125, 0.228759765625, 0.5865478515625, 0.9443359375, 1.3021240234375, 1.659912109375, 2.0177001953125, 2.37548828125, 2.7332763671875, 3.091064453125, 3.4488525390625, 3.806640625, 4.1644287109375, 4.522216796875, 4.8800048828125, 5.23779296875, 5.5955810546875, 5.953369140625, 6.3111572265625, 6.6689453125, 7.0267333984375, 7.384521484375, 7.7423095703125, 8.10009765625, 8.4578857421875, 8.815673828125, 9.1734619140625, 9.53125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 13.0, 26.0, 44.0, 61.0, 108.0, 156.0, 155.0, 146.0, 103.0, 76.0, 45.0, 23.0, 10.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.26039123535156, -76.82545471191406, -73.39051055908203, -69.95556640625, -66.5206298828125, -63.085689544677734, -59.65074920654297, -56.2158088684082, -52.78086853027344, -49.34592819213867, -45.910987854003906, -42.47604751586914, -39.041107177734375, -35.60616683959961, -32.171226501464844, -28.736286163330078, -25.301345825195312, -21.866405487060547, -18.43146514892578, -14.996524810791016, -11.56158447265625, -8.126644134521484, -4.691703796386719, -1.2567634582519531, 2.1781768798828125, 5.613117218017578, 9.048057556152344, 12.48299789428711, 15.917938232421875, 19.35287857055664, 22.787818908691406, 26.222759246826172, 29.657699584960938, 33.0926399230957, 36.52758026123047, 39.962520599365234, 43.3974609375, 46.832401275634766, 50.26734161376953, 53.7022819519043, 57.13722229003906, 60.57216262817383, 64.0071029663086, 67.44204711914062, 70.87698364257812, 74.31192016601562, 77.74686431884766, 81.18180847167969, 84.61674499511719, 88.05168151855469, 91.48662567138672, 94.92156982421875, 98.35650634765625, 101.79144287109375, 105.22638702392578, 108.66133117675781, 112.09626770019531, 115.53120422363281, 118.96614837646484, 122.40109252929688, 125.83602905273438, 129.27096557617188, 132.70590209960938, 136.14085388183594, 139.57579040527344]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 3.0, 10.0, 6.0, 12.0, 7.0, 13.0, 19.0, 16.0, 19.0, 18.0, 32.0, 28.0, 28.0, 37.0, 37.0, 46.0, 42.0, 36.0, 44.0, 48.0, 49.0, 45.0, 36.0, 46.0, 50.0, 40.0, 31.0, 37.0, 35.0, 28.0, 25.0, 12.0, 13.0, 9.0, 11.0, 10.0, 8.0, 2.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-49.0355224609375, -47.66252899169922, -46.28953552246094, -44.91653823852539, -43.54354476928711, -42.17055130004883, -40.79755401611328, -39.424560546875, -38.05156707763672, -36.67857360839844, -35.305580139160156, -33.93258285522461, -32.55958938598633, -31.186595916748047, -29.813600540161133, -28.44060516357422, -27.067611694335938, -25.694618225097656, -24.321622848510742, -22.948627471923828, -21.575634002685547, -20.202640533447266, -18.82964515686035, -17.456649780273438, -16.083656311035156, -14.710661888122559, -13.337667465209961, -11.964673042297363, -10.591678619384766, -9.218684196472168, -7.84568977355957, -6.472695350646973, -5.099700927734375, -3.7267065048217773, -2.3537120819091797, -0.980717658996582, 0.3922767639160156, 1.7652711868286133, 3.138265609741211, 4.511260032653809, 5.884254455566406, 7.257248878479004, 8.630243301391602, 10.0032377243042, 11.376232147216797, 12.749226570129395, 14.122220993041992, 15.49521541595459, 16.868209838867188, 18.24120330810547, 19.614198684692383, 20.987194061279297, 22.360187530517578, 23.73318099975586, 25.106176376342773, 26.479171752929688, 27.85216522216797, 29.22515869140625, 30.598154067993164, 31.971149444580078, 33.34414291381836, 34.71713638305664, 36.09013366699219, 37.46312713623047, 38.83612060546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 6.0, 13.0, 8.0, 19.0, 31.0, 60.0, 75.0, 160.0, 301.0, 560.0, 1225.0, 2622.0, 6502.0, 18666.0, 60053.0, 228104.0, 506938.0, 156426.0, 43684.0, 13867.0, 4999.0, 2106.0, 1039.0, 489.0, 246.0, 144.0, 80.0, 40.0, 33.0, 15.0, 10.0, 5.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.37548828125, -11.9541015625, -11.53271484375, -11.111328125, -10.68994140625, -10.2685546875, -9.84716796875, -9.42578125, -9.00439453125, -8.5830078125, -8.16162109375, -7.740234375, -7.31884765625, -6.8974609375, -6.47607421875, -6.0546875, -5.63330078125, -5.2119140625, -4.79052734375, -4.369140625, -3.94775390625, -3.5263671875, -3.10498046875, -2.68359375, -2.26220703125, -1.8408203125, -1.41943359375, -0.998046875, -0.57666015625, -0.1552734375, 0.26611328125, 0.6875, 1.10888671875, 1.5302734375, 1.95166015625, 2.373046875, 2.79443359375, 3.2158203125, 3.63720703125, 4.05859375, 4.47998046875, 4.9013671875, 5.32275390625, 5.744140625, 6.16552734375, 6.5869140625, 7.00830078125, 7.4296875, 7.85107421875, 8.2724609375, 8.69384765625, 9.115234375, 9.53662109375, 9.9580078125, 10.37939453125, 10.80078125, 11.22216796875, 11.6435546875, 12.06494140625, 12.486328125, 12.90771484375, 13.3291015625, 13.75048828125, 14.171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 8.0, 10.0, 16.0, 14.0, 29.0, 42.0, 48.0, 65.0, 58.0, 69.0, 49.0, 77.0, 92.0, 74.0, 77.0, 49.0, 54.0, 38.0, 31.0, 33.0, 18.0, 17.0, 10.0, 11.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.128173828125, -7.88916015625, -7.650146484375, -7.4111328125, -7.172119140625, -6.93310546875, -6.694091796875, -6.455078125, -6.216064453125, -5.97705078125, -5.738037109375, -5.4990234375, -5.260009765625, -5.02099609375, -4.781982421875, -4.54296875, -4.303955078125, -4.06494140625, -3.825927734375, -3.5869140625, -3.347900390625, -3.10888671875, -2.869873046875, -2.630859375, -2.391845703125, -2.15283203125, -1.913818359375, -1.6748046875, -1.435791015625, -1.19677734375, -0.957763671875, -0.71875, -0.479736328125, -0.24072265625, -0.001708984375, 0.2373046875, 0.476318359375, 0.71533203125, 0.954345703125, 1.193359375, 1.432373046875, 1.67138671875, 1.910400390625, 2.1494140625, 2.388427734375, 2.62744140625, 2.866455078125, 3.10546875, 3.344482421875, 3.58349609375, 3.822509765625, 4.0615234375, 4.300537109375, 4.53955078125, 4.778564453125, 5.017578125, 5.256591796875, 5.49560546875, 5.734619140625, 5.9736328125, 6.212646484375, 6.45166015625, 6.690673828125, 6.9296875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 9.0, 8.0, 14.0, 27.0, 34.0, 62.0, 60.0, 118.0, 178.0, 340.0, 611.0, 1400.0, 4338.0, 28146.0, 807777.0, 189169.0, 11393.0, 2703.0, 1020.0, 459.0, 248.0, 129.0, 91.0, 62.0, 39.0, 36.0, 21.0, 16.0, 8.0, 2.0, 9.0, 2.0, 1.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.28125, -33.130859375, -31.98046875, -30.830078125, -29.6796875, -28.529296875, -27.37890625, -26.228515625, -25.078125, -23.927734375, -22.77734375, -21.626953125, -20.4765625, -19.326171875, -18.17578125, -17.025390625, -15.875, -14.724609375, -13.57421875, -12.423828125, -11.2734375, -10.123046875, -8.97265625, -7.822265625, -6.671875, -5.521484375, -4.37109375, -3.220703125, -2.0703125, -0.919921875, 0.23046875, 1.380859375, 2.53125, 3.681640625, 4.83203125, 5.982421875, 7.1328125, 8.283203125, 9.43359375, 10.583984375, 11.734375, 12.884765625, 14.03515625, 15.185546875, 16.3359375, 17.486328125, 18.63671875, 19.787109375, 20.9375, 22.087890625, 23.23828125, 24.388671875, 25.5390625, 26.689453125, 27.83984375, 28.990234375, 30.140625, 31.291015625, 32.44140625, 33.591796875, 34.7421875, 35.892578125, 37.04296875, 38.193359375, 39.34375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 13.0, 11.0, 15.0, 24.0, 27.0, 39.0, 48.0, 42.0, 74.0, 90.0, 91.0, 91.0, 77.0, 85.0, 67.0, 56.0, 35.0, 32.0, 19.0, 10.0, 6.0, 4.0, 6.0, 2.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.46875, -33.2509765625, -32.033203125, -30.8154296875, -29.59765625, -28.3798828125, -27.162109375, -25.9443359375, -24.7265625, -23.5087890625, -22.291015625, -21.0732421875, -19.85546875, -18.6376953125, -17.419921875, -16.2021484375, -14.984375, -13.7666015625, -12.548828125, -11.3310546875, -10.11328125, -8.8955078125, -7.677734375, -6.4599609375, -5.2421875, -4.0244140625, -2.806640625, -1.5888671875, -0.37109375, 0.8466796875, 2.064453125, 3.2822265625, 4.5, 5.7177734375, 6.935546875, 8.1533203125, 9.37109375, 10.5888671875, 11.806640625, 13.0244140625, 14.2421875, 15.4599609375, 16.677734375, 17.8955078125, 19.11328125, 20.3310546875, 21.548828125, 22.7666015625, 23.984375, 25.2021484375, 26.419921875, 27.6376953125, 28.85546875, 30.0732421875, 31.291015625, 32.5087890625, 33.7265625, 34.9443359375, 36.162109375, 37.3798828125, 38.59765625, 39.8154296875, 41.033203125, 42.2509765625, 43.46875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 8.0, 12.0, 16.0, 15.0, 10.0, 24.0, 34.0, 45.0, 99.0, 145.0, 243.0, 603.0, 1717.0, 9626.0, 172810.0, 835672.0, 22869.0, 2968.0, 804.0, 355.0, 173.0, 87.0, 62.0, 43.0, 28.0, 15.0, 26.0, 7.0, 8.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.2978515625, -16.705078125, -16.1123046875, -15.51953125, -14.9267578125, -14.333984375, -13.7412109375, -13.1484375, -12.5556640625, -11.962890625, -11.3701171875, -10.77734375, -10.1845703125, -9.591796875, -8.9990234375, -8.40625, -7.8134765625, -7.220703125, -6.6279296875, -6.03515625, -5.4423828125, -4.849609375, -4.2568359375, -3.6640625, -3.0712890625, -2.478515625, -1.8857421875, -1.29296875, -0.7001953125, -0.107421875, 0.4853515625, 1.078125, 1.6708984375, 2.263671875, 2.8564453125, 3.44921875, 4.0419921875, 4.634765625, 5.2275390625, 5.8203125, 6.4130859375, 7.005859375, 7.5986328125, 8.19140625, 8.7841796875, 9.376953125, 9.9697265625, 10.5625, 11.1552734375, 11.748046875, 12.3408203125, 12.93359375, 13.5263671875, 14.119140625, 14.7119140625, 15.3046875, 15.8974609375, 16.490234375, 17.0830078125, 17.67578125, 18.2685546875, 18.861328125, 19.4541015625, 20.046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 13.0, 15.0, 13.0, 23.0, 43.0, 51.0, 76.0, 174.0, 213.0, 124.0, 58.0, 37.0, 25.0, 22.0, 20.0, 18.0, 14.0, 5.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031757354736328125, -0.0030856430530548096, -0.0029955506324768066, -0.0029054582118988037, -0.0028153657913208008, -0.002725273370742798, -0.002635180950164795, -0.002545088529586792, -0.002454996109008789, -0.002364903688430786, -0.002274811267852783, -0.0021847188472747803, -0.0020946264266967773, -0.0020045340061187744, -0.0019144415855407715, -0.0018243491649627686, -0.0017342567443847656, -0.0016441643238067627, -0.0015540719032287598, -0.0014639794826507568, -0.001373887062072754, -0.001283794641494751, -0.001193702220916748, -0.0011036098003387451, -0.0010135173797607422, -0.0009234249591827393, -0.0008333325386047363, -0.0007432401180267334, -0.0006531476974487305, -0.0005630552768707275, -0.0004729628562927246, -0.0003828704357147217, -0.00029277801513671875, -0.00020268559455871582, -0.00011259317398071289, -2.250075340270996e-05, 6.759166717529297e-05, 0.0001576840877532959, 0.00024777650833129883, 0.00033786892890930176, 0.0004279613494873047, 0.0005180537700653076, 0.0006081461906433105, 0.0006982386112213135, 0.0007883310317993164, 0.0008784234523773193, 0.0009685158729553223, 0.0010586082935333252, 0.0011487007141113281, 0.001238793134689331, 0.001328885555267334, 0.001418977975845337, 0.0015090703964233398, 0.0015991628170013428, 0.0016892552375793457, 0.0017793476581573486, 0.0018694400787353516, 0.0019595324993133545, 0.0020496249198913574, 0.0021397173404693604, 0.0022298097610473633, 0.002319902181625366, 0.002409994602203369, 0.002500087022781372, 0.002590179443359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 13.0, 16.0, 20.0, 46.0, 45.0, 61.0, 108.0, 142.0, 274.0, 451.0, 1002.0, 2324.0, 7116.0, 30545.0, 697677.0, 277595.0, 21705.0, 5494.0, 1917.0, 922.0, 399.0, 205.0, 153.0, 99.0, 65.0, 45.0, 29.0, 22.0, 15.0, 9.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.734375, -17.1953125, -16.65625, -16.1171875, -15.578125, -15.0390625, -14.5, -13.9609375, -13.421875, -12.8828125, -12.34375, -11.8046875, -11.265625, -10.7265625, -10.1875, -9.6484375, -9.109375, -8.5703125, -8.03125, -7.4921875, -6.953125, -6.4140625, -5.875, -5.3359375, -4.796875, -4.2578125, -3.71875, -3.1796875, -2.640625, -2.1015625, -1.5625, -1.0234375, -0.484375, 0.0546875, 0.59375, 1.1328125, 1.671875, 2.2109375, 2.75, 3.2890625, 3.828125, 4.3671875, 4.90625, 5.4453125, 5.984375, 6.5234375, 7.0625, 7.6015625, 8.140625, 8.6796875, 9.21875, 9.7578125, 10.296875, 10.8359375, 11.375, 11.9140625, 12.453125, 12.9921875, 13.53125, 14.0703125, 14.609375, 15.1484375, 15.6875, 16.2265625, 16.765625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 7.0, 19.0, 16.0, 32.0, 59.0, 100.0, 160.0, 221.0, 146.0, 80.0, 38.0, 25.0, 16.0, 16.0, 9.0, 10.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.7159423828125, -17.197509765625, -16.6790771484375, -16.16064453125, -15.6422119140625, -15.123779296875, -14.6053466796875, -14.0869140625, -13.5684814453125, -13.050048828125, -12.5316162109375, -12.01318359375, -11.4947509765625, -10.976318359375, -10.4578857421875, -9.939453125, -9.4210205078125, -8.902587890625, -8.3841552734375, -7.86572265625, -7.3472900390625, -6.828857421875, -6.3104248046875, -5.7919921875, -5.2735595703125, -4.755126953125, -4.2366943359375, -3.71826171875, -3.1998291015625, -2.681396484375, -2.1629638671875, -1.64453125, -1.1260986328125, -0.607666015625, -0.0892333984375, 0.42919921875, 0.9476318359375, 1.466064453125, 1.9844970703125, 2.5029296875, 3.0213623046875, 3.539794921875, 4.0582275390625, 4.57666015625, 5.0950927734375, 5.613525390625, 6.1319580078125, 6.650390625, 7.1688232421875, 7.687255859375, 8.2056884765625, 8.72412109375, 9.2425537109375, 9.760986328125, 10.2794189453125, 10.7978515625, 11.3162841796875, 11.834716796875, 12.3531494140625, 12.87158203125, 13.3900146484375, 13.908447265625, 14.4268798828125, 14.9453125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 8.0, 10.0, 24.0, 77.0, 167.0, 308.0, 203.0, 118.0, 50.0, 13.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.7328338623047, -156.73707580566406, -148.74131774902344, -140.7455596923828, -132.74981689453125, -124.7540512084961, -116.75830078125, -108.76254272460938, -100.76678466796875, -92.77102661132812, -84.7752685546875, -76.7795181274414, -68.78376007080078, -60.788002014160156, -52.7922477722168, -44.79649353027344, -36.80073547363281, -28.80497932434082, -20.809223175048828, -12.813467025756836, -4.817710876464844, 3.1780471801757812, 11.17380142211914, 19.1695556640625, 27.165313720703125, 35.16107177734375, 43.15682601928711, 51.15258026123047, 59.148338317871094, 67.14409637451172, 75.13984680175781, 83.13560485839844, 91.13134765625, 99.12710571289062, 107.12286376953125, 115.11861419677734, 123.11437225341797, 131.11013793945312, 139.1058807373047, 147.1016387939453, 155.09739685058594, 163.09315490722656, 171.0889129638672, 179.0846710205078, 187.08041381835938, 195.076171875, 203.07192993164062, 211.06768798828125, 219.06344604492188, 227.0592041015625, 235.05496215820312, 243.05072021484375, 251.04647827148438, 259.042236328125, 267.0379943847656, 275.03375244140625, 283.02947998046875, 291.0252380371094, 299.02099609375, 307.0167541503906, 315.01251220703125, 323.0082702636719, 331.0040283203125, 338.999755859375, 346.99554443359375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 12.0, 11.0, 18.0, 19.0, 19.0, 25.0, 29.0, 42.0, 46.0, 53.0, 53.0, 61.0, 78.0, 66.0, 62.0, 61.0, 54.0, 52.0, 41.0, 38.0, 26.0, 26.0, 20.0, 20.0, 13.0, 14.0, 13.0, 8.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.6919937133789, -92.19994354248047, -88.70789337158203, -85.2158432006836, -81.72379302978516, -78.23174285888672, -74.73970031738281, -71.24765014648438, -67.75559997558594, -64.2635498046875, -60.77149963378906, -57.279449462890625, -53.78739929199219, -50.29534912109375, -46.80330276489258, -43.31125259399414, -39.81919860839844, -36.3271484375, -32.83509826660156, -29.343050003051758, -25.85099983215332, -22.358949661254883, -18.866901397705078, -15.37485122680664, -11.882801055908203, -8.390750885009766, -4.8987016677856445, -1.4066524505615234, 2.085397720336914, 5.577447891235352, 9.069496154785156, 12.561546325683594, 16.0535888671875, 19.545639038085938, 23.037689208984375, 26.52973747253418, 30.021787643432617, 33.51383972167969, 37.00588607788086, 40.4979362487793, 43.989986419677734, 47.48203659057617, 50.97408676147461, 54.46613311767578, 57.95818328857422, 61.450233459472656, 64.9422836303711, 68.43433380126953, 71.92638397216797, 75.4184341430664, 78.91048431396484, 82.40253448486328, 85.89458465576172, 89.38663482666016, 92.87867736816406, 96.3707275390625, 99.86277770996094, 103.35482788085938, 106.84687805175781, 110.33892822265625, 113.83097839355469, 117.32302856445312, 120.81507873535156, 124.30712890625, 127.79917907714844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 9.0, 9.0, 25.0, 36.0, 48.0, 59.0, 106.0, 183.0, 315.0, 790.0, 5425.0, 529010.0, 3641297.0, 14667.0, 1391.0, 396.0, 182.0, 114.0, 68.0, 53.0, 33.0, 14.0, 9.0, 7.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.921875, -30.92919921875, -29.9365234375, -28.94384765625, -27.951171875, -26.95849609375, -25.9658203125, -24.97314453125, -23.98046875, -22.98779296875, -21.9951171875, -21.00244140625, -20.009765625, -19.01708984375, -18.0244140625, -17.03173828125, -16.0390625, -15.04638671875, -14.0537109375, -13.06103515625, -12.068359375, -11.07568359375, -10.0830078125, -9.09033203125, -8.09765625, -7.10498046875, -6.1123046875, -5.11962890625, -4.126953125, -3.13427734375, -2.1416015625, -1.14892578125, -0.15625, 0.83642578125, 1.8291015625, 2.82177734375, 3.814453125, 4.80712890625, 5.7998046875, 6.79248046875, 7.78515625, 8.77783203125, 9.7705078125, 10.76318359375, 11.755859375, 12.74853515625, 13.7412109375, 14.73388671875, 15.7265625, 16.71923828125, 17.7119140625, 18.70458984375, 19.697265625, 20.68994140625, 21.6826171875, 22.67529296875, 23.66796875, 24.66064453125, 25.6533203125, 26.64599609375, 27.638671875, 28.63134765625, 29.6240234375, 30.61669921875, 31.609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 11.0, 10.0, 26.0, 26.0, 26.0, 53.0, 43.0, 72.0, 65.0, 99.0, 92.0, 80.0, 65.0, 83.0, 61.0, 38.0, 32.0, 33.0, 22.0, 17.0, 15.0, 7.0, 9.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8458251953125, -7.582275390625, -7.3187255859375, -7.05517578125, -6.7916259765625, -6.528076171875, -6.2645263671875, -6.0009765625, -5.7374267578125, -5.473876953125, -5.2103271484375, -4.94677734375, -4.6832275390625, -4.419677734375, -4.1561279296875, -3.892578125, -3.6290283203125, -3.365478515625, -3.1019287109375, -2.83837890625, -2.5748291015625, -2.311279296875, -2.0477294921875, -1.7841796875, -1.5206298828125, -1.257080078125, -0.9935302734375, -0.72998046875, -0.4664306640625, -0.202880859375, 0.0606689453125, 0.32421875, 0.5877685546875, 0.851318359375, 1.1148681640625, 1.37841796875, 1.6419677734375, 1.905517578125, 2.1690673828125, 2.4326171875, 2.6961669921875, 2.959716796875, 3.2232666015625, 3.48681640625, 3.7503662109375, 4.013916015625, 4.2774658203125, 4.541015625, 4.8045654296875, 5.068115234375, 5.3316650390625, 5.59521484375, 5.8587646484375, 6.122314453125, 6.3858642578125, 6.6494140625, 6.9129638671875, 7.176513671875, 7.4400634765625, 7.70361328125, 7.9671630859375, 8.230712890625, 8.4942626953125, 8.7578125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 15.0, 17.0, 34.0, 69.0, 135.0, 265.0, 494.0, 1065.0, 2766.0, 8404.0, 32048.0, 201777.0, 2262665.0, 1512579.0, 135012.0, 25204.0, 7257.0, 2530.0, 976.0, 435.0, 219.0, 129.0, 58.0, 54.0, 26.0, 20.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.9847412109375, -11.641357421875, -11.2979736328125, -10.95458984375, -10.6112060546875, -10.267822265625, -9.9244384765625, -9.5810546875, -9.2376708984375, -8.894287109375, -8.5509033203125, -8.20751953125, -7.8641357421875, -7.520751953125, -7.1773681640625, -6.833984375, -6.4906005859375, -6.147216796875, -5.8038330078125, -5.46044921875, -5.1170654296875, -4.773681640625, -4.4302978515625, -4.0869140625, -3.7435302734375, -3.400146484375, -3.0567626953125, -2.71337890625, -2.3699951171875, -2.026611328125, -1.6832275390625, -1.33984375, -0.9964599609375, -0.653076171875, -0.3096923828125, 0.03369140625, 0.3770751953125, 0.720458984375, 1.0638427734375, 1.4072265625, 1.7506103515625, 2.093994140625, 2.4373779296875, 2.78076171875, 3.1241455078125, 3.467529296875, 3.8109130859375, 4.154296875, 4.4976806640625, 4.841064453125, 5.1844482421875, 5.52783203125, 5.8712158203125, 6.214599609375, 6.5579833984375, 6.9013671875, 7.2447509765625, 7.588134765625, 7.9315185546875, 8.27490234375, 8.6182861328125, 8.961669921875, 9.3050537109375, 9.6484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 7.0, 10.0, 9.0, 15.0, 28.0, 53.0, 42.0, 136.0, 187.0, 248.0, 384.0, 547.0, 662.0, 551.0, 394.0, 275.0, 180.0, 104.0, 71.0, 41.0, 33.0, 23.0, 19.0, 10.0, 12.0, 11.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8004150390625, -8.468017578125, -8.1356201171875, -7.80322265625, -7.4708251953125, -7.138427734375, -6.8060302734375, -6.4736328125, -6.1412353515625, -5.808837890625, -5.4764404296875, -5.14404296875, -4.8116455078125, -4.479248046875, -4.1468505859375, -3.814453125, -3.4820556640625, -3.149658203125, -2.8172607421875, -2.48486328125, -2.1524658203125, -1.820068359375, -1.4876708984375, -1.1552734375, -0.8228759765625, -0.490478515625, -0.1580810546875, 0.17431640625, 0.5067138671875, 0.839111328125, 1.1715087890625, 1.50390625, 1.8363037109375, 2.168701171875, 2.5010986328125, 2.83349609375, 3.1658935546875, 3.498291015625, 3.8306884765625, 4.1630859375, 4.4954833984375, 4.827880859375, 5.1602783203125, 5.49267578125, 5.8250732421875, 6.157470703125, 6.4898681640625, 6.822265625, 7.1546630859375, 7.487060546875, 7.8194580078125, 8.15185546875, 8.4842529296875, 8.816650390625, 9.1490478515625, 9.4814453125, 9.8138427734375, 10.146240234375, 10.4786376953125, 10.81103515625, 11.1434326171875, 11.475830078125, 11.8082275390625, 12.140625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 8.0, 8.0, 10.0, 32.0, 95.0, 159.0, 218.0, 221.0, 139.0, 55.0, 25.0, 13.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.59634399414062, -109.3470458984375, -105.09774780273438, -100.84845733642578, -96.59915924072266, -92.34986114501953, -88.10057067871094, -83.85127258300781, -79.60197448730469, -75.35267639160156, -71.10337829589844, -66.85408782958984, -62.60478973388672, -58.355491638183594, -54.106197357177734, -49.856903076171875, -45.60760498046875, -41.358306884765625, -37.109012603759766, -32.859718322753906, -28.61042022705078, -24.36112403869629, -20.111827850341797, -15.862531661987305, -11.613235473632812, -7.36393928527832, -3.114643096923828, 1.134653091430664, 5.383949279785156, 9.633245468139648, 13.88254165649414, 18.131837844848633, 22.381118774414062, 26.630414962768555, 30.879711151123047, 35.129005432128906, 39.37830352783203, 43.627601623535156, 47.876895904541016, 52.126190185546875, 56.37548828125, 60.624786376953125, 64.87408447265625, 69.12337493896484, 73.37267303466797, 77.6219711303711, 81.87126159667969, 86.12055969238281, 90.36985778808594, 94.61915588378906, 98.86845397949219, 103.11774444580078, 107.3670425415039, 111.61634063720703, 115.86563110351562, 120.11492919921875, 124.36422729492188, 128.613525390625, 132.86282348632812, 137.11212158203125, 141.36141967773438, 145.61070251464844, 149.86000061035156, 154.1092987060547, 158.3585968017578]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 10.0, 22.0, 21.0, 20.0, 36.0, 33.0, 35.0, 32.0, 40.0, 51.0, 56.0, 54.0, 50.0, 70.0, 47.0, 56.0, 50.0, 43.0, 37.0, 40.0, 28.0, 30.0, 18.0, 20.0, 17.0, 11.0, 13.0, 11.0, 10.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-55.51289367675781, -53.9188117980957, -52.32473373413086, -50.73065185546875, -49.136573791503906, -47.5424919128418, -45.94841003417969, -44.354331970214844, -42.760250091552734, -41.166168212890625, -39.57209014892578, -37.97800827026367, -36.38393020629883, -34.78984832763672, -33.195770263671875, -31.601688385009766, -30.00760841369629, -28.413528442382812, -26.819448471069336, -25.22536849975586, -23.63128662109375, -22.037206649780273, -20.443126678466797, -18.849044799804688, -17.254966735839844, -15.660886764526367, -14.066805839538574, -12.472725868225098, -10.878644943237305, -9.284564971923828, -7.690485000610352, -6.096404075622559, -4.502323150634766, -2.908242702484131, -1.3141624927520752, 0.27991771697998047, 1.8739981651306152, 3.46807861328125, 5.062158584594727, 6.6562395095825195, 8.250319480895996, 9.844399452209473, 11.438480377197266, 13.032560348510742, 14.626640319824219, 16.220722198486328, 17.814800262451172, 19.40888214111328, 21.002962112426758, 22.597042083740234, 24.19112205505371, 25.785202026367188, 27.379283905029297, 28.973363876342773, 30.56744384765625, 32.16152572631836, 33.7556037902832, 35.34968566894531, 36.943763732910156, 38.537845611572266, 40.13192367553711, 41.72600555419922, 43.32008361816406, 44.91416549682617, 46.50824737548828]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 13.0, 10.0, 15.0, 24.0, 24.0, 30.0, 43.0, 66.0, 124.0, 198.0, 322.0, 606.0, 1201.0, 2575.0, 6418.0, 17184.0, 52053.0, 198953.0, 518808.0, 175842.0, 47328.0, 15834.0, 5987.0, 2464.0, 1076.0, 550.0, 298.0, 172.0, 99.0, 75.0, 41.0, 34.0, 20.0, 18.0, 14.0, 9.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.109375, -14.6949462890625, -14.280517578125, -13.8660888671875, -13.45166015625, -13.0372314453125, -12.622802734375, -12.2083740234375, -11.7939453125, -11.3795166015625, -10.965087890625, -10.5506591796875, -10.13623046875, -9.7218017578125, -9.307373046875, -8.8929443359375, -8.478515625, -8.0640869140625, -7.649658203125, -7.2352294921875, -6.82080078125, -6.4063720703125, -5.991943359375, -5.5775146484375, -5.1630859375, -4.7486572265625, -4.334228515625, -3.9197998046875, -3.50537109375, -3.0909423828125, -2.676513671875, -2.2620849609375, -1.84765625, -1.4332275390625, -1.018798828125, -0.6043701171875, -0.18994140625, 0.2244873046875, 0.638916015625, 1.0533447265625, 1.4677734375, 1.8822021484375, 2.296630859375, 2.7110595703125, 3.12548828125, 3.5399169921875, 3.954345703125, 4.3687744140625, 4.783203125, 5.1976318359375, 5.612060546875, 6.0264892578125, 6.44091796875, 6.8553466796875, 7.269775390625, 7.6842041015625, 8.0986328125, 8.5130615234375, 8.927490234375, 9.3419189453125, 9.75634765625, 10.1707763671875, 10.585205078125, 10.9996337890625, 11.4140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 13.0, 10.0, 17.0, 16.0, 17.0, 36.0, 29.0, 46.0, 46.0, 63.0, 47.0, 61.0, 62.0, 68.0, 65.0, 59.0, 58.0, 56.0, 39.0, 32.0, 22.0, 19.0, 18.0, 14.0, 18.0, 7.0, 6.0, 11.0, 13.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.94921875, -7.74578857421875, -7.5423583984375, -7.33892822265625, -7.135498046875, -6.93206787109375, -6.7286376953125, -6.52520751953125, -6.32177734375, -6.11834716796875, -5.9149169921875, -5.71148681640625, -5.508056640625, -5.30462646484375, -5.1011962890625, -4.89776611328125, -4.6943359375, -4.49090576171875, -4.2874755859375, -4.08404541015625, -3.880615234375, -3.67718505859375, -3.4737548828125, -3.27032470703125, -3.06689453125, -2.86346435546875, -2.6600341796875, -2.45660400390625, -2.253173828125, -2.04974365234375, -1.8463134765625, -1.64288330078125, -1.439453125, -1.23602294921875, -1.0325927734375, -0.82916259765625, -0.625732421875, -0.42230224609375, -0.2188720703125, -0.01544189453125, 0.18798828125, 0.39141845703125, 0.5948486328125, 0.79827880859375, 1.001708984375, 1.20513916015625, 1.4085693359375, 1.61199951171875, 1.8154296875, 2.01885986328125, 2.2222900390625, 2.42572021484375, 2.629150390625, 2.83258056640625, 3.0360107421875, 3.23944091796875, 3.44287109375, 3.64630126953125, 3.8497314453125, 4.05316162109375, 4.256591796875, 4.46002197265625, 4.6634521484375, 4.86688232421875, 5.0703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 13.0, 14.0, 18.0, 26.0, 47.0, 69.0, 107.0, 211.0, 403.0, 813.0, 1857.0, 5785.0, 25838.0, 222328.0, 710396.0, 64290.0, 10928.0, 3063.0, 1115.0, 559.0, 245.0, 158.0, 86.0, 53.0, 36.0, 21.0, 19.0, 15.0, 10.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.765625, -18.982421875, -18.19921875, -17.416015625, -16.6328125, -15.849609375, -15.06640625, -14.283203125, -13.5, -12.716796875, -11.93359375, -11.150390625, -10.3671875, -9.583984375, -8.80078125, -8.017578125, -7.234375, -6.451171875, -5.66796875, -4.884765625, -4.1015625, -3.318359375, -2.53515625, -1.751953125, -0.96875, -0.185546875, 0.59765625, 1.380859375, 2.1640625, 2.947265625, 3.73046875, 4.513671875, 5.296875, 6.080078125, 6.86328125, 7.646484375, 8.4296875, 9.212890625, 9.99609375, 10.779296875, 11.5625, 12.345703125, 13.12890625, 13.912109375, 14.6953125, 15.478515625, 16.26171875, 17.044921875, 17.828125, 18.611328125, 19.39453125, 20.177734375, 20.9609375, 21.744140625, 22.52734375, 23.310546875, 24.09375, 24.876953125, 25.66015625, 26.443359375, 27.2265625, 28.009765625, 28.79296875, 29.576171875, 30.359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 6.0, 8.0, 17.0, 17.0, 24.0, 35.0, 39.0, 48.0, 69.0, 59.0, 77.0, 82.0, 70.0, 63.0, 81.0, 64.0, 69.0, 40.0, 35.0, 31.0, 20.0, 6.0, 12.0, 11.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0625, -37.853515625, -36.64453125, -35.435546875, -34.2265625, -33.017578125, -31.80859375, -30.599609375, -29.390625, -28.181640625, -26.97265625, -25.763671875, -24.5546875, -23.345703125, -22.13671875, -20.927734375, -19.71875, -18.509765625, -17.30078125, -16.091796875, -14.8828125, -13.673828125, -12.46484375, -11.255859375, -10.046875, -8.837890625, -7.62890625, -6.419921875, -5.2109375, -4.001953125, -2.79296875, -1.583984375, -0.375, 0.833984375, 2.04296875, 3.251953125, 4.4609375, 5.669921875, 6.87890625, 8.087890625, 9.296875, 10.505859375, 11.71484375, 12.923828125, 14.1328125, 15.341796875, 16.55078125, 17.759765625, 18.96875, 20.177734375, 21.38671875, 22.595703125, 23.8046875, 25.013671875, 26.22265625, 27.431640625, 28.640625, 29.849609375, 31.05859375, 32.267578125, 33.4765625, 34.685546875, 35.89453125, 37.103515625, 38.3125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 18.0, 25.0, 22.0, 39.0, 44.0, 76.0, 148.0, 378.0, 1030.0, 4948.0, 72386.0, 936819.0, 28135.0, 3034.0, 768.0, 306.0, 136.0, 85.0, 50.0, 34.0, 12.0, 15.0, 11.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.3125, -26.493896484375, -25.67529296875, -24.856689453125, -24.0380859375, -23.219482421875, -22.40087890625, -21.582275390625, -20.763671875, -19.945068359375, -19.12646484375, -18.307861328125, -17.4892578125, -16.670654296875, -15.85205078125, -15.033447265625, -14.21484375, -13.396240234375, -12.57763671875, -11.759033203125, -10.9404296875, -10.121826171875, -9.30322265625, -8.484619140625, -7.666015625, -6.847412109375, -6.02880859375, -5.210205078125, -4.3916015625, -3.572998046875, -2.75439453125, -1.935791015625, -1.1171875, -0.298583984375, 0.52001953125, 1.338623046875, 2.1572265625, 2.975830078125, 3.79443359375, 4.613037109375, 5.431640625, 6.250244140625, 7.06884765625, 7.887451171875, 8.7060546875, 9.524658203125, 10.34326171875, 11.161865234375, 11.98046875, 12.799072265625, 13.61767578125, 14.436279296875, 15.2548828125, 16.073486328125, 16.89208984375, 17.710693359375, 18.529296875, 19.347900390625, 20.16650390625, 20.985107421875, 21.8037109375, 22.622314453125, 23.44091796875, 24.259521484375, 25.078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 1.0, 6.0, 9.0, 4.0, 5.0, 4.0, 10.0, 13.0, 32.0, 30.0, 58.0, 77.0, 172.0, 188.0, 143.0, 72.0, 45.0, 36.0, 29.0, 16.0, 10.0, 8.0, 7.0, 2.0, 5.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002471923828125, -0.002378016710281372, -0.002284109592437744, -0.002190202474594116, -0.0020962953567504883, -0.0020023882389068604, -0.0019084811210632324, -0.0018145740032196045, -0.0017206668853759766, -0.0016267597675323486, -0.0015328526496887207, -0.0014389455318450928, -0.0013450384140014648, -0.001251131296157837, -0.001157224178314209, -0.001063317060470581, -0.0009694099426269531, -0.0008755028247833252, -0.0007815957069396973, -0.0006876885890960693, -0.0005937814712524414, -0.0004998743534088135, -0.00040596723556518555, -0.0003120601177215576, -0.0002181529998779297, -0.00012424588203430176, -3.0338764190673828e-05, 6.35683536529541e-05, 0.00015747547149658203, 0.00025138258934020996, 0.0003452897071838379, 0.0004391968250274658, 0.0005331039428710938, 0.0006270110607147217, 0.0007209181785583496, 0.0008148252964019775, 0.0009087324142456055, 0.0010026395320892334, 0.0010965466499328613, 0.0011904537677764893, 0.0012843608856201172, 0.0013782680034637451, 0.001472175121307373, 0.001566082239151001, 0.001659989356994629, 0.0017538964748382568, 0.0018478035926818848, 0.0019417107105255127, 0.0020356178283691406, 0.0021295249462127686, 0.0022234320640563965, 0.0023173391819000244, 0.0024112462997436523, 0.0025051534175872803, 0.002599060535430908, 0.002692967653274536, 0.002786874771118164, 0.002880781888961792, 0.00297468900680542, 0.003068596124649048, 0.0031625032424926758, 0.0032564103603363037, 0.0033503174781799316, 0.0034442245960235596, 0.0035381317138671875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 4.0, 3.0, 18.0, 23.0, 31.0, 35.0, 76.0, 140.0, 291.0, 556.0, 1307.0, 3371.0, 12111.0, 147460.0, 845143.0, 28540.0, 5811.0, 1977.0, 847.0, 352.0, 208.0, 84.0, 54.0, 35.0, 23.0, 17.0, 13.0, 2.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.484375, -18.81787109375, -18.1513671875, -17.48486328125, -16.818359375, -16.15185546875, -15.4853515625, -14.81884765625, -14.15234375, -13.48583984375, -12.8193359375, -12.15283203125, -11.486328125, -10.81982421875, -10.1533203125, -9.48681640625, -8.8203125, -8.15380859375, -7.4873046875, -6.82080078125, -6.154296875, -5.48779296875, -4.8212890625, -4.15478515625, -3.48828125, -2.82177734375, -2.1552734375, -1.48876953125, -0.822265625, -0.15576171875, 0.5107421875, 1.17724609375, 1.84375, 2.51025390625, 3.1767578125, 3.84326171875, 4.509765625, 5.17626953125, 5.8427734375, 6.50927734375, 7.17578125, 7.84228515625, 8.5087890625, 9.17529296875, 9.841796875, 10.50830078125, 11.1748046875, 11.84130859375, 12.5078125, 13.17431640625, 13.8408203125, 14.50732421875, 15.173828125, 15.84033203125, 16.5068359375, 17.17333984375, 17.83984375, 18.50634765625, 19.1728515625, 19.83935546875, 20.505859375, 21.17236328125, 21.8388671875, 22.50537109375, 23.171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 15.0, 13.0, 20.0, 55.0, 50.0, 95.0, 113.0, 175.0, 135.0, 110.0, 77.0, 32.0, 32.0, 8.0, 11.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.3172607421875, -12.884521484375, -12.4517822265625, -12.01904296875, -11.5863037109375, -11.153564453125, -10.7208251953125, -10.2880859375, -9.8553466796875, -9.422607421875, -8.9898681640625, -8.55712890625, -8.1243896484375, -7.691650390625, -7.2589111328125, -6.826171875, -6.3934326171875, -5.960693359375, -5.5279541015625, -5.09521484375, -4.6624755859375, -4.229736328125, -3.7969970703125, -3.3642578125, -2.9315185546875, -2.498779296875, -2.0660400390625, -1.63330078125, -1.2005615234375, -0.767822265625, -0.3350830078125, 0.09765625, 0.5303955078125, 0.963134765625, 1.3958740234375, 1.82861328125, 2.2613525390625, 2.694091796875, 3.1268310546875, 3.5595703125, 3.9923095703125, 4.425048828125, 4.8577880859375, 5.29052734375, 5.7232666015625, 6.156005859375, 6.5887451171875, 7.021484375, 7.4542236328125, 7.886962890625, 8.3197021484375, 8.75244140625, 9.1851806640625, 9.617919921875, 10.0506591796875, 10.4833984375, 10.9161376953125, 11.348876953125, 11.7816162109375, 12.21435546875, 12.6470947265625, 13.079833984375, 13.5125732421875, 13.9453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 35.0, 117.0, 258.0, 353.0, 155.0, 37.0, 17.0, 6.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-297.60223388671875, -288.0688171386719, -278.535400390625, -269.0019836425781, -259.46856689453125, -249.93515014648438, -240.40174865722656, -230.8683319091797, -221.3349151611328, -211.80149841308594, -202.26808166503906, -192.7346649169922, -183.20126342773438, -173.6678466796875, -164.13442993164062, -154.60101318359375, -145.06759643554688, -135.5341796875, -126.00076293945312, -116.46735382080078, -106.9339370727539, -97.40052032470703, -87.86711120605469, -78.33369445800781, -68.80027770996094, -59.26686096191406, -49.73344802856445, -40.200035095214844, -30.66661834716797, -21.133201599121094, -11.599788665771484, -2.066375732421875, 7.467010498046875, 17.000425338745117, 26.53384017944336, 36.06725311279297, 45.600669860839844, 55.13408660888672, 64.66749572753906, 74.20091247558594, 83.73432922363281, 93.26774597167969, 102.80116271972656, 112.3345718383789, 121.86798858642578, 131.40139770507812, 140.934814453125, 150.46823120117188, 160.00164794921875, 169.53506469726562, 179.0684814453125, 188.60189819335938, 198.13531494140625, 207.66873168945312, 217.20213317871094, 226.7355499267578, 236.2689666748047, 245.80238342285156, 255.33580017089844, 264.86920166015625, 274.4026184082031, 283.93603515625, 293.4694519042969, 303.00286865234375, 312.5362854003906]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 13.0, 8.0, 13.0, 51.0, 38.0, 48.0, 59.0, 81.0, 74.0, 111.0, 118.0, 84.0, 70.0, 55.0, 38.0, 48.0, 26.0, 23.0, 9.0, 9.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-264.48590087890625, -258.87890625, -253.2719268798828, -247.66493225097656, -242.0579376220703, -236.45095825195312, -230.84396362304688, -225.23696899414062, -219.62998962402344, -214.0229949951172, -208.416015625, -202.80902099609375, -197.2020263671875, -191.5950469970703, -185.98805236816406, -180.38107299804688, -174.77407836914062, -169.16708374023438, -163.5601043701172, -157.95310974121094, -152.3461151123047, -146.7391357421875, -141.13214111328125, -135.525146484375, -129.91815185546875, -124.31116485595703, -118.70417022705078, -113.09718322753906, -107.49019622802734, -101.88320922851562, -96.27621459960938, -90.66922760009766, -85.0622329711914, -79.45524597167969, -73.84825134277344, -68.24126434326172, -62.63427734375, -57.027286529541016, -51.42029571533203, -45.81330871582031, -40.20631790161133, -34.599327087402344, -28.992340087890625, -23.38534927368164, -17.77836036682129, -12.171371459960938, -6.564380645751953, -0.9573936462402344, 4.64959716796875, 10.256586074829102, 15.86357593536377, 21.470565795898438, 27.07755470275879, 32.68454360961914, 38.291534423828125, 43.898521423339844, 49.50551223754883, 55.11250305175781, 60.71949005126953, 66.32647705078125, 71.9334716796875, 77.54045867919922, 83.14744567871094, 88.75444030761719, 94.3614273071289]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 2.0, 6.0, 9.0, 13.0, 11.0, 16.0, 22.0, 29.0, 26.0, 47.0, 59.0, 63.0, 93.0, 134.0, 190.0, 261.0, 561.0, 1254.0, 4110.0, 25301.0, 460080.0, 3427704.0, 246400.0, 19985.0, 4670.0, 1815.0, 774.0, 325.0, 134.0, 66.0, 48.0, 24.0, 10.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0], "bins": [-22.90625, -22.40185546875, -21.8974609375, -21.39306640625, -20.888671875, -20.38427734375, -19.8798828125, -19.37548828125, -18.87109375, -18.36669921875, -17.8623046875, -17.35791015625, -16.853515625, -16.34912109375, -15.8447265625, -15.34033203125, -14.8359375, -14.33154296875, -13.8271484375, -13.32275390625, -12.818359375, -12.31396484375, -11.8095703125, -11.30517578125, -10.80078125, -10.29638671875, -9.7919921875, -9.28759765625, -8.783203125, -8.27880859375, -7.7744140625, -7.27001953125, -6.765625, -6.26123046875, -5.7568359375, -5.25244140625, -4.748046875, -4.24365234375, -3.7392578125, -3.23486328125, -2.73046875, -2.22607421875, -1.7216796875, -1.21728515625, -0.712890625, -0.20849609375, 0.2958984375, 0.80029296875, 1.3046875, 1.80908203125, 2.3134765625, 2.81787109375, 3.322265625, 3.82666015625, 4.3310546875, 4.83544921875, 5.33984375, 5.84423828125, 6.3486328125, 6.85302734375, 7.357421875, 7.86181640625, 8.3662109375, 8.87060546875, 9.375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 9.0, 23.0, 52.0, 105.0, 162.0, 161.0, 181.0, 122.0, 92.0, 45.0, 32.0, 14.0, 3.0, 6.0], "bins": [-31.515625, -30.9515380859375, -30.387451171875, -29.8233642578125, -29.25927734375, -28.6951904296875, -28.131103515625, -27.5670166015625, -27.0029296875, -26.4388427734375, -25.874755859375, -25.3106689453125, -24.74658203125, -24.1824951171875, -23.618408203125, -23.0543212890625, -22.490234375, -21.9261474609375, -21.362060546875, -20.7979736328125, -20.23388671875, -19.6697998046875, -19.105712890625, -18.5416259765625, -17.9775390625, -17.4134521484375, -16.849365234375, -16.2852783203125, -15.72119140625, -15.1571044921875, -14.593017578125, -14.0289306640625, -13.46484375, -12.9007568359375, -12.336669921875, -11.7725830078125, -11.20849609375, -10.6444091796875, -10.080322265625, -9.5162353515625, -8.9521484375, -8.3880615234375, -7.823974609375, -7.2598876953125, -6.69580078125, -6.1317138671875, -5.567626953125, -5.0035400390625, -4.439453125, -3.8753662109375, -3.311279296875, -2.7471923828125, -2.18310546875, -1.6190185546875, -1.054931640625, -0.4908447265625, 0.0732421875, 0.6373291015625, 1.201416015625, 1.7655029296875, 2.32958984375, 2.8936767578125, 3.457763671875, 4.0218505859375, 4.5859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 10.0, 16.0, 27.0, 27.0, 42.0, 55.0, 90.0, 164.0, 315.0, 890.0, 2966.0, 13385.0, 94721.0, 1488504.0, 2404728.0, 158357.0, 22367.0, 4904.0, 1393.0, 534.0, 272.0, 113.0, 101.0, 81.0, 51.0, 35.0, 19.0, 26.0, 20.0, 13.0, 11.0, 13.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.1015625, -13.633056640625, -13.16455078125, -12.696044921875, -12.2275390625, -11.759033203125, -11.29052734375, -10.822021484375, -10.353515625, -9.885009765625, -9.41650390625, -8.947998046875, -8.4794921875, -8.010986328125, -7.54248046875, -7.073974609375, -6.60546875, -6.136962890625, -5.66845703125, -5.199951171875, -4.7314453125, -4.262939453125, -3.79443359375, -3.325927734375, -2.857421875, -2.388916015625, -1.92041015625, -1.451904296875, -0.9833984375, -0.514892578125, -0.04638671875, 0.422119140625, 0.890625, 1.359130859375, 1.82763671875, 2.296142578125, 2.7646484375, 3.233154296875, 3.70166015625, 4.170166015625, 4.638671875, 5.107177734375, 5.57568359375, 6.044189453125, 6.5126953125, 6.981201171875, 7.44970703125, 7.918212890625, 8.38671875, 8.855224609375, 9.32373046875, 9.792236328125, 10.2607421875, 10.729248046875, 11.19775390625, 11.666259765625, 12.134765625, 12.603271484375, 13.07177734375, 13.540283203125, 14.0087890625, 14.477294921875, 14.94580078125, 15.414306640625, 15.8828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 11.0, 12.0, 29.0, 33.0, 69.0, 80.0, 120.0, 220.0, 285.0, 371.0, 550.0, 604.0, 488.0, 358.0, 230.0, 178.0, 120.0, 82.0, 61.0, 48.0, 33.0, 20.0, 15.0, 7.0, 8.0, 12.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.815185546875, -9.39599609375, -8.976806640625, -8.5576171875, -8.138427734375, -7.71923828125, -7.300048828125, -6.880859375, -6.461669921875, -6.04248046875, -5.623291015625, -5.2041015625, -4.784912109375, -4.36572265625, -3.946533203125, -3.52734375, -3.108154296875, -2.68896484375, -2.269775390625, -1.8505859375, -1.431396484375, -1.01220703125, -0.593017578125, -0.173828125, 0.245361328125, 0.66455078125, 1.083740234375, 1.5029296875, 1.922119140625, 2.34130859375, 2.760498046875, 3.1796875, 3.598876953125, 4.01806640625, 4.437255859375, 4.8564453125, 5.275634765625, 5.69482421875, 6.114013671875, 6.533203125, 6.952392578125, 7.37158203125, 7.790771484375, 8.2099609375, 8.629150390625, 9.04833984375, 9.467529296875, 9.88671875, 10.305908203125, 10.72509765625, 11.144287109375, 11.5634765625, 11.982666015625, 12.40185546875, 12.821044921875, 13.240234375, 13.659423828125, 14.07861328125, 14.497802734375, 14.9169921875, 15.336181640625, 15.75537109375, 16.174560546875, 16.59375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 12.0, 32.0, 66.0, 153.0, 204.0, 210.0, 139.0, 96.0, 34.0, 20.0, 10.0, 3.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.64988708496094, -181.1382293701172, -174.62655639648438, -168.11489868164062, -161.60324096679688, -155.09156799316406, -148.5799102783203, -142.0682373046875, -135.55657958984375, -129.044921875, -122.53324890136719, -116.02159118652344, -109.50992584228516, -102.99826049804688, -96.48660278320312, -89.97493743896484, -83.46327209472656, -76.95160675048828, -70.43994140625, -63.92828369140625, -57.41661834716797, -50.90495300292969, -44.39329147338867, -37.881629943847656, -31.369964599609375, -24.858301162719727, -18.346637725830078, -11.83497428894043, -5.323310852050781, 1.1883544921875, 7.700016021728516, 14.211677551269531, 20.72332763671875, 27.2349910736084, 33.74665451049805, 40.25831604003906, 46.769981384277344, 53.281646728515625, 59.79330825805664, 66.30496978759766, 72.81663513183594, 79.32830047607422, 85.8399658203125, 92.35162353515625, 98.86328887939453, 105.37495422363281, 111.88661193847656, 118.39827728271484, 124.90994262695312, 131.42160034179688, 137.9332733154297, 144.44493103027344, 150.95660400390625, 157.46826171875, 163.97991943359375, 170.4915771484375, 177.0032501220703, 183.51490783691406, 190.02658081054688, 196.53823852539062, 203.04989624023438, 209.5615692138672, 216.07322692871094, 222.58489990234375, 229.0965576171875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 23.0, 25.0, 46.0, 56.0, 99.0, 111.0, 111.0, 119.0, 109.0, 88.0, 74.0, 65.0, 32.0, 29.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.91571044921875, -124.40957641601562, -118.9034423828125, -113.39730834960938, -107.89118194580078, -102.38504791259766, -96.87891387939453, -91.37278747558594, -85.86665344238281, -80.36051940917969, -74.85438537597656, -69.34825134277344, -63.842124938964844, -58.33599090576172, -52.829856872558594, -47.323726654052734, -41.817588806152344, -36.31145477294922, -30.80532455444336, -25.299190521240234, -19.793058395385742, -14.28692626953125, -8.780792236328125, -3.2746620178222656, 2.2314720153808594, 7.73760461807251, 13.24373722076416, 18.74987030029297, 24.25600242614746, 29.762134552001953, 35.26826858520508, 40.77439880371094, 46.28053283691406, 51.78666687011719, 57.29279708862305, 62.79893112182617, 68.30506134033203, 73.81119537353516, 79.31732940673828, 84.82345581054688, 90.32958984375, 95.83572387695312, 101.34185791015625, 106.84799194335938, 112.35411834716797, 117.8602523803711, 123.36638641357422, 128.8725128173828, 134.378662109375, 139.88479614257812, 145.39093017578125, 150.89706420898438, 156.4031982421875, 161.90933227539062, 167.41546630859375, 172.9215850830078, 178.42771911621094, 183.93385314941406, 189.4399871826172, 194.9461212158203, 200.45225524902344, 205.9583740234375, 211.46450805664062, 216.97064208984375, 222.47677612304688]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 8.0, 13.0, 11.0, 13.0, 30.0, 30.0, 49.0, 70.0, 106.0, 146.0, 270.0, 499.0, 959.0, 2380.0, 7296.0, 29643.0, 134500.0, 525074.0, 270205.0, 57476.0, 13158.0, 3655.0, 1348.0, 609.0, 356.0, 220.0, 140.0, 75.0, 52.0, 42.0, 34.0, 28.0, 12.0, 16.0, 6.0, 8.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.3511962890625, -12.788330078125, -12.2254638671875, -11.66259765625, -11.0997314453125, -10.536865234375, -9.9739990234375, -9.4111328125, -8.8482666015625, -8.285400390625, -7.7225341796875, -7.15966796875, -6.5968017578125, -6.033935546875, -5.4710693359375, -4.908203125, -4.3453369140625, -3.782470703125, -3.2196044921875, -2.65673828125, -2.0938720703125, -1.531005859375, -0.9681396484375, -0.4052734375, 0.1575927734375, 0.720458984375, 1.2833251953125, 1.84619140625, 2.4090576171875, 2.971923828125, 3.5347900390625, 4.09765625, 4.6605224609375, 5.223388671875, 5.7862548828125, 6.34912109375, 6.9119873046875, 7.474853515625, 8.0377197265625, 8.6005859375, 9.1634521484375, 9.726318359375, 10.2891845703125, 10.85205078125, 11.4149169921875, 11.977783203125, 12.5406494140625, 13.103515625, 13.6663818359375, 14.229248046875, 14.7921142578125, 15.35498046875, 15.9178466796875, 16.480712890625, 17.0435791015625, 17.6064453125, 18.1693115234375, 18.732177734375, 19.2950439453125, 19.85791015625, 20.4207763671875, 20.983642578125, 21.5465087890625, 22.109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 14.0, 15.0, 12.0, 36.0, 27.0, 47.0, 39.0, 65.0, 64.0, 89.0, 71.0, 93.0, 73.0, 65.0, 69.0, 62.0, 46.0, 29.0, 29.0, 25.0, 10.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.203125, -10.924072265625, -10.64501953125, -10.365966796875, -10.0869140625, -9.807861328125, -9.52880859375, -9.249755859375, -8.970703125, -8.691650390625, -8.41259765625, -8.133544921875, -7.8544921875, -7.575439453125, -7.29638671875, -7.017333984375, -6.73828125, -6.459228515625, -6.18017578125, -5.901123046875, -5.6220703125, -5.343017578125, -5.06396484375, -4.784912109375, -4.505859375, -4.226806640625, -3.94775390625, -3.668701171875, -3.3896484375, -3.110595703125, -2.83154296875, -2.552490234375, -2.2734375, -1.994384765625, -1.71533203125, -1.436279296875, -1.1572265625, -0.878173828125, -0.59912109375, -0.320068359375, -0.041015625, 0.238037109375, 0.51708984375, 0.796142578125, 1.0751953125, 1.354248046875, 1.63330078125, 1.912353515625, 2.19140625, 2.470458984375, 2.74951171875, 3.028564453125, 3.3076171875, 3.586669921875, 3.86572265625, 4.144775390625, 4.423828125, 4.702880859375, 4.98193359375, 5.260986328125, 5.5400390625, 5.819091796875, 6.09814453125, 6.377197265625, 6.65625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 8.0, 8.0, 14.0, 17.0, 27.0, 48.0, 77.0, 148.0, 249.0, 482.0, 1025.0, 2529.0, 8839.0, 99918.0, 868641.0, 55788.0, 6807.0, 2088.0, 867.0, 400.0, 229.0, 138.0, 68.0, 46.0, 26.0, 21.0, 9.0, 14.0, 9.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.90625, -46.55322265625, -45.2001953125, -43.84716796875, -42.494140625, -41.14111328125, -39.7880859375, -38.43505859375, -37.08203125, -35.72900390625, -34.3759765625, -33.02294921875, -31.669921875, -30.31689453125, -28.9638671875, -27.61083984375, -26.2578125, -24.90478515625, -23.5517578125, -22.19873046875, -20.845703125, -19.49267578125, -18.1396484375, -16.78662109375, -15.43359375, -14.08056640625, -12.7275390625, -11.37451171875, -10.021484375, -8.66845703125, -7.3154296875, -5.96240234375, -4.609375, -3.25634765625, -1.9033203125, -0.55029296875, 0.802734375, 2.15576171875, 3.5087890625, 4.86181640625, 6.21484375, 7.56787109375, 8.9208984375, 10.27392578125, 11.626953125, 12.97998046875, 14.3330078125, 15.68603515625, 17.0390625, 18.39208984375, 19.7451171875, 21.09814453125, 22.451171875, 23.80419921875, 25.1572265625, 26.51025390625, 27.86328125, 29.21630859375, 30.5693359375, 31.92236328125, 33.275390625, 34.62841796875, 35.9814453125, 37.33447265625, 38.6875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 10.0, 11.0, 19.0, 23.0, 28.0, 30.0, 48.0, 43.0, 49.0, 45.0, 57.0, 53.0, 68.0, 71.0, 68.0, 59.0, 42.0, 46.0, 37.0, 37.0, 28.0, 19.0, 26.0, 14.0, 9.0, 3.0, 4.0, 6.0, 6.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-35.59375, -34.560302734375, -33.52685546875, -32.493408203125, -31.4599609375, -30.426513671875, -29.39306640625, -28.359619140625, -27.326171875, -26.292724609375, -25.25927734375, -24.225830078125, -23.1923828125, -22.158935546875, -21.12548828125, -20.092041015625, -19.05859375, -18.025146484375, -16.99169921875, -15.958251953125, -14.9248046875, -13.891357421875, -12.85791015625, -11.824462890625, -10.791015625, -9.757568359375, -8.72412109375, -7.690673828125, -6.6572265625, -5.623779296875, -4.59033203125, -3.556884765625, -2.5234375, -1.489990234375, -0.45654296875, 0.576904296875, 1.6103515625, 2.643798828125, 3.67724609375, 4.710693359375, 5.744140625, 6.777587890625, 7.81103515625, 8.844482421875, 9.8779296875, 10.911376953125, 11.94482421875, 12.978271484375, 14.01171875, 15.045166015625, 16.07861328125, 17.112060546875, 18.1455078125, 19.178955078125, 20.21240234375, 21.245849609375, 22.279296875, 23.312744140625, 24.34619140625, 25.379638671875, 26.4130859375, 27.446533203125, 28.47998046875, 29.513427734375, 30.546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 3.0, 4.0, 8.0, 13.0, 15.0, 14.0, 27.0, 48.0, 59.0, 81.0, 110.0, 223.0, 400.0, 726.0, 1689.0, 4581.0, 16483.0, 104224.0, 819144.0, 79643.0, 13786.0, 4046.0, 1502.0, 687.0, 416.0, 196.0, 128.0, 88.0, 51.0, 35.0, 38.0, 29.0, 13.0, 4.0, 10.0, 6.0, 2.0, 1.0, 3.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.59375, -17.067626953125, -16.54150390625, -16.015380859375, -15.4892578125, -14.963134765625, -14.43701171875, -13.910888671875, -13.384765625, -12.858642578125, -12.33251953125, -11.806396484375, -11.2802734375, -10.754150390625, -10.22802734375, -9.701904296875, -9.17578125, -8.649658203125, -8.12353515625, -7.597412109375, -7.0712890625, -6.545166015625, -6.01904296875, -5.492919921875, -4.966796875, -4.440673828125, -3.91455078125, -3.388427734375, -2.8623046875, -2.336181640625, -1.81005859375, -1.283935546875, -0.7578125, -0.231689453125, 0.29443359375, 0.820556640625, 1.3466796875, 1.872802734375, 2.39892578125, 2.925048828125, 3.451171875, 3.977294921875, 4.50341796875, 5.029541015625, 5.5556640625, 6.081787109375, 6.60791015625, 7.134033203125, 7.66015625, 8.186279296875, 8.71240234375, 9.238525390625, 9.7646484375, 10.290771484375, 10.81689453125, 11.343017578125, 11.869140625, 12.395263671875, 12.92138671875, 13.447509765625, 13.9736328125, 14.499755859375, 15.02587890625, 15.552001953125, 16.078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 3.0, 5.0, 11.0, 10.0, 13.0, 18.0, 20.0, 29.0, 34.0, 32.0, 56.0, 76.0, 118.0, 197.0, 91.0, 58.0, 46.0, 28.0, 32.0, 20.0, 14.0, 9.0, 12.0, 3.0, 4.0, 5.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030059814453125, -0.002906888723373413, -0.002807796001434326, -0.0027087032794952393, -0.0026096105575561523, -0.0025105178356170654, -0.0024114251136779785, -0.0023123323917388916, -0.0022132396697998047, -0.0021141469478607178, -0.002015054225921631, -0.001915961503982544, -0.001816868782043457, -0.0017177760601043701, -0.0016186833381652832, -0.0015195906162261963, -0.0014204978942871094, -0.0013214051723480225, -0.0012223124504089355, -0.0011232197284698486, -0.0010241270065307617, -0.0009250342845916748, -0.0008259415626525879, -0.000726848840713501, -0.0006277561187744141, -0.0005286633968353271, -0.00042957067489624023, -0.0003304779529571533, -0.0002313852310180664, -0.0001322925090789795, -3.319978713989258e-05, 6.589293479919434e-05, 0.00016498565673828125, 0.00026407837867736816, 0.0003631711006164551, 0.000462263822555542, 0.0005613565444946289, 0.0006604492664337158, 0.0007595419883728027, 0.0008586347103118896, 0.0009577274322509766, 0.0010568201541900635, 0.0011559128761291504, 0.0012550055980682373, 0.0013540983200073242, 0.0014531910419464111, 0.001552283763885498, 0.001651376485824585, 0.0017504692077636719, 0.0018495619297027588, 0.0019486546516418457, 0.0020477473735809326, 0.0021468400955200195, 0.0022459328174591064, 0.0023450255393981934, 0.0024441182613372803, 0.002543210983276367, 0.002642303705215454, 0.002741396427154541, 0.002840489149093628, 0.002939581871032715, 0.0030386745929718018, 0.0031377673149108887, 0.0032368600368499756, 0.0033359527587890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 6.0, 8.0, 14.0, 20.0, 27.0, 35.0, 57.0, 70.0, 101.0, 162.0, 346.0, 559.0, 1205.0, 3334.0, 11407.0, 66124.0, 878067.0, 69215.0, 11759.0, 3389.0, 1257.0, 563.0, 329.0, 181.0, 109.0, 79.0, 36.0, 22.0, 19.0, 23.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.9375, -28.205078125, -27.47265625, -26.740234375, -26.0078125, -25.275390625, -24.54296875, -23.810546875, -23.078125, -22.345703125, -21.61328125, -20.880859375, -20.1484375, -19.416015625, -18.68359375, -17.951171875, -17.21875, -16.486328125, -15.75390625, -15.021484375, -14.2890625, -13.556640625, -12.82421875, -12.091796875, -11.359375, -10.626953125, -9.89453125, -9.162109375, -8.4296875, -7.697265625, -6.96484375, -6.232421875, -5.5, -4.767578125, -4.03515625, -3.302734375, -2.5703125, -1.837890625, -1.10546875, -0.373046875, 0.359375, 1.091796875, 1.82421875, 2.556640625, 3.2890625, 4.021484375, 4.75390625, 5.486328125, 6.21875, 6.951171875, 7.68359375, 8.416015625, 9.1484375, 9.880859375, 10.61328125, 11.345703125, 12.078125, 12.810546875, 13.54296875, 14.275390625, 15.0078125, 15.740234375, 16.47265625, 17.205078125, 17.9375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 10.0, 10.0, 11.0, 12.0, 17.0, 13.0, 25.0, 45.0, 63.0, 84.0, 149.0, 158.0, 137.0, 64.0, 53.0, 35.0, 26.0, 17.0, 13.0, 6.0, 6.0, 4.0, 10.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -16.020263671875, -15.52490234375, -15.029541015625, -14.5341796875, -14.038818359375, -13.54345703125, -13.048095703125, -12.552734375, -12.057373046875, -11.56201171875, -11.066650390625, -10.5712890625, -10.075927734375, -9.58056640625, -9.085205078125, -8.58984375, -8.094482421875, -7.59912109375, -7.103759765625, -6.6083984375, -6.113037109375, -5.61767578125, -5.122314453125, -4.626953125, -4.131591796875, -3.63623046875, -3.140869140625, -2.6455078125, -2.150146484375, -1.65478515625, -1.159423828125, -0.6640625, -0.168701171875, 0.32666015625, 0.822021484375, 1.3173828125, 1.812744140625, 2.30810546875, 2.803466796875, 3.298828125, 3.794189453125, 4.28955078125, 4.784912109375, 5.2802734375, 5.775634765625, 6.27099609375, 6.766357421875, 7.26171875, 7.757080078125, 8.25244140625, 8.747802734375, 9.2431640625, 9.738525390625, 10.23388671875, 10.729248046875, 11.224609375, 11.719970703125, 12.21533203125, 12.710693359375, 13.2060546875, 13.701416015625, 14.19677734375, 14.692138671875, 15.1875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 18.0, 37.0, 82.0, 204.0, 311.0, 192.0, 80.0, 30.0, 17.0, 9.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.33547973632812, -226.72068786621094, -217.10589599609375, -207.49110412597656, -197.87631225585938, -188.26153564453125, -178.64674377441406, -169.03195190429688, -159.4171600341797, -149.8023681640625, -140.1875762939453, -130.57278442382812, -120.95800018310547, -111.34320831298828, -101.72842407226562, -92.11363220214844, -82.49884033203125, -72.88404846191406, -63.26926040649414, -53.65447235107422, -44.03968048095703, -34.424888610839844, -24.810100555419922, -15.1953125, -5.5805206298828125, 4.034269332885742, 13.649059295654297, 23.26384925842285, 32.878639221191406, 42.493431091308594, 52.108219146728516, 61.72300720214844, 71.33782958984375, 80.95262145996094, 90.56741333007812, 100.18219757080078, 109.79698944091797, 119.41178131103516, 129.0265655517578, 138.641357421875, 148.2561492919922, 157.87094116210938, 167.48573303222656, 177.10052490234375, 186.71530151367188, 196.33010864257812, 205.94488525390625, 215.55967712402344, 225.17446899414062, 234.7892608642578, 244.404052734375, 254.0188446044922, 263.6336364746094, 273.2484130859375, 282.86322021484375, 292.4779968261719, 302.0927734375, 311.7075500488281, 321.3223571777344, 330.9371337890625, 340.55194091796875, 350.1667175292969, 359.7815246582031, 369.39630126953125, 379.0111083984375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 9.0, 3.0, 9.0, 16.0, 9.0, 10.0, 13.0, 15.0, 17.0, 16.0, 15.0, 31.0, 15.0, 34.0, 22.0, 26.0, 36.0, 34.0, 43.0, 48.0, 52.0, 66.0, 54.0, 52.0, 38.0, 29.0, 31.0, 40.0, 19.0, 31.0, 21.0, 20.0, 17.0, 16.0, 22.0, 14.0, 9.0, 10.0, 8.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.78917694091797, -91.79435729980469, -88.7995376586914, -85.80471801757812, -82.80989074707031, -79.81507110595703, -76.82025146484375, -73.82543182373047, -70.83061218261719, -67.8357925415039, -64.84097290039062, -61.84614944458008, -58.8513298034668, -55.856510162353516, -52.86168670654297, -49.86686706542969, -46.872047424316406, -43.877227783203125, -40.882408142089844, -37.8875846862793, -34.892765045166016, -31.897945404052734, -28.90312385559082, -25.908302307128906, -22.913482666015625, -19.918663024902344, -16.92384147644043, -13.929020881652832, -10.934200286865234, -7.939379692077637, -4.944559097290039, -1.949737548828125, 1.0450897216796875, 4.039910316467285, 7.034730911254883, 10.02955150604248, 13.024372100830078, 16.01919174194336, 19.014013290405273, 22.008834838867188, 25.00365447998047, 27.99847412109375, 30.993295669555664, 33.98811721801758, 36.98293685913086, 39.97775650024414, 42.97257995605469, 45.96739959716797, 48.96221923828125, 51.95703887939453, 54.95185852050781, 57.94668197631836, 60.94150161743164, 63.93632125854492, 66.93114471435547, 69.92596435546875, 72.92078399658203, 75.91560363769531, 78.9104232788086, 81.90524291992188, 84.90007019042969, 87.89488983154297, 90.88970947265625, 93.88452911376953, 96.87934875488281]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 3.0, 8.0, 7.0, 2.0, 8.0, 18.0, 24.0, 39.0, 43.0, 68.0, 79.0, 137.0, 235.0, 462.0, 1070.0, 3230.0, 22021.0, 1274756.0, 2847376.0, 37428.0, 4860.0, 1349.0, 536.0, 205.0, 124.0, 65.0, 45.0, 28.0, 20.0, 12.0, 10.0, 3.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.578125, -30.79052734375, -30.0029296875, -29.21533203125, -28.427734375, -27.64013671875, -26.8525390625, -26.06494140625, -25.27734375, -24.48974609375, -23.7021484375, -22.91455078125, -22.126953125, -21.33935546875, -20.5517578125, -19.76416015625, -18.9765625, -18.18896484375, -17.4013671875, -16.61376953125, -15.826171875, -15.03857421875, -14.2509765625, -13.46337890625, -12.67578125, -11.88818359375, -11.1005859375, -10.31298828125, -9.525390625, -8.73779296875, -7.9501953125, -7.16259765625, -6.375, -5.58740234375, -4.7998046875, -4.01220703125, -3.224609375, -2.43701171875, -1.6494140625, -0.86181640625, -0.07421875, 0.71337890625, 1.5009765625, 2.28857421875, 3.076171875, 3.86376953125, 4.6513671875, 5.43896484375, 6.2265625, 7.01416015625, 7.8017578125, 8.58935546875, 9.376953125, 10.16455078125, 10.9521484375, 11.73974609375, 12.52734375, 13.31494140625, 14.1025390625, 14.89013671875, 15.677734375, 16.46533203125, 17.2529296875, 18.04052734375, 18.828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 13.0, 12.0, 34.0, 33.0, 54.0, 76.0, 88.0, 100.0, 107.0, 106.0, 93.0, 92.0, 48.0, 46.0, 30.0, 27.0, 20.0, 13.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.78369140625, -12.4267578125, -12.06982421875, -11.712890625, -11.35595703125, -10.9990234375, -10.64208984375, -10.28515625, -9.92822265625, -9.5712890625, -9.21435546875, -8.857421875, -8.50048828125, -8.1435546875, -7.78662109375, -7.4296875, -7.07275390625, -6.7158203125, -6.35888671875, -6.001953125, -5.64501953125, -5.2880859375, -4.93115234375, -4.57421875, -4.21728515625, -3.8603515625, -3.50341796875, -3.146484375, -2.78955078125, -2.4326171875, -2.07568359375, -1.71875, -1.36181640625, -1.0048828125, -0.64794921875, -0.291015625, 0.06591796875, 0.4228515625, 0.77978515625, 1.13671875, 1.49365234375, 1.8505859375, 2.20751953125, 2.564453125, 2.92138671875, 3.2783203125, 3.63525390625, 3.9921875, 4.34912109375, 4.7060546875, 5.06298828125, 5.419921875, 5.77685546875, 6.1337890625, 6.49072265625, 6.84765625, 7.20458984375, 7.5615234375, 7.91845703125, 8.275390625, 8.63232421875, 8.9892578125, 9.34619140625, 9.703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 6.0, 17.0, 19.0, 39.0, 81.0, 136.0, 301.0, 824.0, 3884.0, 331397.0, 3842517.0, 12757.0, 1323.0, 436.0, 205.0, 123.0, 77.0, 56.0, 38.0, 19.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.1875, -34.62744140625, -33.0673828125, -31.50732421875, -29.947265625, -28.38720703125, -26.8271484375, -25.26708984375, -23.70703125, -22.14697265625, -20.5869140625, -19.02685546875, -17.466796875, -15.90673828125, -14.3466796875, -12.78662109375, -11.2265625, -9.66650390625, -8.1064453125, -6.54638671875, -4.986328125, -3.42626953125, -1.8662109375, -0.30615234375, 1.25390625, 2.81396484375, 4.3740234375, 5.93408203125, 7.494140625, 9.05419921875, 10.6142578125, 12.17431640625, 13.734375, 15.29443359375, 16.8544921875, 18.41455078125, 19.974609375, 21.53466796875, 23.0947265625, 24.65478515625, 26.21484375, 27.77490234375, 29.3349609375, 30.89501953125, 32.455078125, 34.01513671875, 35.5751953125, 37.13525390625, 38.6953125, 40.25537109375, 41.8154296875, 43.37548828125, 44.935546875, 46.49560546875, 48.0556640625, 49.61572265625, 51.17578125, 52.73583984375, 54.2958984375, 55.85595703125, 57.416015625, 58.97607421875, 60.5361328125, 62.09619140625, 63.65625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 17.0, 20.0, 45.0, 112.0, 332.0, 949.0, 1441.0, 709.0, 266.0, 107.0, 37.0, 19.0, 15.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -17.714111328125, -16.63134765625, -15.548583984375, -14.4658203125, -13.383056640625, -12.30029296875, -11.217529296875, -10.134765625, -9.052001953125, -7.96923828125, -6.886474609375, -5.8037109375, -4.720947265625, -3.63818359375, -2.555419921875, -1.47265625, -0.389892578125, 0.69287109375, 1.775634765625, 2.8583984375, 3.941162109375, 5.02392578125, 6.106689453125, 7.189453125, 8.272216796875, 9.35498046875, 10.437744140625, 11.5205078125, 12.603271484375, 13.68603515625, 14.768798828125, 15.8515625, 16.934326171875, 18.01708984375, 19.099853515625, 20.1826171875, 21.265380859375, 22.34814453125, 23.430908203125, 24.513671875, 25.596435546875, 26.67919921875, 27.761962890625, 28.8447265625, 29.927490234375, 31.01025390625, 32.093017578125, 33.17578125, 34.258544921875, 35.34130859375, 36.424072265625, 37.5068359375, 38.589599609375, 39.67236328125, 40.755126953125, 41.837890625, 42.920654296875, 44.00341796875, 45.086181640625, 46.1689453125, 47.251708984375, 48.33447265625, 49.417236328125, 50.5]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 37.0, 126.0, 301.0, 318.0, 122.0, 45.0, 23.0, 9.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-426.604248046875, -415.3379211425781, -404.07159423828125, -392.8052978515625, -381.5389709472656, -370.27264404296875, -359.0063171386719, -347.739990234375, -336.47369384765625, -325.2073669433594, -313.9410400390625, -302.67474365234375, -291.4084167480469, -280.14208984375, -268.8757629394531, -257.60943603515625, -246.34312438964844, -235.07679748535156, -223.81048583984375, -212.54415893554688, -201.27784729003906, -190.0115203857422, -178.74520874023438, -167.4788818359375, -156.21255493164062, -144.94622802734375, -133.67991638183594, -122.41358947753906, -111.14727783203125, -99.88095092773438, -88.61463165283203, -77.34831237792969, -66.08200073242188, -54.81568145751953, -43.54936218261719, -32.28303909301758, -21.016719818115234, -9.75040054321289, 1.5159225463867188, 12.782241821289062, 24.048561096191406, 35.31488037109375, 46.581199645996094, 57.8475227355957, 69.11384582519531, 80.38015747070312, 91.646484375, 102.91280364990234, 114.17912292480469, 125.44544219970703, 136.71176147460938, 147.97808837890625, 159.24440002441406, 170.51072692871094, 181.77703857421875, 193.04336547851562, 204.3096923828125, 215.57601928710938, 226.8423309326172, 238.10865783691406, 249.37496948242188, 260.64129638671875, 271.9076232910156, 283.1739501953125, 294.44024658203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 12.0, 11.0, 12.0, 11.0, 28.0, 25.0, 38.0, 34.0, 52.0, 69.0, 49.0, 60.0, 79.0, 47.0, 62.0, 72.0, 65.0, 55.0, 49.0, 43.0, 30.0, 30.0, 12.0, 11.0, 13.0, 10.0, 5.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.90958404541016, -68.54634857177734, -65.18312072753906, -61.81988525390625, -58.4566535949707, -55.093421936035156, -51.730186462402344, -48.3669548034668, -45.00372314453125, -41.6404914855957, -38.277259826660156, -34.914024353027344, -31.550792694091797, -28.18756103515625, -24.82432746887207, -21.46109390258789, -18.097862243652344, -14.73462963104248, -11.371397018432617, -8.008164405822754, -4.644931793212891, -1.2817001342773438, 2.081533432006836, 5.444766998291016, 8.807998657226562, 12.171231269836426, 15.534463882446289, 18.89769744873047, 22.260929107666016, 25.624160766601562, 28.987394332885742, 32.35062789916992, 35.7138671875, 39.07709884643555, 42.440330505371094, 45.803565979003906, 49.16679763793945, 52.530029296875, 55.89326477050781, 59.25649642944336, 62.619728088378906, 65.98296356201172, 69.34619140625, 72.70942687988281, 76.07266235351562, 79.4358901977539, 82.79912567138672, 86.162353515625, 89.52558898925781, 92.88882446289062, 96.2520523071289, 99.61528778076172, 102.978515625, 106.34175109863281, 109.70498657226562, 113.06822204589844, 116.43144989013672, 119.79468536376953, 123.15791320800781, 126.52114868164062, 129.88438415527344, 133.24761962890625, 136.61083984375, 139.9740753173828, 143.33731079101562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 12.0, 14.0, 17.0, 24.0, 41.0, 57.0, 94.0, 156.0, 285.0, 555.0, 1358.0, 4615.0, 23578.0, 215561.0, 701864.0, 83843.0, 11688.0, 2727.0, 980.0, 427.0, 248.0, 134.0, 83.0, 64.0, 32.0, 30.0, 13.0, 10.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.7587890625, -25.845703125, -24.9326171875, -24.01953125, -23.1064453125, -22.193359375, -21.2802734375, -20.3671875, -19.4541015625, -18.541015625, -17.6279296875, -16.71484375, -15.8017578125, -14.888671875, -13.9755859375, -13.0625, -12.1494140625, -11.236328125, -10.3232421875, -9.41015625, -8.4970703125, -7.583984375, -6.6708984375, -5.7578125, -4.8447265625, -3.931640625, -3.0185546875, -2.10546875, -1.1923828125, -0.279296875, 0.6337890625, 1.546875, 2.4599609375, 3.373046875, 4.2861328125, 5.19921875, 6.1123046875, 7.025390625, 7.9384765625, 8.8515625, 9.7646484375, 10.677734375, 11.5908203125, 12.50390625, 13.4169921875, 14.330078125, 15.2431640625, 16.15625, 17.0693359375, 17.982421875, 18.8955078125, 19.80859375, 20.7216796875, 21.634765625, 22.5478515625, 23.4609375, 24.3740234375, 25.287109375, 26.2001953125, 27.11328125, 28.0263671875, 28.939453125, 29.8525390625, 30.765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 11.0, 20.0, 20.0, 18.0, 46.0, 47.0, 52.0, 63.0, 72.0, 66.0, 93.0, 62.0, 77.0, 71.0, 51.0, 57.0, 35.0, 30.0, 33.0, 17.0, 13.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.65576171875, -6.3662109375, -6.07666015625, -5.787109375, -5.49755859375, -5.2080078125, -4.91845703125, -4.62890625, -4.33935546875, -4.0498046875, -3.76025390625, -3.470703125, -3.18115234375, -2.8916015625, -2.60205078125, -2.3125, -2.02294921875, -1.7333984375, -1.44384765625, -1.154296875, -0.86474609375, -0.5751953125, -0.28564453125, 0.00390625, 0.29345703125, 0.5830078125, 0.87255859375, 1.162109375, 1.45166015625, 1.7412109375, 2.03076171875, 2.3203125, 2.60986328125, 2.8994140625, 3.18896484375, 3.478515625, 3.76806640625, 4.0576171875, 4.34716796875, 4.63671875, 4.92626953125, 5.2158203125, 5.50537109375, 5.794921875, 6.08447265625, 6.3740234375, 6.66357421875, 6.953125, 7.24267578125, 7.5322265625, 7.82177734375, 8.111328125, 8.40087890625, 8.6904296875, 8.97998046875, 9.26953125, 9.55908203125, 9.8486328125, 10.13818359375, 10.427734375, 10.71728515625, 11.0068359375, 11.29638671875, 11.5859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 8.0, 6.0, 12.0, 19.0, 26.0, 32.0, 76.0, 109.0, 162.0, 309.0, 682.0, 1645.0, 5477.0, 34524.0, 831680.0, 156626.0, 12129.0, 2879.0, 1090.0, 428.0, 250.0, 148.0, 90.0, 43.0, 36.0, 23.0, 14.0, 14.0, 3.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.78125, -49.23095703125, -47.6806640625, -46.13037109375, -44.580078125, -43.02978515625, -41.4794921875, -39.92919921875, -38.37890625, -36.82861328125, -35.2783203125, -33.72802734375, -32.177734375, -30.62744140625, -29.0771484375, -27.52685546875, -25.9765625, -24.42626953125, -22.8759765625, -21.32568359375, -19.775390625, -18.22509765625, -16.6748046875, -15.12451171875, -13.57421875, -12.02392578125, -10.4736328125, -8.92333984375, -7.373046875, -5.82275390625, -4.2724609375, -2.72216796875, -1.171875, 0.37841796875, 1.9287109375, 3.47900390625, 5.029296875, 6.57958984375, 8.1298828125, 9.68017578125, 11.23046875, 12.78076171875, 14.3310546875, 15.88134765625, 17.431640625, 18.98193359375, 20.5322265625, 22.08251953125, 23.6328125, 25.18310546875, 26.7333984375, 28.28369140625, 29.833984375, 31.38427734375, 32.9345703125, 34.48486328125, 36.03515625, 37.58544921875, 39.1357421875, 40.68603515625, 42.236328125, 43.78662109375, 45.3369140625, 46.88720703125, 48.4375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 14.0, 15.0, 12.0, 14.0, 36.0, 52.0, 49.0, 51.0, 60.0, 60.0, 74.0, 88.0, 72.0, 75.0, 51.0, 61.0, 38.0, 43.0, 26.0, 25.0, 25.0, 17.0, 13.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.30908203125, -46.0244140625, -44.73974609375, -43.455078125, -42.17041015625, -40.8857421875, -39.60107421875, -38.31640625, -37.03173828125, -35.7470703125, -34.46240234375, -33.177734375, -31.89306640625, -30.6083984375, -29.32373046875, -28.0390625, -26.75439453125, -25.4697265625, -24.18505859375, -22.900390625, -21.61572265625, -20.3310546875, -19.04638671875, -17.76171875, -16.47705078125, -15.1923828125, -13.90771484375, -12.623046875, -11.33837890625, -10.0537109375, -8.76904296875, -7.484375, -6.19970703125, -4.9150390625, -3.63037109375, -2.345703125, -1.06103515625, 0.2236328125, 1.50830078125, 2.79296875, 4.07763671875, 5.3623046875, 6.64697265625, 7.931640625, 9.21630859375, 10.5009765625, 11.78564453125, 13.0703125, 14.35498046875, 15.6396484375, 16.92431640625, 18.208984375, 19.49365234375, 20.7783203125, 22.06298828125, 23.34765625, 24.63232421875, 25.9169921875, 27.20166015625, 28.486328125, 29.77099609375, 31.0556640625, 32.34033203125, 33.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 9.0, 7.0, 8.0, 14.0, 26.0, 28.0, 44.0, 67.0, 131.0, 200.0, 404.0, 1008.0, 2713.0, 10626.0, 55241.0, 840549.0, 113169.0, 17600.0, 4131.0, 1343.0, 564.0, 253.0, 156.0, 106.0, 47.0, 25.0, 18.0, 16.0, 20.0, 6.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.515625, -21.88427734375, -21.2529296875, -20.62158203125, -19.990234375, -19.35888671875, -18.7275390625, -18.09619140625, -17.46484375, -16.83349609375, -16.2021484375, -15.57080078125, -14.939453125, -14.30810546875, -13.6767578125, -13.04541015625, -12.4140625, -11.78271484375, -11.1513671875, -10.52001953125, -9.888671875, -9.25732421875, -8.6259765625, -7.99462890625, -7.36328125, -6.73193359375, -6.1005859375, -5.46923828125, -4.837890625, -4.20654296875, -3.5751953125, -2.94384765625, -2.3125, -1.68115234375, -1.0498046875, -0.41845703125, 0.212890625, 0.84423828125, 1.4755859375, 2.10693359375, 2.73828125, 3.36962890625, 4.0009765625, 4.63232421875, 5.263671875, 5.89501953125, 6.5263671875, 7.15771484375, 7.7890625, 8.42041015625, 9.0517578125, 9.68310546875, 10.314453125, 10.94580078125, 11.5771484375, 12.20849609375, 12.83984375, 13.47119140625, 14.1025390625, 14.73388671875, 15.365234375, 15.99658203125, 16.6279296875, 17.25927734375, 17.890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 8.0, 7.0, 12.0, 18.0, 26.0, 38.0, 46.0, 137.0, 244.0, 183.0, 80.0, 43.0, 33.0, 20.0, 12.0, 16.0, 9.0, 9.0, 10.0, 6.0, 3.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004852294921875, -0.004694581031799316, -0.004536867141723633, -0.004379153251647949, -0.004221439361572266, -0.004063725471496582, -0.0039060115814208984, -0.003748297691345215, -0.0035905838012695312, -0.0034328699111938477, -0.003275156021118164, -0.0031174421310424805, -0.002959728240966797, -0.0028020143508911133, -0.0026443004608154297, -0.002486586570739746, -0.0023288726806640625, -0.002171158790588379, -0.0020134449005126953, -0.0018557310104370117, -0.0016980171203613281, -0.0015403032302856445, -0.001382589340209961, -0.0012248754501342773, -0.0010671615600585938, -0.0009094476699829102, -0.0007517337799072266, -0.000594019889831543, -0.0004363059997558594, -0.0002785921096801758, -0.00012087821960449219, 3.6835670471191406e-05, 0.000194549560546875, 0.0003522634506225586, 0.0005099773406982422, 0.0006676912307739258, 0.0008254051208496094, 0.000983119010925293, 0.0011408329010009766, 0.0012985467910766602, 0.0014562606811523438, 0.0016139745712280273, 0.001771688461303711, 0.0019294023513793945, 0.002087116241455078, 0.0022448301315307617, 0.0024025440216064453, 0.002560257911682129, 0.0027179718017578125, 0.002875685691833496, 0.0030333995819091797, 0.0031911134719848633, 0.003348827362060547, 0.0035065412521362305, 0.003664255142211914, 0.0038219690322875977, 0.003979682922363281, 0.004137396812438965, 0.0042951107025146484, 0.004452824592590332, 0.004610538482666016, 0.004768252372741699, 0.004925966262817383, 0.005083680152893066, 0.00524139404296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 8.0, 6.0, 4.0, 4.0, 11.0, 7.0, 14.0, 16.0, 32.0, 41.0, 63.0, 102.0, 147.0, 258.0, 440.0, 799.0, 1624.0, 4139.0, 12372.0, 44256.0, 653687.0, 280087.0, 33911.0, 10057.0, 3404.0, 1385.0, 681.0, 372.0, 194.0, 145.0, 98.0, 62.0, 37.0, 25.0, 15.0, 22.0, 7.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.1043701171875, -11.575927734375, -11.0474853515625, -10.51904296875, -9.9906005859375, -9.462158203125, -8.9337158203125, -8.4052734375, -7.8768310546875, -7.348388671875, -6.8199462890625, -6.29150390625, -5.7630615234375, -5.234619140625, -4.7061767578125, -4.177734375, -3.6492919921875, -3.120849609375, -2.5924072265625, -2.06396484375, -1.5355224609375, -1.007080078125, -0.4786376953125, 0.0498046875, 0.5782470703125, 1.106689453125, 1.6351318359375, 2.16357421875, 2.6920166015625, 3.220458984375, 3.7489013671875, 4.27734375, 4.8057861328125, 5.334228515625, 5.8626708984375, 6.39111328125, 6.9195556640625, 7.447998046875, 7.9764404296875, 8.5048828125, 9.0333251953125, 9.561767578125, 10.0902099609375, 10.61865234375, 11.1470947265625, 11.675537109375, 12.2039794921875, 12.732421875, 13.2608642578125, 13.789306640625, 14.3177490234375, 14.84619140625, 15.3746337890625, 15.903076171875, 16.4315185546875, 16.9599609375, 17.4884033203125, 18.016845703125, 18.5452880859375, 19.07373046875, 19.6021728515625, 20.130615234375, 20.6590576171875, 21.1875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 10.0, 5.0, 8.0, 12.0, 11.0, 10.0, 17.0, 18.0, 18.0, 28.0, 38.0, 60.0, 81.0, 117.0, 142.0, 124.0, 82.0, 51.0, 42.0, 29.0, 16.0, 17.0, 11.0, 3.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.4375, -14.0418701171875, -13.646240234375, -13.2506103515625, -12.85498046875, -12.4593505859375, -12.063720703125, -11.6680908203125, -11.2724609375, -10.8768310546875, -10.481201171875, -10.0855712890625, -9.68994140625, -9.2943115234375, -8.898681640625, -8.5030517578125, -8.107421875, -7.7117919921875, -7.316162109375, -6.9205322265625, -6.52490234375, -6.1292724609375, -5.733642578125, -5.3380126953125, -4.9423828125, -4.5467529296875, -4.151123046875, -3.7554931640625, -3.35986328125, -2.9642333984375, -2.568603515625, -2.1729736328125, -1.77734375, -1.3817138671875, -0.986083984375, -0.5904541015625, -0.19482421875, 0.2008056640625, 0.596435546875, 0.9920654296875, 1.3876953125, 1.7833251953125, 2.178955078125, 2.5745849609375, 2.97021484375, 3.3658447265625, 3.761474609375, 4.1571044921875, 4.552734375, 4.9483642578125, 5.343994140625, 5.7396240234375, 6.13525390625, 6.5308837890625, 6.926513671875, 7.3221435546875, 7.7177734375, 8.1134033203125, 8.509033203125, 8.9046630859375, 9.30029296875, 9.6959228515625, 10.091552734375, 10.4871826171875, 10.8828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 21.0, 56.0, 188.0, 428.0, 191.0, 56.0, 17.0, 11.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-454.3094482421875, -441.15740966796875, -428.00537109375, -414.85333251953125, -401.7012939453125, -388.54925537109375, -375.397216796875, -362.24517822265625, -349.0931396484375, -335.94110107421875, -322.7890625, -309.63702392578125, -296.4849853515625, -283.33294677734375, -270.180908203125, -257.02886962890625, -243.87680053710938, -230.72476196289062, -217.57272338867188, -204.42068481445312, -191.26864624023438, -178.11660766601562, -164.9645538330078, -151.81251525878906, -138.6604766845703, -125.50843811035156, -112.35639953613281, -99.20435333251953, -86.05231475830078, -72.90027618408203, -59.74822998046875, -46.59619140625, -33.44415283203125, -20.292112350463867, -7.140071868896484, 6.011970520019531, 19.16400909423828, 32.31604766845703, 45.46809387207031, 58.62013244628906, 71.77217102050781, 84.92420959472656, 98.07624816894531, 111.2282943725586, 124.38033294677734, 137.53237915039062, 150.68441772460938, 163.83645629882812, 176.98849487304688, 190.14053344726562, 203.29257202148438, 216.44461059570312, 229.59664916992188, 242.74868774414062, 255.90074157714844, 269.05279541015625, 282.204833984375, 295.35687255859375, 308.5089111328125, 321.66094970703125, 334.81298828125, 347.96502685546875, 361.1170654296875, 374.26910400390625, 387.421142578125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 6.0, 6.0, 3.0, 10.0, 9.0, 16.0, 18.0, 15.0, 22.0, 27.0, 35.0, 24.0, 42.0, 43.0, 53.0, 63.0, 87.0, 73.0, 70.0, 62.0, 42.0, 45.0, 37.0, 33.0, 30.0, 18.0, 29.0, 15.0, 11.0, 11.0, 19.0, 10.0, 3.0, 5.0, 1.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.85374450683594, -149.58627319335938, -145.31878662109375, -141.0513153076172, -136.78384399414062, -132.51637268066406, -128.2489013671875, -123.98141479492188, -119.71394348144531, -115.44647216796875, -111.17899322509766, -106.91151428222656, -102.64404296875, -98.37657165527344, -94.10909271240234, -89.84161376953125, -85.57414245605469, -81.30667114257812, -77.03919219970703, -72.77171325683594, -68.50424194335938, -64.23677062988281, -59.96929168701172, -55.70181655883789, -51.43434143066406, -47.166866302490234, -42.899391174316406, -38.63191604614258, -34.36444091796875, -30.096965789794922, -25.829490661621094, -21.562015533447266, -17.29454803466797, -13.02707290649414, -8.759597778320312, -4.492122650146484, -0.22464752197265625, 4.042827606201172, 8.310302734375, 12.577777862548828, 16.845252990722656, 21.112728118896484, 25.380203247070312, 29.64767837524414, 33.91515350341797, 38.1826286315918, 42.450103759765625, 46.71757888793945, 50.98505401611328, 55.25252914428711, 59.52000427246094, 63.787479400634766, 68.0549545288086, 72.32243347167969, 76.58990478515625, 80.85737609863281, 85.1248550415039, 89.392333984375, 93.65980529785156, 97.92727661132812, 102.19475555419922, 106.46223449707031, 110.72970581054688, 114.99717712402344, 119.26465606689453]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 11.0, 11.0, 15.0, 13.0, 28.0, 32.0, 60.0, 78.0, 123.0, 212.0, 384.0, 830.0, 1973.0, 6722.0, 49776.0, 3128045.0, 974278.0, 24343.0, 4528.0, 1528.0, 596.0, 293.0, 161.0, 70.0, 59.0, 30.0, 20.0, 17.0, 13.0, 8.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.74462890625, -19.9423828125, -19.14013671875, -18.337890625, -17.53564453125, -16.7333984375, -15.93115234375, -15.12890625, -14.32666015625, -13.5244140625, -12.72216796875, -11.919921875, -11.11767578125, -10.3154296875, -9.51318359375, -8.7109375, -7.90869140625, -7.1064453125, -6.30419921875, -5.501953125, -4.69970703125, -3.8974609375, -3.09521484375, -2.29296875, -1.49072265625, -0.6884765625, 0.11376953125, 0.916015625, 1.71826171875, 2.5205078125, 3.32275390625, 4.125, 4.92724609375, 5.7294921875, 6.53173828125, 7.333984375, 8.13623046875, 8.9384765625, 9.74072265625, 10.54296875, 11.34521484375, 12.1474609375, 12.94970703125, 13.751953125, 14.55419921875, 15.3564453125, 16.15869140625, 16.9609375, 17.76318359375, 18.5654296875, 19.36767578125, 20.169921875, 20.97216796875, 21.7744140625, 22.57666015625, 23.37890625, 24.18115234375, 24.9833984375, 25.78564453125, 26.587890625, 27.39013671875, 28.1923828125, 28.99462890625, 29.796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 8.0, 13.0, 17.0, 19.0, 39.0, 46.0, 59.0, 73.0, 67.0, 89.0, 84.0, 87.0, 88.0, 70.0, 58.0, 46.0, 45.0, 34.0, 15.0, 10.0, 15.0, 6.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.36181640625, -10.0126953125, -9.66357421875, -9.314453125, -8.96533203125, -8.6162109375, -8.26708984375, -7.91796875, -7.56884765625, -7.2197265625, -6.87060546875, -6.521484375, -6.17236328125, -5.8232421875, -5.47412109375, -5.125, -4.77587890625, -4.4267578125, -4.07763671875, -3.728515625, -3.37939453125, -3.0302734375, -2.68115234375, -2.33203125, -1.98291015625, -1.6337890625, -1.28466796875, -0.935546875, -0.58642578125, -0.2373046875, 0.11181640625, 0.4609375, 0.81005859375, 1.1591796875, 1.50830078125, 1.857421875, 2.20654296875, 2.5556640625, 2.90478515625, 3.25390625, 3.60302734375, 3.9521484375, 4.30126953125, 4.650390625, 4.99951171875, 5.3486328125, 5.69775390625, 6.046875, 6.39599609375, 6.7451171875, 7.09423828125, 7.443359375, 7.79248046875, 8.1416015625, 8.49072265625, 8.83984375, 9.18896484375, 9.5380859375, 9.88720703125, 10.236328125, 10.58544921875, 10.9345703125, 11.28369140625, 11.6328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 11.0, 15.0, 32.0, 55.0, 95.0, 147.0, 300.0, 1337.0, 4086133.0, 105079.0, 728.0, 178.0, 78.0, 40.0, 23.0, 14.0, 9.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.625, -210.75390625, -204.8828125, -199.01171875, -193.140625, -187.26953125, -181.3984375, -175.52734375, -169.65625, -163.78515625, -157.9140625, -152.04296875, -146.171875, -140.30078125, -134.4296875, -128.55859375, -122.6875, -116.81640625, -110.9453125, -105.07421875, -99.203125, -93.33203125, -87.4609375, -81.58984375, -75.71875, -69.84765625, -63.9765625, -58.10546875, -52.234375, -46.36328125, -40.4921875, -34.62109375, -28.75, -22.87890625, -17.0078125, -11.13671875, -5.265625, 0.60546875, 6.4765625, 12.34765625, 18.21875, 24.08984375, 29.9609375, 35.83203125, 41.703125, 47.57421875, 53.4453125, 59.31640625, 65.1875, 71.05859375, 76.9296875, 82.80078125, 88.671875, 94.54296875, 100.4140625, 106.28515625, 112.15625, 118.02734375, 123.8984375, 129.76953125, 135.640625, 141.51171875, 147.3828125, 153.25390625, 159.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 29.0, 133.0, 1262.0, 2331.0, 254.0, 50.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.75, -129.224853515625, -126.69970703125, -124.174560546875, -121.6494140625, -119.124267578125, -116.59912109375, -114.073974609375, -111.548828125, -109.023681640625, -106.49853515625, -103.973388671875, -101.4482421875, -98.923095703125, -96.39794921875, -93.872802734375, -91.34765625, -88.822509765625, -86.29736328125, -83.772216796875, -81.2470703125, -78.721923828125, -76.19677734375, -73.671630859375, -71.146484375, -68.621337890625, -66.09619140625, -63.571044921875, -61.0458984375, -58.520751953125, -55.99560546875, -53.470458984375, -50.9453125, -48.420166015625, -45.89501953125, -43.369873046875, -40.8447265625, -38.319580078125, -35.79443359375, -33.269287109375, -30.744140625, -28.218994140625, -25.69384765625, -23.168701171875, -20.6435546875, -18.118408203125, -15.59326171875, -13.068115234375, -10.54296875, -8.017822265625, -5.49267578125, -2.967529296875, -0.4423828125, 2.082763671875, 4.60791015625, 7.133056640625, 9.658203125, 12.183349609375, 14.70849609375, 17.233642578125, 19.7587890625, 22.283935546875, 24.80908203125, 27.334228515625, 29.859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 30.0, 90.0, 292.0, 401.0, 114.0, 35.0, 7.0, 9.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-593.7481079101562, -574.734130859375, -555.7200927734375, -536.7061157226562, -517.692138671875, -498.6781311035156, -479.66412353515625, -460.650146484375, -441.63616943359375, -422.6221618652344, -403.6081848144531, -384.59417724609375, -365.5802001953125, -346.5661926269531, -327.55218505859375, -308.5382080078125, -289.5242004394531, -270.51019287109375, -251.4962158203125, -232.48220825195312, -213.46823120117188, -194.4542236328125, -175.4402313232422, -156.42623901367188, -137.41224670410156, -118.39825439453125, -99.38426208496094, -80.3702621459961, -61.35626983642578, -42.34227752685547, -23.328277587890625, -4.3142852783203125, 14.69970703125, 33.71369934082031, 52.72769546508789, 71.74169158935547, 90.75568389892578, 109.7696762084961, 128.78367614746094, 147.79766845703125, 166.81166076660156, 185.82565307617188, 204.8396453857422, 223.8536376953125, 242.86764526367188, 261.8816223144531, 280.8956298828125, 299.90960693359375, 318.9236145019531, 337.9376220703125, 356.95159912109375, 375.9656066894531, 394.9795837402344, 413.99359130859375, 433.007568359375, 452.0215759277344, 471.03558349609375, 490.0495910644531, 509.0635681152344, 528.0775756835938, 547.091552734375, 566.1055297851562, 585.1195678710938, 604.133544921875, 623.1475219726562]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 11.0, 19.0, 22.0, 35.0, 38.0, 40.0, 37.0, 70.0, 62.0, 52.0, 77.0, 57.0, 87.0, 59.0, 58.0, 53.0, 42.0, 39.0, 31.0, 17.0, 24.0, 18.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-215.36094665527344, -210.1773681640625, -204.9937744140625, -199.81019592285156, -194.62661743164062, -189.4430389404297, -184.25946044921875, -179.07586669921875, -173.8922882080078, -168.70870971679688, -163.52511596679688, -158.34153747558594, -153.157958984375, -147.97438049316406, -142.79080200195312, -137.60720825195312, -132.4236297607422, -127.24005126953125, -122.05646514892578, -116.87287902832031, -111.68930053710938, -106.50572204589844, -101.32213592529297, -96.1385498046875, -90.95497131347656, -85.77139282226562, -80.58780670166016, -75.40422058105469, -70.22064208984375, -65.03706359863281, -59.853477478027344, -54.66989517211914, -49.48631286621094, -44.302730560302734, -39.11914825439453, -33.93556594848633, -28.751983642578125, -23.568401336669922, -18.38481903076172, -13.201236724853516, -8.017654418945312, -2.8340721130371094, 2.3495101928710938, 7.533092498779297, 12.7166748046875, 17.900257110595703, 23.083839416503906, 28.26742172241211, 33.45100402832031, 38.634586334228516, 43.81816864013672, 49.00175094604492, 54.185333251953125, 59.36891555786133, 64.55249786376953, 69.736083984375, 74.91966247558594, 80.10324096679688, 85.28682708740234, 90.47041320800781, 95.65399169921875, 100.83757019042969, 106.02115631103516, 111.20474243164062, 116.38832092285156]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 8.0, 12.0, 18.0, 31.0, 37.0, 39.0, 84.0, 145.0, 232.0, 499.0, 1265.0, 3824.0, 16142.0, 103006.0, 671583.0, 215536.0, 27231.0, 5767.0, 1716.0, 663.0, 297.0, 159.0, 75.0, 44.0, 28.0, 24.0, 17.0, 19.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.75, -21.927490234375, -21.10498046875, -20.282470703125, -19.4599609375, -18.637451171875, -17.81494140625, -16.992431640625, -16.169921875, -15.347412109375, -14.52490234375, -13.702392578125, -12.8798828125, -12.057373046875, -11.23486328125, -10.412353515625, -9.58984375, -8.767333984375, -7.94482421875, -7.122314453125, -6.2998046875, -5.477294921875, -4.65478515625, -3.832275390625, -3.009765625, -2.187255859375, -1.36474609375, -0.542236328125, 0.2802734375, 1.102783203125, 1.92529296875, 2.747802734375, 3.5703125, 4.392822265625, 5.21533203125, 6.037841796875, 6.8603515625, 7.682861328125, 8.50537109375, 9.327880859375, 10.150390625, 10.972900390625, 11.79541015625, 12.617919921875, 13.4404296875, 14.262939453125, 15.08544921875, 15.907958984375, 16.73046875, 17.552978515625, 18.37548828125, 19.197998046875, 20.0205078125, 20.843017578125, 21.66552734375, 22.488037109375, 23.310546875, 24.133056640625, 24.95556640625, 25.778076171875, 26.6005859375, 27.423095703125, 28.24560546875, 29.068115234375, 29.890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 3.0, 9.0, 13.0, 8.0, 20.0, 18.0, 27.0, 27.0, 27.0, 45.0, 49.0, 60.0, 65.0, 65.0, 63.0, 65.0, 48.0, 51.0, 58.0, 50.0, 45.0, 31.0, 22.0, 22.0, 25.0, 18.0, 14.0, 17.0, 10.0, 7.0, 1.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6796875, -11.3458251953125, -11.011962890625, -10.6781005859375, -10.34423828125, -10.0103759765625, -9.676513671875, -9.3426513671875, -9.0087890625, -8.6749267578125, -8.341064453125, -8.0072021484375, -7.67333984375, -7.3394775390625, -7.005615234375, -6.6717529296875, -6.337890625, -6.0040283203125, -5.670166015625, -5.3363037109375, -5.00244140625, -4.6685791015625, -4.334716796875, -4.0008544921875, -3.6669921875, -3.3331298828125, -2.999267578125, -2.6654052734375, -2.33154296875, -1.9976806640625, -1.663818359375, -1.3299560546875, -0.99609375, -0.6622314453125, -0.328369140625, 0.0054931640625, 0.33935546875, 0.6732177734375, 1.007080078125, 1.3409423828125, 1.6748046875, 2.0086669921875, 2.342529296875, 2.6763916015625, 3.01025390625, 3.3441162109375, 3.677978515625, 4.0118408203125, 4.345703125, 4.6795654296875, 5.013427734375, 5.3472900390625, 5.68115234375, 6.0150146484375, 6.348876953125, 6.6827392578125, 7.0166015625, 7.3504638671875, 7.684326171875, 8.0181884765625, 8.35205078125, 8.6859130859375, 9.019775390625, 9.3536376953125, 9.6875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 1.0, 9.0, 8.0, 14.0, 31.0, 50.0, 82.0, 175.0, 504.0, 1740.0, 9554.0, 100718.0, 854254.0, 71659.0, 7471.0, 1472.0, 435.0, 173.0, 92.0, 35.0, 19.0, 20.0, 11.0, 8.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.1875, -45.8173828125, -44.447265625, -43.0771484375, -41.70703125, -40.3369140625, -38.966796875, -37.5966796875, -36.2265625, -34.8564453125, -33.486328125, -32.1162109375, -30.74609375, -29.3759765625, -28.005859375, -26.6357421875, -25.265625, -23.8955078125, -22.525390625, -21.1552734375, -19.78515625, -18.4150390625, -17.044921875, -15.6748046875, -14.3046875, -12.9345703125, -11.564453125, -10.1943359375, -8.82421875, -7.4541015625, -6.083984375, -4.7138671875, -3.34375, -1.9736328125, -0.603515625, 0.7666015625, 2.13671875, 3.5068359375, 4.876953125, 6.2470703125, 7.6171875, 8.9873046875, 10.357421875, 11.7275390625, 13.09765625, 14.4677734375, 15.837890625, 17.2080078125, 18.578125, 19.9482421875, 21.318359375, 22.6884765625, 24.05859375, 25.4287109375, 26.798828125, 28.1689453125, 29.5390625, 30.9091796875, 32.279296875, 33.6494140625, 35.01953125, 36.3896484375, 37.759765625, 39.1298828125, 40.5]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 4.0, 6.0, 10.0, 13.0, 12.0, 20.0, 20.0, 33.0, 33.0, 44.0, 54.0, 52.0, 52.0, 58.0, 60.0, 59.0, 68.0, 58.0, 54.0, 47.0, 36.0, 38.0, 32.0, 29.0, 17.0, 19.0, 15.0, 8.0, 3.0, 10.0, 3.0, 7.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.09375, -47.64697265625, -46.2001953125, -44.75341796875, -43.306640625, -41.85986328125, -40.4130859375, -38.96630859375, -37.51953125, -36.07275390625, -34.6259765625, -33.17919921875, -31.732421875, -30.28564453125, -28.8388671875, -27.39208984375, -25.9453125, -24.49853515625, -23.0517578125, -21.60498046875, -20.158203125, -18.71142578125, -17.2646484375, -15.81787109375, -14.37109375, -12.92431640625, -11.4775390625, -10.03076171875, -8.583984375, -7.13720703125, -5.6904296875, -4.24365234375, -2.796875, -1.35009765625, 0.0966796875, 1.54345703125, 2.990234375, 4.43701171875, 5.8837890625, 7.33056640625, 8.77734375, 10.22412109375, 11.6708984375, 13.11767578125, 14.564453125, 16.01123046875, 17.4580078125, 18.90478515625, 20.3515625, 21.79833984375, 23.2451171875, 24.69189453125, 26.138671875, 27.58544921875, 29.0322265625, 30.47900390625, 31.92578125, 33.37255859375, 34.8193359375, 36.26611328125, 37.712890625, 39.15966796875, 40.6064453125, 42.05322265625, 43.5]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 12.0, 14.0, 27.0, 20.0, 54.0, 100.0, 195.0, 469.0, 1324.0, 4853.0, 20867.0, 167931.0, 770089.0, 66960.0, 11164.0, 2879.0, 901.0, 366.0, 134.0, 58.0, 34.0, 22.0, 12.0, 13.0, 3.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.7578125, -11.4248046875, -11.091796875, -10.7587890625, -10.42578125, -10.0927734375, -9.759765625, -9.4267578125, -9.09375, -8.7607421875, -8.427734375, -8.0947265625, -7.76171875, -7.4287109375, -7.095703125, -6.7626953125, -6.4296875, -6.0966796875, -5.763671875, -5.4306640625, -5.09765625, -4.7646484375, -4.431640625, -4.0986328125, -3.765625, -3.4326171875, -3.099609375, -2.7666015625, -2.43359375, -2.1005859375, -1.767578125, -1.4345703125, -1.1015625, -0.7685546875, -0.435546875, -0.1025390625, 0.23046875, 0.5634765625, 0.896484375, 1.2294921875, 1.5625, 1.8955078125, 2.228515625, 2.5615234375, 2.89453125, 3.2275390625, 3.560546875, 3.8935546875, 4.2265625, 4.5595703125, 4.892578125, 5.2255859375, 5.55859375, 5.8916015625, 6.224609375, 6.5576171875, 6.890625, 7.2236328125, 7.556640625, 7.8896484375, 8.22265625, 8.5556640625, 8.888671875, 9.2216796875, 9.5546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 7.0, 13.0, 15.0, 21.0, 21.0, 58.0, 82.0, 96.0, 137.0, 127.0, 117.0, 89.0, 54.0, 29.0, 26.0, 14.0, 15.0, 13.0, 11.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00228118896484375, -0.0022122561931610107, -0.0021433234214782715, -0.0020743906497955322, -0.002005457878112793, -0.0019365251064300537, -0.0018675923347473145, -0.0017986595630645752, -0.001729726791381836, -0.0016607940196990967, -0.0015918612480163574, -0.0015229284763336182, -0.001453995704650879, -0.0013850629329681396, -0.0013161301612854004, -0.0012471973896026611, -0.0011782646179199219, -0.0011093318462371826, -0.0010403990745544434, -0.0009714663028717041, -0.0009025335311889648, -0.0008336007595062256, -0.0007646679878234863, -0.0006957352161407471, -0.0006268024444580078, -0.0005578696727752686, -0.0004889369010925293, -0.00042000412940979004, -0.0003510713577270508, -0.0002821385860443115, -0.00021320581436157227, -0.000144273042678833, -7.534027099609375e-05, -6.407499313354492e-06, 6.252527236938477e-05, 0.00013145804405212402, 0.00020039081573486328, 0.00026932358741760254, 0.0003382563591003418, 0.00040718913078308105, 0.0004761219024658203, 0.0005450546741485596, 0.0006139874458312988, 0.0006829202175140381, 0.0007518529891967773, 0.0008207857608795166, 0.0008897185325622559, 0.0009586513042449951, 0.0010275840759277344, 0.0010965168476104736, 0.0011654496192932129, 0.0012343823909759521, 0.0013033151626586914, 0.0013722479343414307, 0.00144118070602417, 0.0015101134777069092, 0.0015790462493896484, 0.0016479790210723877, 0.001716911792755127, 0.0017858445644378662, 0.0018547773361206055, 0.0019237101078033447, 0.001992642879486084, 0.0020615756511688232, 0.0021305084228515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 9.0, 3.0, 7.0, 11.0, 13.0, 20.0, 42.0, 81.0, 165.0, 336.0, 815.0, 2202.0, 6805.0, 29013.0, 247367.0, 689884.0, 55578.0, 10970.0, 3241.0, 1109.0, 465.0, 185.0, 83.0, 51.0, 35.0, 19.0, 14.0, 8.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5, -12.1446533203125, -11.789306640625, -11.4339599609375, -11.07861328125, -10.7232666015625, -10.367919921875, -10.0125732421875, -9.6572265625, -9.3018798828125, -8.946533203125, -8.5911865234375, -8.23583984375, -7.8804931640625, -7.525146484375, -7.1697998046875, -6.814453125, -6.4591064453125, -6.103759765625, -5.7484130859375, -5.39306640625, -5.0377197265625, -4.682373046875, -4.3270263671875, -3.9716796875, -3.6163330078125, -3.260986328125, -2.9056396484375, -2.55029296875, -2.1949462890625, -1.839599609375, -1.4842529296875, -1.12890625, -0.7735595703125, -0.418212890625, -0.0628662109375, 0.29248046875, 0.6478271484375, 1.003173828125, 1.3585205078125, 1.7138671875, 2.0692138671875, 2.424560546875, 2.7799072265625, 3.13525390625, 3.4906005859375, 3.845947265625, 4.2012939453125, 4.556640625, 4.9119873046875, 5.267333984375, 5.6226806640625, 5.97802734375, 6.3333740234375, 6.688720703125, 7.0440673828125, 7.3994140625, 7.7547607421875, 8.110107421875, 8.4654541015625, 8.82080078125, 9.1761474609375, 9.531494140625, 9.8868408203125, 10.2421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 8.0, 3.0, 8.0, 3.0, 6.0, 6.0, 22.0, 27.0, 23.0, 28.0, 42.0, 49.0, 68.0, 97.0, 97.0, 118.0, 85.0, 78.0, 57.0, 48.0, 31.0, 20.0, 17.0, 10.0, 6.0, 12.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.91668701171875, -7.6693115234375, -7.42193603515625, -7.174560546875, -6.92718505859375, -6.6798095703125, -6.43243408203125, -6.18505859375, -5.93768310546875, -5.6903076171875, -5.44293212890625, -5.195556640625, -4.94818115234375, -4.7008056640625, -4.45343017578125, -4.2060546875, -3.95867919921875, -3.7113037109375, -3.46392822265625, -3.216552734375, -2.96917724609375, -2.7218017578125, -2.47442626953125, -2.22705078125, -1.97967529296875, -1.7322998046875, -1.48492431640625, -1.237548828125, -0.99017333984375, -0.7427978515625, -0.49542236328125, -0.248046875, -0.00067138671875, 0.2467041015625, 0.49407958984375, 0.741455078125, 0.98883056640625, 1.2362060546875, 1.48358154296875, 1.73095703125, 1.97833251953125, 2.2257080078125, 2.47308349609375, 2.720458984375, 2.96783447265625, 3.2152099609375, 3.46258544921875, 3.7099609375, 3.95733642578125, 4.2047119140625, 4.45208740234375, 4.699462890625, 4.94683837890625, 5.1942138671875, 5.44158935546875, 5.68896484375, 5.93634033203125, 6.1837158203125, 6.43109130859375, 6.678466796875, 6.92584228515625, 7.1732177734375, 7.42059326171875, 7.66796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 0.0, 5.0, 9.0, 10.0, 16.0, 23.0, 48.0, 84.0, 159.0, 301.0, 157.0, 86.0, 45.0, 21.0, 13.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.7222900390625, -292.5058898925781, -285.28948974609375, -278.0730895996094, -270.856689453125, -263.6402893066406, -256.42388916015625, -249.20750427246094, -241.99110412597656, -234.7747039794922, -227.5583038330078, -220.34190368652344, -213.12551879882812, -205.90911865234375, -198.69271850585938, -191.476318359375, -184.25991821289062, -177.04351806640625, -169.82711791992188, -162.6107177734375, -155.39431762695312, -148.17791748046875, -140.96153259277344, -133.74513244628906, -126.52873229980469, -119.31233215332031, -112.09593200683594, -104.8795394897461, -97.66313934326172, -90.44673919677734, -83.2303466796875, -76.01394653320312, -68.79754638671875, -61.581146240234375, -54.364749908447266, -47.148353576660156, -39.93195343017578, -32.715553283691406, -25.499156951904297, -18.282760620117188, -11.066360473632812, -3.8499622344970703, 3.366436004638672, 10.582834243774414, 17.799232482910156, 25.01563262939453, 32.23202896118164, 39.44842529296875, 46.664825439453125, 53.8812255859375, 61.09762191772461, 68.31401824951172, 75.5304183959961, 82.74681854248047, 89.96321105957031, 97.17961120605469, 104.39601135253906, 111.61241149902344, 118.82881164550781, 126.04520416259766, 133.2615966796875, 140.47799682617188, 147.69439697265625, 154.91079711914062, 162.127197265625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 10.0, 5.0, 1.0, 7.0, 7.0, 15.0, 8.0, 11.0, 13.0, 19.0, 18.0, 22.0, 23.0, 26.0, 24.0, 33.0, 43.0, 48.0, 80.0, 95.0, 91.0, 54.0, 41.0, 33.0, 37.0, 34.0, 25.0, 22.0, 34.0, 18.0, 18.0, 9.0, 13.0, 15.0, 13.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-172.39007568359375, -166.42596435546875, -160.46185302734375, -154.4977569580078, -148.5336456298828, -142.5695343017578, -136.60543823242188, -130.64132690429688, -124.67721557617188, -118.71310424804688, -112.7490005493164, -106.78489685058594, -100.82078552246094, -94.85667419433594, -88.89257049560547, -82.928466796875, -76.96435546875, -71.000244140625, -65.03614044189453, -59.0720329284668, -53.10792541503906, -47.14381790161133, -41.179710388183594, -35.21560287475586, -29.251495361328125, -23.28738784790039, -17.323280334472656, -11.359172821044922, -5.3950653076171875, 0.5690422058105469, 6.533149719238281, 12.497257232666016, 18.46136474609375, 24.425472259521484, 30.38957977294922, 36.35368728637695, 42.31779479980469, 48.28190231323242, 54.246009826660156, 60.21011734008789, 66.17422485351562, 72.13833618164062, 78.1024398803711, 84.06654357910156, 90.03065490722656, 95.99476623535156, 101.95886993408203, 107.9229736328125, 113.8870849609375, 119.8511962890625, 125.81529998779297, 131.77940368652344, 137.74351501464844, 143.70762634277344, 149.67172241210938, 155.63583374023438, 161.59994506835938, 167.56405639648438, 173.52816772460938, 179.4922637939453, 185.4563751220703, 191.4204864501953, 197.38458251953125, 203.34869384765625, 209.31280517578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 8.0, 10.0, 15.0, 14.0, 23.0, 36.0, 48.0, 72.0, 113.0, 160.0, 241.0, 465.0, 800.0, 1650.0, 3840.0, 12809.0, 94839.0, 2188692.0, 1795372.0, 77642.0, 10957.0, 3382.0, 1416.0, 751.0, 361.0, 181.0, 135.0, 95.0, 56.0, 31.0, 25.0, 14.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.484375, -21.9610595703125, -21.437744140625, -20.9144287109375, -20.39111328125, -19.8677978515625, -19.344482421875, -18.8211669921875, -18.2978515625, -17.7745361328125, -17.251220703125, -16.7279052734375, -16.20458984375, -15.6812744140625, -15.157958984375, -14.6346435546875, -14.111328125, -13.5880126953125, -13.064697265625, -12.5413818359375, -12.01806640625, -11.4947509765625, -10.971435546875, -10.4481201171875, -9.9248046875, -9.4014892578125, -8.878173828125, -8.3548583984375, -7.83154296875, -7.3082275390625, -6.784912109375, -6.2615966796875, -5.73828125, -5.2149658203125, -4.691650390625, -4.1683349609375, -3.64501953125, -3.1217041015625, -2.598388671875, -2.0750732421875, -1.5517578125, -1.0284423828125, -0.505126953125, 0.0181884765625, 0.54150390625, 1.0648193359375, 1.588134765625, 2.1114501953125, 2.634765625, 3.1580810546875, 3.681396484375, 4.2047119140625, 4.72802734375, 5.2513427734375, 5.774658203125, 6.2979736328125, 6.8212890625, 7.3446044921875, 7.867919921875, 8.3912353515625, 8.91455078125, 9.4378662109375, 9.961181640625, 10.4844970703125, 11.0078125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 6.0, 12.0, 18.0, 30.0, 14.0, 26.0, 28.0, 29.0, 40.0, 41.0, 63.0, 58.0, 56.0, 54.0, 69.0, 63.0, 48.0, 45.0, 48.0, 42.0, 41.0, 26.0, 27.0, 17.0, 22.0, 11.0, 10.0, 10.0, 8.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19921875, -6.91192626953125, -6.6246337890625, -6.33734130859375, -6.050048828125, -5.76275634765625, -5.4754638671875, -5.18817138671875, -4.90087890625, -4.61358642578125, -4.3262939453125, -4.03900146484375, -3.751708984375, -3.46441650390625, -3.1771240234375, -2.88983154296875, -2.6025390625, -2.31524658203125, -2.0279541015625, -1.74066162109375, -1.453369140625, -1.16607666015625, -0.8787841796875, -0.59149169921875, -0.30419921875, -0.01690673828125, 0.2703857421875, 0.55767822265625, 0.844970703125, 1.13226318359375, 1.4195556640625, 1.70684814453125, 1.994140625, 2.28143310546875, 2.5687255859375, 2.85601806640625, 3.143310546875, 3.43060302734375, 3.7178955078125, 4.00518798828125, 4.29248046875, 4.57977294921875, 4.8670654296875, 5.15435791015625, 5.441650390625, 5.72894287109375, 6.0162353515625, 6.30352783203125, 6.5908203125, 6.87811279296875, 7.1654052734375, 7.45269775390625, 7.739990234375, 8.02728271484375, 8.3145751953125, 8.60186767578125, 8.88916015625, 9.17645263671875, 9.4637451171875, 9.75103759765625, 10.038330078125, 10.32562255859375, 10.6129150390625, 10.90020751953125, 11.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 19.0, 29.0, 74.0, 143.0, 388.0, 1333.0, 12638.0, 4115811.0, 60902.0, 2096.0, 492.0, 189.0, 82.0, 35.0, 20.0, 14.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.125, -73.0185546875, -70.912109375, -68.8056640625, -66.69921875, -64.5927734375, -62.486328125, -60.3798828125, -58.2734375, -56.1669921875, -54.060546875, -51.9541015625, -49.84765625, -47.7412109375, -45.634765625, -43.5283203125, -41.421875, -39.3154296875, -37.208984375, -35.1025390625, -32.99609375, -30.8896484375, -28.783203125, -26.6767578125, -24.5703125, -22.4638671875, -20.357421875, -18.2509765625, -16.14453125, -14.0380859375, -11.931640625, -9.8251953125, -7.71875, -5.6123046875, -3.505859375, -1.3994140625, 0.70703125, 2.8134765625, 4.919921875, 7.0263671875, 9.1328125, 11.2392578125, 13.345703125, 15.4521484375, 17.55859375, 19.6650390625, 21.771484375, 23.8779296875, 25.984375, 28.0908203125, 30.197265625, 32.3037109375, 34.41015625, 36.5166015625, 38.623046875, 40.7294921875, 42.8359375, 44.9423828125, 47.048828125, 49.1552734375, 51.26171875, 53.3681640625, 55.474609375, 57.5810546875, 59.6875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 14.0, 8.0, 26.0, 22.0, 64.0, 132.0, 289.0, 702.0, 1184.0, 897.0, 390.0, 172.0, 69.0, 29.0, 30.0, 14.0, 9.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.5625, -35.7255859375, -34.888671875, -34.0517578125, -33.21484375, -32.3779296875, -31.541015625, -30.7041015625, -29.8671875, -29.0302734375, -28.193359375, -27.3564453125, -26.51953125, -25.6826171875, -24.845703125, -24.0087890625, -23.171875, -22.3349609375, -21.498046875, -20.6611328125, -19.82421875, -18.9873046875, -18.150390625, -17.3134765625, -16.4765625, -15.6396484375, -14.802734375, -13.9658203125, -13.12890625, -12.2919921875, -11.455078125, -10.6181640625, -9.78125, -8.9443359375, -8.107421875, -7.2705078125, -6.43359375, -5.5966796875, -4.759765625, -3.9228515625, -3.0859375, -2.2490234375, -1.412109375, -0.5751953125, 0.26171875, 1.0986328125, 1.935546875, 2.7724609375, 3.609375, 4.4462890625, 5.283203125, 6.1201171875, 6.95703125, 7.7939453125, 8.630859375, 9.4677734375, 10.3046875, 11.1416015625, 11.978515625, 12.8154296875, 13.65234375, 14.4892578125, 15.326171875, 16.1630859375, 17.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 18.0, 37.0, 95.0, 238.0, 283.0, 182.0, 95.0, 31.0, 12.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-422.3249816894531, -413.2271423339844, -404.1292724609375, -395.03143310546875, -385.93359375, -376.83575439453125, -367.7379150390625, -358.6400451660156, -349.5422058105469, -340.4443664550781, -331.34649658203125, -322.2486572265625, -313.15081787109375, -304.052978515625, -294.95513916015625, -285.8572692871094, -276.7594299316406, -267.6615905761719, -258.563720703125, -249.46588134765625, -240.3680419921875, -231.27020263671875, -222.17234802246094, -213.07449340820312, -203.97665405273438, -194.87881469726562, -185.7809600830078, -176.68310546875, -167.58526611328125, -158.4874267578125, -149.3895721435547, -140.29171752929688, -131.19386291503906, -122.09601593017578, -112.9981689453125, -103.90032196044922, -94.80247497558594, -85.70462799072266, -76.60678100585938, -67.5089340209961, -58.41108703613281, -49.31324005126953, -40.21539306640625, -31.11754608154297, -22.019699096679688, -12.921852111816406, -3.824005126953125, 5.273841857910156, 14.371688842773438, 23.46953582763672, 32.5673828125, 41.66522979736328, 50.76307678222656, 59.860923767089844, 68.95877075195312, 78.0566177368164, 87.15446472167969, 96.25231170654297, 105.35015869140625, 114.44800567626953, 123.54585266113281, 132.64370727539062, 141.74154663085938, 150.83938598632812, 159.93724060058594]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 13.0, 23.0, 25.0, 26.0, 30.0, 36.0, 49.0, 62.0, 61.0, 63.0, 61.0, 59.0, 66.0, 71.0, 67.0, 55.0, 59.0, 45.0, 33.0, 28.0, 16.0, 14.0, 8.0, 9.0, 8.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.92166137695312, -100.23426818847656, -96.54688262939453, -92.85948944091797, -89.17210388183594, -85.48471069335938, -81.79731750488281, -78.10993194580078, -74.42253875732422, -70.73514556884766, -67.04776000976562, -63.36036682128906, -59.672977447509766, -55.98558807373047, -52.29819869995117, -48.610809326171875, -44.92341995239258, -41.23603057861328, -37.548641204833984, -33.86125183105469, -30.173858642578125, -26.486469268798828, -22.79907989501953, -19.1116886138916, -15.424299240112305, -11.736908912658691, -8.049518585205078, -4.362129211425781, -0.674738883972168, 3.0126514434814453, 6.700040817260742, 10.387432098388672, 14.074821472167969, 17.762210845947266, 21.449602127075195, 25.136991500854492, 28.824382781982422, 32.51177215576172, 36.199161529541016, 39.88655090332031, 43.573944091796875, 47.26133346557617, 50.94872283935547, 54.63611602783203, 58.32350540161133, 62.010894775390625, 65.69828796386719, 69.38567352294922, 73.07305908203125, 76.76045227050781, 80.44783782958984, 84.1352310180664, 87.82261657714844, 91.510009765625, 95.19740295410156, 98.8847885131836, 102.57218170166016, 106.25957489013672, 109.94696044921875, 113.63435363769531, 117.32173919677734, 121.0091323852539, 124.69651794433594, 128.3839111328125, 132.07130432128906]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 9.0, 12.0, 20.0, 22.0, 55.0, 75.0, 170.0, 310.0, 672.0, 1785.0, 5972.0, 26538.0, 177879.0, 660630.0, 143695.0, 22575.0, 5161.0, 1648.0, 625.0, 300.0, 159.0, 80.0, 54.0, 29.0, 27.0, 7.0, 11.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-27.140625, -26.48583984375, -25.8310546875, -25.17626953125, -24.521484375, -23.86669921875, -23.2119140625, -22.55712890625, -21.90234375, -21.24755859375, -20.5927734375, -19.93798828125, -19.283203125, -18.62841796875, -17.9736328125, -17.31884765625, -16.6640625, -16.00927734375, -15.3544921875, -14.69970703125, -14.044921875, -13.39013671875, -12.7353515625, -12.08056640625, -11.42578125, -10.77099609375, -10.1162109375, -9.46142578125, -8.806640625, -8.15185546875, -7.4970703125, -6.84228515625, -6.1875, -5.53271484375, -4.8779296875, -4.22314453125, -3.568359375, -2.91357421875, -2.2587890625, -1.60400390625, -0.94921875, -0.29443359375, 0.3603515625, 1.01513671875, 1.669921875, 2.32470703125, 2.9794921875, 3.63427734375, 4.2890625, 4.94384765625, 5.5986328125, 6.25341796875, 6.908203125, 7.56298828125, 8.2177734375, 8.87255859375, 9.52734375, 10.18212890625, 10.8369140625, 11.49169921875, 12.146484375, 12.80126953125, 13.4560546875, 14.11083984375, 14.765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 12.0, 11.0, 14.0, 24.0, 24.0, 22.0, 39.0, 43.0, 65.0, 63.0, 66.0, 72.0, 76.0, 56.0, 70.0, 62.0, 53.0, 51.0, 36.0, 27.0, 15.0, 19.0, 21.0, 14.0, 8.0, 12.0, 5.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.79296875, -10.4296875, -10.06640625, -9.703125, -9.33984375, -8.9765625, -8.61328125, -8.25, -7.88671875, -7.5234375, -7.16015625, -6.796875, -6.43359375, -6.0703125, -5.70703125, -5.34375, -4.98046875, -4.6171875, -4.25390625, -3.890625, -3.52734375, -3.1640625, -2.80078125, -2.4375, -2.07421875, -1.7109375, -1.34765625, -0.984375, -0.62109375, -0.2578125, 0.10546875, 0.46875, 0.83203125, 1.1953125, 1.55859375, 1.921875, 2.28515625, 2.6484375, 3.01171875, 3.375, 3.73828125, 4.1015625, 4.46484375, 4.828125, 5.19140625, 5.5546875, 5.91796875, 6.28125, 6.64453125, 7.0078125, 7.37109375, 7.734375, 8.09765625, 8.4609375, 8.82421875, 9.1875, 9.55078125, 9.9140625, 10.27734375, 10.640625, 11.00390625, 11.3671875, 11.73046875, 12.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 7.0, 9.0, 11.0, 19.0, 22.0, 20.0, 30.0, 31.0, 69.0, 106.0, 153.0, 220.0, 408.0, 747.0, 1816.0, 4838.0, 16274.0, 75992.0, 646081.0, 245828.0, 39946.0, 9848.0, 3265.0, 1278.0, 556.0, 324.0, 199.0, 138.0, 81.0, 59.0, 46.0, 26.0, 23.0, 15.0, 12.0, 12.0, 11.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.453125, -18.800537109375, -18.14794921875, -17.495361328125, -16.8427734375, -16.190185546875, -15.53759765625, -14.885009765625, -14.232421875, -13.579833984375, -12.92724609375, -12.274658203125, -11.6220703125, -10.969482421875, -10.31689453125, -9.664306640625, -9.01171875, -8.359130859375, -7.70654296875, -7.053955078125, -6.4013671875, -5.748779296875, -5.09619140625, -4.443603515625, -3.791015625, -3.138427734375, -2.48583984375, -1.833251953125, -1.1806640625, -0.528076171875, 0.12451171875, 0.777099609375, 1.4296875, 2.082275390625, 2.73486328125, 3.387451171875, 4.0400390625, 4.692626953125, 5.34521484375, 5.997802734375, 6.650390625, 7.302978515625, 7.95556640625, 8.608154296875, 9.2607421875, 9.913330078125, 10.56591796875, 11.218505859375, 11.87109375, 12.523681640625, 13.17626953125, 13.828857421875, 14.4814453125, 15.134033203125, 15.78662109375, 16.439208984375, 17.091796875, 17.744384765625, 18.39697265625, 19.049560546875, 19.7021484375, 20.354736328125, 21.00732421875, 21.659912109375, 22.3125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 9.0, 7.0, 10.0, 16.0, 17.0, 24.0, 35.0, 38.0, 35.0, 44.0, 39.0, 63.0, 78.0, 67.0, 75.0, 49.0, 63.0, 49.0, 52.0, 35.0, 27.0, 19.0, 22.0, 19.0, 21.0, 14.0, 13.0, 14.0, 4.0, 4.0, 6.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.52783203125, -40.2431640625, -38.95849609375, -37.673828125, -36.38916015625, -35.1044921875, -33.81982421875, -32.53515625, -31.25048828125, -29.9658203125, -28.68115234375, -27.396484375, -26.11181640625, -24.8271484375, -23.54248046875, -22.2578125, -20.97314453125, -19.6884765625, -18.40380859375, -17.119140625, -15.83447265625, -14.5498046875, -13.26513671875, -11.98046875, -10.69580078125, -9.4111328125, -8.12646484375, -6.841796875, -5.55712890625, -4.2724609375, -2.98779296875, -1.703125, -0.41845703125, 0.8662109375, 2.15087890625, 3.435546875, 4.72021484375, 6.0048828125, 7.28955078125, 8.57421875, 9.85888671875, 11.1435546875, 12.42822265625, 13.712890625, 14.99755859375, 16.2822265625, 17.56689453125, 18.8515625, 20.13623046875, 21.4208984375, 22.70556640625, 23.990234375, 25.27490234375, 26.5595703125, 27.84423828125, 29.12890625, 30.41357421875, 31.6982421875, 32.98291015625, 34.267578125, 35.55224609375, 36.8369140625, 38.12158203125, 39.40625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 6.0, 12.0, 16.0, 19.0, 22.0, 43.0, 60.0, 119.0, 224.0, 478.0, 1284.0, 4397.0, 20152.0, 149027.0, 798105.0, 59628.0, 10613.0, 2753.0, 858.0, 328.0, 172.0, 84.0, 46.0, 25.0, 26.0, 14.0, 11.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.9453125, -10.643798828125, -10.34228515625, -10.040771484375, -9.7392578125, -9.437744140625, -9.13623046875, -8.834716796875, -8.533203125, -8.231689453125, -7.93017578125, -7.628662109375, -7.3271484375, -7.025634765625, -6.72412109375, -6.422607421875, -6.12109375, -5.819580078125, -5.51806640625, -5.216552734375, -4.9150390625, -4.613525390625, -4.31201171875, -4.010498046875, -3.708984375, -3.407470703125, -3.10595703125, -2.804443359375, -2.5029296875, -2.201416015625, -1.89990234375, -1.598388671875, -1.296875, -0.995361328125, -0.69384765625, -0.392333984375, -0.0908203125, 0.210693359375, 0.51220703125, 0.813720703125, 1.115234375, 1.416748046875, 1.71826171875, 2.019775390625, 2.3212890625, 2.622802734375, 2.92431640625, 3.225830078125, 3.52734375, 3.828857421875, 4.13037109375, 4.431884765625, 4.7333984375, 5.034912109375, 5.33642578125, 5.637939453125, 5.939453125, 6.240966796875, 6.54248046875, 6.843994140625, 7.1455078125, 7.447021484375, 7.74853515625, 8.050048828125, 8.3515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 3.0, 8.0, 2.0, 3.0, 5.0, 10.0, 8.0, 13.0, 14.0, 15.0, 23.0, 38.0, 45.0, 100.0, 91.0, 124.0, 141.0, 84.0, 71.0, 41.0, 33.0, 30.0, 19.0, 23.0, 19.0, 8.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018568038940429688, -0.001801997423171997, -0.0017471909523010254, -0.0016923844814300537, -0.001637578010559082, -0.0015827715396881104, -0.0015279650688171387, -0.001473158597946167, -0.0014183521270751953, -0.0013635456562042236, -0.001308739185333252, -0.0012539327144622803, -0.0011991262435913086, -0.001144319772720337, -0.0010895133018493652, -0.0010347068309783936, -0.0009799003601074219, -0.0009250938892364502, -0.0008702874183654785, -0.0008154809474945068, -0.0007606744766235352, -0.0007058680057525635, -0.0006510615348815918, -0.0005962550640106201, -0.0005414485931396484, -0.00048664212226867676, -0.0004318356513977051, -0.0003770291805267334, -0.0003222227096557617, -0.00026741623878479004, -0.00021260976791381836, -0.00015780329704284668, -0.000102996826171875, -4.819035530090332e-05, 6.616115570068359e-06, 6.142258644104004e-05, 0.00011622905731201172, 0.0001710355281829834, 0.00022584199905395508, 0.00028064846992492676, 0.00033545494079589844, 0.0003902614116668701, 0.0004450678825378418, 0.0004998743534088135, 0.0005546808242797852, 0.0006094872951507568, 0.0006642937660217285, 0.0007191002368927002, 0.0007739067077636719, 0.0008287131786346436, 0.0008835196495056152, 0.0009383261203765869, 0.0009931325912475586, 0.0010479390621185303, 0.001102745532989502, 0.0011575520038604736, 0.0012123584747314453, 0.001267164945602417, 0.0013219714164733887, 0.0013767778873443604, 0.001431584358215332, 0.0014863908290863037, 0.0015411972999572754, 0.001596003770828247, 0.0016508102416992188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 22.0, 33.0, 50.0, 67.0, 100.0, 168.0, 355.0, 706.0, 1746.0, 4476.0, 15302.0, 71248.0, 768506.0, 149556.0, 25080.0, 6898.0, 2310.0, 960.0, 428.0, 206.0, 123.0, 67.0, 40.0, 28.0, 23.0, 12.0, 9.0, 9.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0546875, -10.76885986328125, -10.4830322265625, -10.19720458984375, -9.911376953125, -9.62554931640625, -9.3397216796875, -9.05389404296875, -8.76806640625, -8.48223876953125, -8.1964111328125, -7.91058349609375, -7.624755859375, -7.33892822265625, -7.0531005859375, -6.76727294921875, -6.4814453125, -6.19561767578125, -5.9097900390625, -5.62396240234375, -5.338134765625, -5.05230712890625, -4.7664794921875, -4.48065185546875, -4.19482421875, -3.90899658203125, -3.6231689453125, -3.33734130859375, -3.051513671875, -2.76568603515625, -2.4798583984375, -2.19403076171875, -1.908203125, -1.62237548828125, -1.3365478515625, -1.05072021484375, -0.764892578125, -0.47906494140625, -0.1932373046875, 0.09259033203125, 0.37841796875, 0.66424560546875, 0.9500732421875, 1.23590087890625, 1.521728515625, 1.80755615234375, 2.0933837890625, 2.37921142578125, 2.6650390625, 2.95086669921875, 3.2366943359375, 3.52252197265625, 3.808349609375, 4.09417724609375, 4.3800048828125, 4.66583251953125, 4.95166015625, 5.23748779296875, 5.5233154296875, 5.80914306640625, 6.094970703125, 6.38079833984375, 6.6666259765625, 6.95245361328125, 7.23828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 7.0, 4.0, 8.0, 11.0, 5.0, 14.0, 15.0, 17.0, 11.0, 17.0, 30.0, 30.0, 36.0, 59.0, 73.0, 85.0, 96.0, 99.0, 69.0, 75.0, 43.0, 42.0, 29.0, 23.0, 22.0, 18.0, 6.0, 14.0, 6.0, 4.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6015625, -5.42083740234375, -5.2401123046875, -5.05938720703125, -4.878662109375, -4.69793701171875, -4.5172119140625, -4.33648681640625, -4.15576171875, -3.97503662109375, -3.7943115234375, -3.61358642578125, -3.432861328125, -3.25213623046875, -3.0714111328125, -2.89068603515625, -2.7099609375, -2.52923583984375, -2.3485107421875, -2.16778564453125, -1.987060546875, -1.80633544921875, -1.6256103515625, -1.44488525390625, -1.26416015625, -1.08343505859375, -0.9027099609375, -0.72198486328125, -0.541259765625, -0.36053466796875, -0.1798095703125, 0.00091552734375, 0.181640625, 0.36236572265625, 0.5430908203125, 0.72381591796875, 0.904541015625, 1.08526611328125, 1.2659912109375, 1.44671630859375, 1.62744140625, 1.80816650390625, 1.9888916015625, 2.16961669921875, 2.350341796875, 2.53106689453125, 2.7117919921875, 2.89251708984375, 3.0732421875, 3.25396728515625, 3.4346923828125, 3.61541748046875, 3.796142578125, 3.97686767578125, 4.1575927734375, 4.33831787109375, 4.51904296875, 4.69976806640625, 4.8804931640625, 5.06121826171875, 5.241943359375, 5.42266845703125, 5.6033935546875, 5.78411865234375, 5.96484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 12.0, 28.0, 54.0, 135.0, 360.0, 223.0, 95.0, 43.0, 19.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.0602264404297, -130.32791137695312, -122.59558868408203, -114.86326599121094, -107.13095092773438, -99.39862823486328, -91.66630554199219, -83.93399047851562, -76.20166778564453, -68.46934509277344, -60.737030029296875, -53.00470733642578, -45.27238845825195, -37.540069580078125, -29.80774688720703, -22.075428009033203, -14.343109130859375, -6.6107892990112305, 1.121530532836914, 8.853851318359375, 16.586170196533203, 24.31848907470703, 32.050811767578125, 39.78313064575195, 47.51544952392578, 55.24776840209961, 62.98008728027344, 70.71240997314453, 78.44473266601562, 86.17704772949219, 93.90937042236328, 101.64169311523438, 109.37399291992188, 117.10631561279297, 124.83863067626953, 132.57095336914062, 140.3032684326172, 148.03558349609375, 155.76791381835938, 163.50022888183594, 171.2325439453125, 178.96485900878906, 186.6971893310547, 194.42950439453125, 202.1618194580078, 209.89413452148438, 217.62646484375, 225.35877990722656, 233.0911102294922, 240.82342529296875, 248.55575561523438, 256.2880859375, 264.0203857421875, 271.7527160644531, 279.48504638671875, 287.21734619140625, 294.9496765136719, 302.6820068359375, 310.414306640625, 318.1466369628906, 325.87896728515625, 333.61126708984375, 341.3435974121094, 349.075927734375, 356.8082275390625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 5.0, 13.0, 16.0, 17.0, 11.0, 16.0, 22.0, 22.0, 42.0, 27.0, 28.0, 44.0, 43.0, 61.0, 116.0, 88.0, 69.0, 53.0, 44.0, 39.0, 27.0, 32.0, 26.0, 34.0, 18.0, 12.0, 18.0, 8.0, 8.0, 4.0, 4.0, 5.0, 9.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-172.89117431640625, -168.11264038085938, -163.3341064453125, -158.55555725097656, -153.7770233154297, -148.9984893798828, -144.21995544433594, -139.44142150878906, -134.66287231445312, -129.88433837890625, -125.10579681396484, -120.32726287841797, -115.54872131347656, -110.77018737792969, -105.99165344238281, -101.21311950683594, -96.43458557128906, -91.65605163574219, -86.87751007080078, -82.0989761352539, -77.3204345703125, -72.54190063476562, -67.76336669921875, -62.98482894897461, -58.20629119873047, -53.42775344848633, -48.64921569824219, -43.87068176269531, -39.09214401245117, -34.31360626220703, -29.535070419311523, -24.756534576416016, -19.977996826171875, -15.19946002960205, -10.420923233032227, -5.642386436462402, -0.8638496398925781, 3.9146881103515625, 8.69322395324707, 13.471759796142578, 18.25029754638672, 23.02883529663086, 27.807371139526367, 32.585906982421875, 37.364444732666016, 42.142982482910156, 46.92151641845703, 51.70005416870117, 56.47859191894531, 61.25712966918945, 66.0356674194336, 70.81420135498047, 75.59274291992188, 80.37127685546875, 85.14981079101562, 89.9283447265625, 94.7068862915039, 99.48542022705078, 104.26396179199219, 109.04249572753906, 113.82102966308594, 118.59957122802734, 123.37810516357422, 128.15664672851562, 132.9351806640625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 10.0, 15.0, 17.0, 24.0, 42.0, 50.0, 78.0, 89.0, 148.0, 228.0, 323.0, 522.0, 905.0, 1650.0, 3522.0, 9584.0, 41263.0, 445361.0, 3083767.0, 538955.0, 48515.0, 10578.0, 4064.0, 1906.0, 999.0, 581.0, 396.0, 210.0, 145.0, 94.0, 72.0, 45.0, 31.0, 20.0, 14.0, 13.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.84375, -14.373046875, -13.90234375, -13.431640625, -12.9609375, -12.490234375, -12.01953125, -11.548828125, -11.078125, -10.607421875, -10.13671875, -9.666015625, -9.1953125, -8.724609375, -8.25390625, -7.783203125, -7.3125, -6.841796875, -6.37109375, -5.900390625, -5.4296875, -4.958984375, -4.48828125, -4.017578125, -3.546875, -3.076171875, -2.60546875, -2.134765625, -1.6640625, -1.193359375, -0.72265625, -0.251953125, 0.21875, 0.689453125, 1.16015625, 1.630859375, 2.1015625, 2.572265625, 3.04296875, 3.513671875, 3.984375, 4.455078125, 4.92578125, 5.396484375, 5.8671875, 6.337890625, 6.80859375, 7.279296875, 7.75, 8.220703125, 8.69140625, 9.162109375, 9.6328125, 10.103515625, 10.57421875, 11.044921875, 11.515625, 11.986328125, 12.45703125, 12.927734375, 13.3984375, 13.869140625, 14.33984375, 14.810546875, 15.28125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 5.0, 12.0, 23.0, 34.0, 25.0, 45.0, 48.0, 75.0, 65.0, 67.0, 74.0, 66.0, 89.0, 52.0, 70.0, 55.0, 37.0, 26.0, 31.0, 22.0, 26.0, 19.0, 8.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.921875, -14.5303955078125, -14.138916015625, -13.7474365234375, -13.35595703125, -12.9644775390625, -12.572998046875, -12.1815185546875, -11.7900390625, -11.3985595703125, -11.007080078125, -10.6156005859375, -10.22412109375, -9.8326416015625, -9.441162109375, -9.0496826171875, -8.658203125, -8.2667236328125, -7.875244140625, -7.4837646484375, -7.09228515625, -6.7008056640625, -6.309326171875, -5.9178466796875, -5.5263671875, -5.1348876953125, -4.743408203125, -4.3519287109375, -3.96044921875, -3.5689697265625, -3.177490234375, -2.7860107421875, -2.39453125, -2.0030517578125, -1.611572265625, -1.2200927734375, -0.82861328125, -0.4371337890625, -0.045654296875, 0.3458251953125, 0.7373046875, 1.1287841796875, 1.520263671875, 1.9117431640625, 2.30322265625, 2.6947021484375, 3.086181640625, 3.4776611328125, 3.869140625, 4.2606201171875, 4.652099609375, 5.0435791015625, 5.43505859375, 5.8265380859375, 6.218017578125, 6.6094970703125, 7.0009765625, 7.3924560546875, 7.783935546875, 8.1754150390625, 8.56689453125, 8.9583740234375, 9.349853515625, 9.7413330078125, 10.1328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 16.0, 32.0, 76.0, 185.0, 387.0, 990.0, 4189256.0, 2556.0, 455.0, 186.0, 87.0, 30.0, 17.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.5, -280.62109375, -272.7421875, -264.86328125, -256.984375, -249.10546875, -241.2265625, -233.34765625, -225.46875, -217.58984375, -209.7109375, -201.83203125, -193.953125, -186.07421875, -178.1953125, -170.31640625, -162.4375, -154.55859375, -146.6796875, -138.80078125, -130.921875, -123.04296875, -115.1640625, -107.28515625, -99.40625, -91.52734375, -83.6484375, -75.76953125, -67.890625, -60.01171875, -52.1328125, -44.25390625, -36.375, -28.49609375, -20.6171875, -12.73828125, -4.859375, 3.01953125, 10.8984375, 18.77734375, 26.65625, 34.53515625, 42.4140625, 50.29296875, 58.171875, 66.05078125, 73.9296875, 81.80859375, 89.6875, 97.56640625, 105.4453125, 113.32421875, 121.203125, 129.08203125, 136.9609375, 144.83984375, 152.71875, 160.59765625, 168.4765625, 176.35546875, 184.234375, 192.11328125, 199.9921875, 207.87109375, 215.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 41.0, 377.0, 3223.0, 392.0, 33.0, 14.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.625, -137.0654296875, -133.505859375, -129.9462890625, -126.38671875, -122.8271484375, -119.267578125, -115.7080078125, -112.1484375, -108.5888671875, -105.029296875, -101.4697265625, -97.91015625, -94.3505859375, -90.791015625, -87.2314453125, -83.671875, -80.1123046875, -76.552734375, -72.9931640625, -69.43359375, -65.8740234375, -62.314453125, -58.7548828125, -55.1953125, -51.6357421875, -48.076171875, -44.5166015625, -40.95703125, -37.3974609375, -33.837890625, -30.2783203125, -26.71875, -23.1591796875, -19.599609375, -16.0400390625, -12.48046875, -8.9208984375, -5.361328125, -1.8017578125, 1.7578125, 5.3173828125, 8.876953125, 12.4365234375, 15.99609375, 19.5556640625, 23.115234375, 26.6748046875, 30.234375, 33.7939453125, 37.353515625, 40.9130859375, 44.47265625, 48.0322265625, 51.591796875, 55.1513671875, 58.7109375, 62.2705078125, 65.830078125, 69.3896484375, 72.94921875, 76.5087890625, 80.068359375, 83.6279296875, 87.1875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 13.0, 43.0, 94.0, 210.0, 346.0, 174.0, 69.0, 26.0, 9.0, 8.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.0595703125, -505.5362854003906, -493.0130310058594, -480.48974609375, -467.96649169921875, -455.4432067871094, -442.919921875, -430.39666748046875, -417.8733825683594, -405.35009765625, -392.82684326171875, -380.3035583496094, -367.7802734375, -355.25701904296875, -342.7337341308594, -330.21044921875, -317.68719482421875, -305.1639099121094, -292.6406555175781, -280.11737060546875, -267.5941162109375, -255.07083129882812, -242.54754638671875, -230.02427673339844, -217.50100708007812, -204.9777374267578, -192.4544677734375, -179.93118286132812, -167.4079132080078, -154.8846435546875, -142.36135864257812, -129.8380889892578, -117.3148193359375, -104.79154968261719, -92.26827239990234, -79.7449951171875, -67.22172546386719, -54.69845199584961, -42.17517852783203, -29.651901245117188, -17.128631591796875, -4.605358123779297, 7.917915344238281, 20.44118881225586, 32.96446228027344, 45.487735748291016, 58.011009216308594, 70.53428649902344, 83.05755615234375, 95.58082580566406, 108.1041030883789, 120.62738037109375, 133.15065002441406, 145.67391967773438, 158.19720458984375, 170.72047424316406, 183.24374389648438, 195.7670135498047, 208.290283203125, 220.81356811523438, 233.3368377685547, 245.860107421875, 258.3833923339844, 270.90667724609375, 283.429931640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 2.0, 11.0, 10.0, 10.0, 12.0, 17.0, 18.0, 33.0, 30.0, 31.0, 38.0, 40.0, 51.0, 49.0, 53.0, 47.0, 52.0, 46.0, 49.0, 41.0, 44.0, 41.0, 41.0, 44.0, 31.0, 24.0, 21.0, 23.0, 11.0, 10.0, 13.0, 18.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.17119598388672, -85.4741439819336, -81.77708435058594, -78.08003234863281, -74.38298034667969, -70.68592834472656, -66.9888687133789, -63.29181671142578, -59.59476089477539, -55.897705078125, -52.200653076171875, -48.503597259521484, -44.806541442871094, -41.10948944091797, -37.41243362426758, -33.71537780761719, -30.018325805664062, -26.321271896362305, -22.624217987060547, -18.927162170410156, -15.230108261108398, -11.53305435180664, -7.83599853515625, -4.138944625854492, -0.4418907165527344, 3.2551636695861816, 6.952218055725098, 10.649272918701172, 14.34632682800293, 18.043380737304688, 21.740436553955078, 25.437490463256836, 29.134552001953125, 32.831607818603516, 36.52865982055664, 40.22571563720703, 43.922767639160156, 47.61982345581055, 51.31687927246094, 55.01393127441406, 58.71098709106445, 62.408042907714844, 66.10509490966797, 69.80215454101562, 73.49920654296875, 77.19625854492188, 80.893310546875, 84.59037017822266, 88.28742218017578, 91.9844741821289, 95.68153381347656, 99.37858581542969, 103.07563781738281, 106.77268981933594, 110.4697494506836, 114.16680145263672, 117.86386108398438, 121.5609130859375, 125.25797271728516, 128.95501708984375, 132.65208435058594, 136.34913635253906, 140.0461883544922, 143.7432403564453, 147.44029235839844]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 13.0, 10.0, 16.0, 16.0, 26.0, 52.0, 83.0, 144.0, 236.0, 469.0, 845.0, 1809.0, 4215.0, 11686.0, 40976.0, 212993.0, 596536.0, 134247.0, 28806.0, 8789.0, 3375.0, 1533.0, 745.0, 420.0, 193.0, 132.0, 74.0, 45.0, 34.0, 14.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.832763671875, -23.11865234375, -22.404541015625, -21.6904296875, -20.976318359375, -20.26220703125, -19.548095703125, -18.833984375, -18.119873046875, -17.40576171875, -16.691650390625, -15.9775390625, -15.263427734375, -14.54931640625, -13.835205078125, -13.12109375, -12.406982421875, -11.69287109375, -10.978759765625, -10.2646484375, -9.550537109375, -8.83642578125, -8.122314453125, -7.408203125, -6.694091796875, -5.97998046875, -5.265869140625, -4.5517578125, -3.837646484375, -3.12353515625, -2.409423828125, -1.6953125, -0.981201171875, -0.26708984375, 0.447021484375, 1.1611328125, 1.875244140625, 2.58935546875, 3.303466796875, 4.017578125, 4.731689453125, 5.44580078125, 6.159912109375, 6.8740234375, 7.588134765625, 8.30224609375, 9.016357421875, 9.73046875, 10.444580078125, 11.15869140625, 11.872802734375, 12.5869140625, 13.301025390625, 14.01513671875, 14.729248046875, 15.443359375, 16.157470703125, 16.87158203125, 17.585693359375, 18.2998046875, 19.013916015625, 19.72802734375, 20.442138671875, 21.15625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 4.0, 0.0, 3.0, 10.0, 7.0, 8.0, 14.0, 23.0, 9.0, 23.0, 22.0, 34.0, 32.0, 36.0, 30.0, 49.0, 60.0, 78.0, 52.0, 51.0, 61.0, 48.0, 43.0, 47.0, 57.0, 34.0, 25.0, 23.0, 23.0, 21.0, 21.0, 11.0, 11.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.078125, -10.7435302734375, -10.408935546875, -10.0743408203125, -9.73974609375, -9.4051513671875, -9.070556640625, -8.7359619140625, -8.4013671875, -8.0667724609375, -7.732177734375, -7.3975830078125, -7.06298828125, -6.7283935546875, -6.393798828125, -6.0592041015625, -5.724609375, -5.3900146484375, -5.055419921875, -4.7208251953125, -4.38623046875, -4.0516357421875, -3.717041015625, -3.3824462890625, -3.0478515625, -2.7132568359375, -2.378662109375, -2.0440673828125, -1.70947265625, -1.3748779296875, -1.040283203125, -0.7056884765625, -0.37109375, -0.0364990234375, 0.298095703125, 0.6326904296875, 0.96728515625, 1.3018798828125, 1.636474609375, 1.9710693359375, 2.3056640625, 2.6402587890625, 2.974853515625, 3.3094482421875, 3.64404296875, 3.9786376953125, 4.313232421875, 4.6478271484375, 4.982421875, 5.3170166015625, 5.651611328125, 5.9862060546875, 6.32080078125, 6.6553955078125, 6.989990234375, 7.3245849609375, 7.6591796875, 7.9937744140625, 8.328369140625, 8.6629638671875, 8.99755859375, 9.3321533203125, 9.666748046875, 10.0013427734375, 10.3359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 8.0, 6.0, 15.0, 18.0, 32.0, 43.0, 68.0, 97.0, 179.0, 326.0, 721.0, 1952.0, 8018.0, 75017.0, 885070.0, 65956.0, 7572.0, 1944.0, 699.0, 314.0, 160.0, 105.0, 67.0, 46.0, 30.0, 16.0, 18.0, 9.0, 10.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.1875, -45.81884765625, -44.4501953125, -43.08154296875, -41.712890625, -40.34423828125, -38.9755859375, -37.60693359375, -36.23828125, -34.86962890625, -33.5009765625, -32.13232421875, -30.763671875, -29.39501953125, -28.0263671875, -26.65771484375, -25.2890625, -23.92041015625, -22.5517578125, -21.18310546875, -19.814453125, -18.44580078125, -17.0771484375, -15.70849609375, -14.33984375, -12.97119140625, -11.6025390625, -10.23388671875, -8.865234375, -7.49658203125, -6.1279296875, -4.75927734375, -3.390625, -2.02197265625, -0.6533203125, 0.71533203125, 2.083984375, 3.45263671875, 4.8212890625, 6.18994140625, 7.55859375, 8.92724609375, 10.2958984375, 11.66455078125, 13.033203125, 14.40185546875, 15.7705078125, 17.13916015625, 18.5078125, 19.87646484375, 21.2451171875, 22.61376953125, 23.982421875, 25.35107421875, 26.7197265625, 28.08837890625, 29.45703125, 30.82568359375, 32.1943359375, 33.56298828125, 34.931640625, 36.30029296875, 37.6689453125, 39.03759765625, 40.40625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 7.0, 9.0, 9.0, 12.0, 29.0, 20.0, 38.0, 31.0, 59.0, 63.0, 65.0, 83.0, 57.0, 69.0, 58.0, 66.0, 61.0, 48.0, 55.0, 33.0, 32.0, 18.0, 19.0, 16.0, 10.0, 10.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75, -52.01513671875, -50.2802734375, -48.54541015625, -46.810546875, -45.07568359375, -43.3408203125, -41.60595703125, -39.87109375, -38.13623046875, -36.4013671875, -34.66650390625, -32.931640625, -31.19677734375, -29.4619140625, -27.72705078125, -25.9921875, -24.25732421875, -22.5224609375, -20.78759765625, -19.052734375, -17.31787109375, -15.5830078125, -13.84814453125, -12.11328125, -10.37841796875, -8.6435546875, -6.90869140625, -5.173828125, -3.43896484375, -1.7041015625, 0.03076171875, 1.765625, 3.50048828125, 5.2353515625, 6.97021484375, 8.705078125, 10.43994140625, 12.1748046875, 13.90966796875, 15.64453125, 17.37939453125, 19.1142578125, 20.84912109375, 22.583984375, 24.31884765625, 26.0537109375, 27.78857421875, 29.5234375, 31.25830078125, 32.9931640625, 34.72802734375, 36.462890625, 38.19775390625, 39.9326171875, 41.66748046875, 43.40234375, 45.13720703125, 46.8720703125, 48.60693359375, 50.341796875, 52.07666015625, 53.8115234375, 55.54638671875, 57.28125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 11.0, 5.0, 13.0, 13.0, 24.0, 35.0, 63.0, 73.0, 130.0, 226.0, 352.0, 701.0, 1302.0, 3317.0, 10928.0, 70430.0, 889336.0, 56502.0, 9401.0, 2889.0, 1261.0, 617.0, 325.0, 211.0, 123.0, 75.0, 47.0, 27.0, 36.0, 17.0, 14.0, 12.0, 5.0, 10.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.52099609375, -17.8701171875, -17.21923828125, -16.568359375, -15.91748046875, -15.2666015625, -14.61572265625, -13.96484375, -13.31396484375, -12.6630859375, -12.01220703125, -11.361328125, -10.71044921875, -10.0595703125, -9.40869140625, -8.7578125, -8.10693359375, -7.4560546875, -6.80517578125, -6.154296875, -5.50341796875, -4.8525390625, -4.20166015625, -3.55078125, -2.89990234375, -2.2490234375, -1.59814453125, -0.947265625, -0.29638671875, 0.3544921875, 1.00537109375, 1.65625, 2.30712890625, 2.9580078125, 3.60888671875, 4.259765625, 4.91064453125, 5.5615234375, 6.21240234375, 6.86328125, 7.51416015625, 8.1650390625, 8.81591796875, 9.466796875, 10.11767578125, 10.7685546875, 11.41943359375, 12.0703125, 12.72119140625, 13.3720703125, 14.02294921875, 14.673828125, 15.32470703125, 15.9755859375, 16.62646484375, 17.27734375, 17.92822265625, 18.5791015625, 19.22998046875, 19.880859375, 20.53173828125, 21.1826171875, 21.83349609375, 22.484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 4.0, 2.0, 5.0, 8.0, 7.0, 14.0, 18.0, 32.0, 65.0, 124.0, 233.0, 220.0, 89.0, 53.0, 37.0, 21.0, 14.0, 17.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.004871368408203125, -0.0046836137771606445, -0.004495859146118164, -0.004308104515075684, -0.004120349884033203, -0.003932595252990723, -0.003744840621948242, -0.0035570859909057617, -0.0033693313598632812, -0.0031815767288208008, -0.0029938220977783203, -0.00280606746673584, -0.0026183128356933594, -0.002430558204650879, -0.0022428035736083984, -0.002055048942565918, -0.0018672943115234375, -0.001679539680480957, -0.0014917850494384766, -0.001304030418395996, -0.0011162757873535156, -0.0009285211563110352, -0.0007407665252685547, -0.0005530118942260742, -0.00036525726318359375, -0.00017750263214111328, 1.0251998901367188e-05, 0.00019800662994384766, 0.0003857612609863281, 0.0005735158920288086, 0.0007612705230712891, 0.0009490251541137695, 0.00113677978515625, 0.0013245344161987305, 0.001512289047241211, 0.0017000436782836914, 0.0018877983093261719, 0.0020755529403686523, 0.002263307571411133, 0.0024510622024536133, 0.0026388168334960938, 0.0028265714645385742, 0.0030143260955810547, 0.003202080726623535, 0.0033898353576660156, 0.003577589988708496, 0.0037653446197509766, 0.003953099250793457, 0.0041408538818359375, 0.004328608512878418, 0.0045163631439208984, 0.004704117774963379, 0.004891872406005859, 0.00507962703704834, 0.00526738166809082, 0.005455136299133301, 0.005642890930175781, 0.005830645561218262, 0.006018400192260742, 0.006206154823303223, 0.006393909454345703, 0.006581664085388184, 0.006769418716430664, 0.0069571733474731445, 0.007144927978515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 13.0, 9.0, 9.0, 20.0, 30.0, 56.0, 54.0, 122.0, 218.0, 428.0, 950.0, 2720.0, 8929.0, 43075.0, 818992.0, 146894.0, 18292.0, 4760.0, 1526.0, 650.0, 301.0, 179.0, 114.0, 65.0, 45.0, 24.0, 15.0, 13.0, 15.0, 5.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.265869140625, -15.71923828125, -15.172607421875, -14.6259765625, -14.079345703125, -13.53271484375, -12.986083984375, -12.439453125, -11.892822265625, -11.34619140625, -10.799560546875, -10.2529296875, -9.706298828125, -9.15966796875, -8.613037109375, -8.06640625, -7.519775390625, -6.97314453125, -6.426513671875, -5.8798828125, -5.333251953125, -4.78662109375, -4.239990234375, -3.693359375, -3.146728515625, -2.60009765625, -2.053466796875, -1.5068359375, -0.960205078125, -0.41357421875, 0.133056640625, 0.6796875, 1.226318359375, 1.77294921875, 2.319580078125, 2.8662109375, 3.412841796875, 3.95947265625, 4.506103515625, 5.052734375, 5.599365234375, 6.14599609375, 6.692626953125, 7.2392578125, 7.785888671875, 8.33251953125, 8.879150390625, 9.42578125, 9.972412109375, 10.51904296875, 11.065673828125, 11.6123046875, 12.158935546875, 12.70556640625, 13.252197265625, 13.798828125, 14.345458984375, 14.89208984375, 15.438720703125, 15.9853515625, 16.531982421875, 17.07861328125, 17.625244140625, 18.171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 5.0, 8.0, 18.0, 11.0, 5.0, 18.0, 22.0, 23.0, 36.0, 56.0, 74.0, 102.0, 119.0, 117.0, 81.0, 66.0, 54.0, 36.0, 20.0, 20.0, 13.0, 12.0, 12.0, 12.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.125, -8.774169921875, -8.42333984375, -8.072509765625, -7.7216796875, -7.370849609375, -7.02001953125, -6.669189453125, -6.318359375, -5.967529296875, -5.61669921875, -5.265869140625, -4.9150390625, -4.564208984375, -4.21337890625, -3.862548828125, -3.51171875, -3.160888671875, -2.81005859375, -2.459228515625, -2.1083984375, -1.757568359375, -1.40673828125, -1.055908203125, -0.705078125, -0.354248046875, -0.00341796875, 0.347412109375, 0.6982421875, 1.049072265625, 1.39990234375, 1.750732421875, 2.1015625, 2.452392578125, 2.80322265625, 3.154052734375, 3.5048828125, 3.855712890625, 4.20654296875, 4.557373046875, 4.908203125, 5.259033203125, 5.60986328125, 5.960693359375, 6.3115234375, 6.662353515625, 7.01318359375, 7.364013671875, 7.71484375, 8.065673828125, 8.41650390625, 8.767333984375, 9.1181640625, 9.468994140625, 9.81982421875, 10.170654296875, 10.521484375, 10.872314453125, 11.22314453125, 11.573974609375, 11.9248046875, 12.275634765625, 12.62646484375, 12.977294921875, 13.328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 11.0, 120.0, 677.0, 142.0, 34.0, 13.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-572.6337890625, -539.8124389648438, -506.99102783203125, -474.169677734375, -441.3482971191406, -408.52691650390625, -375.70556640625, -342.8841857910156, -310.06280517578125, -277.2414245605469, -244.42005920410156, -211.59869384765625, -178.77731323242188, -145.9559326171875, -113.13456726074219, -80.31320190429688, -47.4918212890625, -14.670448303222656, 18.150924682617188, 50.97229766845703, 83.79367065429688, 116.61505126953125, 149.43641662597656, 182.25778198242188, 215.07916259765625, 247.90054321289062, 280.721923828125, 313.54327392578125, 346.3646545410156, 379.18603515625, 412.00738525390625, 444.8287658691406, 477.6502685546875, 510.4716491699219, 543.2930297851562, 576.1143798828125, 608.935791015625, 641.7571411132812, 674.5784912109375, 707.39990234375, 740.2212524414062, 773.0426025390625, 805.864013671875, 838.6853637695312, 871.5067138671875, 904.328125, 937.1494750976562, 969.9708251953125, 1002.792236328125, 1035.6136474609375, 1068.4349365234375, 1101.25634765625, 1134.0777587890625, 1166.899169921875, 1199.720458984375, 1232.5418701171875, 1265.36328125, 1298.1846923828125, 1331.0059814453125, 1363.827392578125, 1396.6488037109375, 1429.47021484375, 1462.29150390625, 1495.1129150390625, 1527.9342041015625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 12.0, 17.0, 9.0, 14.0, 15.0, 19.0, 21.0, 20.0, 28.0, 24.0, 31.0, 41.0, 63.0, 95.0, 147.0, 94.0, 49.0, 32.0, 24.0, 31.0, 32.0, 16.0, 17.0, 23.0, 23.0, 13.0, 18.0, 9.0, 14.0, 10.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-193.44381713867188, -187.4773712158203, -181.5109405517578, -175.54449462890625, -169.57806396484375, -163.6116180419922, -157.64517211914062, -151.67874145507812, -145.71229553222656, -139.745849609375, -133.7794189453125, -127.81297302246094, -121.8465347290039, -115.88009643554688, -109.91365051269531, -103.94721221923828, -97.98077392578125, -92.01433563232422, -86.04789733886719, -80.08145141601562, -74.1150131225586, -68.14857482910156, -62.182132720947266, -56.21569061279297, -50.24925231933594, -44.282814025878906, -38.31637191772461, -32.34992980957031, -26.38349151611328, -20.417051315307617, -14.450611114501953, -8.484169006347656, -2.5177154541015625, 3.4487247467041016, 9.415164947509766, 15.38160514831543, 21.348045349121094, 27.314485549926758, 33.28092575073242, 39.24736785888672, 45.21380615234375, 51.18024444580078, 57.14668655395508, 63.113128662109375, 69.0795669555664, 75.04600524902344, 81.012451171875, 86.97888946533203, 92.94532775878906, 98.9117660522461, 104.87820434570312, 110.84465026855469, 116.81108856201172, 122.77752685546875, 128.7439727783203, 134.71041870117188, 140.67684936523438, 146.64329528808594, 152.60972595214844, 158.576171875, 164.5426025390625, 170.50904846191406, 176.47549438476562, 182.44192504882812, 188.4083709716797]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 36.0, 56.0, 85.0, 203.0, 346.0, 723.0, 1692.0, 5161.0, 23533.0, 440905.0, 3484168.0, 214387.0, 16712.0, 3899.0, 1332.0, 503.0, 256.0, 110.0, 67.0, 53.0, 24.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.5, -45.2890625, -44.078125, -42.8671875, -41.65625, -40.4453125, -39.234375, -38.0234375, -36.8125, -35.6015625, -34.390625, -33.1796875, -31.96875, -30.7578125, -29.546875, -28.3359375, -27.125, -25.9140625, -24.703125, -23.4921875, -22.28125, -21.0703125, -19.859375, -18.6484375, -17.4375, -16.2265625, -15.015625, -13.8046875, -12.59375, -11.3828125, -10.171875, -8.9609375, -7.75, -6.5390625, -5.328125, -4.1171875, -2.90625, -1.6953125, -0.484375, 0.7265625, 1.9375, 3.1484375, 4.359375, 5.5703125, 6.78125, 7.9921875, 9.203125, 10.4140625, 11.625, 12.8359375, 14.046875, 15.2578125, 16.46875, 17.6796875, 18.890625, 20.1015625, 21.3125, 22.5234375, 23.734375, 24.9453125, 26.15625, 27.3671875, 28.578125, 29.7890625, 31.0]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 11.0, 10.0, 15.0, 12.0, 18.0, 17.0, 26.0, 18.0, 31.0, 30.0, 33.0, 49.0, 42.0, 42.0, 38.0, 55.0, 56.0, 52.0, 54.0, 45.0, 41.0, 41.0, 38.0, 31.0, 24.0, 18.0, 33.0, 23.0, 20.0, 11.0, 14.0, 11.0, 7.0, 8.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6171875, -9.3333740234375, -9.049560546875, -8.7657470703125, -8.48193359375, -8.1981201171875, -7.914306640625, -7.6304931640625, -7.3466796875, -7.0628662109375, -6.779052734375, -6.4952392578125, -6.21142578125, -5.9276123046875, -5.643798828125, -5.3599853515625, -5.076171875, -4.7923583984375, -4.508544921875, -4.2247314453125, -3.94091796875, -3.6571044921875, -3.373291015625, -3.0894775390625, -2.8056640625, -2.5218505859375, -2.238037109375, -1.9542236328125, -1.67041015625, -1.3865966796875, -1.102783203125, -0.8189697265625, -0.53515625, -0.2513427734375, 0.032470703125, 0.3162841796875, 0.60009765625, 0.8839111328125, 1.167724609375, 1.4515380859375, 1.7353515625, 2.0191650390625, 2.302978515625, 2.5867919921875, 2.87060546875, 3.1544189453125, 3.438232421875, 3.7220458984375, 4.005859375, 4.2896728515625, 4.573486328125, 4.8572998046875, 5.14111328125, 5.4249267578125, 5.708740234375, 5.9925537109375, 6.2763671875, 6.5601806640625, 6.843994140625, 7.1278076171875, 7.41162109375, 7.6954345703125, 7.979248046875, 8.2630615234375, 8.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 14.0, 14.0, 37.0, 69.0, 170.0, 566.0, 3195.0, 3884979.0, 302017.0, 2361.0, 528.0, 172.0, 90.0, 28.0, 15.0, 11.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.875, -215.697265625, -209.51953125, -203.341796875, -197.1640625, -190.986328125, -184.80859375, -178.630859375, -172.453125, -166.275390625, -160.09765625, -153.919921875, -147.7421875, -141.564453125, -135.38671875, -129.208984375, -123.03125, -116.853515625, -110.67578125, -104.498046875, -98.3203125, -92.142578125, -85.96484375, -79.787109375, -73.609375, -67.431640625, -61.25390625, -55.076171875, -48.8984375, -42.720703125, -36.54296875, -30.365234375, -24.1875, -18.009765625, -11.83203125, -5.654296875, 0.5234375, 6.701171875, 12.87890625, 19.056640625, 25.234375, 31.412109375, 37.58984375, 43.767578125, 49.9453125, 56.123046875, 62.30078125, 68.478515625, 74.65625, 80.833984375, 87.01171875, 93.189453125, 99.3671875, 105.544921875, 111.72265625, 117.900390625, 124.078125, 130.255859375, 136.43359375, 142.611328125, 148.7890625, 154.966796875, 161.14453125, 167.322265625, 173.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 11.0, 29.0, 53.0, 129.0, 258.0, 586.0, 1213.0, 972.0, 452.0, 199.0, 72.0, 38.0, 25.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.150390625, -31.05078125, -28.951171875, -26.8515625, -24.751953125, -22.65234375, -20.552734375, -18.453125, -16.353515625, -14.25390625, -12.154296875, -10.0546875, -7.955078125, -5.85546875, -3.755859375, -1.65625, 0.443359375, 2.54296875, 4.642578125, 6.7421875, 8.841796875, 10.94140625, 13.041015625, 15.140625, 17.240234375, 19.33984375, 21.439453125, 23.5390625, 25.638671875, 27.73828125, 29.837890625, 31.9375, 34.037109375, 36.13671875, 38.236328125, 40.3359375, 42.435546875, 44.53515625, 46.634765625, 48.734375, 50.833984375, 52.93359375, 55.033203125, 57.1328125, 59.232421875, 61.33203125, 63.431640625, 65.53125, 67.630859375, 69.73046875, 71.830078125, 73.9296875, 76.029296875, 78.12890625, 80.228515625, 82.328125, 84.427734375, 86.52734375, 88.626953125, 90.7265625, 92.826171875, 94.92578125, 97.025390625, 99.125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 2.0, 14.0, 15.0, 37.0, 106.0, 253.0, 265.0, 160.0, 57.0, 38.0, 18.0, 7.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-432.15667724609375, -412.7328796386719, -393.3091125488281, -373.88531494140625, -354.4615478515625, -335.0377502441406, -315.61395263671875, -296.190185546875, -276.7663879394531, -257.34259033203125, -237.9188232421875, -218.49502563476562, -199.0712432861328, -179.6474609375, -160.22366333007812, -140.7998809814453, -121.3760986328125, -101.95231628417969, -82.52852630615234, -63.104740142822266, -43.68095397949219, -24.257171630859375, -4.833381652832031, 14.590408325195312, 34.014190673828125, 53.4379768371582, 72.86176300048828, 92.28555297851562, 111.70933532714844, 131.13311767578125, 150.55691528320312, 169.98069763183594, 189.404541015625, 208.8283233642578, 228.25210571289062, 247.6759033203125, 267.09967041015625, 286.5234680175781, 305.947265625, 325.37103271484375, 344.7948303222656, 364.2186279296875, 383.64239501953125, 403.0661926269531, 422.489990234375, 441.91375732421875, 461.3375549316406, 480.7613525390625, 500.18511962890625, 519.60888671875, 539.03271484375, 558.4564819335938, 577.8802490234375, 597.3040771484375, 616.7278442382812, 636.151611328125, 655.575439453125, 674.9992065429688, 694.4230346679688, 713.8468017578125, 733.2705688476562, 752.6943359375, 772.1181640625, 791.5419311523438, 810.9656982421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 12.0, 14.0, 15.0, 14.0, 22.0, 21.0, 21.0, 26.0, 42.0, 57.0, 56.0, 66.0, 67.0, 74.0, 93.0, 77.0, 58.0, 52.0, 48.0, 35.0, 29.0, 23.0, 10.0, 17.0, 8.0, 9.0, 6.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-321.7721862792969, -313.84332275390625, -305.91448974609375, -297.9856262207031, -290.0567626953125, -282.1279296875, -274.1990661621094, -266.2702331542969, -258.34136962890625, -250.4125213623047, -242.48367309570312, -234.5548095703125, -226.62596130371094, -218.69711303710938, -210.76824951171875, -202.8394012451172, -194.91055297851562, -186.98170471191406, -179.0528564453125, -171.12399291992188, -163.1951446533203, -155.26629638671875, -147.33743286132812, -139.40858459472656, -131.479736328125, -123.55088806152344, -115.62203216552734, -107.69317626953125, -99.76432800292969, -91.83547973632812, -83.90662384033203, -75.97776794433594, -68.04891967773438, -60.12006759643555, -52.19121551513672, -44.26236343383789, -36.33351135253906, -28.404659271240234, -20.475807189941406, -12.546955108642578, -4.61810302734375, 3.310749053955078, 11.239601135253906, 19.168453216552734, 27.097305297851562, 35.02615737915039, 42.95500946044922, 50.88386154174805, 58.812713623046875, 66.74156188964844, 74.67041778564453, 82.59927368164062, 90.52812194824219, 98.45697021484375, 106.38582611083984, 114.31468200683594, 122.2435302734375, 130.17237854003906, 138.10122680664062, 146.03009033203125, 153.9589385986328, 161.88778686523438, 169.816650390625, 177.74549865722656, 185.67434692382812]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 6.0, 16.0, 16.0, 36.0, 50.0, 79.0, 158.0, 302.0, 620.0, 1539.0, 4420.0, 17360.0, 126827.0, 786811.0, 90033.0, 13876.0, 3862.0, 1353.0, 568.0, 268.0, 134.0, 70.0, 48.0, 35.0, 21.0, 11.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.53125, -38.41552734375, -37.2998046875, -36.18408203125, -35.068359375, -33.95263671875, -32.8369140625, -31.72119140625, -30.60546875, -29.48974609375, -28.3740234375, -27.25830078125, -26.142578125, -25.02685546875, -23.9111328125, -22.79541015625, -21.6796875, -20.56396484375, -19.4482421875, -18.33251953125, -17.216796875, -16.10107421875, -14.9853515625, -13.86962890625, -12.75390625, -11.63818359375, -10.5224609375, -9.40673828125, -8.291015625, -7.17529296875, -6.0595703125, -4.94384765625, -3.828125, -2.71240234375, -1.5966796875, -0.48095703125, 0.634765625, 1.75048828125, 2.8662109375, 3.98193359375, 5.09765625, 6.21337890625, 7.3291015625, 8.44482421875, 9.560546875, 10.67626953125, 11.7919921875, 12.90771484375, 14.0234375, 15.13916015625, 16.2548828125, 17.37060546875, 18.486328125, 19.60205078125, 20.7177734375, 21.83349609375, 22.94921875, 24.06494140625, 25.1806640625, 26.29638671875, 27.412109375, 28.52783203125, 29.6435546875, 30.75927734375, 31.875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 20.0, 21.0, 22.0, 38.0, 57.0, 82.0, 80.0, 72.0, 94.0, 104.0, 85.0, 77.0, 57.0, 55.0, 29.0, 28.0, 17.0, 15.0, 7.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.0625, -22.33203125, -21.6015625, -20.87109375, -20.140625, -19.41015625, -18.6796875, -17.94921875, -17.21875, -16.48828125, -15.7578125, -15.02734375, -14.296875, -13.56640625, -12.8359375, -12.10546875, -11.375, -10.64453125, -9.9140625, -9.18359375, -8.453125, -7.72265625, -6.9921875, -6.26171875, -5.53125, -4.80078125, -4.0703125, -3.33984375, -2.609375, -1.87890625, -1.1484375, -0.41796875, 0.3125, 1.04296875, 1.7734375, 2.50390625, 3.234375, 3.96484375, 4.6953125, 5.42578125, 6.15625, 6.88671875, 7.6171875, 8.34765625, 9.078125, 9.80859375, 10.5390625, 11.26953125, 12.0, 12.73046875, 13.4609375, 14.19140625, 14.921875, 15.65234375, 16.3828125, 17.11328125, 17.84375, 18.57421875, 19.3046875, 20.03515625, 20.765625, 21.49609375, 22.2265625, 22.95703125, 23.6875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 18.0, 18.0, 34.0, 57.0, 118.0, 280.0, 738.0, 4148.0, 166671.0, 867474.0, 7221.0, 1062.0, 318.0, 152.0, 86.0, 39.0, 42.0, 26.0, 14.0, 11.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.125, -63.21533203125, -61.3056640625, -59.39599609375, -57.486328125, -55.57666015625, -53.6669921875, -51.75732421875, -49.84765625, -47.93798828125, -46.0283203125, -44.11865234375, -42.208984375, -40.29931640625, -38.3896484375, -36.47998046875, -34.5703125, -32.66064453125, -30.7509765625, -28.84130859375, -26.931640625, -25.02197265625, -23.1123046875, -21.20263671875, -19.29296875, -17.38330078125, -15.4736328125, -13.56396484375, -11.654296875, -9.74462890625, -7.8349609375, -5.92529296875, -4.015625, -2.10595703125, -0.1962890625, 1.71337890625, 3.623046875, 5.53271484375, 7.4423828125, 9.35205078125, 11.26171875, 13.17138671875, 15.0810546875, 16.99072265625, 18.900390625, 20.81005859375, 22.7197265625, 24.62939453125, 26.5390625, 28.44873046875, 30.3583984375, 32.26806640625, 34.177734375, 36.08740234375, 37.9970703125, 39.90673828125, 41.81640625, 43.72607421875, 45.6357421875, 47.54541015625, 49.455078125, 51.36474609375, 53.2744140625, 55.18408203125, 57.09375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 2.0, 5.0, 9.0, 7.0, 9.0, 11.0, 16.0, 30.0, 24.0, 33.0, 48.0, 48.0, 52.0, 85.0, 94.0, 91.0, 75.0, 58.0, 62.0, 47.0, 31.0, 25.0, 17.0, 22.0, 23.0, 19.0, 8.0, 14.0, 3.0, 7.0, 8.0, 2.0, 5.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25, -62.36474609375, -60.4794921875, -58.59423828125, -56.708984375, -54.82373046875, -52.9384765625, -51.05322265625, -49.16796875, -47.28271484375, -45.3974609375, -43.51220703125, -41.626953125, -39.74169921875, -37.8564453125, -35.97119140625, -34.0859375, -32.20068359375, -30.3154296875, -28.43017578125, -26.544921875, -24.65966796875, -22.7744140625, -20.88916015625, -19.00390625, -17.11865234375, -15.2333984375, -13.34814453125, -11.462890625, -9.57763671875, -7.6923828125, -5.80712890625, -3.921875, -2.03662109375, -0.1513671875, 1.73388671875, 3.619140625, 5.50439453125, 7.3896484375, 9.27490234375, 11.16015625, 13.04541015625, 14.9306640625, 16.81591796875, 18.701171875, 20.58642578125, 22.4716796875, 24.35693359375, 26.2421875, 28.12744140625, 30.0126953125, 31.89794921875, 33.783203125, 35.66845703125, 37.5537109375, 39.43896484375, 41.32421875, 43.20947265625, 45.0947265625, 46.97998046875, 48.865234375, 50.75048828125, 52.6357421875, 54.52099609375, 56.40625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 6.0, 0.0, 4.0, 3.0, 4.0, 10.0, 8.0, 5.0, 6.0, 12.0, 19.0, 25.0, 49.0, 88.0, 196.0, 399.0, 900.0, 2960.0, 13844.0, 330772.0, 679985.0, 14512.0, 3013.0, 897.0, 357.0, 218.0, 98.0, 58.0, 34.0, 30.0, 12.0, 10.0, 11.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.31640625, -7.01165771484375, -6.7069091796875, -6.40216064453125, -6.097412109375, -5.79266357421875, -5.4879150390625, -5.18316650390625, -4.87841796875, -4.57366943359375, -4.2689208984375, -3.96417236328125, -3.659423828125, -3.35467529296875, -3.0499267578125, -2.74517822265625, -2.4404296875, -2.13568115234375, -1.8309326171875, -1.52618408203125, -1.221435546875, -0.91668701171875, -0.6119384765625, -0.30718994140625, -0.00244140625, 0.30230712890625, 0.6070556640625, 0.91180419921875, 1.216552734375, 1.52130126953125, 1.8260498046875, 2.13079833984375, 2.435546875, 2.74029541015625, 3.0450439453125, 3.34979248046875, 3.654541015625, 3.95928955078125, 4.2640380859375, 4.56878662109375, 4.87353515625, 5.17828369140625, 5.4830322265625, 5.78778076171875, 6.092529296875, 6.39727783203125, 6.7020263671875, 7.00677490234375, 7.3115234375, 7.61627197265625, 7.9210205078125, 8.22576904296875, 8.530517578125, 8.83526611328125, 9.1400146484375, 9.44476318359375, 9.74951171875, 10.05426025390625, 10.3590087890625, 10.66375732421875, 10.968505859375, 11.27325439453125, 11.5780029296875, 11.88275146484375, 12.1875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 12.0, 21.0, 24.0, 50.0, 105.0, 243.0, 274.0, 101.0, 53.0, 37.0, 19.0, 16.0, 6.0, 9.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00452423095703125, -0.004405617713928223, -0.004287004470825195, -0.004168391227722168, -0.004049777984619141, -0.003931164741516113, -0.003812551498413086, -0.0036939382553100586, -0.0035753250122070312, -0.003456711769104004, -0.0033380985260009766, -0.0032194852828979492, -0.003100872039794922, -0.0029822587966918945, -0.002863645553588867, -0.00274503231048584, -0.0026264190673828125, -0.002507805824279785, -0.002389192581176758, -0.0022705793380737305, -0.002151966094970703, -0.0020333528518676758, -0.0019147396087646484, -0.001796126365661621, -0.0016775131225585938, -0.0015588998794555664, -0.001440286636352539, -0.0013216733932495117, -0.0012030601501464844, -0.001084446907043457, -0.0009658336639404297, -0.0008472204208374023, -0.000728607177734375, -0.0006099939346313477, -0.0004913806915283203, -0.00037276744842529297, -0.0002541542053222656, -0.00013554096221923828, -1.6927719116210938e-05, 0.0001016855239868164, 0.00022029876708984375, 0.0003389120101928711, 0.00045752525329589844, 0.0005761384963989258, 0.0006947517395019531, 0.0008133649826049805, 0.0009319782257080078, 0.0010505914688110352, 0.0011692047119140625, 0.0012878179550170898, 0.0014064311981201172, 0.0015250444412231445, 0.0016436576843261719, 0.0017622709274291992, 0.0018808841705322266, 0.001999497413635254, 0.0021181106567382812, 0.0022367238998413086, 0.002355337142944336, 0.0024739503860473633, 0.0025925636291503906, 0.002711176872253418, 0.0028297901153564453, 0.0029484033584594727, 0.0030670166015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 13.0, 10.0, 19.0, 28.0, 51.0, 81.0, 132.0, 243.0, 507.0, 1102.0, 2558.0, 7880.0, 48011.0, 936325.0, 39649.0, 7290.0, 2474.0, 1059.0, 498.0, 258.0, 141.0, 67.0, 39.0, 26.0, 14.0, 14.0, 15.0, 8.0, 10.0, 5.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9412841796875, -10.593505859375, -10.2457275390625, -9.89794921875, -9.5501708984375, -9.202392578125, -8.8546142578125, -8.5068359375, -8.1590576171875, -7.811279296875, -7.4635009765625, -7.11572265625, -6.7679443359375, -6.420166015625, -6.0723876953125, -5.724609375, -5.3768310546875, -5.029052734375, -4.6812744140625, -4.33349609375, -3.9857177734375, -3.637939453125, -3.2901611328125, -2.9423828125, -2.5946044921875, -2.246826171875, -1.8990478515625, -1.55126953125, -1.2034912109375, -0.855712890625, -0.5079345703125, -0.16015625, 0.1876220703125, 0.535400390625, 0.8831787109375, 1.23095703125, 1.5787353515625, 1.926513671875, 2.2742919921875, 2.6220703125, 2.9698486328125, 3.317626953125, 3.6654052734375, 4.01318359375, 4.3609619140625, 4.708740234375, 5.0565185546875, 5.404296875, 5.7520751953125, 6.099853515625, 6.4476318359375, 6.79541015625, 7.1431884765625, 7.490966796875, 7.8387451171875, 8.1865234375, 8.5343017578125, 8.882080078125, 9.2298583984375, 9.57763671875, 9.9254150390625, 10.273193359375, 10.6209716796875, 10.96875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 7.0, 10.0, 10.0, 13.0, 16.0, 26.0, 34.0, 67.0, 98.0, 150.0, 151.0, 109.0, 78.0, 57.0, 32.0, 24.0, 15.0, 14.0, 10.0, 8.0, 8.0, 8.0, 6.0, 6.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.15625, -5.946044921875, -5.73583984375, -5.525634765625, -5.3154296875, -5.105224609375, -4.89501953125, -4.684814453125, -4.474609375, -4.264404296875, -4.05419921875, -3.843994140625, -3.6337890625, -3.423583984375, -3.21337890625, -3.003173828125, -2.79296875, -2.582763671875, -2.37255859375, -2.162353515625, -1.9521484375, -1.741943359375, -1.53173828125, -1.321533203125, -1.111328125, -0.901123046875, -0.69091796875, -0.480712890625, -0.2705078125, -0.060302734375, 0.14990234375, 0.360107421875, 0.5703125, 0.780517578125, 0.99072265625, 1.200927734375, 1.4111328125, 1.621337890625, 1.83154296875, 2.041748046875, 2.251953125, 2.462158203125, 2.67236328125, 2.882568359375, 3.0927734375, 3.302978515625, 3.51318359375, 3.723388671875, 3.93359375, 4.143798828125, 4.35400390625, 4.564208984375, 4.7744140625, 4.984619140625, 5.19482421875, 5.405029296875, 5.615234375, 5.825439453125, 6.03564453125, 6.245849609375, 6.4560546875, 6.666259765625, 6.87646484375, 7.086669921875, 7.296875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 17.0, 104.0, 566.0, 201.0, 59.0, 21.0, 15.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.60238647460938, -142.18923950195312, -125.77609252929688, -109.36295318603516, -92.9498062133789, -76.53665924072266, -60.12351989746094, -43.71037292480469, -27.297225952148438, -10.88408088684082, 5.529064178466797, 21.94220733642578, 38.35535430908203, 54.76850128173828, 71.181640625, 87.59478759765625, 104.0079345703125, 120.42108154296875, 136.834228515625, 153.24737548828125, 169.6605224609375, 186.07366943359375, 202.48680114746094, 218.8999481201172, 235.31309509277344, 251.7262420654297, 268.1393737792969, 284.5525207519531, 300.9656677246094, 317.3788146972656, 333.7919616699219, 350.2051086425781, 366.61822509765625, 383.0313720703125, 399.44451904296875, 415.857666015625, 432.27081298828125, 448.6839599609375, 465.09710693359375, 481.51025390625, 497.92340087890625, 514.3365478515625, 530.7496948242188, 547.162841796875, 563.5759887695312, 579.9891357421875, 596.4022827148438, 612.8154296875, 629.228515625, 645.6416625976562, 662.0548095703125, 678.4679565429688, 694.881103515625, 711.2942504882812, 727.7073974609375, 744.1205444335938, 760.53369140625, 776.9468383789062, 793.3599853515625, 809.7731323242188, 826.186279296875, 842.5994262695312, 859.0125732421875, 875.4257202148438, 891.8388671875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 5.0, 2.0, 10.0, 10.0, 13.0, 15.0, 21.0, 20.0, 9.0, 29.0, 105.0, 97.0, 74.0, 46.0, 62.0, 108.0, 118.0, 41.0, 22.0, 24.0, 21.0, 18.0, 19.0, 13.0, 21.0, 5.0, 13.0, 4.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-181.88784790039062, -176.7776336669922, -171.66741943359375, -166.5572052001953, -161.44699096679688, -156.33677673339844, -151.2265625, -146.11634826660156, -141.00613403320312, -135.8959197998047, -130.78570556640625, -125.67549133300781, -120.56527709960938, -115.45506286621094, -110.3448486328125, -105.23463439941406, -100.12442779541016, -95.01421356201172, -89.90399932861328, -84.79378509521484, -79.6835708618164, -74.57335662841797, -69.46315002441406, -64.35293579101562, -59.24271774291992, -54.132503509521484, -49.02228927612305, -43.912078857421875, -38.80186462402344, -33.691650390625, -28.581436157226562, -23.471221923828125, -18.361007690429688, -13.25079345703125, -8.140580177307129, -3.030366897583008, 2.0798473358154297, 7.190061569213867, 12.300273895263672, 17.41048812866211, 22.520702362060547, 27.630916595458984, 32.74113082885742, 37.851341247558594, 42.96155548095703, 48.07176971435547, 53.181983947753906, 58.292198181152344, 63.40241241455078, 68.51262664794922, 73.62284088134766, 78.7330551147461, 83.84326934814453, 88.95348358154297, 94.06369018554688, 99.17390441894531, 104.28411865234375, 109.39433288574219, 114.50454711914062, 119.61476135253906, 124.7249755859375, 129.83518981933594, 134.94540405273438, 140.0556182861328, 145.16583251953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 14.0, 13.0, 32.0, 32.0, 54.0, 60.0, 88.0, 326.0, 119.0, 75.0, 55.0, 39.0, 34.0, 20.0, 11.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.78125, -23.94482421875, -23.1083984375, -22.27197265625, -21.435546875, -20.59912109375, -19.7626953125, -18.92626953125, -18.08984375, -17.25341796875, -16.4169921875, -15.58056640625, -14.744140625, -13.90771484375, -13.0712890625, -12.23486328125, -11.3984375, -10.56201171875, -9.7255859375, -8.88916015625, -8.052734375, -7.21630859375, -6.3798828125, -5.54345703125, -4.70703125, -3.87060546875, -3.0341796875, -2.19775390625, -1.361328125, -0.52490234375, 0.3115234375, 1.14794921875, 1.984375, 2.82080078125, 3.6572265625, 4.49365234375, 5.330078125, 6.16650390625, 7.0029296875, 7.83935546875, 8.67578125, 9.51220703125, 10.3486328125, 11.18505859375, 12.021484375, 12.85791015625, 13.6943359375, 14.53076171875, 15.3671875, 16.20361328125, 17.0400390625, 17.87646484375, 18.712890625, 19.54931640625, 20.3857421875, 21.22216796875, 22.05859375, 22.89501953125, 23.7314453125, 24.56787109375, 25.404296875, 26.24072265625, 27.0771484375, 27.91357421875, 28.75]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 6.0, 12.0, 9.0, 7.0, 18.0, 30.0, 40.0, 68.0, 130.0, 403.0, 1817.0, 243606.0, 8139432.0, 2196.0, 451.0, 164.0, 79.0, 24.0, 33.0, 31.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.75706481933594, -241.95896911621094, -234.16085815429688, -226.36276245117188, -218.5646514892578, -210.7665557861328, -202.96844482421875, -195.17034912109375, -187.3722381591797, -179.5741424560547, -171.77603149414062, -163.97793579101562, -156.17982482910156, -148.38172912597656, -140.5836181640625, -132.7855224609375, -124.98741912841797, -117.18931579589844, -109.3912124633789, -101.59310913085938, -93.79500579833984, -85.99690246582031, -78.19880676269531, -70.40069580078125, -62.602596282958984, -54.80449295043945, -47.00638961791992, -39.208290100097656, -31.410184860229492, -23.612083435058594, -15.813980102539062, -8.015876770019531, -0.2177734375, 7.580329418182373, 15.378432273864746, 23.17653465270996, 30.974637985229492, 38.77273941040039, 46.57084274291992, 54.36894607543945, 62.167049407958984, 69.96514892578125, 77.76325225830078, 85.56135559082031, 93.35945892333984, 101.15756225585938, 108.9556655883789, 116.75376892089844, 124.55187225341797, 132.3499755859375, 140.1480712890625, 147.94618225097656, 155.74427795410156, 163.54238891601562, 171.34048461914062, 179.1385955810547, 186.9366912841797, 194.7347869873047, 202.53289794921875, 210.33099365234375, 218.1291046142578, 225.9272003173828, 233.72531127929688, 241.52340698242188, 249.32151794433594]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-248.71612548828125, -240.24270629882812, -231.76930236816406, -223.2958984375, -214.82247924804688, -206.34906005859375, -197.8756561279297, -189.40225219726562, -180.9288330078125, -172.45541381835938, -163.9820098876953, -155.50860595703125, -147.03518676757812, -138.561767578125, -130.08836364746094, -121.61495208740234, -113.14154052734375, -104.66812896728516, -96.19471740722656, -87.72130584716797, -79.24789428710938, -70.77448272705078, -62.30107116699219, -53.827659606933594, -45.354248046875, -36.880836486816406, -28.407424926757812, -19.93401336669922, -11.460601806640625, -2.9871902465820312, 5.4862213134765625, 13.959632873535156, 22.433013916015625, 30.90642547607422, 39.37983703613281, 47.853248596191406, 56.32666015625, 64.8000717163086, 73.27348327636719, 81.74689483642578, 90.22030639648438, 98.69371795654297, 107.16712951660156, 115.64054107666016, 124.11395263671875, 132.58737182617188, 141.06077575683594, 149.5341796875, 158.00759887695312, 166.48101806640625, 174.9544219970703, 183.42782592773438, 191.9012451171875, 200.37466430664062, 208.8480682373047, 217.32147216796875, 225.79489135742188, 234.268310546875, 242.74171447753906, 251.21511840820312, 259.68853759765625, 268.1619567871094, 276.6353759765625, 285.1087646484375, 293.5821838378906]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 8.0, 12.0, 4.0, 12.0, 17.0, 16.0, 22.0, 22.0, 18.0, 28.0, 41.0, 27.0, 64.0, 58.0, 68.0, 62.0, 53.0, 63.0, 61.0, 47.0, 40.0, 42.0, 34.0, 28.0, 34.0, 20.0, 21.0, 12.0, 14.0, 9.0, 15.0, 6.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.734375, -7.5419921875, -7.349609375, -7.1572265625, -6.96484375, -6.7724609375, -6.580078125, -6.3876953125, -6.1953125, -6.0029296875, -5.810546875, -5.6181640625, -5.42578125, -5.2333984375, -5.041015625, -4.8486328125, -4.65625, -4.4638671875, -4.271484375, -4.0791015625, -3.88671875, -3.6943359375, -3.501953125, -3.3095703125, -3.1171875, -2.9248046875, -2.732421875, -2.5400390625, -2.34765625, -2.1552734375, -1.962890625, -1.7705078125, -1.578125, -1.3857421875, -1.193359375, -1.0009765625, -0.80859375, -0.6162109375, -0.423828125, -0.2314453125, -0.0390625, 0.1533203125, 0.345703125, 0.5380859375, 0.73046875, 0.9228515625, 1.115234375, 1.3076171875, 1.5, 1.6923828125, 1.884765625, 2.0771484375, 2.26953125, 2.4619140625, 2.654296875, 2.8466796875, 3.0390625, 3.2314453125, 3.423828125, 3.6162109375, 3.80859375, 4.0009765625, 4.193359375, 4.3857421875, 4.578125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 4.0, 11.0, 9.0, 26.0, 29.0, 52.0, 78.0, 160.0, 272.0, 437.0, 776.0, 1500.0, 3262.0, 7860.0, 22523.0, 73059.0, 204190.0, 142578.0, 43141.0, 14016.0, 5315.0, 2440.0, 1107.0, 577.0, 303.0, 208.0, 115.0, 73.0, 36.0, 26.0, 14.0, 16.0, 9.0, 7.0, 7.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-90.6875, -87.7412109375, -84.794921875, -81.8486328125, -78.90234375, -75.9560546875, -73.009765625, -70.0634765625, -67.1171875, -64.1708984375, -61.224609375, -58.2783203125, -55.33203125, -52.3857421875, -49.439453125, -46.4931640625, -43.546875, -40.6005859375, -37.654296875, -34.7080078125, -31.76171875, -28.8154296875, -25.869140625, -22.9228515625, -19.9765625, -17.0302734375, -14.083984375, -11.1376953125, -8.19140625, -5.2451171875, -2.298828125, 0.6474609375, 3.59375, 6.5400390625, 9.486328125, 12.4326171875, 15.37890625, 18.3251953125, 21.271484375, 24.2177734375, 27.1640625, 30.1103515625, 33.056640625, 36.0029296875, 38.94921875, 41.8955078125, 44.841796875, 47.7880859375, 50.734375, 53.6806640625, 56.626953125, 59.5732421875, 62.51953125, 65.4658203125, 68.412109375, 71.3583984375, 74.3046875, 77.2509765625, 80.197265625, 83.1435546875, 86.08984375, 89.0361328125, 91.982421875, 94.9287109375, 97.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 6.0, 7.0, 7.0, 7.0, 12.0, 17.0, 22.0, 31.0, 40.0, 69.0, 72.0, 68.0, 97.0, 94.0, 100.0, 82.0, 67.0, 47.0, 34.0, 19.0, 28.0, 18.0, 10.0, 11.0, 7.0, 7.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-23.515625, -22.8997802734375, -22.283935546875, -21.6680908203125, -21.05224609375, -20.4364013671875, -19.820556640625, -19.2047119140625, -18.5888671875, -17.9730224609375, -17.357177734375, -16.7413330078125, -16.12548828125, -15.5096435546875, -14.893798828125, -14.2779541015625, -13.662109375, -13.0462646484375, -12.430419921875, -11.8145751953125, -11.19873046875, -10.5828857421875, -9.967041015625, -9.3511962890625, -8.7353515625, -8.1195068359375, -7.503662109375, -6.8878173828125, -6.27197265625, -5.6561279296875, -5.040283203125, -4.4244384765625, -3.80859375, -3.1927490234375, -2.576904296875, -1.9610595703125, -1.34521484375, -0.7293701171875, -0.113525390625, 0.5023193359375, 1.1181640625, 1.7340087890625, 2.349853515625, 2.9656982421875, 3.58154296875, 4.1973876953125, 4.813232421875, 5.4290771484375, 6.044921875, 6.6607666015625, 7.276611328125, 7.8924560546875, 8.50830078125, 9.1241455078125, 9.739990234375, 10.3558349609375, 10.9716796875, 11.5875244140625, 12.203369140625, 12.8192138671875, 13.43505859375, 14.0509033203125, 14.666748046875, 15.2825927734375, 15.8984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 9.0, 32.0, 60.0, 101.0, 131.0, 64.0, 32.0, 17.0, 14.0, 10.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-309.65032958984375, -303.609375, -297.56842041015625, -291.5274658203125, -285.48651123046875, -279.445556640625, -273.40460205078125, -267.3636474609375, -261.32269287109375, -255.28173828125, -249.24078369140625, -243.1998291015625, -237.15887451171875, -231.11793518066406, -225.0769805908203, -219.03602600097656, -212.99508666992188, -206.95413208007812, -200.91317749023438, -194.87222290039062, -188.83126831054688, -182.7903289794922, -176.74937438964844, -170.7084197998047, -164.66746520996094, -158.6265106201172, -152.58555603027344, -146.5446014404297, -140.503662109375, -134.46270751953125, -128.4217529296875, -122.38079833984375, -116.33984375, -110.29888916015625, -104.2579345703125, -98.21698760986328, -92.17603302001953, -86.13507843017578, -80.09413146972656, -74.05317687988281, -68.01222229003906, -61.97126770019531, -55.93031692504883, -49.889366149902344, -43.848411560058594, -37.807456970214844, -31.76650619506836, -25.725555419921875, -19.684600830078125, -13.643648147583008, -7.602695465087891, -1.5617427825927734, 4.479209899902344, 10.520162582397461, 16.561115264892578, 22.602066040039062, 28.643020629882812, 34.68397521972656, 40.72492599487305, 46.76587677001953, 52.80683135986328, 58.84778594970703, 64.88873291015625, 70.9296875, 76.97064208984375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 2.0, 8.0, 12.0, 22.0, 27.0, 50.0, 52.0, 85.0, 67.0, 39.0, 35.0, 24.0, 17.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-187.84454345703125, -183.61148071289062, -179.37843322753906, -175.14537048339844, -170.91232299804688, -166.67926025390625, -162.4462127685547, -158.21315002441406, -153.9801025390625, -149.74703979492188, -145.5139923095703, -141.2809295654297, -137.04788208007812, -132.8148193359375, -128.58177185058594, -124.34870910644531, -120.11564636230469, -115.8825912475586, -111.6495361328125, -107.4164810180664, -103.18342590332031, -98.95036315917969, -94.7173080444336, -90.4842529296875, -86.2511978149414, -82.01814270019531, -77.78508758544922, -73.55203247070312, -69.3189697265625, -65.08592224121094, -60.85285949707031, -56.61980438232422, -52.386749267578125, -48.15369415283203, -43.92063903808594, -39.68758010864258, -35.454524993896484, -31.22146987915039, -26.988412857055664, -22.755355834960938, -18.522300720214844, -14.289244651794434, -10.056188583374023, -5.823132514953613, -1.5900764465332031, 2.6429786682128906, 6.876035690307617, 11.109092712402344, 15.342147827148438, 19.57520294189453, 23.808259963989258, 28.041316986083984, 32.27437210083008, 36.50742721557617, 40.74048614501953, 44.973541259765625, 49.20659637451172, 53.43965148925781, 57.672706604003906, 61.905765533447266, 66.13882446289062, 70.37187194824219, 74.60493469238281, 78.8379898071289, 83.071044921875]}, "eval/loss": 3.480835437774658, "eval/wer": 0.7460729869099564, "eval/runtime": 649.7344, "eval/samples_per_second": 4.066, "eval/steps_per_second": 0.509} \ No newline at end of file +{"train/loss": 1.5259, "train/learning_rate": 2.2961971830985914e-05, "train/epoch": 6.73, "train/global_step": 6000, "_runtime": 35889, "_timestamp": 1648177233, "_step": 6003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 10.0, 24.0, 21.0, 26.0, 34.0, 36.0, 31.0, 33.0, 36.0, 44.0, 44.0, 43.0, 57.0, 59.0, 71.0, 49.0, 54.0, 48.0, 52.0, 43.0, 36.0, 27.0, 27.0, 17.0, 11.0, 11.0, 13.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5392951965332, -45.22349548339844, -43.90769958496094, -42.59189987182617, -41.276100158691406, -39.96030044555664, -38.644500732421875, -37.328704833984375, -36.01290512084961, -34.697105407714844, -33.381309509277344, -32.06550979614258, -30.749710083007812, -29.433910369873047, -28.118112564086914, -26.80231475830078, -25.486515045166016, -24.17071533203125, -22.854917526245117, -21.539119720458984, -20.22332000732422, -18.907520294189453, -17.59172248840332, -16.275924682617188, -14.960124969482422, -13.644326210021973, -12.328527450561523, -11.012728691101074, -9.696929931640625, -8.381131172180176, -7.065332412719727, -5.749533653259277, -4.4337310791015625, -3.1179323196411133, -1.802133560180664, -0.48633480072021484, 0.8294639587402344, 2.1452627182006836, 3.461061477661133, 4.776860237121582, 6.092658996582031, 7.4084577560424805, 8.72425651550293, 10.040055274963379, 11.355854034423828, 12.671652793884277, 13.987451553344727, 15.303250312805176, 16.619049072265625, 17.93484878540039, 19.250646591186523, 20.566444396972656, 21.882244110107422, 23.198043823242188, 24.51384162902832, 25.829639434814453, 27.14543914794922, 28.461238861083984, 29.777036666870117, 31.09283447265625, 32.408634185791016, 33.72443389892578, 35.04022979736328, 36.35602951049805, 37.67182922363281]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 10.0, 8.0, 9.0, 13.0, 11.0, 13.0, 24.0, 18.0, 18.0, 28.0, 32.0, 24.0, 27.0, 34.0, 29.0, 37.0, 32.0, 31.0, 41.0, 36.0, 35.0, 37.0, 44.0, 35.0, 36.0, 30.0, 24.0, 32.0, 38.0, 27.0, 17.0, 21.0, 15.0, 19.0, 21.0, 17.0, 16.0, 8.0, 14.0, 7.0, 8.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.92849349975586, -34.91211700439453, -33.89574432373047, -32.87936782836914, -31.862993240356445, -30.84661865234375, -29.830244064331055, -28.81386947631836, -27.79749298095703, -26.781118392944336, -25.76474380493164, -24.748367309570312, -23.731992721557617, -22.715618133544922, -21.699243545532227, -20.68286895751953, -19.666494369506836, -18.65011978149414, -17.633745193481445, -16.61737060546875, -15.600994110107422, -14.584619522094727, -13.568244934082031, -12.551870346069336, -11.535494804382324, -10.519120216369629, -9.502744674682617, -8.486370086669922, -7.469995021820068, -6.453619956970215, -5.4372453689575195, -4.420870304107666, -3.4044952392578125, -2.388120174407959, -1.3717453479766846, -0.35537052154541016, 0.6610045433044434, 1.6773796081542969, 2.693754196166992, 3.7101292610168457, 4.726504325866699, 5.742879390716553, 6.759254455566406, 7.775629043579102, 8.792003631591797, 9.808379173278809, 10.824753761291504, 11.841129302978516, 12.857503890991211, 13.873878479003906, 14.890254020690918, 15.906628608703613, 16.923004150390625, 17.93937873840332, 18.955753326416016, 19.97212791442871, 20.988502502441406, 22.0048770904541, 23.021251678466797, 24.037628173828125, 25.05400276184082, 26.070377349853516, 27.08675193786621, 28.103126525878906, 29.119503021240234]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 13.0, 23.0, 28.0, 39.0, 68.0, 87.0, 151.0, 199.0, 392.0, 600.0, 971.0, 1564.0, 2549.0, 4282.0, 7320.0, 12767.0, 21970.0, 38543.0, 67608.0, 118559.0, 210006.0, 359328.0, 564308.0, 735761.0, 717348.0, 535014.0, 337380.0, 197141.0, 111849.0, 63421.0, 35742.0, 20374.0, 11778.0, 6864.0, 3986.0, 2525.0, 1416.0, 814.0, 528.0, 347.0, 214.0, 123.0, 101.0, 55.0, 36.0, 29.0, 17.0, 10.0, 13.0, 5.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-37.28125, -36.076171875, -34.87109375, -33.666015625, -32.4609375, -31.255859375, -30.05078125, -28.845703125, -27.640625, -26.435546875, -25.23046875, -24.025390625, -22.8203125, -21.615234375, -20.41015625, -19.205078125, -18.0, -16.794921875, -15.58984375, -14.384765625, -13.1796875, -11.974609375, -10.76953125, -9.564453125, -8.359375, -7.154296875, -5.94921875, -4.744140625, -3.5390625, -2.333984375, -1.12890625, 0.076171875, 1.28125, 2.486328125, 3.69140625, 4.896484375, 6.1015625, 7.306640625, 8.51171875, 9.716796875, 10.921875, 12.126953125, 13.33203125, 14.537109375, 15.7421875, 16.947265625, 18.15234375, 19.357421875, 20.5625, 21.767578125, 22.97265625, 24.177734375, 25.3828125, 26.587890625, 27.79296875, 28.998046875, 30.203125, 31.408203125, 32.61328125, 33.818359375, 35.0234375, 36.228515625, 37.43359375, 38.638671875, 39.84375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 11.0, 8.0, 8.0, 17.0, 15.0, 14.0, 27.0, 33.0, 23.0, 31.0, 29.0, 40.0, 38.0, 31.0, 30.0, 49.0, 48.0, 42.0, 48.0, 42.0, 42.0, 46.0, 38.0, 34.0, 38.0, 31.0, 28.0, 38.0, 24.0, 11.0, 15.0, 13.0, 18.0, 9.0, 6.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.578125, -28.610107421875, -27.64208984375, -26.674072265625, -25.7060546875, -24.738037109375, -23.77001953125, -22.802001953125, -21.833984375, -20.865966796875, -19.89794921875, -18.929931640625, -17.9619140625, -16.993896484375, -16.02587890625, -15.057861328125, -14.08984375, -13.121826171875, -12.15380859375, -11.185791015625, -10.2177734375, -9.249755859375, -8.28173828125, -7.313720703125, -6.345703125, -5.377685546875, -4.40966796875, -3.441650390625, -2.4736328125, -1.505615234375, -0.53759765625, 0.430419921875, 1.3984375, 2.366455078125, 3.33447265625, 4.302490234375, 5.2705078125, 6.238525390625, 7.20654296875, 8.174560546875, 9.142578125, 10.110595703125, 11.07861328125, 12.046630859375, 13.0146484375, 13.982666015625, 14.95068359375, 15.918701171875, 16.88671875, 17.854736328125, 18.82275390625, 19.790771484375, 20.7587890625, 21.726806640625, 22.69482421875, 23.662841796875, 24.630859375, 25.598876953125, 26.56689453125, 27.534912109375, 28.5029296875, 29.470947265625, 30.43896484375, 31.406982421875, 32.375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 16.0, 25.0, 38.0, 54.0, 88.0, 147.0, 237.0, 375.0, 583.0, 858.0, 1350.0, 2068.0, 3396.0, 5438.0, 8509.0, 14069.0, 22561.0, 35748.0, 57695.0, 90357.0, 139314.0, 208792.0, 301956.0, 410187.0, 508323.0, 549811.0, 510077.0, 412971.0, 306665.0, 212500.0, 141608.0, 91777.0, 58671.0, 36714.0, 22986.0, 14406.0, 8989.0, 5503.0, 3438.0, 2149.0, 1416.0, 847.0, 588.0, 345.0, 242.0, 137.0, 108.0, 49.0, 31.0, 16.0, 18.0, 13.0, 9.0, 2.0, 2.0, 6.0], "bins": [-28.59375, -27.74072265625, -26.8876953125, -26.03466796875, -25.181640625, -24.32861328125, -23.4755859375, -22.62255859375, -21.76953125, -20.91650390625, -20.0634765625, -19.21044921875, -18.357421875, -17.50439453125, -16.6513671875, -15.79833984375, -14.9453125, -14.09228515625, -13.2392578125, -12.38623046875, -11.533203125, -10.68017578125, -9.8271484375, -8.97412109375, -8.12109375, -7.26806640625, -6.4150390625, -5.56201171875, -4.708984375, -3.85595703125, -3.0029296875, -2.14990234375, -1.296875, -0.44384765625, 0.4091796875, 1.26220703125, 2.115234375, 2.96826171875, 3.8212890625, 4.67431640625, 5.52734375, 6.38037109375, 7.2333984375, 8.08642578125, 8.939453125, 9.79248046875, 10.6455078125, 11.49853515625, 12.3515625, 13.20458984375, 14.0576171875, 14.91064453125, 15.763671875, 16.61669921875, 17.4697265625, 18.32275390625, 19.17578125, 20.02880859375, 20.8818359375, 21.73486328125, 22.587890625, 23.44091796875, 24.2939453125, 25.14697265625, 26.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 17.0, 23.0, 27.0, 22.0, 31.0, 38.0, 68.0, 75.0, 75.0, 89.0, 105.0, 133.0, 168.0, 166.0, 183.0, 215.0, 194.0, 205.0, 232.0, 235.0, 205.0, 182.0, 231.0, 186.0, 146.0, 140.0, 99.0, 93.0, 96.0, 71.0, 38.0, 53.0, 40.0, 37.0, 30.0, 19.0, 18.0, 20.0, 15.0, 10.0, 7.0, 2.0, 7.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.609375, -12.203857421875, -11.79833984375, -11.392822265625, -10.9873046875, -10.581787109375, -10.17626953125, -9.770751953125, -9.365234375, -8.959716796875, -8.55419921875, -8.148681640625, -7.7431640625, -7.337646484375, -6.93212890625, -6.526611328125, -6.12109375, -5.715576171875, -5.31005859375, -4.904541015625, -4.4990234375, -4.093505859375, -3.68798828125, -3.282470703125, -2.876953125, -2.471435546875, -2.06591796875, -1.660400390625, -1.2548828125, -0.849365234375, -0.44384765625, -0.038330078125, 0.3671875, 0.772705078125, 1.17822265625, 1.583740234375, 1.9892578125, 2.394775390625, 2.80029296875, 3.205810546875, 3.611328125, 4.016845703125, 4.42236328125, 4.827880859375, 5.2333984375, 5.638916015625, 6.04443359375, 6.449951171875, 6.85546875, 7.260986328125, 7.66650390625, 8.072021484375, 8.4775390625, 8.883056640625, 9.28857421875, 9.694091796875, 10.099609375, 10.505126953125, 10.91064453125, 11.316162109375, 11.7216796875, 12.127197265625, 12.53271484375, 12.938232421875, 13.34375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 17.0, 5.0, 16.0, 21.0, 10.0, 31.0, 21.0, 28.0, 34.0, 32.0, 52.0, 46.0, 51.0, 55.0, 57.0, 55.0, 46.0, 56.0, 49.0, 46.0, 30.0, 29.0, 47.0, 26.0, 26.0, 21.0, 20.0, 11.0, 8.0, 8.0, 11.0, 4.0, 8.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.374835968017578, -28.21469497680664, -27.054553985595703, -25.894411087036133, -24.734270095825195, -23.574129104614258, -22.413986206054688, -21.25384521484375, -20.093704223632812, -18.933563232421875, -17.773422241210938, -16.613279342651367, -15.45313835144043, -14.292997360229492, -13.132855415344238, -11.972713470458984, -10.812572479248047, -9.65243148803711, -8.492289543151855, -7.33214807510376, -6.172006607055664, -5.011865139007568, -3.8517236709594727, -2.6915817260742188, -1.5314407348632812, -0.37129926681518555, 0.7888422012329102, 1.9489836692810059, 3.1091251373291016, 4.269266605377197, 5.429408073425293, 6.589550018310547, 7.749687194824219, 8.909828186035156, 10.06997013092041, 11.230112075805664, 12.390253067016602, 13.550394058227539, 14.710536003112793, 15.870677947998047, 17.030818939208984, 18.190959930419922, 19.35110092163086, 20.51124382019043, 21.671384811401367, 22.831525802612305, 23.991668701171875, 25.151809692382812, 26.31195068359375, 27.472091674804688, 28.632232666015625, 29.792375564575195, 30.952516555786133, 32.1126594543457, 33.27280044555664, 34.43294143676758, 35.593082427978516, 36.75322341918945, 37.91336441040039, 39.07350540161133, 40.23365020751953, 41.39379119873047, 42.553932189941406, 43.714073181152344, 44.87421417236328]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 11.0, 13.0, 18.0, 11.0, 16.0, 13.0, 16.0, 12.0, 19.0, 33.0, 26.0, 26.0, 23.0, 27.0, 37.0, 37.0, 37.0, 32.0, 32.0, 56.0, 31.0, 32.0, 42.0, 40.0, 34.0, 28.0, 36.0, 31.0, 21.0, 25.0, 20.0, 24.0, 30.0, 12.0, 18.0, 18.0, 5.0, 11.0, 8.0, 5.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.3676700592041, -26.449026107788086, -25.530384063720703, -24.611740112304688, -23.693098068237305, -22.77445411682129, -21.855812072753906, -20.93716812133789, -20.018524169921875, -19.09988021850586, -18.181238174438477, -17.26259422302246, -16.343952178955078, -15.425308227539062, -14.506665229797363, -13.588022232055664, -12.669379234313965, -11.750736236572266, -10.832093238830566, -9.913450241088867, -8.994806289672852, -8.076163291931152, -7.157520294189453, -6.238876819610596, -5.3202338218688965, -4.401590824127197, -3.48294734954834, -2.5643043518066406, -1.6456611156463623, -0.727017879486084, 0.19162511825561523, 1.1102685928344727, 2.028911590576172, 2.94755482673645, 3.8661980628967285, 4.784841060638428, 5.703484535217285, 6.622127532958984, 7.540770530700684, 8.459413528442383, 9.378057479858398, 10.296700477600098, 11.215343475341797, 12.133987426757812, 13.052630424499512, 13.971273422241211, 14.88991641998291, 15.80855941772461, 16.727203369140625, 17.64584732055664, 18.564489364624023, 19.48313331604004, 20.401775360107422, 21.320419311523438, 22.239063262939453, 23.157705307006836, 24.07634735107422, 24.994991302490234, 25.913633346557617, 26.832277297973633, 27.750919342041016, 28.66956329345703, 29.588207244873047, 30.50684928894043, 31.425493240356445]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 16.0, 18.0, 30.0, 37.0, 61.0, 95.0, 133.0, 185.0, 319.0, 417.0, 681.0, 1029.0, 1475.0, 2118.0, 3288.0, 5091.0, 7640.0, 11643.0, 16941.0, 25128.0, 36685.0, 53279.0, 74233.0, 98616.0, 119604.0, 128697.0, 120111.0, 98979.0, 74500.0, 53425.0, 37122.0, 25280.0, 17120.0, 11449.0, 7471.0, 5285.0, 3457.0, 2270.0, 1536.0, 1021.0, 668.0, 452.0, 308.0, 208.0, 155.0, 86.0, 64.0, 47.0, 15.0, 27.0, 17.0, 6.0, 9.0, 2.0, 6.0, 0.0, 2.0, 3.0], "bins": [-25.65625, -24.842041015625, -24.02783203125, -23.213623046875, -22.3994140625, -21.585205078125, -20.77099609375, -19.956787109375, -19.142578125, -18.328369140625, -17.51416015625, -16.699951171875, -15.8857421875, -15.071533203125, -14.25732421875, -13.443115234375, -12.62890625, -11.814697265625, -11.00048828125, -10.186279296875, -9.3720703125, -8.557861328125, -7.74365234375, -6.929443359375, -6.115234375, -5.301025390625, -4.48681640625, -3.672607421875, -2.8583984375, -2.044189453125, -1.22998046875, -0.415771484375, 0.3984375, 1.212646484375, 2.02685546875, 2.841064453125, 3.6552734375, 4.469482421875, 5.28369140625, 6.097900390625, 6.912109375, 7.726318359375, 8.54052734375, 9.354736328125, 10.1689453125, 10.983154296875, 11.79736328125, 12.611572265625, 13.42578125, 14.239990234375, 15.05419921875, 15.868408203125, 16.6826171875, 17.496826171875, 18.31103515625, 19.125244140625, 19.939453125, 20.753662109375, 21.56787109375, 22.382080078125, 23.1962890625, 24.010498046875, 24.82470703125, 25.638916015625, 26.453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 5.0, 9.0, 11.0, 15.0, 16.0, 12.0, 16.0, 14.0, 27.0, 33.0, 23.0, 26.0, 29.0, 33.0, 29.0, 34.0, 42.0, 38.0, 49.0, 31.0, 45.0, 32.0, 34.0, 36.0, 38.0, 24.0, 31.0, 36.0, 30.0, 24.0, 24.0, 19.0, 14.0, 18.0, 15.0, 19.0, 16.0, 11.0, 7.0, 5.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.0625, -27.177978515625, -26.29345703125, -25.408935546875, -24.5244140625, -23.639892578125, -22.75537109375, -21.870849609375, -20.986328125, -20.101806640625, -19.21728515625, -18.332763671875, -17.4482421875, -16.563720703125, -15.67919921875, -14.794677734375, -13.91015625, -13.025634765625, -12.14111328125, -11.256591796875, -10.3720703125, -9.487548828125, -8.60302734375, -7.718505859375, -6.833984375, -5.949462890625, -5.06494140625, -4.180419921875, -3.2958984375, -2.411376953125, -1.52685546875, -0.642333984375, 0.2421875, 1.126708984375, 2.01123046875, 2.895751953125, 3.7802734375, 4.664794921875, 5.54931640625, 6.433837890625, 7.318359375, 8.202880859375, 9.08740234375, 9.971923828125, 10.8564453125, 11.740966796875, 12.62548828125, 13.510009765625, 14.39453125, 15.279052734375, 16.16357421875, 17.048095703125, 17.9326171875, 18.817138671875, 19.70166015625, 20.586181640625, 21.470703125, 22.355224609375, 23.23974609375, 24.124267578125, 25.0087890625, 25.893310546875, 26.77783203125, 27.662353515625, 28.546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 11.0, 13.0, 13.0, 25.0, 36.0, 65.0, 89.0, 145.0, 214.0, 307.0, 448.0, 745.0, 1208.0, 2043.0, 3748.0, 6715.0, 12500.0, 25142.0, 51449.0, 105246.0, 194818.0, 252996.0, 188883.0, 100853.0, 49291.0, 24197.0, 12158.0, 6384.0, 3509.0, 2032.0, 1201.0, 743.0, 457.0, 279.0, 188.0, 138.0, 64.0, 59.0, 31.0, 35.0, 19.0, 12.0, 12.0, 10.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.0, -41.5888671875, -40.177734375, -38.7666015625, -37.35546875, -35.9443359375, -34.533203125, -33.1220703125, -31.7109375, -30.2998046875, -28.888671875, -27.4775390625, -26.06640625, -24.6552734375, -23.244140625, -21.8330078125, -20.421875, -19.0107421875, -17.599609375, -16.1884765625, -14.77734375, -13.3662109375, -11.955078125, -10.5439453125, -9.1328125, -7.7216796875, -6.310546875, -4.8994140625, -3.48828125, -2.0771484375, -0.666015625, 0.7451171875, 2.15625, 3.5673828125, 4.978515625, 6.3896484375, 7.80078125, 9.2119140625, 10.623046875, 12.0341796875, 13.4453125, 14.8564453125, 16.267578125, 17.6787109375, 19.08984375, 20.5009765625, 21.912109375, 23.3232421875, 24.734375, 26.1455078125, 27.556640625, 28.9677734375, 30.37890625, 31.7900390625, 33.201171875, 34.6123046875, 36.0234375, 37.4345703125, 38.845703125, 40.2568359375, 41.66796875, 43.0791015625, 44.490234375, 45.9013671875, 47.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 6.0, 13.0, 18.0, 17.0, 20.0, 26.0, 22.0, 26.0, 33.0, 26.0, 33.0, 31.0, 28.0, 47.0, 43.0, 50.0, 47.0, 45.0, 42.0, 47.0, 46.0, 28.0, 38.0, 37.0, 27.0, 25.0, 24.0, 21.0, 21.0, 19.0, 13.0, 16.0, 7.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-24.375, -23.670654296875, -22.96630859375, -22.261962890625, -21.5576171875, -20.853271484375, -20.14892578125, -19.444580078125, -18.740234375, -18.035888671875, -17.33154296875, -16.627197265625, -15.9228515625, -15.218505859375, -14.51416015625, -13.809814453125, -13.10546875, -12.401123046875, -11.69677734375, -10.992431640625, -10.2880859375, -9.583740234375, -8.87939453125, -8.175048828125, -7.470703125, -6.766357421875, -6.06201171875, -5.357666015625, -4.6533203125, -3.948974609375, -3.24462890625, -2.540283203125, -1.8359375, -1.131591796875, -0.42724609375, 0.277099609375, 0.9814453125, 1.685791015625, 2.39013671875, 3.094482421875, 3.798828125, 4.503173828125, 5.20751953125, 5.911865234375, 6.6162109375, 7.320556640625, 8.02490234375, 8.729248046875, 9.43359375, 10.137939453125, 10.84228515625, 11.546630859375, 12.2509765625, 12.955322265625, 13.65966796875, 14.364013671875, 15.068359375, 15.772705078125, 16.47705078125, 17.181396484375, 17.8857421875, 18.590087890625, 19.29443359375, 19.998779296875, 20.703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 18.0, 23.0, 24.0, 29.0, 49.0, 69.0, 87.0, 141.0, 167.0, 284.0, 365.0, 551.0, 923.0, 1576.0, 2689.0, 5016.0, 9736.0, 20406.0, 48030.0, 114481.0, 241595.0, 295467.0, 171140.0, 73998.0, 31391.0, 14216.0, 7054.0, 3631.0, 2024.0, 1202.0, 731.0, 442.0, 295.0, 213.0, 161.0, 98.0, 62.0, 55.0, 31.0, 26.0, 15.0, 10.0, 6.0, 9.0, 1.0, 1.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.71875, -20.0556640625, -19.392578125, -18.7294921875, -18.06640625, -17.4033203125, -16.740234375, -16.0771484375, -15.4140625, -14.7509765625, -14.087890625, -13.4248046875, -12.76171875, -12.0986328125, -11.435546875, -10.7724609375, -10.109375, -9.4462890625, -8.783203125, -8.1201171875, -7.45703125, -6.7939453125, -6.130859375, -5.4677734375, -4.8046875, -4.1416015625, -3.478515625, -2.8154296875, -2.15234375, -1.4892578125, -0.826171875, -0.1630859375, 0.5, 1.1630859375, 1.826171875, 2.4892578125, 3.15234375, 3.8154296875, 4.478515625, 5.1416015625, 5.8046875, 6.4677734375, 7.130859375, 7.7939453125, 8.45703125, 9.1201171875, 9.783203125, 10.4462890625, 11.109375, 11.7724609375, 12.435546875, 13.0986328125, 13.76171875, 14.4248046875, 15.087890625, 15.7509765625, 16.4140625, 17.0771484375, 17.740234375, 18.4033203125, 19.06640625, 19.7294921875, 20.392578125, 21.0556640625, 21.71875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 7.0, 15.0, 11.0, 23.0, 28.0, 45.0, 74.0, 68.0, 102.0, 125.0, 98.0, 106.0, 97.0, 58.0, 32.0, 28.0, 27.0, 10.0, 10.0, 11.0, 4.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0038852691650390625, -0.0037883222103118896, -0.003691375255584717, -0.003594428300857544, -0.003497481346130371, -0.0034005343914031982, -0.0033035874366760254, -0.0032066404819488525, -0.0031096935272216797, -0.003012746572494507, -0.002915799617767334, -0.002818852663040161, -0.0027219057083129883, -0.0026249587535858154, -0.0025280117988586426, -0.0024310648441314697, -0.002334117889404297, -0.002237170934677124, -0.002140223979949951, -0.0020432770252227783, -0.0019463300704956055, -0.0018493831157684326, -0.0017524361610412598, -0.001655489206314087, -0.001558542251586914, -0.0014615952968597412, -0.0013646483421325684, -0.0012677013874053955, -0.0011707544326782227, -0.0010738074779510498, -0.000976860523223877, -0.0008799135684967041, -0.0007829666137695312, -0.0006860196590423584, -0.0005890727043151855, -0.0004921257495880127, -0.00039517879486083984, -0.000298231840133667, -0.00020128488540649414, -0.00010433793067932129, -7.3909759521484375e-06, 8.955597877502441e-05, 0.00018650293350219727, 0.0002834498882293701, 0.00038039684295654297, 0.0004773437976837158, 0.0005742907524108887, 0.0006712377071380615, 0.0007681846618652344, 0.0008651316165924072, 0.0009620785713195801, 0.001059025526046753, 0.0011559724807739258, 0.0012529194355010986, 0.0013498663902282715, 0.0014468133449554443, 0.0015437602996826172, 0.00164070725440979, 0.0017376542091369629, 0.0018346011638641357, 0.0019315481185913086, 0.0020284950733184814, 0.0021254420280456543, 0.002222388982772827, 0.0023193359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 5.0, 6.0, 10.0, 12.0, 18.0, 25.0, 38.0, 48.0, 52.0, 73.0, 102.0, 144.0, 172.0, 257.0, 353.0, 499.0, 722.0, 1144.0, 1989.0, 3318.0, 7076.0, 16613.0, 45369.0, 130809.0, 299046.0, 311374.0, 143995.0, 49906.0, 18224.0, 7645.0, 3665.0, 1966.0, 1183.0, 781.0, 499.0, 368.0, 291.0, 210.0, 139.0, 105.0, 77.0, 55.0, 46.0, 41.0, 23.0, 16.0, 11.0, 11.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.57666015625, -30.5595703125, -29.54248046875, -28.525390625, -27.50830078125, -26.4912109375, -25.47412109375, -24.45703125, -23.43994140625, -22.4228515625, -21.40576171875, -20.388671875, -19.37158203125, -18.3544921875, -17.33740234375, -16.3203125, -15.30322265625, -14.2861328125, -13.26904296875, -12.251953125, -11.23486328125, -10.2177734375, -9.20068359375, -8.18359375, -7.16650390625, -6.1494140625, -5.13232421875, -4.115234375, -3.09814453125, -2.0810546875, -1.06396484375, -0.046875, 0.97021484375, 1.9873046875, 3.00439453125, 4.021484375, 5.03857421875, 6.0556640625, 7.07275390625, 8.08984375, 9.10693359375, 10.1240234375, 11.14111328125, 12.158203125, 13.17529296875, 14.1923828125, 15.20947265625, 16.2265625, 17.24365234375, 18.2607421875, 19.27783203125, 20.294921875, 21.31201171875, 22.3291015625, 23.34619140625, 24.36328125, 25.38037109375, 26.3974609375, 27.41455078125, 28.431640625, 29.44873046875, 30.4658203125, 31.48291015625, 32.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 18.0, 19.0, 19.0, 25.0, 42.0, 37.0, 63.0, 63.0, 82.0, 66.0, 82.0, 90.0, 70.0, 54.0, 55.0, 49.0, 35.0, 30.0, 19.0, 19.0, 16.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.9921875, -9.7281494140625, -9.464111328125, -9.2000732421875, -8.93603515625, -8.6719970703125, -8.407958984375, -8.1439208984375, -7.8798828125, -7.6158447265625, -7.351806640625, -7.0877685546875, -6.82373046875, -6.5596923828125, -6.295654296875, -6.0316162109375, -5.767578125, -5.5035400390625, -5.239501953125, -4.9754638671875, -4.71142578125, -4.4473876953125, -4.183349609375, -3.9193115234375, -3.6552734375, -3.3912353515625, -3.127197265625, -2.8631591796875, -2.59912109375, -2.3350830078125, -2.071044921875, -1.8070068359375, -1.54296875, -1.2789306640625, -1.014892578125, -0.7508544921875, -0.48681640625, -0.2227783203125, 0.041259765625, 0.3052978515625, 0.5693359375, 0.8333740234375, 1.097412109375, 1.3614501953125, 1.62548828125, 1.8895263671875, 2.153564453125, 2.4176025390625, 2.681640625, 2.9456787109375, 3.209716796875, 3.4737548828125, 3.73779296875, 4.0018310546875, 4.265869140625, 4.5299072265625, 4.7939453125, 5.0579833984375, 5.322021484375, 5.5860595703125, 5.85009765625, 6.1141357421875, 6.378173828125, 6.6422119140625, 6.90625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 11.0, 20.0, 21.0, 8.0, 19.0, 32.0, 24.0, 38.0, 39.0, 47.0, 42.0, 50.0, 48.0, 41.0, 44.0, 44.0, 59.0, 47.0, 42.0, 38.0, 48.0, 36.0, 31.0, 26.0, 13.0, 17.0, 18.0, 17.0, 12.0, 6.0, 8.0, 10.0, 1.0, 4.0, 2.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.283079147338867, -24.300622940063477, -23.31816864013672, -22.335712432861328, -21.35325813293457, -20.37080192565918, -19.388347625732422, -18.40589141845703, -17.42343521118164, -16.44097900390625, -15.458524703979492, -14.476068496704102, -13.493614196777344, -12.511157989501953, -11.528702735900879, -10.546247482299805, -9.563793182373047, -8.581337928771973, -7.598882675170898, -6.616426944732666, -5.633971691131592, -4.651516437530518, -3.669060707092285, -2.686605453491211, -1.7041501998901367, -0.721694827079773, 0.2607605457305908, 1.2432160377502441, 2.2256712913513184, 3.2081265449523926, 4.190582275390625, 5.173037528991699, 6.155494689941406, 7.1379499435424805, 8.120405197143555, 9.102861404418945, 10.085315704345703, 11.067771911621094, 12.050227165222168, 13.032682418823242, 14.015137672424316, 14.99759292602539, 15.980048179626465, 16.96250343322754, 17.94495964050293, 18.927413940429688, 19.909870147705078, 20.89232635498047, 21.874780654907227, 22.857236862182617, 23.839691162109375, 24.822147369384766, 25.804601669311523, 26.787057876586914, 27.769512176513672, 28.751968383789062, 29.734424591064453, 30.716880798339844, 31.6993350982666, 32.68178939819336, 33.66424560546875, 34.64670181274414, 35.62915802001953, 36.611610412597656, 37.59406661987305]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 8.0, 6.0, 4.0, 13.0, 12.0, 19.0, 13.0, 12.0, 17.0, 17.0, 22.0, 24.0, 21.0, 29.0, 30.0, 33.0, 31.0, 32.0, 39.0, 42.0, 35.0, 32.0, 40.0, 28.0, 34.0, 39.0, 33.0, 41.0, 33.0, 30.0, 25.0, 24.0, 29.0, 22.0, 18.0, 22.0, 19.0, 12.0, 11.0, 12.0, 7.0, 10.0, 7.0, 5.0, 1.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.850452423095703, -25.021982192993164, -24.193513870239258, -23.36504364013672, -22.53657341003418, -21.70810317993164, -20.879634857177734, -20.051164627075195, -19.222694396972656, -18.394224166870117, -17.56575584411621, -16.737285614013672, -15.908815383911133, -15.08034610748291, -14.251876831054688, -13.423406600952148, -12.594938278198242, -11.76646900177002, -10.93799877166748, -10.109529495239258, -9.281059265136719, -8.452589988708496, -7.624120712280273, -6.795650959014893, -5.967181205749512, -5.138711452484131, -4.31024169921875, -3.4817724227905273, -2.6533026695251465, -1.8248329162597656, -0.996363639831543, -0.1678938865661621, 0.6605739593505859, 1.4890435934066772, 2.3175132274627686, 3.1459827423095703, 3.974452495574951, 4.802922248840332, 5.631391525268555, 6.4598612785339355, 7.288331031799316, 8.116800308227539, 8.945270538330078, 9.7737398147583, 10.602209091186523, 11.430679321289062, 12.259148597717285, 13.087617874145508, 13.916088104248047, 14.74455738067627, 15.573027610778809, 16.40149688720703, 17.22996711730957, 18.05843734741211, 18.886905670166016, 19.715375900268555, 20.543846130371094, 21.372316360473633, 22.20078468322754, 23.029254913330078, 23.857725143432617, 24.686195373535156, 25.514663696289062, 26.3431339263916, 27.171602249145508]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 10.0, 19.0, 27.0, 38.0, 64.0, 89.0, 127.0, 251.0, 330.0, 528.0, 821.0, 1159.0, 1707.0, 2570.0, 3790.0, 5431.0, 7866.0, 11250.0, 15431.0, 21491.0, 29120.0, 37803.0, 48086.0, 58686.0, 69031.0, 78148.0, 84296.0, 86133.0, 84709.0, 78717.0, 69985.0, 59467.0, 48607.0, 37916.0, 29726.0, 21985.0, 16158.0, 11637.0, 8118.0, 5473.0, 3868.0, 2646.0, 1771.0, 1213.0, 789.0, 492.0, 347.0, 185.0, 160.0, 110.0, 72.0, 46.0, 29.0, 11.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0], "bins": [-16.84375, -16.3095703125, -15.775390625, -15.2412109375, -14.70703125, -14.1728515625, -13.638671875, -13.1044921875, -12.5703125, -12.0361328125, -11.501953125, -10.9677734375, -10.43359375, -9.8994140625, -9.365234375, -8.8310546875, -8.296875, -7.7626953125, -7.228515625, -6.6943359375, -6.16015625, -5.6259765625, -5.091796875, -4.5576171875, -4.0234375, -3.4892578125, -2.955078125, -2.4208984375, -1.88671875, -1.3525390625, -0.818359375, -0.2841796875, 0.25, 0.7841796875, 1.318359375, 1.8525390625, 2.38671875, 2.9208984375, 3.455078125, 3.9892578125, 4.5234375, 5.0576171875, 5.591796875, 6.1259765625, 6.66015625, 7.1943359375, 7.728515625, 8.2626953125, 8.796875, 9.3310546875, 9.865234375, 10.3994140625, 10.93359375, 11.4677734375, 12.001953125, 12.5361328125, 13.0703125, 13.6044921875, 14.138671875, 14.6728515625, 15.20703125, 15.7412109375, 16.275390625, 16.8095703125, 17.34375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 9.0, 4.0, 8.0, 16.0, 12.0, 15.0, 21.0, 11.0, 21.0, 22.0, 22.0, 42.0, 23.0, 30.0, 39.0, 44.0, 29.0, 46.0, 37.0, 42.0, 47.0, 30.0, 36.0, 41.0, 27.0, 40.0, 28.0, 36.0, 26.0, 25.0, 24.0, 23.0, 18.0, 17.0, 11.0, 7.0, 5.0, 9.0, 15.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.374267578125, -25.51416015625, -24.654052734375, -23.7939453125, -22.933837890625, -22.07373046875, -21.213623046875, -20.353515625, -19.493408203125, -18.63330078125, -17.773193359375, -16.9130859375, -16.052978515625, -15.19287109375, -14.332763671875, -13.47265625, -12.612548828125, -11.75244140625, -10.892333984375, -10.0322265625, -9.172119140625, -8.31201171875, -7.451904296875, -6.591796875, -5.731689453125, -4.87158203125, -4.011474609375, -3.1513671875, -2.291259765625, -1.43115234375, -0.571044921875, 0.2890625, 1.149169921875, 2.00927734375, 2.869384765625, 3.7294921875, 4.589599609375, 5.44970703125, 6.309814453125, 7.169921875, 8.030029296875, 8.89013671875, 9.750244140625, 10.6103515625, 11.470458984375, 12.33056640625, 13.190673828125, 14.05078125, 14.910888671875, 15.77099609375, 16.631103515625, 17.4912109375, 18.351318359375, 19.21142578125, 20.071533203125, 20.931640625, 21.791748046875, 22.65185546875, 23.511962890625, 24.3720703125, 25.232177734375, 26.09228515625, 26.952392578125, 27.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 5.0, 14.0, 20.0, 24.0, 45.0, 72.0, 101.0, 164.0, 294.0, 464.0, 800.0, 1287.0, 2121.0, 3585.0, 5805.0, 9744.0, 16390.0, 26561.0, 42116.0, 64327.0, 90918.0, 117595.0, 134175.0, 135826.0, 119205.0, 94217.0, 66931.0, 44521.0, 27834.0, 17406.0, 10539.0, 6174.0, 3755.0, 2148.0, 1284.0, 807.0, 459.0, 307.0, 174.0, 134.0, 87.0, 50.0, 27.0, 13.0, 15.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-36.53125, -35.45849609375, -34.3857421875, -33.31298828125, -32.240234375, -31.16748046875, -30.0947265625, -29.02197265625, -27.94921875, -26.87646484375, -25.8037109375, -24.73095703125, -23.658203125, -22.58544921875, -21.5126953125, -20.43994140625, -19.3671875, -18.29443359375, -17.2216796875, -16.14892578125, -15.076171875, -14.00341796875, -12.9306640625, -11.85791015625, -10.78515625, -9.71240234375, -8.6396484375, -7.56689453125, -6.494140625, -5.42138671875, -4.3486328125, -3.27587890625, -2.203125, -1.13037109375, -0.0576171875, 1.01513671875, 2.087890625, 3.16064453125, 4.2333984375, 5.30615234375, 6.37890625, 7.45166015625, 8.5244140625, 9.59716796875, 10.669921875, 11.74267578125, 12.8154296875, 13.88818359375, 14.9609375, 16.03369140625, 17.1064453125, 18.17919921875, 19.251953125, 20.32470703125, 21.3974609375, 22.47021484375, 23.54296875, 24.61572265625, 25.6884765625, 26.76123046875, 27.833984375, 28.90673828125, 29.9794921875, 31.05224609375, 32.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0, 3.0, 4.0, 9.0, 11.0, 15.0, 12.0, 14.0, 31.0, 21.0, 29.0, 21.0, 26.0, 39.0, 39.0, 25.0, 28.0, 38.0, 39.0, 40.0, 43.0, 37.0, 39.0, 39.0, 45.0, 29.0, 32.0, 33.0, 41.0, 18.0, 27.0, 31.0, 20.0, 17.0, 14.0, 10.0, 10.0, 12.0, 11.0, 6.0, 6.0, 5.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.625, -16.036865234375, -15.44873046875, -14.860595703125, -14.2724609375, -13.684326171875, -13.09619140625, -12.508056640625, -11.919921875, -11.331787109375, -10.74365234375, -10.155517578125, -9.5673828125, -8.979248046875, -8.39111328125, -7.802978515625, -7.21484375, -6.626708984375, -6.03857421875, -5.450439453125, -4.8623046875, -4.274169921875, -3.68603515625, -3.097900390625, -2.509765625, -1.921630859375, -1.33349609375, -0.745361328125, -0.1572265625, 0.430908203125, 1.01904296875, 1.607177734375, 2.1953125, 2.783447265625, 3.37158203125, 3.959716796875, 4.5478515625, 5.135986328125, 5.72412109375, 6.312255859375, 6.900390625, 7.488525390625, 8.07666015625, 8.664794921875, 9.2529296875, 9.841064453125, 10.42919921875, 11.017333984375, 11.60546875, 12.193603515625, 12.78173828125, 13.369873046875, 13.9580078125, 14.546142578125, 15.13427734375, 15.722412109375, 16.310546875, 16.898681640625, 17.48681640625, 18.074951171875, 18.6630859375, 19.251220703125, 19.83935546875, 20.427490234375, 21.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 8.0, 11.0, 21.0, 21.0, 36.0, 41.0, 51.0, 61.0, 110.0, 132.0, 251.0, 323.0, 489.0, 751.0, 1273.0, 2253.0, 3677.0, 6886.0, 12842.0, 23779.0, 44657.0, 78862.0, 125698.0, 170939.0, 182994.0, 152709.0, 103767.0, 61278.0, 34083.0, 18077.0, 9676.0, 5200.0, 2946.0, 1643.0, 955.0, 664.0, 415.0, 288.0, 188.0, 136.0, 89.0, 83.0, 50.0, 34.0, 37.0, 20.0, 21.0, 7.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0], "bins": [-11.703125, -11.3616943359375, -11.020263671875, -10.6788330078125, -10.33740234375, -9.9959716796875, -9.654541015625, -9.3131103515625, -8.9716796875, -8.6302490234375, -8.288818359375, -7.9473876953125, -7.60595703125, -7.2645263671875, -6.923095703125, -6.5816650390625, -6.240234375, -5.8988037109375, -5.557373046875, -5.2159423828125, -4.87451171875, -4.5330810546875, -4.191650390625, -3.8502197265625, -3.5087890625, -3.1673583984375, -2.825927734375, -2.4844970703125, -2.14306640625, -1.8016357421875, -1.460205078125, -1.1187744140625, -0.77734375, -0.4359130859375, -0.094482421875, 0.2469482421875, 0.58837890625, 0.9298095703125, 1.271240234375, 1.6126708984375, 1.9541015625, 2.2955322265625, 2.636962890625, 2.9783935546875, 3.31982421875, 3.6612548828125, 4.002685546875, 4.3441162109375, 4.685546875, 5.0269775390625, 5.368408203125, 5.7098388671875, 6.05126953125, 6.3927001953125, 6.734130859375, 7.0755615234375, 7.4169921875, 7.7584228515625, 8.099853515625, 8.4412841796875, 8.78271484375, 9.1241455078125, 9.465576171875, 9.8070068359375, 10.1484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 10.0, 11.0, 6.0, 14.0, 13.0, 16.0, 37.0, 33.0, 33.0, 40.0, 54.0, 51.0, 46.0, 43.0, 70.0, 51.0, 61.0, 47.0, 49.0, 45.0, 49.0, 47.0, 31.0, 34.0, 18.0, 15.0, 13.0, 7.0, 4.0, 13.0, 4.0, 5.0, 3.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010766983032226562, -0.0010413676500320435, -0.0010060369968414307, -0.0009707063436508179, -0.0009353756904602051, -0.0009000450372695923, -0.0008647143840789795, -0.0008293837308883667, -0.0007940530776977539, -0.0007587224245071411, -0.0007233917713165283, -0.0006880611181259155, -0.0006527304649353027, -0.0006173998117446899, -0.0005820691585540771, -0.0005467385053634644, -0.0005114078521728516, -0.00047607719898223877, -0.000440746545791626, -0.0004054158926010132, -0.0003700852394104004, -0.0003347545862197876, -0.0002994239330291748, -0.000264093279838562, -0.00022876262664794922, -0.00019343197345733643, -0.00015810132026672363, -0.00012277066707611084, -8.744001388549805e-05, -5.2109360694885254e-05, -1.677870750427246e-05, 1.8551945686340332e-05, 5.3882598876953125e-05, 8.921325206756592e-05, 0.0001245439052581787, 0.0001598745584487915, 0.0001952052116394043, 0.0002305358648300171, 0.0002658665180206299, 0.0003011971712112427, 0.00033652782440185547, 0.00037185847759246826, 0.00040718913078308105, 0.00044251978397369385, 0.00047785043716430664, 0.0005131810903549194, 0.0005485117435455322, 0.000583842396736145, 0.0006191730499267578, 0.0006545037031173706, 0.0006898343563079834, 0.0007251650094985962, 0.000760495662689209, 0.0007958263158798218, 0.0008311569690704346, 0.0008664876222610474, 0.0009018182754516602, 0.000937148928642273, 0.0009724795818328857, 0.0010078102350234985, 0.0010431408882141113, 0.0010784715414047241, 0.001113802194595337, 0.0011491328477859497, 0.0011844635009765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 10.0, 8.0, 7.0, 16.0, 9.0, 42.0, 34.0, 61.0, 98.0, 127.0, 205.0, 309.0, 485.0, 821.0, 1236.0, 2076.0, 3387.0, 5562.0, 9408.0, 15933.0, 26581.0, 43793.0, 68496.0, 100745.0, 133191.0, 151173.0, 144463.0, 116712.0, 83793.0, 54233.0, 34315.0, 20465.0, 12295.0, 7108.0, 4309.0, 2689.0, 1575.0, 1009.0, 612.0, 406.0, 244.0, 164.0, 118.0, 71.0, 50.0, 34.0, 25.0, 22.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.3359375, -8.0556640625, -7.775390625, -7.4951171875, -7.21484375, -6.9345703125, -6.654296875, -6.3740234375, -6.09375, -5.8134765625, -5.533203125, -5.2529296875, -4.97265625, -4.6923828125, -4.412109375, -4.1318359375, -3.8515625, -3.5712890625, -3.291015625, -3.0107421875, -2.73046875, -2.4501953125, -2.169921875, -1.8896484375, -1.609375, -1.3291015625, -1.048828125, -0.7685546875, -0.48828125, -0.2080078125, 0.072265625, 0.3525390625, 0.6328125, 0.9130859375, 1.193359375, 1.4736328125, 1.75390625, 2.0341796875, 2.314453125, 2.5947265625, 2.875, 3.1552734375, 3.435546875, 3.7158203125, 3.99609375, 4.2763671875, 4.556640625, 4.8369140625, 5.1171875, 5.3974609375, 5.677734375, 5.9580078125, 6.23828125, 6.5185546875, 6.798828125, 7.0791015625, 7.359375, 7.6396484375, 7.919921875, 8.2001953125, 8.48046875, 8.7607421875, 9.041015625, 9.3212890625, 9.6015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 12.0, 19.0, 11.0, 14.0, 23.0, 15.0, 31.0, 23.0, 35.0, 27.0, 45.0, 44.0, 36.0, 45.0, 49.0, 52.0, 50.0, 54.0, 39.0, 51.0, 42.0, 38.0, 29.0, 34.0, 27.0, 16.0, 19.0, 20.0, 11.0, 8.0, 12.0, 10.0, 10.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.654296875, -3.551025390625, -3.44775390625, -3.344482421875, -3.2412109375, -3.137939453125, -3.03466796875, -2.931396484375, -2.828125, -2.724853515625, -2.62158203125, -2.518310546875, -2.4150390625, -2.311767578125, -2.20849609375, -2.105224609375, -2.001953125, -1.898681640625, -1.79541015625, -1.692138671875, -1.5888671875, -1.485595703125, -1.38232421875, -1.279052734375, -1.17578125, -1.072509765625, -0.96923828125, -0.865966796875, -0.7626953125, -0.659423828125, -0.55615234375, -0.452880859375, -0.349609375, -0.246337890625, -0.14306640625, -0.039794921875, 0.0634765625, 0.166748046875, 0.27001953125, 0.373291015625, 0.4765625, 0.579833984375, 0.68310546875, 0.786376953125, 0.8896484375, 0.992919921875, 1.09619140625, 1.199462890625, 1.302734375, 1.406005859375, 1.50927734375, 1.612548828125, 1.7158203125, 1.819091796875, 1.92236328125, 2.025634765625, 2.12890625, 2.232177734375, 2.33544921875, 2.438720703125, 2.5419921875, 2.645263671875, 2.74853515625, 2.851806640625, 2.955078125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 3.0, 7.0, 11.0, 6.0, 12.0, 16.0, 15.0, 16.0, 25.0, 19.0, 27.0, 30.0, 37.0, 23.0, 24.0, 38.0, 36.0, 54.0, 39.0, 30.0, 44.0, 38.0, 37.0, 50.0, 47.0, 34.0, 37.0, 19.0, 36.0, 26.0, 21.0, 11.0, 26.0, 19.0, 13.0, 10.0, 10.0, 3.0, 6.0, 5.0, 5.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-25.48256492614746, -24.663169860839844, -23.843772888183594, -23.024377822875977, -22.20498275756836, -21.38558578491211, -20.566190719604492, -19.746795654296875, -18.927398681640625, -18.108003616333008, -17.288606643676758, -16.46921157836914, -15.649816513061523, -14.83042049407959, -14.011024475097656, -13.191629409790039, -12.372234344482422, -11.552838325500488, -10.733443260192871, -9.914047241210938, -9.09465217590332, -8.275256156921387, -7.455860137939453, -6.636464595794678, -5.817069053649902, -4.997673511505127, -4.178277969360352, -3.358881950378418, -2.5394864082336426, -1.7200908660888672, -0.9006948471069336, -0.0812993049621582, 0.7380943298339844, 1.5574899911880493, 2.3768856525421143, 3.1962814331054688, 4.015676975250244, 4.8350725173950195, 5.654468536376953, 6.4738640785217285, 7.293259620666504, 8.112655639648438, 8.932050704956055, 9.751446723937988, 10.570842742919922, 11.390237808227539, 12.209633827209473, 13.029029846191406, 13.848424911499023, 14.667820930480957, 15.487215995788574, 16.306612014770508, 17.126007080078125, 17.945404052734375, 18.764799118041992, 19.58419418334961, 20.40359115600586, 21.222986221313477, 22.042383193969727, 22.861778259277344, 23.68117332458496, 24.500568389892578, 25.319965362548828, 26.139360427856445, 26.958755493164062]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 9.0, 8.0, 5.0, 9.0, 8.0, 9.0, 11.0, 13.0, 24.0, 17.0, 22.0, 24.0, 17.0, 23.0, 35.0, 31.0, 36.0, 26.0, 40.0, 34.0, 29.0, 42.0, 30.0, 50.0, 41.0, 34.0, 28.0, 41.0, 26.0, 31.0, 26.0, 26.0, 23.0, 20.0, 18.0, 23.0, 13.0, 16.0, 19.0, 10.0, 11.0, 7.0, 10.0, 3.0, 6.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-28.986473083496094, -28.149890899658203, -27.313310623168945, -26.476728439331055, -25.640148162841797, -24.803565979003906, -23.96698570251465, -23.130403518676758, -22.2938232421875, -21.45724105834961, -20.62066078186035, -19.78407859802246, -18.947498321533203, -18.110916137695312, -17.274335861206055, -16.437753677368164, -15.60117244720459, -14.764591217041016, -13.928009986877441, -13.091428756713867, -12.254847526550293, -11.418266296386719, -10.581684112548828, -9.74510383605957, -8.90852165222168, -8.071940422058105, -7.235359191894531, -6.398777961730957, -5.562196731567383, -4.72561502456665, -3.889033794403076, -3.052452564239502, -2.215871810913086, -1.3792905807495117, -0.542709231376648, 0.2938721179962158, 1.13045334815979, 1.9670348167419434, 2.8036160469055176, 3.640197277069092, 4.476778507232666, 5.31335973739624, 6.1499409675598145, 6.986522674560547, 7.823103904724121, 8.659685134887695, 9.49626636505127, 10.332847595214844, 11.169428825378418, 12.006010055541992, 12.842591285705566, 13.67917251586914, 14.515753746032715, 15.352334976196289, 16.18891716003418, 17.025497436523438, 17.862079620361328, 18.69866180419922, 19.535242080688477, 20.371824264526367, 21.208404541015625, 22.044986724853516, 22.881567001342773, 23.718149185180664, 24.554729461669922]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 10.0, 9.0, 15.0, 14.0, 29.0, 48.0, 77.0, 122.0, 185.0, 301.0, 440.0, 738.0, 1171.0, 1878.0, 3175.0, 5356.0, 9113.0, 15545.0, 26916.0, 47192.0, 83154.0, 146068.0, 252576.0, 415651.0, 609087.0, 726383.0, 664824.0, 479148.0, 300086.0, 174449.0, 99493.0, 55493.0, 31645.0, 18015.0, 10537.0, 5959.0, 3636.0, 2171.0, 1366.0, 804.0, 482.0, 316.0, 202.0, 146.0, 98.0, 58.0, 40.0, 24.0, 18.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0], "bins": [-31.046875, -30.12451171875, -29.2021484375, -28.27978515625, -27.357421875, -26.43505859375, -25.5126953125, -24.59033203125, -23.66796875, -22.74560546875, -21.8232421875, -20.90087890625, -19.978515625, -19.05615234375, -18.1337890625, -17.21142578125, -16.2890625, -15.36669921875, -14.4443359375, -13.52197265625, -12.599609375, -11.67724609375, -10.7548828125, -9.83251953125, -8.91015625, -7.98779296875, -7.0654296875, -6.14306640625, -5.220703125, -4.29833984375, -3.3759765625, -2.45361328125, -1.53125, -0.60888671875, 0.3134765625, 1.23583984375, 2.158203125, 3.08056640625, 4.0029296875, 4.92529296875, 5.84765625, 6.77001953125, 7.6923828125, 8.61474609375, 9.537109375, 10.45947265625, 11.3818359375, 12.30419921875, 13.2265625, 14.14892578125, 15.0712890625, 15.99365234375, 16.916015625, 17.83837890625, 18.7607421875, 19.68310546875, 20.60546875, 21.52783203125, 22.4501953125, 23.37255859375, 24.294921875, 25.21728515625, 26.1396484375, 27.06201171875, 27.984375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 5.0, 6.0, 8.0, 7.0, 15.0, 12.0, 15.0, 23.0, 15.0, 20.0, 29.0, 32.0, 36.0, 31.0, 31.0, 33.0, 45.0, 40.0, 55.0, 36.0, 29.0, 32.0, 30.0, 46.0, 31.0, 43.0, 39.0, 25.0, 23.0, 30.0, 23.0, 19.0, 18.0, 15.0, 20.0, 7.0, 6.0, 7.0, 7.0, 15.0, 8.0, 8.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-23.078125, -22.40576171875, -21.7333984375, -21.06103515625, -20.388671875, -19.71630859375, -19.0439453125, -18.37158203125, -17.69921875, -17.02685546875, -16.3544921875, -15.68212890625, -15.009765625, -14.33740234375, -13.6650390625, -12.99267578125, -12.3203125, -11.64794921875, -10.9755859375, -10.30322265625, -9.630859375, -8.95849609375, -8.2861328125, -7.61376953125, -6.94140625, -6.26904296875, -5.5966796875, -4.92431640625, -4.251953125, -3.57958984375, -2.9072265625, -2.23486328125, -1.5625, -0.89013671875, -0.2177734375, 0.45458984375, 1.126953125, 1.79931640625, 2.4716796875, 3.14404296875, 3.81640625, 4.48876953125, 5.1611328125, 5.83349609375, 6.505859375, 7.17822265625, 7.8505859375, 8.52294921875, 9.1953125, 9.86767578125, 10.5400390625, 11.21240234375, 11.884765625, 12.55712890625, 13.2294921875, 13.90185546875, 14.57421875, 15.24658203125, 15.9189453125, 16.59130859375, 17.263671875, 17.93603515625, 18.6083984375, 19.28076171875, 19.953125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 10.0, 22.0, 25.0, 44.0, 55.0, 134.0, 190.0, 317.0, 538.0, 886.0, 1609.0, 2766.0, 4702.0, 8186.0, 14239.0, 25060.0, 42432.0, 73552.0, 125123.0, 203678.0, 316730.0, 456324.0, 580987.0, 624757.0, 556222.0, 422077.0, 287297.0, 181404.0, 110530.0, 65267.0, 37887.0, 21654.0, 12615.0, 7147.0, 4119.0, 2331.0, 1401.0, 749.0, 467.0, 301.0, 164.0, 107.0, 65.0, 53.0, 28.0, 9.0, 9.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-27.75, -26.918701171875, -26.08740234375, -25.256103515625, -24.4248046875, -23.593505859375, -22.76220703125, -21.930908203125, -21.099609375, -20.268310546875, -19.43701171875, -18.605712890625, -17.7744140625, -16.943115234375, -16.11181640625, -15.280517578125, -14.44921875, -13.617919921875, -12.78662109375, -11.955322265625, -11.1240234375, -10.292724609375, -9.46142578125, -8.630126953125, -7.798828125, -6.967529296875, -6.13623046875, -5.304931640625, -4.4736328125, -3.642333984375, -2.81103515625, -1.979736328125, -1.1484375, -0.317138671875, 0.51416015625, 1.345458984375, 2.1767578125, 3.008056640625, 3.83935546875, 4.670654296875, 5.501953125, 6.333251953125, 7.16455078125, 7.995849609375, 8.8271484375, 9.658447265625, 10.48974609375, 11.321044921875, 12.15234375, 12.983642578125, 13.81494140625, 14.646240234375, 15.4775390625, 16.308837890625, 17.14013671875, 17.971435546875, 18.802734375, 19.634033203125, 20.46533203125, 21.296630859375, 22.1279296875, 22.959228515625, 23.79052734375, 24.621826171875, 25.453125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 7.0, 8.0, 12.0, 18.0, 16.0, 16.0, 47.0, 46.0, 48.0, 51.0, 74.0, 93.0, 109.0, 117.0, 144.0, 161.0, 164.0, 186.0, 196.0, 221.0, 223.0, 222.0, 197.0, 217.0, 204.0, 182.0, 154.0, 142.0, 114.0, 141.0, 86.0, 87.0, 80.0, 53.0, 39.0, 43.0, 47.0, 20.0, 23.0, 16.0, 10.0, 8.0, 7.0, 5.0, 7.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-9.9453125, -9.609619140625, -9.27392578125, -8.938232421875, -8.6025390625, -8.266845703125, -7.93115234375, -7.595458984375, -7.259765625, -6.924072265625, -6.58837890625, -6.252685546875, -5.9169921875, -5.581298828125, -5.24560546875, -4.909912109375, -4.57421875, -4.238525390625, -3.90283203125, -3.567138671875, -3.2314453125, -2.895751953125, -2.56005859375, -2.224365234375, -1.888671875, -1.552978515625, -1.21728515625, -0.881591796875, -0.5458984375, -0.210205078125, 0.12548828125, 0.461181640625, 0.796875, 1.132568359375, 1.46826171875, 1.803955078125, 2.1396484375, 2.475341796875, 2.81103515625, 3.146728515625, 3.482421875, 3.818115234375, 4.15380859375, 4.489501953125, 4.8251953125, 5.160888671875, 5.49658203125, 5.832275390625, 6.16796875, 6.503662109375, 6.83935546875, 7.175048828125, 7.5107421875, 7.846435546875, 8.18212890625, 8.517822265625, 8.853515625, 9.189208984375, 9.52490234375, 9.860595703125, 10.1962890625, 10.531982421875, 10.86767578125, 11.203369140625, 11.5390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 5.0, 9.0, 21.0, 23.0, 16.0, 19.0, 30.0, 24.0, 38.0, 43.0, 40.0, 49.0, 24.0, 48.0, 42.0, 46.0, 38.0, 41.0, 34.0, 47.0, 37.0, 45.0, 41.0, 21.0, 35.0, 27.0, 25.0, 18.0, 16.0, 17.0, 12.0, 9.0, 9.0, 13.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.804954528808594, -24.957992553710938, -24.11103057861328, -23.264068603515625, -22.41710662841797, -21.570144653320312, -20.723182678222656, -19.876220703125, -19.029258728027344, -18.182296752929688, -17.33533477783203, -16.488372802734375, -15.641410827636719, -14.794448852539062, -13.94748592376709, -13.100523948669434, -12.253561019897461, -11.406599044799805, -10.559637069702148, -9.712675094604492, -8.865713119506836, -8.01875114440918, -7.171788215637207, -6.324826240539551, -5.4778642654418945, -4.630902290344238, -3.783940076828003, -2.9369778633117676, -2.0900158882141113, -1.243053913116455, -0.3960914611816406, 0.4508705139160156, 1.2978324890136719, 2.144794464111328, 2.9917566776275635, 3.838718891143799, 4.685680866241455, 5.532642841339111, 6.379605293273926, 7.226567268371582, 8.073529243469238, 8.920491218566895, 9.76745319366455, 10.614416122436523, 11.46137809753418, 12.308340072631836, 13.155302047729492, 14.002264022827148, 14.849225997924805, 15.696187973022461, 16.543149948120117, 17.390111923217773, 18.23707389831543, 19.084035873413086, 19.930999755859375, 20.77796173095703, 21.624923706054688, 22.471885681152344, 23.31884765625, 24.165809631347656, 25.012771606445312, 25.85973358154297, 26.706695556640625, 27.55365753173828, 28.400619506835938]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 7.0, 4.0, 10.0, 6.0, 12.0, 12.0, 22.0, 21.0, 30.0, 23.0, 24.0, 22.0, 27.0, 21.0, 25.0, 34.0, 49.0, 35.0, 43.0, 39.0, 51.0, 39.0, 42.0, 24.0, 36.0, 32.0, 41.0, 28.0, 23.0, 23.0, 28.0, 21.0, 20.0, 22.0, 12.0, 18.0, 11.0, 10.0, 12.0, 9.0, 5.0, 4.0, 5.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.896869659423828, -22.094961166381836, -21.293052673339844, -20.491146087646484, -19.689237594604492, -18.8873291015625, -18.085420608520508, -17.283512115478516, -16.481605529785156, -15.679697036743164, -14.877789497375488, -14.075881004333496, -13.27397346496582, -12.472064971923828, -11.670156478881836, -10.868247985839844, -10.066339492797852, -9.26443099975586, -8.462523460388184, -7.660614967346191, -6.858706951141357, -6.056798934936523, -5.254890441894531, -4.452982425689697, -3.6510744094848633, -2.8491663932800293, -2.047258138656616, -1.2453498840332031, -0.44344186782836914, 0.35846614837646484, 1.160374641418457, 1.962282657623291, 2.764190673828125, 3.566098690032959, 4.368006706237793, 5.169915199279785, 5.971823215484619, 6.773731231689453, 7.575639724731445, 8.377548217773438, 9.179455757141113, 9.981364250183105, 10.783271789550781, 11.585180282592773, 12.387088775634766, 13.188996315002441, 13.990904808044434, 14.79281234741211, 15.594720840454102, 16.396629333496094, 17.198537826538086, 18.000446319580078, 18.802352905273438, 19.60426139831543, 20.406169891357422, 21.208078384399414, 22.009986877441406, 22.8118953704834, 23.61380386352539, 24.41571044921875, 25.217618942260742, 26.019527435302734, 26.821435928344727, 27.62334442138672, 28.425251007080078]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 12.0, 34.0, 31.0, 56.0, 92.0, 110.0, 206.0, 303.0, 441.0, 747.0, 1115.0, 1826.0, 2750.0, 4119.0, 6431.0, 9410.0, 14419.0, 21292.0, 30624.0, 43834.0, 61289.0, 82360.0, 105290.0, 124282.0, 126018.0, 110470.0, 87300.0, 65190.0, 46888.0, 32790.0, 23105.0, 15540.0, 10471.0, 6954.0, 4404.0, 3014.0, 1806.0, 1232.0, 823.0, 507.0, 346.0, 217.0, 151.0, 94.0, 39.0, 47.0, 29.0, 18.0, 12.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0], "bins": [-27.5625, -26.703857421875, -25.84521484375, -24.986572265625, -24.1279296875, -23.269287109375, -22.41064453125, -21.552001953125, -20.693359375, -19.834716796875, -18.97607421875, -18.117431640625, -17.2587890625, -16.400146484375, -15.54150390625, -14.682861328125, -13.82421875, -12.965576171875, -12.10693359375, -11.248291015625, -10.3896484375, -9.531005859375, -8.67236328125, -7.813720703125, -6.955078125, -6.096435546875, -5.23779296875, -4.379150390625, -3.5205078125, -2.661865234375, -1.80322265625, -0.944580078125, -0.0859375, 0.772705078125, 1.63134765625, 2.489990234375, 3.3486328125, 4.207275390625, 5.06591796875, 5.924560546875, 6.783203125, 7.641845703125, 8.50048828125, 9.359130859375, 10.2177734375, 11.076416015625, 11.93505859375, 12.793701171875, 13.65234375, 14.510986328125, 15.36962890625, 16.228271484375, 17.0869140625, 17.945556640625, 18.80419921875, 19.662841796875, 20.521484375, 21.380126953125, 22.23876953125, 23.097412109375, 23.9560546875, 24.814697265625, 25.67333984375, 26.531982421875, 27.390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 17.0, 12.0, 17.0, 18.0, 22.0, 22.0, 30.0, 26.0, 29.0, 29.0, 30.0, 37.0, 43.0, 23.0, 37.0, 43.0, 42.0, 46.0, 38.0, 32.0, 38.0, 33.0, 28.0, 30.0, 26.0, 38.0, 25.0, 26.0, 23.0, 20.0, 15.0, 17.0, 14.0, 15.0, 8.0, 8.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.29052734375, -19.5966796875, -18.90283203125, -18.208984375, -17.51513671875, -16.8212890625, -16.12744140625, -15.43359375, -14.73974609375, -14.0458984375, -13.35205078125, -12.658203125, -11.96435546875, -11.2705078125, -10.57666015625, -9.8828125, -9.18896484375, -8.4951171875, -7.80126953125, -7.107421875, -6.41357421875, -5.7197265625, -5.02587890625, -4.33203125, -3.63818359375, -2.9443359375, -2.25048828125, -1.556640625, -0.86279296875, -0.1689453125, 0.52490234375, 1.21875, 1.91259765625, 2.6064453125, 3.30029296875, 3.994140625, 4.68798828125, 5.3818359375, 6.07568359375, 6.76953125, 7.46337890625, 8.1572265625, 8.85107421875, 9.544921875, 10.23876953125, 10.9326171875, 11.62646484375, 12.3203125, 13.01416015625, 13.7080078125, 14.40185546875, 15.095703125, 15.78955078125, 16.4833984375, 17.17724609375, 17.87109375, 18.56494140625, 19.2587890625, 19.95263671875, 20.646484375, 21.34033203125, 22.0341796875, 22.72802734375, 23.421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 13.0, 18.0, 23.0, 33.0, 48.0, 60.0, 94.0, 125.0, 200.0, 279.0, 419.0, 640.0, 976.0, 1297.0, 2163.0, 3112.0, 4903.0, 7566.0, 11867.0, 19107.0, 30508.0, 49894.0, 80161.0, 124964.0, 172296.0, 177433.0, 132403.0, 85340.0, 52980.0, 33059.0, 20664.0, 12766.0, 7941.0, 5287.0, 3375.0, 2179.0, 1394.0, 966.0, 669.0, 439.0, 283.0, 207.0, 130.0, 102.0, 51.0, 35.0, 31.0, 22.0, 9.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.375, -34.27197265625, -33.1689453125, -32.06591796875, -30.962890625, -29.85986328125, -28.7568359375, -27.65380859375, -26.55078125, -25.44775390625, -24.3447265625, -23.24169921875, -22.138671875, -21.03564453125, -19.9326171875, -18.82958984375, -17.7265625, -16.62353515625, -15.5205078125, -14.41748046875, -13.314453125, -12.21142578125, -11.1083984375, -10.00537109375, -8.90234375, -7.79931640625, -6.6962890625, -5.59326171875, -4.490234375, -3.38720703125, -2.2841796875, -1.18115234375, -0.078125, 1.02490234375, 2.1279296875, 3.23095703125, 4.333984375, 5.43701171875, 6.5400390625, 7.64306640625, 8.74609375, 9.84912109375, 10.9521484375, 12.05517578125, 13.158203125, 14.26123046875, 15.3642578125, 16.46728515625, 17.5703125, 18.67333984375, 19.7763671875, 20.87939453125, 21.982421875, 23.08544921875, 24.1884765625, 25.29150390625, 26.39453125, 27.49755859375, 28.6005859375, 29.70361328125, 30.806640625, 31.90966796875, 33.0126953125, 34.11572265625, 35.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 6.0, 9.0, 10.0, 9.0, 11.0, 30.0, 26.0, 24.0, 32.0, 24.0, 30.0, 44.0, 40.0, 40.0, 32.0, 41.0, 66.0, 50.0, 48.0, 56.0, 56.0, 28.0, 43.0, 38.0, 27.0, 22.0, 31.0, 20.0, 16.0, 12.0, 19.0, 18.0, 10.0, 2.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.182861328125, -18.50634765625, -17.829833984375, -17.1533203125, -16.476806640625, -15.80029296875, -15.123779296875, -14.447265625, -13.770751953125, -13.09423828125, -12.417724609375, -11.7412109375, -11.064697265625, -10.38818359375, -9.711669921875, -9.03515625, -8.358642578125, -7.68212890625, -7.005615234375, -6.3291015625, -5.652587890625, -4.97607421875, -4.299560546875, -3.623046875, -2.946533203125, -2.27001953125, -1.593505859375, -0.9169921875, -0.240478515625, 0.43603515625, 1.112548828125, 1.7890625, 2.465576171875, 3.14208984375, 3.818603515625, 4.4951171875, 5.171630859375, 5.84814453125, 6.524658203125, 7.201171875, 7.877685546875, 8.55419921875, 9.230712890625, 9.9072265625, 10.583740234375, 11.26025390625, 11.936767578125, 12.61328125, 13.289794921875, 13.96630859375, 14.642822265625, 15.3193359375, 15.995849609375, 16.67236328125, 17.348876953125, 18.025390625, 18.701904296875, 19.37841796875, 20.054931640625, 20.7314453125, 21.407958984375, 22.08447265625, 22.760986328125, 23.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 12.0, 16.0, 40.0, 44.0, 80.0, 90.0, 169.0, 260.0, 365.0, 579.0, 954.0, 1555.0, 2670.0, 4804.0, 8696.0, 16852.0, 35099.0, 85035.0, 295588.0, 395284.0, 112982.0, 43274.0, 20209.0, 10317.0, 5637.0, 3121.0, 1910.0, 1066.0, 646.0, 435.0, 258.0, 158.0, 98.0, 87.0, 51.0, 34.0, 21.0, 17.0, 12.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.65625, -34.43212890625, -33.2080078125, -31.98388671875, -30.759765625, -29.53564453125, -28.3115234375, -27.08740234375, -25.86328125, -24.63916015625, -23.4150390625, -22.19091796875, -20.966796875, -19.74267578125, -18.5185546875, -17.29443359375, -16.0703125, -14.84619140625, -13.6220703125, -12.39794921875, -11.173828125, -9.94970703125, -8.7255859375, -7.50146484375, -6.27734375, -5.05322265625, -3.8291015625, -2.60498046875, -1.380859375, -0.15673828125, 1.0673828125, 2.29150390625, 3.515625, 4.73974609375, 5.9638671875, 7.18798828125, 8.412109375, 9.63623046875, 10.8603515625, 12.08447265625, 13.30859375, 14.53271484375, 15.7568359375, 16.98095703125, 18.205078125, 19.42919921875, 20.6533203125, 21.87744140625, 23.1015625, 24.32568359375, 25.5498046875, 26.77392578125, 27.998046875, 29.22216796875, 30.4462890625, 31.67041015625, 32.89453125, 34.11865234375, 35.3427734375, 36.56689453125, 37.791015625, 39.01513671875, 40.2392578125, 41.46337890625, 42.6875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 4.0, 11.0, 17.0, 5.0, 16.0, 13.0, 18.0, 28.0, 42.0, 62.0, 101.0, 140.0, 158.0, 120.0, 54.0, 46.0, 33.0, 19.0, 19.0, 18.0, 12.0, 6.0, 8.0, 4.0, 4.0, 3.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00560760498046875, -0.00545656681060791, -0.00530552864074707, -0.0051544904708862305, -0.005003452301025391, -0.004852414131164551, -0.004701375961303711, -0.004550337791442871, -0.004399299621582031, -0.004248261451721191, -0.0040972232818603516, -0.003946185111999512, -0.003795146942138672, -0.003644108772277832, -0.003493070602416992, -0.0033420324325561523, -0.0031909942626953125, -0.0030399560928344727, -0.002888917922973633, -0.002737879753112793, -0.002586841583251953, -0.0024358034133911133, -0.0022847652435302734, -0.0021337270736694336, -0.0019826889038085938, -0.001831650733947754, -0.001680612564086914, -0.0015295743942260742, -0.0013785362243652344, -0.0012274980545043945, -0.0010764598846435547, -0.0009254217147827148, -0.000774383544921875, -0.0006233453750610352, -0.0004723072052001953, -0.00032126903533935547, -0.00017023086547851562, -1.919269561767578e-05, 0.00013184547424316406, 0.0002828836441040039, 0.00043392181396484375, 0.0005849599838256836, 0.0007359981536865234, 0.0008870363235473633, 0.0010380744934082031, 0.001189112663269043, 0.0013401508331298828, 0.0014911890029907227, 0.0016422271728515625, 0.0017932653427124023, 0.0019443035125732422, 0.002095341682434082, 0.002246379852294922, 0.0023974180221557617, 0.0025484561920166016, 0.0026994943618774414, 0.0028505325317382812, 0.003001570701599121, 0.003152608871459961, 0.0033036470413208008, 0.0034546852111816406, 0.0036057233810424805, 0.0037567615509033203, 0.00390779972076416, 0.004058837890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 0.0, 7.0, 6.0, 10.0, 11.0, 9.0, 30.0, 28.0, 43.0, 65.0, 89.0, 121.0, 153.0, 223.0, 304.0, 423.0, 588.0, 914.0, 1305.0, 1830.0, 2865.0, 4285.0, 6688.0, 10677.0, 17285.0, 29078.0, 51291.0, 104194.0, 252375.0, 291439.0, 127156.0, 58906.0, 32964.0, 19295.0, 12036.0, 7292.0, 4710.0, 3139.0, 2025.0, 1417.0, 936.0, 709.0, 435.0, 340.0, 252.0, 179.0, 109.0, 93.0, 60.0, 57.0, 33.0, 22.0, 23.0, 14.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0], "bins": [-33.21875, -32.215576171875, -31.21240234375, -30.209228515625, -29.2060546875, -28.202880859375, -27.19970703125, -26.196533203125, -25.193359375, -24.190185546875, -23.18701171875, -22.183837890625, -21.1806640625, -20.177490234375, -19.17431640625, -18.171142578125, -17.16796875, -16.164794921875, -15.16162109375, -14.158447265625, -13.1552734375, -12.152099609375, -11.14892578125, -10.145751953125, -9.142578125, -8.139404296875, -7.13623046875, -6.133056640625, -5.1298828125, -4.126708984375, -3.12353515625, -2.120361328125, -1.1171875, -0.114013671875, 0.88916015625, 1.892333984375, 2.8955078125, 3.898681640625, 4.90185546875, 5.905029296875, 6.908203125, 7.911376953125, 8.91455078125, 9.917724609375, 10.9208984375, 11.924072265625, 12.92724609375, 13.930419921875, 14.93359375, 15.936767578125, 16.93994140625, 17.943115234375, 18.9462890625, 19.949462890625, 20.95263671875, 21.955810546875, 22.958984375, 23.962158203125, 24.96533203125, 25.968505859375, 26.9716796875, 27.974853515625, 28.97802734375, 29.981201171875, 30.984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 8.0, 12.0, 7.0, 9.0, 20.0, 13.0, 16.0, 24.0, 39.0, 59.0, 64.0, 102.0, 108.0, 117.0, 95.0, 72.0, 50.0, 35.0, 33.0, 24.0, 16.0, 10.0, 15.0, 8.0, 6.0, 6.0, 5.0, 1.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0078125, -13.617919921875, -13.22802734375, -12.838134765625, -12.4482421875, -12.058349609375, -11.66845703125, -11.278564453125, -10.888671875, -10.498779296875, -10.10888671875, -9.718994140625, -9.3291015625, -8.939208984375, -8.54931640625, -8.159423828125, -7.76953125, -7.379638671875, -6.98974609375, -6.599853515625, -6.2099609375, -5.820068359375, -5.43017578125, -5.040283203125, -4.650390625, -4.260498046875, -3.87060546875, -3.480712890625, -3.0908203125, -2.700927734375, -2.31103515625, -1.921142578125, -1.53125, -1.141357421875, -0.75146484375, -0.361572265625, 0.0283203125, 0.418212890625, 0.80810546875, 1.197998046875, 1.587890625, 1.977783203125, 2.36767578125, 2.757568359375, 3.1474609375, 3.537353515625, 3.92724609375, 4.317138671875, 4.70703125, 5.096923828125, 5.48681640625, 5.876708984375, 6.2666015625, 6.656494140625, 7.04638671875, 7.436279296875, 7.826171875, 8.216064453125, 8.60595703125, 8.995849609375, 9.3857421875, 9.775634765625, 10.16552734375, 10.555419921875, 10.9453125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 7.0, 8.0, 7.0, 17.0, 20.0, 19.0, 18.0, 28.0, 27.0, 37.0, 47.0, 46.0, 43.0, 43.0, 51.0, 70.0, 48.0, 55.0, 40.0, 61.0, 39.0, 30.0, 35.0, 34.0, 25.0, 35.0, 25.0, 5.0, 13.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.15595054626465, -25.234140396118164, -24.31233024597168, -23.390522003173828, -22.468711853027344, -21.54690170288086, -20.625091552734375, -19.70328140258789, -18.781471252441406, -17.859661102294922, -16.937850952148438, -16.016040802001953, -15.094232559204102, -14.172422409057617, -13.250612258911133, -12.328802108764648, -11.406993865966797, -10.485183715820312, -9.563374519348145, -8.64156436920166, -7.719754695892334, -6.797945022583008, -5.876134872436523, -4.954325199127197, -4.032515525817871, -3.110705852508545, -2.1888959407806396, -1.2670860290527344, -0.3452763557434082, 0.576533317565918, 1.4983434677124023, 2.4201531410217285, 3.341960906982422, 4.263770580291748, 5.185580253601074, 6.107390403747559, 7.029200077056885, 7.951009750366211, 8.872819900512695, 9.79463005065918, 10.716439247131348, 11.638249397277832, 12.56005859375, 13.481868743896484, 14.403678894042969, 15.325488090515137, 16.247299194335938, 17.16910743713379, 18.090917587280273, 19.012727737426758, 19.934537887573242, 20.856346130371094, 21.778156280517578, 22.699966430664062, 23.621776580810547, 24.54358673095703, 25.465396881103516, 26.38720703125, 27.309017181396484, 28.23082733154297, 29.15263557434082, 30.074445724487305, 30.99625587463379, 31.918066024780273, 32.839874267578125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 5.0, 6.0, 7.0, 6.0, 14.0, 12.0, 20.0, 10.0, 20.0, 17.0, 29.0, 29.0, 29.0, 31.0, 25.0, 30.0, 35.0, 37.0, 42.0, 39.0, 39.0, 30.0, 38.0, 41.0, 29.0, 36.0, 21.0, 32.0, 30.0, 22.0, 21.0, 26.0, 37.0, 20.0, 23.0, 15.0, 14.0, 14.0, 10.0, 13.0, 9.0, 8.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.073280334472656, -20.336767196655273, -19.600255966186523, -18.86374282836914, -18.12723159790039, -17.390718460083008, -16.654205322265625, -15.917693138122559, -15.181180953979492, -14.444668769836426, -13.70815658569336, -12.971643447875977, -12.23513126373291, -11.498619079589844, -10.762105941772461, -10.025593757629395, -9.289081573486328, -8.552569389343262, -7.816056728363037, -7.0795440673828125, -6.343031883239746, -5.60651969909668, -4.870007038116455, -4.1334943771362305, -3.396982192993164, -2.6604697704315186, -1.923957347869873, -1.1874449253082275, -0.45093250274658203, 0.2855799198150635, 1.022092342376709, 1.7586050033569336, 2.495119094848633, 3.2316315174102783, 3.968143939971924, 4.704656600952148, 5.441168785095215, 6.177680969238281, 6.914193630218506, 7.6507062911987305, 8.387218475341797, 9.123730659484863, 9.86024284362793, 10.596755981445312, 11.333268165588379, 12.069780349731445, 12.806293487548828, 13.542805671691895, 14.279317855834961, 15.015830039978027, 15.752342224121094, 16.488855361938477, 17.22536849975586, 17.96187973022461, 18.698392868041992, 19.434906005859375, 20.171417236328125, 20.907930374145508, 21.644441604614258, 22.38095474243164, 23.11746597290039, 23.853979110717773, 24.590492248535156, 25.327003479003906, 26.06351661682129]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 8.0, 3.0, 8.0, 16.0, 13.0, 15.0, 40.0, 68.0, 87.0, 129.0, 211.0, 358.0, 540.0, 842.0, 1375.0, 2091.0, 3279.0, 5229.0, 7976.0, 12688.0, 19454.0, 29588.0, 44231.0, 62864.0, 85066.0, 107439.0, 122676.0, 124653.0, 113154.0, 91851.0, 68980.0, 48732.0, 33120.0, 22123.0, 14353.0, 9075.0, 5908.0, 3815.0, 2389.0, 1484.0, 967.0, 609.0, 397.0, 235.0, 159.0, 98.0, 57.0, 39.0, 33.0, 11.0, 11.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.890625, -22.155517578125, -21.42041015625, -20.685302734375, -19.9501953125, -19.215087890625, -18.47998046875, -17.744873046875, -17.009765625, -16.274658203125, -15.53955078125, -14.804443359375, -14.0693359375, -13.334228515625, -12.59912109375, -11.864013671875, -11.12890625, -10.393798828125, -9.65869140625, -8.923583984375, -8.1884765625, -7.453369140625, -6.71826171875, -5.983154296875, -5.248046875, -4.512939453125, -3.77783203125, -3.042724609375, -2.3076171875, -1.572509765625, -0.83740234375, -0.102294921875, 0.6328125, 1.367919921875, 2.10302734375, 2.838134765625, 3.5732421875, 4.308349609375, 5.04345703125, 5.778564453125, 6.513671875, 7.248779296875, 7.98388671875, 8.718994140625, 9.4541015625, 10.189208984375, 10.92431640625, 11.659423828125, 12.39453125, 13.129638671875, 13.86474609375, 14.599853515625, 15.3349609375, 16.070068359375, 16.80517578125, 17.540283203125, 18.275390625, 19.010498046875, 19.74560546875, 20.480712890625, 21.2158203125, 21.950927734375, 22.68603515625, 23.421142578125, 24.15625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [6.0, 3.0, 6.0, 6.0, 5.0, 4.0, 4.0, 7.0, 6.0, 14.0, 13.0, 14.0, 22.0, 12.0, 19.0, 27.0, 25.0, 28.0, 36.0, 26.0, 36.0, 41.0, 25.0, 47.0, 29.0, 24.0, 44.0, 33.0, 41.0, 38.0, 35.0, 29.0, 37.0, 25.0, 30.0, 16.0, 33.0, 22.0, 28.0, 18.0, 17.0, 14.0, 10.0, 4.0, 10.0, 12.0, 9.0, 10.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.51123046875, -17.7880859375, -17.06494140625, -16.341796875, -15.61865234375, -14.8955078125, -14.17236328125, -13.44921875, -12.72607421875, -12.0029296875, -11.27978515625, -10.556640625, -9.83349609375, -9.1103515625, -8.38720703125, -7.6640625, -6.94091796875, -6.2177734375, -5.49462890625, -4.771484375, -4.04833984375, -3.3251953125, -2.60205078125, -1.87890625, -1.15576171875, -0.4326171875, 0.29052734375, 1.013671875, 1.73681640625, 2.4599609375, 3.18310546875, 3.90625, 4.62939453125, 5.3525390625, 6.07568359375, 6.798828125, 7.52197265625, 8.2451171875, 8.96826171875, 9.69140625, 10.41455078125, 11.1376953125, 11.86083984375, 12.583984375, 13.30712890625, 14.0302734375, 14.75341796875, 15.4765625, 16.19970703125, 16.9228515625, 17.64599609375, 18.369140625, 19.09228515625, 19.8154296875, 20.53857421875, 21.26171875, 21.98486328125, 22.7080078125, 23.43115234375, 24.154296875, 24.87744140625, 25.6005859375, 26.32373046875, 27.046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 9.0, 16.0, 20.0, 21.0, 57.0, 74.0, 112.0, 123.0, 216.0, 312.0, 508.0, 756.0, 1140.0, 1805.0, 2824.0, 4306.0, 6967.0, 10976.0, 17368.0, 27893.0, 44798.0, 70822.0, 106069.0, 141233.0, 157298.0, 144133.0, 108795.0, 73672.0, 47180.0, 29426.0, 17973.0, 11303.0, 7408.0, 4627.0, 2970.0, 1904.0, 1168.0, 793.0, 489.0, 337.0, 223.0, 147.0, 99.0, 62.0, 38.0, 27.0, 24.0, 17.0, 12.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.625, -33.453125, -32.28125, -31.109375, -29.9375, -28.765625, -27.59375, -26.421875, -25.25, -24.078125, -22.90625, -21.734375, -20.5625, -19.390625, -18.21875, -17.046875, -15.875, -14.703125, -13.53125, -12.359375, -11.1875, -10.015625, -8.84375, -7.671875, -6.5, -5.328125, -4.15625, -2.984375, -1.8125, -0.640625, 0.53125, 1.703125, 2.875, 4.046875, 5.21875, 6.390625, 7.5625, 8.734375, 9.90625, 11.078125, 12.25, 13.421875, 14.59375, 15.765625, 16.9375, 18.109375, 19.28125, 20.453125, 21.625, 22.796875, 23.96875, 25.140625, 26.3125, 27.484375, 28.65625, 29.828125, 31.0, 32.171875, 33.34375, 34.515625, 35.6875, 36.859375, 38.03125, 39.203125, 40.375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 5.0, 8.0, 12.0, 11.0, 18.0, 13.0, 22.0, 19.0, 21.0, 26.0, 40.0, 32.0, 33.0, 37.0, 44.0, 37.0, 34.0, 31.0, 41.0, 43.0, 38.0, 42.0, 28.0, 38.0, 46.0, 35.0, 23.0, 25.0, 21.0, 31.0, 23.0, 14.0, 17.0, 16.0, 10.0, 7.0, 8.0, 7.0, 2.0, 5.0, 8.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -16.95166015625, -16.3251953125, -15.69873046875, -15.072265625, -14.44580078125, -13.8193359375, -13.19287109375, -12.56640625, -11.93994140625, -11.3134765625, -10.68701171875, -10.060546875, -9.43408203125, -8.8076171875, -8.18115234375, -7.5546875, -6.92822265625, -6.3017578125, -5.67529296875, -5.048828125, -4.42236328125, -3.7958984375, -3.16943359375, -2.54296875, -1.91650390625, -1.2900390625, -0.66357421875, -0.037109375, 0.58935546875, 1.2158203125, 1.84228515625, 2.46875, 3.09521484375, 3.7216796875, 4.34814453125, 4.974609375, 5.60107421875, 6.2275390625, 6.85400390625, 7.48046875, 8.10693359375, 8.7333984375, 9.35986328125, 9.986328125, 10.61279296875, 11.2392578125, 11.86572265625, 12.4921875, 13.11865234375, 13.7451171875, 14.37158203125, 14.998046875, 15.62451171875, 16.2509765625, 16.87744140625, 17.50390625, 18.13037109375, 18.7568359375, 19.38330078125, 20.009765625, 20.63623046875, 21.2626953125, 21.88916015625, 22.515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 8.0, 19.0, 17.0, 30.0, 36.0, 55.0, 101.0, 143.0, 210.0, 387.0, 719.0, 1342.0, 2807.0, 6392.0, 17343.0, 65814.0, 517127.0, 362299.0, 48846.0, 14307.0, 5346.0, 2435.0, 1193.0, 644.0, 345.0, 191.0, 112.0, 80.0, 62.0, 50.0, 27.0, 21.0, 12.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.25, -93.8857421875, -90.521484375, -87.1572265625, -83.79296875, -80.4287109375, -77.064453125, -73.7001953125, -70.3359375, -66.9716796875, -63.607421875, -60.2431640625, -56.87890625, -53.5146484375, -50.150390625, -46.7861328125, -43.421875, -40.0576171875, -36.693359375, -33.3291015625, -29.96484375, -26.6005859375, -23.236328125, -19.8720703125, -16.5078125, -13.1435546875, -9.779296875, -6.4150390625, -3.05078125, 0.3134765625, 3.677734375, 7.0419921875, 10.40625, 13.7705078125, 17.134765625, 20.4990234375, 23.86328125, 27.2275390625, 30.591796875, 33.9560546875, 37.3203125, 40.6845703125, 44.048828125, 47.4130859375, 50.77734375, 54.1416015625, 57.505859375, 60.8701171875, 64.234375, 67.5986328125, 70.962890625, 74.3271484375, 77.69140625, 81.0556640625, 84.419921875, 87.7841796875, 91.1484375, 94.5126953125, 97.876953125, 101.2412109375, 104.60546875, 107.9697265625, 111.333984375, 114.6982421875, 118.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 7.0, 13.0, 11.0, 11.0, 24.0, 25.0, 41.0, 51.0, 91.0, 96.0, 136.0, 136.0, 98.0, 75.0, 47.0, 28.0, 24.0, 18.0, 8.0, 10.0, 7.0, 5.0, 10.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0043792724609375, -0.004221916198730469, -0.0040645599365234375, -0.003907203674316406, -0.003749847412109375, -0.0035924911499023438, -0.0034351348876953125, -0.0032777786254882812, -0.00312042236328125, -0.0029630661010742188, -0.0028057098388671875, -0.0026483535766601562, -0.002490997314453125, -0.0023336410522460938, -0.0021762847900390625, -0.0020189285278320312, -0.001861572265625, -0.0017042160034179688, -0.0015468597412109375, -0.0013895034790039062, -0.001232147216796875, -0.0010747909545898438, -0.0009174346923828125, -0.0007600784301757812, -0.00060272216796875, -0.00044536590576171875, -0.0002880096435546875, -0.00013065338134765625, 2.6702880859375e-05, 0.00018405914306640625, 0.0003414154052734375, 0.0004987716674804688, 0.0006561279296875, 0.0008134841918945312, 0.0009708404541015625, 0.0011281967163085938, 0.001285552978515625, 0.0014429092407226562, 0.0016002655029296875, 0.0017576217651367188, 0.00191497802734375, 0.0020723342895507812, 0.0022296905517578125, 0.0023870468139648438, 0.002544403076171875, 0.0027017593383789062, 0.0028591156005859375, 0.0030164718627929688, 0.003173828125, 0.0033311843872070312, 0.0034885406494140625, 0.0036458969116210938, 0.003803253173828125, 0.003960609436035156, 0.0041179656982421875, 0.004275321960449219, 0.00443267822265625, 0.004590034484863281, 0.0047473907470703125, 0.004904747009277344, 0.005062103271484375, 0.005219459533691406, 0.0053768157958984375, 0.005534172058105469, 0.0056915283203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 12.0, 11.0, 18.0, 21.0, 33.0, 46.0, 67.0, 84.0, 126.0, 174.0, 234.0, 371.0, 536.0, 835.0, 1394.0, 2258.0, 4071.0, 7495.0, 16160.0, 41667.0, 148869.0, 461451.0, 253533.0, 64474.0, 22227.0, 9769.0, 4989.0, 2847.0, 1682.0, 1036.0, 649.0, 434.0, 311.0, 194.0, 140.0, 89.0, 90.0, 31.0, 36.0, 26.0, 13.0, 7.0, 7.0, 9.0, 7.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-54.78125, -52.99609375, -51.2109375, -49.42578125, -47.640625, -45.85546875, -44.0703125, -42.28515625, -40.5, -38.71484375, -36.9296875, -35.14453125, -33.359375, -31.57421875, -29.7890625, -28.00390625, -26.21875, -24.43359375, -22.6484375, -20.86328125, -19.078125, -17.29296875, -15.5078125, -13.72265625, -11.9375, -10.15234375, -8.3671875, -6.58203125, -4.796875, -3.01171875, -1.2265625, 0.55859375, 2.34375, 4.12890625, 5.9140625, 7.69921875, 9.484375, 11.26953125, 13.0546875, 14.83984375, 16.625, 18.41015625, 20.1953125, 21.98046875, 23.765625, 25.55078125, 27.3359375, 29.12109375, 30.90625, 32.69140625, 34.4765625, 36.26171875, 38.046875, 39.83203125, 41.6171875, 43.40234375, 45.1875, 46.97265625, 48.7578125, 50.54296875, 52.328125, 54.11328125, 55.8984375, 57.68359375, 59.46875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 4.0, 15.0, 18.0, 29.0, 26.0, 40.0, 56.0, 67.0, 103.0, 103.0, 108.0, 112.0, 75.0, 67.0, 43.0, 28.0, 28.0, 21.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.564697265625, -11.06689453125, -10.569091796875, -10.0712890625, -9.573486328125, -9.07568359375, -8.577880859375, -8.080078125, -7.582275390625, -7.08447265625, -6.586669921875, -6.0888671875, -5.591064453125, -5.09326171875, -4.595458984375, -4.09765625, -3.599853515625, -3.10205078125, -2.604248046875, -2.1064453125, -1.608642578125, -1.11083984375, -0.613037109375, -0.115234375, 0.382568359375, 0.88037109375, 1.378173828125, 1.8759765625, 2.373779296875, 2.87158203125, 3.369384765625, 3.8671875, 4.364990234375, 4.86279296875, 5.360595703125, 5.8583984375, 6.356201171875, 6.85400390625, 7.351806640625, 7.849609375, 8.347412109375, 8.84521484375, 9.343017578125, 9.8408203125, 10.338623046875, 10.83642578125, 11.334228515625, 11.83203125, 12.329833984375, 12.82763671875, 13.325439453125, 13.8232421875, 14.321044921875, 14.81884765625, 15.316650390625, 15.814453125, 16.312255859375, 16.81005859375, 17.307861328125, 17.8056640625, 18.303466796875, 18.80126953125, 19.299072265625, 19.796875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 6.0, 13.0, 13.0, 16.0, 22.0, 26.0, 33.0, 35.0, 28.0, 35.0, 42.0, 46.0, 49.0, 51.0, 56.0, 40.0, 59.0, 49.0, 36.0, 56.0, 33.0, 41.0, 35.0, 26.0, 22.0, 25.0, 12.0, 21.0, 6.0, 10.0, 9.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.917936325073242, -23.992137908935547, -23.06633758544922, -22.14053726196289, -21.214738845825195, -20.2889404296875, -19.363140106201172, -18.437339782714844, -17.51154136657715, -16.585742950439453, -15.659942626953125, -14.734143257141113, -13.808343887329102, -12.88254451751709, -11.956745147705078, -11.030945777893066, -10.105146408081055, -9.179347038269043, -8.253547668457031, -7.3277482986450195, -6.401948928833008, -5.476149559020996, -4.550350189208984, -3.6245508193969727, -2.698751449584961, -1.7729520797729492, -0.8471527099609375, 0.07864665985107422, 1.004446029663086, 1.9302453994750977, 2.8560447692871094, 3.781844139099121, 4.707645416259766, 5.633444786071777, 6.559244155883789, 7.485043525695801, 8.410842895507812, 9.336642265319824, 10.262441635131836, 11.188241004943848, 12.11404037475586, 13.039839744567871, 13.965639114379883, 14.891438484191895, 15.817237854003906, 16.743038177490234, 17.66883659362793, 18.594635009765625, 19.520435333251953, 20.44623565673828, 21.372034072875977, 22.297832489013672, 23.2236328125, 24.149433135986328, 25.075231552124023, 26.00102996826172, 26.926830291748047, 27.852630615234375, 28.77842903137207, 29.704227447509766, 30.630027770996094, 31.555828094482422, 32.48162841796875, 33.40742492675781, 34.33322525024414]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 7.0, 10.0, 2.0, 7.0, 13.0, 20.0, 19.0, 15.0, 23.0, 30.0, 21.0, 31.0, 34.0, 36.0, 34.0, 28.0, 42.0, 49.0, 43.0, 50.0, 39.0, 33.0, 37.0, 43.0, 37.0, 39.0, 34.0, 31.0, 30.0, 34.0, 25.0, 20.0, 16.0, 11.0, 9.0, 16.0, 9.0, 5.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.683778762817383, -27.73978614807129, -26.795791625976562, -25.85179901123047, -24.907806396484375, -23.96381378173828, -23.019819259643555, -22.07582664489746, -21.131832122802734, -20.18783950805664, -19.243844985961914, -18.29985237121582, -17.355859756469727, -16.411865234375, -15.467872619628906, -14.523880004882812, -13.579887390136719, -12.635893821716309, -11.691901206970215, -10.747907638549805, -9.803915023803711, -8.8599214553833, -7.915927886962891, -6.971934795379639, -6.027941703796387, -5.083948612213135, -4.139955520629883, -3.1959619522094727, -2.2519688606262207, -1.3079757690429688, -0.3639822006225586, 0.5800108909606934, 1.5240020751953125, 2.4679951667785645, 3.4119884967803955, 4.355981826782227, 5.2999749183654785, 6.2439680099487305, 7.187961578369141, 8.131954193115234, 9.075947761535645, 10.019941329956055, 10.963933944702148, 11.907927513122559, 12.851921081542969, 13.795913696289062, 14.739907264709473, 15.683900833129883, 16.627893447875977, 17.57188606262207, 18.515880584716797, 19.45987319946289, 20.403865814208984, 21.347858428955078, 22.291852951049805, 23.2358455657959, 24.179840087890625, 25.12383270263672, 26.067827224731445, 27.01181983947754, 27.955812454223633, 28.89980697631836, 29.843799591064453, 30.787792205810547, 31.73178482055664]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 21.0, 30.0, 47.0, 82.0, 144.0, 207.0, 300.0, 550.0, 874.0, 1375.0, 2201.0, 3635.0, 6150.0, 10082.0, 17651.0, 30637.0, 54524.0, 97698.0, 181161.0, 326954.0, 547768.0, 748570.0, 765307.0, 587540.0, 361849.0, 200562.0, 108621.0, 60020.0, 33511.0, 18891.0, 11013.0, 6461.0, 3810.0, 2312.0, 1380.0, 855.0, 555.0, 335.0, 213.0, 135.0, 78.0, 47.0, 40.0, 31.0, 12.0, 13.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.46875, -23.6552734375, -22.841796875, -22.0283203125, -21.21484375, -20.4013671875, -19.587890625, -18.7744140625, -17.9609375, -17.1474609375, -16.333984375, -15.5205078125, -14.70703125, -13.8935546875, -13.080078125, -12.2666015625, -11.453125, -10.6396484375, -9.826171875, -9.0126953125, -8.19921875, -7.3857421875, -6.572265625, -5.7587890625, -4.9453125, -4.1318359375, -3.318359375, -2.5048828125, -1.69140625, -0.8779296875, -0.064453125, 0.7490234375, 1.5625, 2.3759765625, 3.189453125, 4.0029296875, 4.81640625, 5.6298828125, 6.443359375, 7.2568359375, 8.0703125, 8.8837890625, 9.697265625, 10.5107421875, 11.32421875, 12.1376953125, 12.951171875, 13.7646484375, 14.578125, 15.3916015625, 16.205078125, 17.0185546875, 17.83203125, 18.6455078125, 19.458984375, 20.2724609375, 21.0859375, 21.8994140625, 22.712890625, 23.5263671875, 24.33984375, 25.1533203125, 25.966796875, 26.7802734375, 27.59375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 10.0, 12.0, 11.0, 11.0, 11.0, 17.0, 19.0, 25.0, 28.0, 26.0, 33.0, 36.0, 36.0, 39.0, 34.0, 47.0, 41.0, 49.0, 34.0, 50.0, 57.0, 41.0, 38.0, 36.0, 28.0, 39.0, 28.0, 30.0, 34.0, 20.0, 17.0, 19.0, 8.0, 6.0, 15.0, 4.0, 5.0, 10.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.12353515625, -22.2783203125, -21.43310546875, -20.587890625, -19.74267578125, -18.8974609375, -18.05224609375, -17.20703125, -16.36181640625, -15.5166015625, -14.67138671875, -13.826171875, -12.98095703125, -12.1357421875, -11.29052734375, -10.4453125, -9.60009765625, -8.7548828125, -7.90966796875, -7.064453125, -6.21923828125, -5.3740234375, -4.52880859375, -3.68359375, -2.83837890625, -1.9931640625, -1.14794921875, -0.302734375, 0.54248046875, 1.3876953125, 2.23291015625, 3.078125, 3.92333984375, 4.7685546875, 5.61376953125, 6.458984375, 7.30419921875, 8.1494140625, 8.99462890625, 9.83984375, 10.68505859375, 11.5302734375, 12.37548828125, 13.220703125, 14.06591796875, 14.9111328125, 15.75634765625, 16.6015625, 17.44677734375, 18.2919921875, 19.13720703125, 19.982421875, 20.82763671875, 21.6728515625, 22.51806640625, 23.36328125, 24.20849609375, 25.0537109375, 25.89892578125, 26.744140625, 27.58935546875, 28.4345703125, 29.27978515625, 30.125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 8.0, 16.0, 21.0, 37.0, 44.0, 69.0, 118.0, 151.0, 290.0, 420.0, 757.0, 1215.0, 2198.0, 3718.0, 6507.0, 11509.0, 21253.0, 39549.0, 74316.0, 143192.0, 274206.0, 492360.0, 760670.0, 858059.0, 659231.0, 394222.0, 212372.0, 110929.0, 57812.0, 30474.0, 16796.0, 9220.0, 5179.0, 3013.0, 1681.0, 1041.0, 617.0, 359.0, 221.0, 163.0, 82.0, 62.0, 45.0, 24.0, 19.0, 11.0, 9.0, 10.0, 3.0, 6.0, 0.0, 1.0], "bins": [-36.0, -34.980224609375, -33.96044921875, -32.940673828125, -31.9208984375, -30.901123046875, -29.88134765625, -28.861572265625, -27.841796875, -26.822021484375, -25.80224609375, -24.782470703125, -23.7626953125, -22.742919921875, -21.72314453125, -20.703369140625, -19.68359375, -18.663818359375, -17.64404296875, -16.624267578125, -15.6044921875, -14.584716796875, -13.56494140625, -12.545166015625, -11.525390625, -10.505615234375, -9.48583984375, -8.466064453125, -7.4462890625, -6.426513671875, -5.40673828125, -4.386962890625, -3.3671875, -2.347412109375, -1.32763671875, -0.307861328125, 0.7119140625, 1.731689453125, 2.75146484375, 3.771240234375, 4.791015625, 5.810791015625, 6.83056640625, 7.850341796875, 8.8701171875, 9.889892578125, 10.90966796875, 11.929443359375, 12.94921875, 13.968994140625, 14.98876953125, 16.008544921875, 17.0283203125, 18.048095703125, 19.06787109375, 20.087646484375, 21.107421875, 22.127197265625, 23.14697265625, 24.166748046875, 25.1865234375, 26.206298828125, 27.22607421875, 28.245849609375, 29.265625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 8.0, 11.0, 18.0, 23.0, 30.0, 27.0, 46.0, 54.0, 84.0, 87.0, 116.0, 149.0, 167.0, 184.0, 211.0, 245.0, 245.0, 286.0, 280.0, 278.0, 239.0, 248.0, 190.0, 156.0, 153.0, 109.0, 89.0, 74.0, 60.0, 39.0, 41.0, 25.0, 18.0, 25.0, 10.0, 14.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.4609375, -14.0726318359375, -13.684326171875, -13.2960205078125, -12.90771484375, -12.5194091796875, -12.131103515625, -11.7427978515625, -11.3544921875, -10.9661865234375, -10.577880859375, -10.1895751953125, -9.80126953125, -9.4129638671875, -9.024658203125, -8.6363525390625, -8.248046875, -7.8597412109375, -7.471435546875, -7.0831298828125, -6.69482421875, -6.3065185546875, -5.918212890625, -5.5299072265625, -5.1416015625, -4.7532958984375, -4.364990234375, -3.9766845703125, -3.58837890625, -3.2000732421875, -2.811767578125, -2.4234619140625, -2.03515625, -1.6468505859375, -1.258544921875, -0.8702392578125, -0.48193359375, -0.0936279296875, 0.294677734375, 0.6829833984375, 1.0712890625, 1.4595947265625, 1.847900390625, 2.2362060546875, 2.62451171875, 3.0128173828125, 3.401123046875, 3.7894287109375, 4.177734375, 4.5660400390625, 4.954345703125, 5.3426513671875, 5.73095703125, 6.1192626953125, 6.507568359375, 6.8958740234375, 7.2841796875, 7.6724853515625, 8.060791015625, 8.4490966796875, 8.83740234375, 9.2257080078125, 9.614013671875, 10.0023193359375, 10.390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 7.0, 4.0, 14.0, 14.0, 15.0, 15.0, 23.0, 20.0, 36.0, 36.0, 36.0, 42.0, 32.0, 32.0, 57.0, 50.0, 56.0, 51.0, 59.0, 46.0, 51.0, 47.0, 37.0, 26.0, 27.0, 17.0, 25.0, 25.0, 12.0, 15.0, 11.0, 13.0, 8.0, 8.0, 8.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.204660415649414, -25.30303192138672, -24.401405334472656, -23.49977684020996, -22.598148345947266, -21.696521759033203, -20.794893264770508, -19.893264770507812, -18.99163818359375, -18.090009689331055, -17.188383102416992, -16.286754608154297, -15.385126113891602, -14.483498573303223, -13.581871032714844, -12.680242538452148, -11.778614044189453, -10.876986503601074, -9.975358009338379, -9.07373046875, -8.172101974487305, -7.270474433898926, -6.368846893310547, -5.46721887588501, -4.565590858459473, -3.6639628410339355, -2.7623350620269775, -1.8607072830200195, -0.9590792655944824, -0.05745124816894531, 0.8441762924194336, 1.7458043098449707, 2.6474342346191406, 3.5490622520446777, 4.450690269470215, 5.352317810058594, 6.253945827484131, 7.155573844909668, 8.057201385498047, 8.958829879760742, 9.860457420349121, 10.7620849609375, 11.663713455200195, 12.565340995788574, 13.466968536376953, 14.368597030639648, 15.270224571228027, 16.171852111816406, 17.0734806060791, 17.975109100341797, 18.87673568725586, 19.778364181518555, 20.67999267578125, 21.581619262695312, 22.483247756958008, 23.384876251220703, 24.286502838134766, 25.18813133239746, 26.089757919311523, 26.99138641357422, 27.893014907836914, 28.79464340209961, 29.696269989013672, 30.597898483276367, 31.499526977539062]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 8.0, 7.0, 12.0, 13.0, 12.0, 27.0, 13.0, 28.0, 12.0, 23.0, 23.0, 27.0, 28.0, 30.0, 34.0, 33.0, 50.0, 42.0, 33.0, 49.0, 45.0, 54.0, 42.0, 37.0, 30.0, 45.0, 33.0, 31.0, 21.0, 26.0, 16.0, 15.0, 14.0, 19.0, 12.0, 19.0, 7.0, 9.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.648866653442383, -26.766971588134766, -25.885074615478516, -25.0031795501709, -24.12128448486328, -23.23938751220703, -22.357492446899414, -21.475597381591797, -20.593700408935547, -19.71180534362793, -18.82990837097168, -17.948013305664062, -17.066118240356445, -16.184223175048828, -15.302326202392578, -14.420431137084961, -13.538536071777344, -12.65664005279541, -11.774744987487793, -10.89284896850586, -10.010953903198242, -9.129057884216309, -8.247161865234375, -7.3652663230896, -6.483370780944824, -5.601475238800049, -4.719579696655273, -3.83768367767334, -2.9557881355285645, -2.073892593383789, -1.1919965744018555, -0.3101010322570801, 0.5717926025390625, 1.4536882638931274, 2.3355839252471924, 3.217479705810547, 4.099375247955322, 4.981270790100098, 5.863166809082031, 6.745062351226807, 7.626957893371582, 8.508853912353516, 9.390748977661133, 10.272644996643066, 11.154541015625, 12.036436080932617, 12.91833209991455, 13.800228118896484, 14.682123184204102, 15.564019203186035, 16.44591522216797, 17.327810287475586, 18.209705352783203, 19.091602325439453, 19.97349739074707, 20.855392456054688, 21.737289428710938, 22.619184494018555, 23.501081466674805, 24.382976531982422, 25.26487159729004, 26.146766662597656, 27.028663635253906, 27.910558700561523, 28.79245376586914]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 23.0, 19.0, 28.0, 32.0, 55.0, 83.0, 137.0, 178.0, 220.0, 334.0, 476.0, 718.0, 990.0, 1494.0, 2409.0, 3759.0, 6065.0, 10199.0, 17286.0, 30708.0, 56765.0, 109912.0, 200249.0, 245652.0, 166052.0, 86842.0, 45487.0, 25086.0, 14256.0, 8412.0, 5213.0, 3191.0, 2070.0, 1326.0, 841.0, 578.0, 428.0, 292.0, 221.0, 126.0, 92.0, 77.0, 59.0, 32.0, 28.0, 20.0, 15.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-44.9375, -43.54736328125, -42.1572265625, -40.76708984375, -39.376953125, -37.98681640625, -36.5966796875, -35.20654296875, -33.81640625, -32.42626953125, -31.0361328125, -29.64599609375, -28.255859375, -26.86572265625, -25.4755859375, -24.08544921875, -22.6953125, -21.30517578125, -19.9150390625, -18.52490234375, -17.134765625, -15.74462890625, -14.3544921875, -12.96435546875, -11.57421875, -10.18408203125, -8.7939453125, -7.40380859375, -6.013671875, -4.62353515625, -3.2333984375, -1.84326171875, -0.453125, 0.93701171875, 2.3271484375, 3.71728515625, 5.107421875, 6.49755859375, 7.8876953125, 9.27783203125, 10.66796875, 12.05810546875, 13.4482421875, 14.83837890625, 16.228515625, 17.61865234375, 19.0087890625, 20.39892578125, 21.7890625, 23.17919921875, 24.5693359375, 25.95947265625, 27.349609375, 28.73974609375, 30.1298828125, 31.52001953125, 32.91015625, 34.30029296875, 35.6904296875, 37.08056640625, 38.470703125, 39.86083984375, 41.2509765625, 42.64111328125, 44.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 6.0, 4.0, 6.0, 4.0, 3.0, 9.0, 12.0, 3.0, 16.0, 16.0, 19.0, 21.0, 25.0, 18.0, 24.0, 25.0, 29.0, 29.0, 30.0, 37.0, 34.0, 47.0, 50.0, 35.0, 51.0, 47.0, 43.0, 45.0, 37.0, 42.0, 38.0, 23.0, 24.0, 26.0, 19.0, 18.0, 16.0, 14.0, 12.0, 8.0, 12.0, 13.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.671875, -24.80126953125, -23.9306640625, -23.06005859375, -22.189453125, -21.31884765625, -20.4482421875, -19.57763671875, -18.70703125, -17.83642578125, -16.9658203125, -16.09521484375, -15.224609375, -14.35400390625, -13.4833984375, -12.61279296875, -11.7421875, -10.87158203125, -10.0009765625, -9.13037109375, -8.259765625, -7.38916015625, -6.5185546875, -5.64794921875, -4.77734375, -3.90673828125, -3.0361328125, -2.16552734375, -1.294921875, -0.42431640625, 0.4462890625, 1.31689453125, 2.1875, 3.05810546875, 3.9287109375, 4.79931640625, 5.669921875, 6.54052734375, 7.4111328125, 8.28173828125, 9.15234375, 10.02294921875, 10.8935546875, 11.76416015625, 12.634765625, 13.50537109375, 14.3759765625, 15.24658203125, 16.1171875, 16.98779296875, 17.8583984375, 18.72900390625, 19.599609375, 20.47021484375, 21.3408203125, 22.21142578125, 23.08203125, 23.95263671875, 24.8232421875, 25.69384765625, 26.564453125, 27.43505859375, 28.3056640625, 29.17626953125, 30.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 12.0, 22.0, 24.0, 36.0, 57.0, 92.0, 128.0, 199.0, 289.0, 432.0, 686.0, 1170.0, 1943.0, 3297.0, 5702.0, 10592.0, 20392.0, 42266.0, 97294.0, 232380.0, 324786.0, 169309.0, 70000.0, 31657.0, 15793.0, 8390.0, 4565.0, 2741.0, 1609.0, 998.0, 570.0, 384.0, 257.0, 168.0, 103.0, 53.0, 44.0, 41.0, 17.0, 8.0, 16.0, 13.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-62.8125, -61.03369140625, -59.2548828125, -57.47607421875, -55.697265625, -53.91845703125, -52.1396484375, -50.36083984375, -48.58203125, -46.80322265625, -45.0244140625, -43.24560546875, -41.466796875, -39.68798828125, -37.9091796875, -36.13037109375, -34.3515625, -32.57275390625, -30.7939453125, -29.01513671875, -27.236328125, -25.45751953125, -23.6787109375, -21.89990234375, -20.12109375, -18.34228515625, -16.5634765625, -14.78466796875, -13.005859375, -11.22705078125, -9.4482421875, -7.66943359375, -5.890625, -4.11181640625, -2.3330078125, -0.55419921875, 1.224609375, 3.00341796875, 4.7822265625, 6.56103515625, 8.33984375, 10.11865234375, 11.8974609375, 13.67626953125, 15.455078125, 17.23388671875, 19.0126953125, 20.79150390625, 22.5703125, 24.34912109375, 26.1279296875, 27.90673828125, 29.685546875, 31.46435546875, 33.2431640625, 35.02197265625, 36.80078125, 38.57958984375, 40.3583984375, 42.13720703125, 43.916015625, 45.69482421875, 47.4736328125, 49.25244140625, 51.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 14.0, 12.0, 27.0, 23.0, 33.0, 44.0, 40.0, 36.0, 43.0, 68.0, 64.0, 57.0, 53.0, 46.0, 58.0, 52.0, 56.0, 62.0, 30.0, 40.0, 26.0, 19.0, 13.0, 20.0, 12.0, 8.0, 8.0, 4.0, 1.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.40625, -33.435791015625, -32.46533203125, -31.494873046875, -30.5244140625, -29.553955078125, -28.58349609375, -27.613037109375, -26.642578125, -25.672119140625, -24.70166015625, -23.731201171875, -22.7607421875, -21.790283203125, -20.81982421875, -19.849365234375, -18.87890625, -17.908447265625, -16.93798828125, -15.967529296875, -14.9970703125, -14.026611328125, -13.05615234375, -12.085693359375, -11.115234375, -10.144775390625, -9.17431640625, -8.203857421875, -7.2333984375, -6.262939453125, -5.29248046875, -4.322021484375, -3.3515625, -2.381103515625, -1.41064453125, -0.440185546875, 0.5302734375, 1.500732421875, 2.47119140625, 3.441650390625, 4.412109375, 5.382568359375, 6.35302734375, 7.323486328125, 8.2939453125, 9.264404296875, 10.23486328125, 11.205322265625, 12.17578125, 13.146240234375, 14.11669921875, 15.087158203125, 16.0576171875, 17.028076171875, 17.99853515625, 18.968994140625, 19.939453125, 20.909912109375, 21.88037109375, 22.850830078125, 23.8212890625, 24.791748046875, 25.76220703125, 26.732666015625, 27.703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 10.0, 15.0, 23.0, 27.0, 38.0, 60.0, 64.0, 77.0, 134.0, 188.0, 228.0, 324.0, 495.0, 669.0, 918.0, 1400.0, 1897.0, 2849.0, 4230.0, 6612.0, 10572.0, 19720.0, 51259.0, 261841.0, 519958.0, 98304.0, 28848.0, 13899.0, 7980.0, 4905.0, 3321.0, 2328.0, 1607.0, 1100.0, 736.0, 529.0, 374.0, 277.0, 171.0, 154.0, 95.0, 90.0, 69.0, 44.0, 30.0, 23.0, 15.0, 12.0, 5.0, 4.0, 12.0, 7.0, 5.0], "bins": [-44.3125, -43.0546875, -41.796875, -40.5390625, -39.28125, -38.0234375, -36.765625, -35.5078125, -34.25, -32.9921875, -31.734375, -30.4765625, -29.21875, -27.9609375, -26.703125, -25.4453125, -24.1875, -22.9296875, -21.671875, -20.4140625, -19.15625, -17.8984375, -16.640625, -15.3828125, -14.125, -12.8671875, -11.609375, -10.3515625, -9.09375, -7.8359375, -6.578125, -5.3203125, -4.0625, -2.8046875, -1.546875, -0.2890625, 0.96875, 2.2265625, 3.484375, 4.7421875, 6.0, 7.2578125, 8.515625, 9.7734375, 11.03125, 12.2890625, 13.546875, 14.8046875, 16.0625, 17.3203125, 18.578125, 19.8359375, 21.09375, 22.3515625, 23.609375, 24.8671875, 26.125, 27.3828125, 28.640625, 29.8984375, 31.15625, 32.4140625, 33.671875, 34.9296875, 36.1875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 10.0, 12.0, 23.0, 33.0, 172.0, 392.0, 171.0, 54.0, 24.0, 12.0, 14.0, 9.0, 8.0, 3.0, 4.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0084381103515625, -0.008170723915100098, -0.007903337478637695, -0.007635951042175293, -0.007368564605712891, -0.007101178169250488, -0.006833791732788086, -0.006566405296325684, -0.006299018859863281, -0.006031632423400879, -0.0057642459869384766, -0.005496859550476074, -0.005229473114013672, -0.0049620866775512695, -0.004694700241088867, -0.004427313804626465, -0.0041599273681640625, -0.00389254093170166, -0.003625154495239258, -0.0033577680587768555, -0.003090381622314453, -0.0028229951858520508, -0.0025556087493896484, -0.002288222312927246, -0.0020208358764648438, -0.0017534494400024414, -0.001486063003540039, -0.0012186765670776367, -0.0009512901306152344, -0.000683903694152832, -0.0004165172576904297, -0.00014913082122802734, 0.000118255615234375, 0.00038564205169677734, 0.0006530284881591797, 0.000920414924621582, 0.0011878013610839844, 0.0014551877975463867, 0.001722574234008789, 0.0019899606704711914, 0.0022573471069335938, 0.002524733543395996, 0.0027921199798583984, 0.0030595064163208008, 0.003326892852783203, 0.0035942792892456055, 0.003861665725708008, 0.00412905216217041, 0.0043964385986328125, 0.004663825035095215, 0.004931211471557617, 0.0051985979080200195, 0.005465984344482422, 0.005733370780944824, 0.0060007572174072266, 0.006268143653869629, 0.006535530090332031, 0.006802916526794434, 0.007070302963256836, 0.007337689399719238, 0.007605075836181641, 0.007872462272644043, 0.008139848709106445, 0.008407235145568848, 0.00867462158203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 13.0, 10.0, 23.0, 39.0, 46.0, 77.0, 95.0, 142.0, 222.0, 394.0, 591.0, 979.0, 1541.0, 2569.0, 4588.0, 7824.0, 14355.0, 29607.0, 100954.0, 492144.0, 288116.0, 56150.0, 21425.0, 11156.0, 6205.0, 3638.0, 2173.0, 1375.0, 790.0, 498.0, 290.0, 174.0, 116.0, 74.0, 56.0, 30.0, 28.0, 12.0, 11.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.15625, -45.57373046875, -43.9912109375, -42.40869140625, -40.826171875, -39.24365234375, -37.6611328125, -36.07861328125, -34.49609375, -32.91357421875, -31.3310546875, -29.74853515625, -28.166015625, -26.58349609375, -25.0009765625, -23.41845703125, -21.8359375, -20.25341796875, -18.6708984375, -17.08837890625, -15.505859375, -13.92333984375, -12.3408203125, -10.75830078125, -9.17578125, -7.59326171875, -6.0107421875, -4.42822265625, -2.845703125, -1.26318359375, 0.3193359375, 1.90185546875, 3.484375, 5.06689453125, 6.6494140625, 8.23193359375, 9.814453125, 11.39697265625, 12.9794921875, 14.56201171875, 16.14453125, 17.72705078125, 19.3095703125, 20.89208984375, 22.474609375, 24.05712890625, 25.6396484375, 27.22216796875, 28.8046875, 30.38720703125, 31.9697265625, 33.55224609375, 35.134765625, 36.71728515625, 38.2998046875, 39.88232421875, 41.46484375, 43.04736328125, 44.6298828125, 46.21240234375, 47.794921875, 49.37744140625, 50.9599609375, 52.54248046875, 54.125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 8.0, 10.0, 10.0, 15.0, 24.0, 39.0, 62.0, 95.0, 168.0, 152.0, 139.0, 81.0, 49.0, 30.0, 16.0, 11.0, 12.0, 4.0, 10.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.6873779296875, -15.187255859375, -14.6871337890625, -14.18701171875, -13.6868896484375, -13.186767578125, -12.6866455078125, -12.1865234375, -11.6864013671875, -11.186279296875, -10.6861572265625, -10.18603515625, -9.6859130859375, -9.185791015625, -8.6856689453125, -8.185546875, -7.6854248046875, -7.185302734375, -6.6851806640625, -6.18505859375, -5.6849365234375, -5.184814453125, -4.6846923828125, -4.1845703125, -3.6844482421875, -3.184326171875, -2.6842041015625, -2.18408203125, -1.6839599609375, -1.183837890625, -0.6837158203125, -0.18359375, 0.3165283203125, 0.816650390625, 1.3167724609375, 1.81689453125, 2.3170166015625, 2.817138671875, 3.3172607421875, 3.8173828125, 4.3175048828125, 4.817626953125, 5.3177490234375, 5.81787109375, 6.3179931640625, 6.818115234375, 7.3182373046875, 7.818359375, 8.3184814453125, 8.818603515625, 9.3187255859375, 9.81884765625, 10.3189697265625, 10.819091796875, 11.3192138671875, 11.8193359375, 12.3194580078125, 12.819580078125, 13.3197021484375, 13.81982421875, 14.3199462890625, 14.820068359375, 15.3201904296875, 15.8203125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 12.0, 3.0, 5.0, 9.0, 10.0, 13.0, 15.0, 16.0, 22.0, 28.0, 39.0, 55.0, 51.0, 55.0, 49.0, 61.0, 56.0, 65.0, 45.0, 64.0, 60.0, 37.0, 44.0, 33.0, 24.0, 24.0, 29.0, 19.0, 13.0, 16.0, 7.0, 6.0, 9.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.815786361694336, -28.7351131439209, -27.654438018798828, -26.57376480102539, -25.493091583251953, -24.412418365478516, -23.331743240356445, -22.251070022583008, -21.170394897460938, -20.0897216796875, -19.00904655456543, -17.928373336791992, -16.847700119018555, -15.7670259475708, -14.686351776123047, -13.60567855834961, -12.525005340576172, -11.444331169128418, -10.36365795135498, -9.282983779907227, -8.202310562133789, -7.121636390686035, -6.040962219238281, -4.9602885246276855, -3.87961483001709, -2.798941135406494, -1.7182672023773193, -0.6375932693481445, 0.44308042526245117, 1.5237541198730469, 2.604428291320801, 3.6851019859313965, 4.765777587890625, 5.846451282501221, 6.927124977111816, 8.00779914855957, 9.088472366333008, 10.169146537780762, 11.249820709228516, 12.330493927001953, 13.411168098449707, 14.491842269897461, 15.572515487670898, 16.65319061279297, 17.733863830566406, 18.814537048339844, 19.89521026611328, 20.97588539123535, 22.05655860900879, 23.137231826782227, 24.217906951904297, 25.298580169677734, 26.379253387451172, 27.45992660522461, 28.54060173034668, 29.621274948120117, 30.701950073242188, 31.782623291015625, 32.86329650878906, 33.9439697265625, 35.0246467590332, 36.10531997680664, 37.18599319458008, 38.266666412353516, 39.34733963012695]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 6.0, 5.0, 11.0, 8.0, 21.0, 20.0, 13.0, 24.0, 17.0, 25.0, 33.0, 30.0, 38.0, 38.0, 30.0, 47.0, 33.0, 42.0, 42.0, 37.0, 49.0, 46.0, 44.0, 50.0, 38.0, 39.0, 26.0, 30.0, 21.0, 25.0, 28.0, 17.0, 16.0, 7.0, 8.0, 5.0, 5.0, 4.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.58155059814453, -26.625232696533203, -25.668916702270508, -24.71259880065918, -23.756282806396484, -22.799964904785156, -21.84364891052246, -20.887331008911133, -19.931015014648438, -18.97469711303711, -18.018381118774414, -17.062063217163086, -16.10574722290039, -15.149429321289062, -14.193113327026367, -13.236795425415039, -12.280478477478027, -11.324161529541016, -10.367844581604004, -9.411527633666992, -8.45521068572998, -7.4988932609558105, -6.542576313018799, -5.586259365081787, -4.629942417144775, -3.6736254692077637, -2.717308521270752, -1.7609913349151611, -0.8046743869781494, 0.1516427993774414, 1.1079597473144531, 2.064276695251465, 3.0205936431884766, 3.9769105911254883, 4.9332275390625, 5.889544486999512, 6.845861434936523, 7.802178859710693, 8.758495330810547, 9.714813232421875, 10.67112922668457, 11.627446174621582, 12.583763122558594, 13.540080070495605, 14.496397018432617, 15.452714920043945, 16.40903091430664, 17.36534881591797, 18.321666717529297, 19.277984619140625, 20.23430061340332, 21.19061851501465, 22.146934509277344, 23.103252410888672, 24.059568405151367, 25.015886306762695, 25.97220230102539, 26.92852020263672, 27.884836196899414, 28.841154098510742, 29.797470092773438, 30.753787994384766, 31.71010398864746, 32.666419982910156, 33.622737884521484]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 9.0, 30.0, 37.0, 53.0, 82.0, 130.0, 203.0, 308.0, 487.0, 768.0, 1125.0, 1865.0, 2887.0, 4666.0, 7599.0, 11832.0, 19014.0, 29574.0, 46537.0, 68938.0, 96982.0, 124774.0, 141477.0, 136109.0, 111797.0, 82614.0, 57115.0, 37283.0, 23539.0, 14905.0, 9446.0, 6013.0, 3752.0, 2376.0, 1539.0, 941.0, 615.0, 423.0, 267.0, 148.0, 98.0, 58.0, 41.0, 24.0, 20.0, 20.0, 4.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-29.484375, -28.61083984375, -27.7373046875, -26.86376953125, -25.990234375, -25.11669921875, -24.2431640625, -23.36962890625, -22.49609375, -21.62255859375, -20.7490234375, -19.87548828125, -19.001953125, -18.12841796875, -17.2548828125, -16.38134765625, -15.5078125, -14.63427734375, -13.7607421875, -12.88720703125, -12.013671875, -11.14013671875, -10.2666015625, -9.39306640625, -8.51953125, -7.64599609375, -6.7724609375, -5.89892578125, -5.025390625, -4.15185546875, -3.2783203125, -2.40478515625, -1.53125, -0.65771484375, 0.2158203125, 1.08935546875, 1.962890625, 2.83642578125, 3.7099609375, 4.58349609375, 5.45703125, 6.33056640625, 7.2041015625, 8.07763671875, 8.951171875, 9.82470703125, 10.6982421875, 11.57177734375, 12.4453125, 13.31884765625, 14.1923828125, 15.06591796875, 15.939453125, 16.81298828125, 17.6865234375, 18.56005859375, 19.43359375, 20.30712890625, 21.1806640625, 22.05419921875, 22.927734375, 23.80126953125, 24.6748046875, 25.54833984375, 26.421875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 8.0, 6.0, 14.0, 6.0, 20.0, 24.0, 16.0, 15.0, 23.0, 30.0, 28.0, 36.0, 34.0, 34.0, 37.0, 44.0, 50.0, 43.0, 53.0, 51.0, 49.0, 55.0, 40.0, 40.0, 26.0, 40.0, 30.0, 29.0, 22.0, 18.0, 21.0, 12.0, 9.0, 9.0, 4.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.078125, -27.083251953125, -26.08837890625, -25.093505859375, -24.0986328125, -23.103759765625, -22.10888671875, -21.114013671875, -20.119140625, -19.124267578125, -18.12939453125, -17.134521484375, -16.1396484375, -15.144775390625, -14.14990234375, -13.155029296875, -12.16015625, -11.165283203125, -10.17041015625, -9.175537109375, -8.1806640625, -7.185791015625, -6.19091796875, -5.196044921875, -4.201171875, -3.206298828125, -2.21142578125, -1.216552734375, -0.2216796875, 0.773193359375, 1.76806640625, 2.762939453125, 3.7578125, 4.752685546875, 5.74755859375, 6.742431640625, 7.7373046875, 8.732177734375, 9.72705078125, 10.721923828125, 11.716796875, 12.711669921875, 13.70654296875, 14.701416015625, 15.6962890625, 16.691162109375, 17.68603515625, 18.680908203125, 19.67578125, 20.670654296875, 21.66552734375, 22.660400390625, 23.6552734375, 24.650146484375, 25.64501953125, 26.639892578125, 27.634765625, 28.629638671875, 29.62451171875, 30.619384765625, 31.6142578125, 32.609130859375, 33.60400390625, 34.598876953125, 35.59375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 11.0, 23.0, 26.0, 28.0, 45.0, 81.0, 107.0, 193.0, 343.0, 536.0, 914.0, 1673.0, 2870.0, 5250.0, 9889.0, 18584.0, 35513.0, 66306.0, 117412.0, 179854.0, 208078.0, 168507.0, 105873.0, 58829.0, 31403.0, 16669.0, 8659.0, 4681.0, 2621.0, 1460.0, 835.0, 441.0, 292.0, 202.0, 113.0, 68.0, 55.0, 31.0, 19.0, 17.0, 14.0, 3.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-46.9375, -45.44287109375, -43.9482421875, -42.45361328125, -40.958984375, -39.46435546875, -37.9697265625, -36.47509765625, -34.98046875, -33.48583984375, -31.9912109375, -30.49658203125, -29.001953125, -27.50732421875, -26.0126953125, -24.51806640625, -23.0234375, -21.52880859375, -20.0341796875, -18.53955078125, -17.044921875, -15.55029296875, -14.0556640625, -12.56103515625, -11.06640625, -9.57177734375, -8.0771484375, -6.58251953125, -5.087890625, -3.59326171875, -2.0986328125, -0.60400390625, 0.890625, 2.38525390625, 3.8798828125, 5.37451171875, 6.869140625, 8.36376953125, 9.8583984375, 11.35302734375, 12.84765625, 14.34228515625, 15.8369140625, 17.33154296875, 18.826171875, 20.32080078125, 21.8154296875, 23.31005859375, 24.8046875, 26.29931640625, 27.7939453125, 29.28857421875, 30.783203125, 32.27783203125, 33.7724609375, 35.26708984375, 36.76171875, 38.25634765625, 39.7509765625, 41.24560546875, 42.740234375, 44.23486328125, 45.7294921875, 47.22412109375, 48.71875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 7.0, 4.0, 7.0, 6.0, 10.0, 11.0, 11.0, 10.0, 18.0, 27.0, 26.0, 30.0, 36.0, 37.0, 50.0, 36.0, 54.0, 48.0, 48.0, 50.0, 64.0, 53.0, 57.0, 47.0, 36.0, 42.0, 37.0, 32.0, 26.0, 16.0, 22.0, 11.0, 7.0, 7.0, 13.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.015625, -26.24169921875, -25.4677734375, -24.69384765625, -23.919921875, -23.14599609375, -22.3720703125, -21.59814453125, -20.82421875, -20.05029296875, -19.2763671875, -18.50244140625, -17.728515625, -16.95458984375, -16.1806640625, -15.40673828125, -14.6328125, -13.85888671875, -13.0849609375, -12.31103515625, -11.537109375, -10.76318359375, -9.9892578125, -9.21533203125, -8.44140625, -7.66748046875, -6.8935546875, -6.11962890625, -5.345703125, -4.57177734375, -3.7978515625, -3.02392578125, -2.25, -1.47607421875, -0.7021484375, 0.07177734375, 0.845703125, 1.61962890625, 2.3935546875, 3.16748046875, 3.94140625, 4.71533203125, 5.4892578125, 6.26318359375, 7.037109375, 7.81103515625, 8.5849609375, 9.35888671875, 10.1328125, 10.90673828125, 11.6806640625, 12.45458984375, 13.228515625, 14.00244140625, 14.7763671875, 15.55029296875, 16.32421875, 17.09814453125, 17.8720703125, 18.64599609375, 19.419921875, 20.19384765625, 20.9677734375, 21.74169921875, 22.515625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 9.0, 13.0, 20.0, 31.0, 39.0, 61.0, 96.0, 134.0, 189.0, 297.0, 532.0, 775.0, 1351.0, 2183.0, 3690.0, 6456.0, 11488.0, 22805.0, 47416.0, 112802.0, 272519.0, 311081.0, 139947.0, 56761.0, 26551.0, 13515.0, 7439.0, 4049.0, 2335.0, 1464.0, 840.0, 555.0, 366.0, 258.0, 156.0, 94.0, 63.0, 57.0, 32.0, 22.0, 16.0, 9.0, 10.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.65625, -31.49462890625, -30.3330078125, -29.17138671875, -28.009765625, -26.84814453125, -25.6865234375, -24.52490234375, -23.36328125, -22.20166015625, -21.0400390625, -19.87841796875, -18.716796875, -17.55517578125, -16.3935546875, -15.23193359375, -14.0703125, -12.90869140625, -11.7470703125, -10.58544921875, -9.423828125, -8.26220703125, -7.1005859375, -5.93896484375, -4.77734375, -3.61572265625, -2.4541015625, -1.29248046875, -0.130859375, 1.03076171875, 2.1923828125, 3.35400390625, 4.515625, 5.67724609375, 6.8388671875, 8.00048828125, 9.162109375, 10.32373046875, 11.4853515625, 12.64697265625, 13.80859375, 14.97021484375, 16.1318359375, 17.29345703125, 18.455078125, 19.61669921875, 20.7783203125, 21.93994140625, 23.1015625, 24.26318359375, 25.4248046875, 26.58642578125, 27.748046875, 28.90966796875, 30.0712890625, 31.23291015625, 32.39453125, 33.55615234375, 34.7177734375, 35.87939453125, 37.041015625, 38.20263671875, 39.3642578125, 40.52587890625, 41.6875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 10.0, 9.0, 12.0, 14.0, 17.0, 26.0, 33.0, 42.0, 66.0, 73.0, 71.0, 79.0, 104.0, 92.0, 75.0, 58.0, 47.0, 29.0, 23.0, 20.0, 15.0, 9.0, 15.0, 6.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0035305023193359375, -0.003426879644393921, -0.0033232569694519043, -0.0032196342945098877, -0.003116011619567871, -0.0030123889446258545, -0.002908766269683838, -0.0028051435947418213, -0.0027015209197998047, -0.002597898244857788, -0.0024942755699157715, -0.002390652894973755, -0.0022870302200317383, -0.0021834075450897217, -0.002079784870147705, -0.0019761621952056885, -0.0018725395202636719, -0.0017689168453216553, -0.0016652941703796387, -0.001561671495437622, -0.0014580488204956055, -0.0013544261455535889, -0.0012508034706115723, -0.0011471807956695557, -0.001043558120727539, -0.0009399354457855225, -0.0008363127708435059, -0.0007326900959014893, -0.0006290674209594727, -0.0005254447460174561, -0.00042182207107543945, -0.00031819939613342285, -0.00021457672119140625, -0.00011095404624938965, -7.331371307373047e-06, 9.629130363464355e-05, 0.00019991397857666016, 0.00030353665351867676, 0.00040715932846069336, 0.00051078200340271, 0.0006144046783447266, 0.0007180273532867432, 0.0008216500282287598, 0.0009252727031707764, 0.001028895378112793, 0.0011325180530548096, 0.0012361407279968262, 0.0013397634029388428, 0.0014433860778808594, 0.001547008752822876, 0.0016506314277648926, 0.0017542541027069092, 0.0018578767776489258, 0.0019614994525909424, 0.002065122127532959, 0.0021687448024749756, 0.002272367477416992, 0.002375990152359009, 0.0024796128273010254, 0.002583235502243042, 0.0026868581771850586, 0.002790480852127075, 0.002894103527069092, 0.0029977262020111084, 0.003101348876953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 13.0, 10.0, 9.0, 13.0, 25.0, 33.0, 38.0, 45.0, 60.0, 101.0, 144.0, 180.0, 302.0, 424.0, 673.0, 1068.0, 1799.0, 3154.0, 5878.0, 12352.0, 28577.0, 78555.0, 232677.0, 381356.0, 190279.0, 63367.0, 24062.0, 10783.0, 5207.0, 2885.0, 1645.0, 925.0, 592.0, 405.0, 274.0, 191.0, 141.0, 74.0, 64.0, 45.0, 39.0, 28.0, 12.0, 21.0, 11.0, 4.0, 4.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.810546875, -35.55859375, -34.306640625, -33.0546875, -31.802734375, -30.55078125, -29.298828125, -28.046875, -26.794921875, -25.54296875, -24.291015625, -23.0390625, -21.787109375, -20.53515625, -19.283203125, -18.03125, -16.779296875, -15.52734375, -14.275390625, -13.0234375, -11.771484375, -10.51953125, -9.267578125, -8.015625, -6.763671875, -5.51171875, -4.259765625, -3.0078125, -1.755859375, -0.50390625, 0.748046875, 2.0, 3.251953125, 4.50390625, 5.755859375, 7.0078125, 8.259765625, 9.51171875, 10.763671875, 12.015625, 13.267578125, 14.51953125, 15.771484375, 17.0234375, 18.275390625, 19.52734375, 20.779296875, 22.03125, 23.283203125, 24.53515625, 25.787109375, 27.0390625, 28.291015625, 29.54296875, 30.794921875, 32.046875, 33.298828125, 34.55078125, 35.802734375, 37.0546875, 38.306640625, 39.55859375, 40.810546875, 42.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 9.0, 16.0, 13.0, 11.0, 18.0, 19.0, 31.0, 35.0, 44.0, 52.0, 76.0, 57.0, 81.0, 73.0, 76.0, 64.0, 70.0, 54.0, 36.0, 37.0, 24.0, 19.0, 16.0, 21.0, 14.0, 12.0, 4.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.890625, -10.5810546875, -10.271484375, -9.9619140625, -9.65234375, -9.3427734375, -9.033203125, -8.7236328125, -8.4140625, -8.1044921875, -7.794921875, -7.4853515625, -7.17578125, -6.8662109375, -6.556640625, -6.2470703125, -5.9375, -5.6279296875, -5.318359375, -5.0087890625, -4.69921875, -4.3896484375, -4.080078125, -3.7705078125, -3.4609375, -3.1513671875, -2.841796875, -2.5322265625, -2.22265625, -1.9130859375, -1.603515625, -1.2939453125, -0.984375, -0.6748046875, -0.365234375, -0.0556640625, 0.25390625, 0.5634765625, 0.873046875, 1.1826171875, 1.4921875, 1.8017578125, 2.111328125, 2.4208984375, 2.73046875, 3.0400390625, 3.349609375, 3.6591796875, 3.96875, 4.2783203125, 4.587890625, 4.8974609375, 5.20703125, 5.5166015625, 5.826171875, 6.1357421875, 6.4453125, 6.7548828125, 7.064453125, 7.3740234375, 7.68359375, 7.9931640625, 8.302734375, 8.6123046875, 8.921875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 12.0, 12.0, 8.0, 11.0, 13.0, 22.0, 31.0, 29.0, 46.0, 40.0, 46.0, 54.0, 58.0, 49.0, 62.0, 51.0, 56.0, 54.0, 38.0, 33.0, 39.0, 45.0, 42.0, 24.0, 19.0, 16.0, 13.0, 22.0, 9.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.433563232421875, -26.409563064575195, -25.385562896728516, -24.361562728881836, -23.337562561035156, -22.31356430053711, -21.28956413269043, -20.26556396484375, -19.24156379699707, -18.21756362915039, -17.19356346130371, -16.16956329345703, -15.145564079284668, -14.121563911437988, -13.097564697265625, -12.073564529418945, -11.049564361572266, -10.025564193725586, -9.001564025878906, -7.977564811706543, -6.953564643859863, -5.929564476013184, -4.905564785003662, -3.8815650939941406, -2.857564926147461, -1.8335649967193604, -0.8095650672912598, 0.21443486213684082, 1.2384347915649414, 2.262434959411621, 3.2864346504211426, 4.310434341430664, 5.334434509277344, 6.358434677124023, 7.382434368133545, 8.406434059143066, 9.430434226989746, 10.454434394836426, 11.478433609008789, 12.502433776855469, 13.526433944702148, 14.550434112548828, 15.574434280395508, 16.598434448242188, 17.622432708740234, 18.646434783935547, 19.670433044433594, 20.694433212280273, 21.718433380126953, 22.742433547973633, 23.766433715820312, 24.790433883666992, 25.814434051513672, 26.83843231201172, 27.8624324798584, 28.886432647705078, 29.910432815551758, 30.934432983398438, 31.958433151245117, 32.9824333190918, 34.006431579589844, 35.030433654785156, 36.0544319152832, 37.07843017578125, 38.10243225097656]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 11.0, 10.0, 8.0, 24.0, 18.0, 21.0, 18.0, 30.0, 28.0, 24.0, 36.0, 37.0, 33.0, 32.0, 53.0, 40.0, 45.0, 39.0, 47.0, 42.0, 37.0, 40.0, 35.0, 29.0, 33.0, 36.0, 28.0, 16.0, 22.0, 17.0, 16.0, 17.0, 6.0, 11.0, 9.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.413799285888672, -26.500789642333984, -25.587778091430664, -24.674766540527344, -23.761756896972656, -22.84874725341797, -21.93573570251465, -21.022724151611328, -20.10971450805664, -19.196704864501953, -18.283693313598633, -17.370681762695312, -16.457672119140625, -15.544661521911621, -14.631650924682617, -13.718640327453613, -12.80562973022461, -11.892619132995605, -10.979608535766602, -10.066597938537598, -9.153587341308594, -8.24057674407959, -7.327566146850586, -6.414555549621582, -5.501544952392578, -4.588534355163574, -3.6755237579345703, -2.7625131607055664, -1.8495025634765625, -0.9364919662475586, -0.023481369018554688, 0.8895292282104492, 1.802541732788086, 2.71555233001709, 3.6285629272460938, 4.541573524475098, 5.454584121704102, 6.3675947189331055, 7.280605316162109, 8.193615913391113, 9.106626510620117, 10.019637107849121, 10.932647705078125, 11.845658302307129, 12.758668899536133, 13.671679496765137, 14.58469009399414, 15.497700691223145, 16.41071128845215, 17.32372283935547, 18.236732482910156, 19.149742126464844, 20.062753677368164, 20.975765228271484, 21.888774871826172, 22.80178451538086, 23.71479606628418, 24.6278076171875, 25.540817260742188, 26.453826904296875, 27.366838455200195, 28.279850006103516, 29.192859649658203, 30.10586929321289, 31.01888084411621]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 6.0, 11.0, 21.0, 36.0, 52.0, 56.0, 136.0, 203.0, 344.0, 535.0, 844.0, 1346.0, 2225.0, 3514.0, 5793.0, 9512.0, 16231.0, 28510.0, 52314.0, 99857.0, 200680.0, 407846.0, 736519.0, 945563.0, 777592.0, 445445.0, 220266.0, 108409.0, 56690.0, 30864.0, 17104.0, 9872.0, 5943.0, 3691.0, 2327.0, 1448.0, 871.0, 550.0, 400.0, 224.0, 141.0, 93.0, 58.0, 47.0, 29.0, 18.0, 19.0, 12.0, 7.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.35791015625, -24.4033203125, -23.44873046875, -22.494140625, -21.53955078125, -20.5849609375, -19.63037109375, -18.67578125, -17.72119140625, -16.7666015625, -15.81201171875, -14.857421875, -13.90283203125, -12.9482421875, -11.99365234375, -11.0390625, -10.08447265625, -9.1298828125, -8.17529296875, -7.220703125, -6.26611328125, -5.3115234375, -4.35693359375, -3.40234375, -2.44775390625, -1.4931640625, -0.53857421875, 0.416015625, 1.37060546875, 2.3251953125, 3.27978515625, 4.234375, 5.18896484375, 6.1435546875, 7.09814453125, 8.052734375, 9.00732421875, 9.9619140625, 10.91650390625, 11.87109375, 12.82568359375, 13.7802734375, 14.73486328125, 15.689453125, 16.64404296875, 17.5986328125, 18.55322265625, 19.5078125, 20.46240234375, 21.4169921875, 22.37158203125, 23.326171875, 24.28076171875, 25.2353515625, 26.18994140625, 27.14453125, 28.09912109375, 29.0537109375, 30.00830078125, 30.962890625, 31.91748046875, 32.8720703125, 33.82666015625, 34.78125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 1.0, 9.0, 9.0, 5.0, 6.0, 9.0, 11.0, 15.0, 23.0, 21.0, 27.0, 17.0, 42.0, 34.0, 29.0, 24.0, 38.0, 35.0, 30.0, 41.0, 45.0, 46.0, 35.0, 47.0, 40.0, 42.0, 34.0, 31.0, 36.0, 31.0, 27.0, 21.0, 18.0, 20.0, 17.0, 10.0, 8.0, 11.0, 18.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.109375, -21.3740234375, -20.638671875, -19.9033203125, -19.16796875, -18.4326171875, -17.697265625, -16.9619140625, -16.2265625, -15.4912109375, -14.755859375, -14.0205078125, -13.28515625, -12.5498046875, -11.814453125, -11.0791015625, -10.34375, -9.6083984375, -8.873046875, -8.1376953125, -7.40234375, -6.6669921875, -5.931640625, -5.1962890625, -4.4609375, -3.7255859375, -2.990234375, -2.2548828125, -1.51953125, -0.7841796875, -0.048828125, 0.6865234375, 1.421875, 2.1572265625, 2.892578125, 3.6279296875, 4.36328125, 5.0986328125, 5.833984375, 6.5693359375, 7.3046875, 8.0400390625, 8.775390625, 9.5107421875, 10.24609375, 10.9814453125, 11.716796875, 12.4521484375, 13.1875, 13.9228515625, 14.658203125, 15.3935546875, 16.12890625, 16.8642578125, 17.599609375, 18.3349609375, 19.0703125, 19.8056640625, 20.541015625, 21.2763671875, 22.01171875, 22.7470703125, 23.482421875, 24.2177734375, 24.953125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 13.0, 21.0, 20.0, 20.0, 47.0, 69.0, 104.0, 154.0, 241.0, 386.0, 561.0, 877.0, 1410.0, 2189.0, 3592.0, 5726.0, 9337.0, 15481.0, 26347.0, 45203.0, 80555.0, 146782.0, 268056.0, 475989.0, 742071.0, 847481.0, 645143.0, 387409.0, 214092.0, 116982.0, 64904.0, 37323.0, 21646.0, 12894.0, 7887.0, 4885.0, 3001.0, 1964.0, 1246.0, 746.0, 494.0, 311.0, 226.0, 145.0, 88.0, 51.0, 41.0, 27.0, 14.0, 13.0, 9.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0], "bins": [-31.1875, -30.222412109375, -29.25732421875, -28.292236328125, -27.3271484375, -26.362060546875, -25.39697265625, -24.431884765625, -23.466796875, -22.501708984375, -21.53662109375, -20.571533203125, -19.6064453125, -18.641357421875, -17.67626953125, -16.711181640625, -15.74609375, -14.781005859375, -13.81591796875, -12.850830078125, -11.8857421875, -10.920654296875, -9.95556640625, -8.990478515625, -8.025390625, -7.060302734375, -6.09521484375, -5.130126953125, -4.1650390625, -3.199951171875, -2.23486328125, -1.269775390625, -0.3046875, 0.660400390625, 1.62548828125, 2.590576171875, 3.5556640625, 4.520751953125, 5.48583984375, 6.450927734375, 7.416015625, 8.381103515625, 9.34619140625, 10.311279296875, 11.2763671875, 12.241455078125, 13.20654296875, 14.171630859375, 15.13671875, 16.101806640625, 17.06689453125, 18.031982421875, 18.9970703125, 19.962158203125, 20.92724609375, 21.892333984375, 22.857421875, 23.822509765625, 24.78759765625, 25.752685546875, 26.7177734375, 27.682861328125, 28.64794921875, 29.613037109375, 30.578125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 9.0, 17.0, 16.0, 20.0, 30.0, 37.0, 33.0, 50.0, 68.0, 84.0, 105.0, 132.0, 148.0, 196.0, 204.0, 211.0, 272.0, 282.0, 284.0, 283.0, 257.0, 245.0, 208.0, 147.0, 139.0, 125.0, 105.0, 75.0, 61.0, 44.0, 38.0, 21.0, 24.0, 19.0, 16.0, 15.0, 18.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-13.0703125, -12.6917724609375, -12.313232421875, -11.9346923828125, -11.55615234375, -11.1776123046875, -10.799072265625, -10.4205322265625, -10.0419921875, -9.6634521484375, -9.284912109375, -8.9063720703125, -8.52783203125, -8.1492919921875, -7.770751953125, -7.3922119140625, -7.013671875, -6.6351318359375, -6.256591796875, -5.8780517578125, -5.49951171875, -5.1209716796875, -4.742431640625, -4.3638916015625, -3.9853515625, -3.6068115234375, -3.228271484375, -2.8497314453125, -2.47119140625, -2.0926513671875, -1.714111328125, -1.3355712890625, -0.95703125, -0.5784912109375, -0.199951171875, 0.1785888671875, 0.55712890625, 0.9356689453125, 1.314208984375, 1.6927490234375, 2.0712890625, 2.4498291015625, 2.828369140625, 3.2069091796875, 3.58544921875, 3.9639892578125, 4.342529296875, 4.7210693359375, 5.099609375, 5.4781494140625, 5.856689453125, 6.2352294921875, 6.61376953125, 6.9923095703125, 7.370849609375, 7.7493896484375, 8.1279296875, 8.5064697265625, 8.885009765625, 9.2635498046875, 9.64208984375, 10.0206298828125, 10.399169921875, 10.7777099609375, 11.15625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 13.0, 19.0, 19.0, 25.0, 20.0, 27.0, 31.0, 37.0, 34.0, 43.0, 46.0, 39.0, 56.0, 51.0, 60.0, 46.0, 55.0, 53.0, 45.0, 36.0, 46.0, 28.0, 24.0, 22.0, 20.0, 20.0, 14.0, 13.0, 12.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.818099975585938, -27.872392654418945, -26.926685333251953, -25.98097801208496, -25.03527069091797, -24.089563369750977, -23.143856048583984, -22.198148727416992, -21.25244140625, -20.306734085083008, -19.361026763916016, -18.415319442749023, -17.46961212158203, -16.52390480041504, -15.578197479248047, -14.632490158081055, -13.686782836914062, -12.74107551574707, -11.795368194580078, -10.849660873413086, -9.903953552246094, -8.958246231079102, -8.01253890991211, -7.066831588745117, -6.121124267578125, -5.175416946411133, -4.229709625244141, -3.2840023040771484, -2.3382949829101562, -1.392587661743164, -0.4468803405761719, 0.4988269805908203, 1.4445323944091797, 2.390239715576172, 3.335947036743164, 4.281654357910156, 5.227361679077148, 6.173069000244141, 7.118776321411133, 8.064483642578125, 9.010190963745117, 9.95589828491211, 10.901605606079102, 11.847312927246094, 12.793020248413086, 13.738727569580078, 14.68443489074707, 15.630142211914062, 16.575849533081055, 17.521556854248047, 18.46726417541504, 19.41297149658203, 20.358678817749023, 21.304386138916016, 22.250093460083008, 23.19580078125, 24.141508102416992, 25.087215423583984, 26.032922744750977, 26.97863006591797, 27.92433738708496, 28.870044708251953, 29.815752029418945, 30.761459350585938, 31.70716667175293]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 14.0, 12.0, 9.0, 21.0, 18.0, 17.0, 25.0, 23.0, 26.0, 21.0, 28.0, 30.0, 20.0, 35.0, 43.0, 37.0, 37.0, 33.0, 51.0, 44.0, 35.0, 47.0, 41.0, 33.0, 33.0, 33.0, 22.0, 28.0, 24.0, 25.0, 22.0, 23.0, 9.0, 20.0, 9.0, 9.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.12867546081543, -23.302513122558594, -22.476348876953125, -21.65018653869629, -20.824024200439453, -19.997859954833984, -19.17169761657715, -18.345535278320312, -17.519371032714844, -16.693208694458008, -15.867044448852539, -15.040882110595703, -14.21471881866455, -13.388555526733398, -12.562393188476562, -11.73622989654541, -10.910066604614258, -10.083903312683105, -9.257740020751953, -8.431577682495117, -7.605414390563965, -6.7792510986328125, -5.953088283538818, -5.126925468444824, -4.300762176513672, -3.4745991230010986, -2.6484360694885254, -1.8222730159759521, -0.9961099624633789, -0.16994667053222656, 0.6562161445617676, 1.4823789596557617, 2.3085403442382812, 3.1347033977508545, 3.9608664512634277, 4.787029266357422, 5.613192558288574, 6.439355850219727, 7.265518665313721, 8.091681480407715, 8.917844772338867, 9.74400806427002, 10.570171356201172, 11.396333694458008, 12.22249698638916, 13.048660278320312, 13.874822616577148, 14.7009859085083, 15.527149200439453, 16.35331153869629, 17.179475784301758, 18.005638122558594, 18.831802368164062, 19.6579647064209, 20.484127044677734, 21.310291290283203, 22.13645362854004, 22.962615966796875, 23.788780212402344, 24.61494255065918, 25.441104888916016, 26.267269134521484, 27.09343147277832, 27.919593811035156, 28.745758056640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 7.0, 14.0, 14.0, 17.0, 21.0, 39.0, 64.0, 79.0, 135.0, 192.0, 288.0, 394.0, 591.0, 912.0, 1520.0, 2533.0, 4514.0, 9067.0, 18197.0, 39050.0, 86705.0, 181037.0, 286228.0, 215337.0, 106119.0, 48585.0, 22604.0, 10884.0, 5531.0, 3003.0, 1760.0, 1079.0, 651.0, 486.0, 286.0, 209.0, 135.0, 84.0, 62.0, 49.0, 22.0, 21.0, 12.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.46875, -41.08251953125, -39.6962890625, -38.31005859375, -36.923828125, -35.53759765625, -34.1513671875, -32.76513671875, -31.37890625, -29.99267578125, -28.6064453125, -27.22021484375, -25.833984375, -24.44775390625, -23.0615234375, -21.67529296875, -20.2890625, -18.90283203125, -17.5166015625, -16.13037109375, -14.744140625, -13.35791015625, -11.9716796875, -10.58544921875, -9.19921875, -7.81298828125, -6.4267578125, -5.04052734375, -3.654296875, -2.26806640625, -0.8818359375, 0.50439453125, 1.890625, 3.27685546875, 4.6630859375, 6.04931640625, 7.435546875, 8.82177734375, 10.2080078125, 11.59423828125, 12.98046875, 14.36669921875, 15.7529296875, 17.13916015625, 18.525390625, 19.91162109375, 21.2978515625, 22.68408203125, 24.0703125, 25.45654296875, 26.8427734375, 28.22900390625, 29.615234375, 31.00146484375, 32.3876953125, 33.77392578125, 35.16015625, 36.54638671875, 37.9326171875, 39.31884765625, 40.705078125, 42.09130859375, 43.4775390625, 44.86376953125, 46.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 8.0, 4.0, 6.0, 9.0, 15.0, 13.0, 19.0, 16.0, 20.0, 24.0, 21.0, 25.0, 31.0, 38.0, 26.0, 32.0, 33.0, 30.0, 46.0, 35.0, 38.0, 38.0, 41.0, 44.0, 53.0, 39.0, 38.0, 18.0, 34.0, 27.0, 28.0, 21.0, 28.0, 26.0, 12.0, 16.0, 11.0, 6.0, 7.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-28.21875, -27.362548828125, -26.50634765625, -25.650146484375, -24.7939453125, -23.937744140625, -23.08154296875, -22.225341796875, -21.369140625, -20.512939453125, -19.65673828125, -18.800537109375, -17.9443359375, -17.088134765625, -16.23193359375, -15.375732421875, -14.51953125, -13.663330078125, -12.80712890625, -11.950927734375, -11.0947265625, -10.238525390625, -9.38232421875, -8.526123046875, -7.669921875, -6.813720703125, -5.95751953125, -5.101318359375, -4.2451171875, -3.388916015625, -2.53271484375, -1.676513671875, -0.8203125, 0.035888671875, 0.89208984375, 1.748291015625, 2.6044921875, 3.460693359375, 4.31689453125, 5.173095703125, 6.029296875, 6.885498046875, 7.74169921875, 8.597900390625, 9.4541015625, 10.310302734375, 11.16650390625, 12.022705078125, 12.87890625, 13.735107421875, 14.59130859375, 15.447509765625, 16.3037109375, 17.159912109375, 18.01611328125, 18.872314453125, 19.728515625, 20.584716796875, 21.44091796875, 22.297119140625, 23.1533203125, 24.009521484375, 24.86572265625, 25.721923828125, 26.578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 12.0, 12.0, 11.0, 13.0, 30.0, 34.0, 49.0, 79.0, 127.0, 197.0, 270.0, 426.0, 657.0, 1034.0, 1577.0, 2644.0, 4418.0, 7863.0, 14255.0, 28216.0, 56593.0, 117973.0, 227217.0, 267745.0, 158814.0, 77011.0, 37729.0, 19231.0, 9936.0, 5667.0, 3232.0, 2017.0, 1210.0, 749.0, 517.0, 299.0, 220.0, 155.0, 97.0, 68.0, 51.0, 31.0, 34.0, 14.0, 14.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-44.90625, -43.630859375, -42.35546875, -41.080078125, -39.8046875, -38.529296875, -37.25390625, -35.978515625, -34.703125, -33.427734375, -32.15234375, -30.876953125, -29.6015625, -28.326171875, -27.05078125, -25.775390625, -24.5, -23.224609375, -21.94921875, -20.673828125, -19.3984375, -18.123046875, -16.84765625, -15.572265625, -14.296875, -13.021484375, -11.74609375, -10.470703125, -9.1953125, -7.919921875, -6.64453125, -5.369140625, -4.09375, -2.818359375, -1.54296875, -0.267578125, 1.0078125, 2.283203125, 3.55859375, 4.833984375, 6.109375, 7.384765625, 8.66015625, 9.935546875, 11.2109375, 12.486328125, 13.76171875, 15.037109375, 16.3125, 17.587890625, 18.86328125, 20.138671875, 21.4140625, 22.689453125, 23.96484375, 25.240234375, 26.515625, 27.791015625, 29.06640625, 30.341796875, 31.6171875, 32.892578125, 34.16796875, 35.443359375, 36.71875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 7.0, 22.0, 10.0, 9.0, 18.0, 32.0, 34.0, 34.0, 38.0, 25.0, 44.0, 54.0, 49.0, 44.0, 64.0, 51.0, 50.0, 48.0, 44.0, 59.0, 36.0, 37.0, 30.0, 24.0, 26.0, 22.0, 16.0, 12.0, 15.0, 9.0, 6.0, 6.0, 8.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-29.46875, -28.689453125, -27.91015625, -27.130859375, -26.3515625, -25.572265625, -24.79296875, -24.013671875, -23.234375, -22.455078125, -21.67578125, -20.896484375, -20.1171875, -19.337890625, -18.55859375, -17.779296875, -17.0, -16.220703125, -15.44140625, -14.662109375, -13.8828125, -13.103515625, -12.32421875, -11.544921875, -10.765625, -9.986328125, -9.20703125, -8.427734375, -7.6484375, -6.869140625, -6.08984375, -5.310546875, -4.53125, -3.751953125, -2.97265625, -2.193359375, -1.4140625, -0.634765625, 0.14453125, 0.923828125, 1.703125, 2.482421875, 3.26171875, 4.041015625, 4.8203125, 5.599609375, 6.37890625, 7.158203125, 7.9375, 8.716796875, 9.49609375, 10.275390625, 11.0546875, 11.833984375, 12.61328125, 13.392578125, 14.171875, 14.951171875, 15.73046875, 16.509765625, 17.2890625, 18.068359375, 18.84765625, 19.626953125, 20.40625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 7.0, 13.0, 18.0, 19.0, 33.0, 54.0, 66.0, 82.0, 110.0, 188.0, 220.0, 359.0, 497.0, 749.0, 1150.0, 1910.0, 3592.0, 7565.0, 19644.0, 65872.0, 279953.0, 473455.0, 134874.0, 34286.0, 11656.0, 5271.0, 2625.0, 1448.0, 883.0, 588.0, 392.0, 251.0, 204.0, 133.0, 108.0, 59.0, 51.0, 37.0, 25.0, 27.0, 22.0, 12.0, 10.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0], "bins": [-25.78125, -25.070068359375, -24.35888671875, -23.647705078125, -22.9365234375, -22.225341796875, -21.51416015625, -20.802978515625, -20.091796875, -19.380615234375, -18.66943359375, -17.958251953125, -17.2470703125, -16.535888671875, -15.82470703125, -15.113525390625, -14.40234375, -13.691162109375, -12.97998046875, -12.268798828125, -11.5576171875, -10.846435546875, -10.13525390625, -9.424072265625, -8.712890625, -8.001708984375, -7.29052734375, -6.579345703125, -5.8681640625, -5.156982421875, -4.44580078125, -3.734619140625, -3.0234375, -2.312255859375, -1.60107421875, -0.889892578125, -0.1787109375, 0.532470703125, 1.24365234375, 1.954833984375, 2.666015625, 3.377197265625, 4.08837890625, 4.799560546875, 5.5107421875, 6.221923828125, 6.93310546875, 7.644287109375, 8.35546875, 9.066650390625, 9.77783203125, 10.489013671875, 11.2001953125, 11.911376953125, 12.62255859375, 13.333740234375, 14.044921875, 14.756103515625, 15.46728515625, 16.178466796875, 16.8896484375, 17.600830078125, 18.31201171875, 19.023193359375, 19.734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 8.0, 5.0, 6.0, 10.0, 10.0, 20.0, 52.0, 144.0, 255.0, 261.0, 126.0, 53.0, 23.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024566650390625, -0.0023118257522583008, -0.0021669864654541016, -0.0020221471786499023, -0.0018773078918457031, -0.001732468605041504, -0.0015876293182373047, -0.0014427900314331055, -0.0012979507446289062, -0.001153111457824707, -0.0010082721710205078, -0.0008634328842163086, -0.0007185935974121094, -0.0005737543106079102, -0.00042891502380371094, -0.0002840757369995117, -0.0001392364501953125, 5.602836608886719e-06, 0.00015044212341308594, 0.00029528141021728516, 0.0004401206970214844, 0.0005849599838256836, 0.0007297992706298828, 0.000874638557434082, 0.0010194778442382812, 0.0011643171310424805, 0.0013091564178466797, 0.001453995704650879, 0.0015988349914550781, 0.0017436742782592773, 0.0018885135650634766, 0.0020333528518676758, 0.002178192138671875, 0.0023230314254760742, 0.0024678707122802734, 0.0026127099990844727, 0.002757549285888672, 0.002902388572692871, 0.0030472278594970703, 0.0031920671463012695, 0.0033369064331054688, 0.003481745719909668, 0.003626585006713867, 0.0037714242935180664, 0.003916263580322266, 0.004061102867126465, 0.004205942153930664, 0.004350781440734863, 0.0044956207275390625, 0.004640460014343262, 0.004785299301147461, 0.00493013858795166, 0.005074977874755859, 0.005219817161560059, 0.005364656448364258, 0.005509495735168457, 0.005654335021972656, 0.0057991743087768555, 0.005944013595581055, 0.006088852882385254, 0.006233692169189453, 0.006378531455993652, 0.0065233707427978516, 0.006668210029602051, 0.00681304931640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 4.0, 24.0, 31.0, 39.0, 42.0, 64.0, 97.0, 133.0, 159.0, 249.0, 297.0, 412.0, 559.0, 679.0, 1091.0, 1558.0, 2358.0, 4030.0, 7364.0, 14625.0, 34619.0, 96638.0, 273448.0, 354491.0, 157112.0, 53000.0, 21010.0, 9810.0, 5185.0, 3025.0, 1883.0, 1269.0, 882.0, 614.0, 459.0, 367.0, 209.0, 210.0, 134.0, 99.0, 70.0, 51.0, 49.0, 27.0, 23.0, 17.0, 12.0, 8.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.296875, -20.65576171875, -20.0146484375, -19.37353515625, -18.732421875, -18.09130859375, -17.4501953125, -16.80908203125, -16.16796875, -15.52685546875, -14.8857421875, -14.24462890625, -13.603515625, -12.96240234375, -12.3212890625, -11.68017578125, -11.0390625, -10.39794921875, -9.7568359375, -9.11572265625, -8.474609375, -7.83349609375, -7.1923828125, -6.55126953125, -5.91015625, -5.26904296875, -4.6279296875, -3.98681640625, -3.345703125, -2.70458984375, -2.0634765625, -1.42236328125, -0.78125, -0.14013671875, 0.5009765625, 1.14208984375, 1.783203125, 2.42431640625, 3.0654296875, 3.70654296875, 4.34765625, 4.98876953125, 5.6298828125, 6.27099609375, 6.912109375, 7.55322265625, 8.1943359375, 8.83544921875, 9.4765625, 10.11767578125, 10.7587890625, 11.39990234375, 12.041015625, 12.68212890625, 13.3232421875, 13.96435546875, 14.60546875, 15.24658203125, 15.8876953125, 16.52880859375, 17.169921875, 17.81103515625, 18.4521484375, 19.09326171875, 19.734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 9.0, 6.0, 13.0, 15.0, 37.0, 52.0, 84.0, 97.0, 115.0, 128.0, 130.0, 90.0, 74.0, 40.0, 23.0, 20.0, 15.0, 4.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.04290771484375, -6.7850341796875, -6.52716064453125, -6.269287109375, -6.01141357421875, -5.7535400390625, -5.49566650390625, -5.23779296875, -4.97991943359375, -4.7220458984375, -4.46417236328125, -4.206298828125, -3.94842529296875, -3.6905517578125, -3.43267822265625, -3.1748046875, -2.91693115234375, -2.6590576171875, -2.40118408203125, -2.143310546875, -1.88543701171875, -1.6275634765625, -1.36968994140625, -1.11181640625, -0.85394287109375, -0.5960693359375, -0.33819580078125, -0.080322265625, 0.17755126953125, 0.4354248046875, 0.69329833984375, 0.951171875, 1.20904541015625, 1.4669189453125, 1.72479248046875, 1.982666015625, 2.24053955078125, 2.4984130859375, 2.75628662109375, 3.01416015625, 3.27203369140625, 3.5299072265625, 3.78778076171875, 4.045654296875, 4.30352783203125, 4.5614013671875, 4.81927490234375, 5.0771484375, 5.33502197265625, 5.5928955078125, 5.85076904296875, 6.108642578125, 6.36651611328125, 6.6243896484375, 6.88226318359375, 7.14013671875, 7.39801025390625, 7.6558837890625, 7.91375732421875, 8.171630859375, 8.42950439453125, 8.6873779296875, 8.94525146484375, 9.203125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 9.0, 16.0, 19.0, 16.0, 29.0, 28.0, 35.0, 49.0, 37.0, 52.0, 49.0, 55.0, 56.0, 58.0, 57.0, 51.0, 46.0, 35.0, 52.0, 42.0, 44.0, 18.0, 21.0, 25.0, 15.0, 10.0, 11.0, 9.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.20750617980957, -29.230022430419922, -28.252538681030273, -27.275054931640625, -26.297569274902344, -25.320085525512695, -24.342601776123047, -23.3651180267334, -22.38763427734375, -21.4101505279541, -20.432666778564453, -19.455181121826172, -18.477697372436523, -17.500213623046875, -16.522729873657227, -15.545246124267578, -14.567760467529297, -13.590276718139648, -12.612792015075684, -11.635308265686035, -10.65782356262207, -9.680339813232422, -8.702856063842773, -7.725371837615967, -6.74788761138916, -5.7704033851623535, -4.792919158935547, -3.8154354095458984, -2.837951183319092, -1.8604669570922852, -0.8829832077026367, 0.09450101852416992, 1.0719871520996094, 2.049471378326416, 3.0269553661346436, 4.004439353942871, 4.981923580169678, 5.959407806396484, 6.936891555786133, 7.9143757820129395, 8.891860008239746, 9.869343757629395, 10.84682846069336, 11.824312210083008, 12.801795959472656, 13.779280662536621, 14.75676441192627, 15.734249114990234, 16.711732864379883, 17.68921661376953, 18.66670036315918, 19.644184112548828, 20.62166976928711, 21.599153518676758, 22.576637268066406, 23.554121017456055, 24.531604766845703, 25.50908851623535, 26.486572265625, 27.46405792236328, 28.44154167175293, 29.419025421142578, 30.396509170532227, 31.373992919921875, 32.351478576660156]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 6.0, 11.0, 10.0, 12.0, 17.0, 16.0, 18.0, 25.0, 25.0, 20.0, 34.0, 19.0, 36.0, 32.0, 33.0, 40.0, 47.0, 47.0, 51.0, 44.0, 37.0, 41.0, 44.0, 39.0, 35.0, 28.0, 26.0, 32.0, 31.0, 24.0, 25.0, 17.0, 12.0, 20.0, 7.0, 9.0, 2.0, 3.0, 8.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.00399398803711, -25.13258171081543, -24.261171340942383, -23.389759063720703, -22.518346786499023, -21.646934509277344, -20.775524139404297, -19.904111862182617, -19.032699584960938, -18.161287307739258, -17.28987693786621, -16.41846466064453, -15.547052383422852, -14.675641059875488, -13.804229736328125, -12.932817459106445, -12.061407089233398, -11.189995765686035, -10.318583488464355, -9.447172164916992, -8.575759887695312, -7.704348564147949, -6.832937240600586, -5.9615254402160645, -5.090113639831543, -4.2187018394470215, -3.347290277481079, -2.4758787155151367, -1.6044669151306152, -0.7330551147460938, 0.13835620880126953, 1.009768009185791, 1.8811798095703125, 2.752591609954834, 3.6240031719207764, 4.495414733886719, 5.36682653427124, 6.238238334655762, 7.109649658203125, 7.9810614585876465, 8.852473258972168, 9.723884582519531, 10.595296859741211, 11.466708183288574, 12.338119506835938, 13.209531784057617, 14.08094310760498, 14.952354431152344, 15.823766708374023, 16.695178985595703, 17.56658935546875, 18.43800163269043, 19.30941390991211, 20.180824279785156, 21.052236557006836, 21.923648834228516, 22.795059204101562, 23.666471481323242, 24.53788185119629, 25.40929412841797, 26.28070640563965, 27.152118682861328, 28.023529052734375, 28.894941329956055, 29.766353607177734]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 17.0, 29.0, 32.0, 58.0, 72.0, 126.0, 193.0, 287.0, 422.0, 683.0, 1025.0, 1577.0, 2469.0, 3930.0, 6025.0, 9444.0, 14690.0, 22644.0, 34995.0, 53014.0, 76424.0, 103712.0, 127862.0, 137354.0, 126727.0, 102437.0, 74718.0, 51338.0, 33909.0, 22315.0, 14306.0, 9132.0, 5825.0, 3799.0, 2435.0, 1579.0, 1053.0, 641.0, 431.0, 290.0, 186.0, 104.0, 91.0, 54.0, 33.0, 19.0, 10.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.625, -26.774169921875, -25.92333984375, -25.072509765625, -24.2216796875, -23.370849609375, -22.52001953125, -21.669189453125, -20.818359375, -19.967529296875, -19.11669921875, -18.265869140625, -17.4150390625, -16.564208984375, -15.71337890625, -14.862548828125, -14.01171875, -13.160888671875, -12.31005859375, -11.459228515625, -10.6083984375, -9.757568359375, -8.90673828125, -8.055908203125, -7.205078125, -6.354248046875, -5.50341796875, -4.652587890625, -3.8017578125, -2.950927734375, -2.10009765625, -1.249267578125, -0.3984375, 0.452392578125, 1.30322265625, 2.154052734375, 3.0048828125, 3.855712890625, 4.70654296875, 5.557373046875, 6.408203125, 7.259033203125, 8.10986328125, 8.960693359375, 9.8115234375, 10.662353515625, 11.51318359375, 12.364013671875, 13.21484375, 14.065673828125, 14.91650390625, 15.767333984375, 16.6181640625, 17.468994140625, 18.31982421875, 19.170654296875, 20.021484375, 20.872314453125, 21.72314453125, 22.573974609375, 23.4248046875, 24.275634765625, 25.12646484375, 25.977294921875, 26.828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 12.0, 21.0, 17.0, 26.0, 19.0, 31.0, 15.0, 27.0, 40.0, 23.0, 40.0, 35.0, 44.0, 32.0, 51.0, 47.0, 35.0, 35.0, 56.0, 48.0, 49.0, 35.0, 38.0, 22.0, 28.0, 18.0, 29.0, 18.0, 27.0, 15.0, 8.0, 9.0, 3.0, 6.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.468994140625, -24.57861328125, -23.688232421875, -22.7978515625, -21.907470703125, -21.01708984375, -20.126708984375, -19.236328125, -18.345947265625, -17.45556640625, -16.565185546875, -15.6748046875, -14.784423828125, -13.89404296875, -13.003662109375, -12.11328125, -11.222900390625, -10.33251953125, -9.442138671875, -8.5517578125, -7.661376953125, -6.77099609375, -5.880615234375, -4.990234375, -4.099853515625, -3.20947265625, -2.319091796875, -1.4287109375, -0.538330078125, 0.35205078125, 1.242431640625, 2.1328125, 3.023193359375, 3.91357421875, 4.803955078125, 5.6943359375, 6.584716796875, 7.47509765625, 8.365478515625, 9.255859375, 10.146240234375, 11.03662109375, 11.927001953125, 12.8173828125, 13.707763671875, 14.59814453125, 15.488525390625, 16.37890625, 17.269287109375, 18.15966796875, 19.050048828125, 19.9404296875, 20.830810546875, 21.72119140625, 22.611572265625, 23.501953125, 24.392333984375, 25.28271484375, 26.173095703125, 27.0634765625, 27.953857421875, 28.84423828125, 29.734619140625, 30.625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 5.0, 6.0, 5.0, 15.0, 26.0, 28.0, 49.0, 71.0, 115.0, 157.0, 243.0, 348.0, 534.0, 759.0, 1135.0, 1725.0, 2602.0, 4074.0, 6282.0, 9788.0, 14939.0, 23948.0, 36965.0, 56926.0, 83416.0, 115351.0, 140204.0, 144576.0, 124965.0, 93851.0, 64798.0, 43166.0, 27495.0, 17670.0, 11366.0, 7387.0, 4731.0, 2979.0, 1976.0, 1263.0, 802.0, 567.0, 398.0, 270.0, 179.0, 118.0, 88.0, 63.0, 54.0, 23.0, 20.0, 17.0, 8.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.09619140625, -28.0986328125, -27.10107421875, -26.103515625, -25.10595703125, -24.1083984375, -23.11083984375, -22.11328125, -21.11572265625, -20.1181640625, -19.12060546875, -18.123046875, -17.12548828125, -16.1279296875, -15.13037109375, -14.1328125, -13.13525390625, -12.1376953125, -11.14013671875, -10.142578125, -9.14501953125, -8.1474609375, -7.14990234375, -6.15234375, -5.15478515625, -4.1572265625, -3.15966796875, -2.162109375, -1.16455078125, -0.1669921875, 0.83056640625, 1.828125, 2.82568359375, 3.8232421875, 4.82080078125, 5.818359375, 6.81591796875, 7.8134765625, 8.81103515625, 9.80859375, 10.80615234375, 11.8037109375, 12.80126953125, 13.798828125, 14.79638671875, 15.7939453125, 16.79150390625, 17.7890625, 18.78662109375, 19.7841796875, 20.78173828125, 21.779296875, 22.77685546875, 23.7744140625, 24.77197265625, 25.76953125, 26.76708984375, 27.7646484375, 28.76220703125, 29.759765625, 30.75732421875, 31.7548828125, 32.75244140625, 33.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 3.0, 4.0, 6.0, 6.0, 15.0, 13.0, 9.0, 13.0, 18.0, 19.0, 28.0, 31.0, 20.0, 25.0, 33.0, 30.0, 38.0, 55.0, 35.0, 56.0, 43.0, 45.0, 43.0, 39.0, 36.0, 43.0, 44.0, 29.0, 32.0, 27.0, 26.0, 27.0, 17.0, 13.0, 16.0, 8.0, 16.0, 7.0, 4.0, 8.0, 6.0, 3.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.951904296875, -18.38818359375, -17.824462890625, -17.2607421875, -16.697021484375, -16.13330078125, -15.569580078125, -15.005859375, -14.442138671875, -13.87841796875, -13.314697265625, -12.7509765625, -12.187255859375, -11.62353515625, -11.059814453125, -10.49609375, -9.932373046875, -9.36865234375, -8.804931640625, -8.2412109375, -7.677490234375, -7.11376953125, -6.550048828125, -5.986328125, -5.422607421875, -4.85888671875, -4.295166015625, -3.7314453125, -3.167724609375, -2.60400390625, -2.040283203125, -1.4765625, -0.912841796875, -0.34912109375, 0.214599609375, 0.7783203125, 1.342041015625, 1.90576171875, 2.469482421875, 3.033203125, 3.596923828125, 4.16064453125, 4.724365234375, 5.2880859375, 5.851806640625, 6.41552734375, 6.979248046875, 7.54296875, 8.106689453125, 8.67041015625, 9.234130859375, 9.7978515625, 10.361572265625, 10.92529296875, 11.489013671875, 12.052734375, 12.616455078125, 13.18017578125, 13.743896484375, 14.3076171875, 14.871337890625, 15.43505859375, 15.998779296875, 16.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 7.0, 8.0, 16.0, 30.0, 34.0, 36.0, 44.0, 63.0, 83.0, 118.0, 184.0, 254.0, 378.0, 486.0, 736.0, 1191.0, 1662.0, 2621.0, 4208.0, 7303.0, 13662.0, 31133.0, 87290.0, 265575.0, 377011.0, 157424.0, 51213.0, 20405.0, 9889.0, 5596.0, 3351.0, 2093.0, 1415.0, 904.0, 606.0, 447.0, 292.0, 231.0, 168.0, 115.0, 74.0, 55.0, 44.0, 26.0, 20.0, 15.0, 9.0, 11.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.34375, -36.18603515625, -35.0283203125, -33.87060546875, -32.712890625, -31.55517578125, -30.3974609375, -29.23974609375, -28.08203125, -26.92431640625, -25.7666015625, -24.60888671875, -23.451171875, -22.29345703125, -21.1357421875, -19.97802734375, -18.8203125, -17.66259765625, -16.5048828125, -15.34716796875, -14.189453125, -13.03173828125, -11.8740234375, -10.71630859375, -9.55859375, -8.40087890625, -7.2431640625, -6.08544921875, -4.927734375, -3.77001953125, -2.6123046875, -1.45458984375, -0.296875, 0.86083984375, 2.0185546875, 3.17626953125, 4.333984375, 5.49169921875, 6.6494140625, 7.80712890625, 8.96484375, 10.12255859375, 11.2802734375, 12.43798828125, 13.595703125, 14.75341796875, 15.9111328125, 17.06884765625, 18.2265625, 19.38427734375, 20.5419921875, 21.69970703125, 22.857421875, 24.01513671875, 25.1728515625, 26.33056640625, 27.48828125, 28.64599609375, 29.8037109375, 30.96142578125, 32.119140625, 33.27685546875, 34.4345703125, 35.59228515625, 36.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 5.0, 6.0, 4.0, 9.0, 12.0, 12.0, 12.0, 19.0, 14.0, 17.0, 29.0, 46.0, 61.0, 55.0, 59.0, 76.0, 66.0, 81.0, 74.0, 62.0, 50.0, 37.0, 45.0, 34.0, 13.0, 19.0, 8.0, 14.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002613067626953125, -0.0025361180305480957, -0.0024591684341430664, -0.002382218837738037, -0.002305269241333008, -0.0022283196449279785, -0.0021513700485229492, -0.00207442045211792, -0.0019974708557128906, -0.0019205212593078613, -0.001843571662902832, -0.0017666220664978027, -0.0016896724700927734, -0.0016127228736877441, -0.0015357732772827148, -0.0014588236808776855, -0.0013818740844726562, -0.001304924488067627, -0.0012279748916625977, -0.0011510252952575684, -0.001074075698852539, -0.0009971261024475098, -0.0009201765060424805, -0.0008432269096374512, -0.0007662773132324219, -0.0006893277168273926, -0.0006123781204223633, -0.000535428524017334, -0.0004584789276123047, -0.0003815293312072754, -0.0003045797348022461, -0.0002276301383972168, -0.0001506805419921875, -7.37309455871582e-05, 3.2186508178710938e-06, 8.016824722290039e-05, 0.0001571178436279297, 0.00023406744003295898, 0.0003110170364379883, 0.0003879666328430176, 0.0004649162292480469, 0.0005418658256530762, 0.0006188154220581055, 0.0006957650184631348, 0.0007727146148681641, 0.0008496642112731934, 0.0009266138076782227, 0.001003563404083252, 0.0010805130004882812, 0.0011574625968933105, 0.0012344121932983398, 0.0013113617897033691, 0.0013883113861083984, 0.0014652609825134277, 0.001542210578918457, 0.0016191601753234863, 0.0016961097717285156, 0.001773059368133545, 0.0018500089645385742, 0.0019269585609436035, 0.002003908157348633, 0.002080857753753662, 0.0021578073501586914, 0.0022347569465637207, 0.00231170654296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 9.0, 11.0, 12.0, 14.0, 29.0, 43.0, 54.0, 63.0, 104.0, 124.0, 156.0, 243.0, 326.0, 435.0, 575.0, 792.0, 1080.0, 1484.0, 2234.0, 3223.0, 4800.0, 7469.0, 12776.0, 23292.0, 50112.0, 117597.0, 244449.0, 281861.0, 155904.0, 66727.0, 30216.0, 15253.0, 8999.0, 5569.0, 3705.0, 2519.0, 1781.0, 1230.0, 887.0, 653.0, 520.0, 327.0, 248.0, 187.0, 135.0, 98.0, 74.0, 47.0, 32.0, 25.0, 19.0, 15.0, 10.0, 6.0, 6.0, 1.0, 4.0, 2.0], "bins": [-26.96875, -26.15576171875, -25.3427734375, -24.52978515625, -23.716796875, -22.90380859375, -22.0908203125, -21.27783203125, -20.46484375, -19.65185546875, -18.8388671875, -18.02587890625, -17.212890625, -16.39990234375, -15.5869140625, -14.77392578125, -13.9609375, -13.14794921875, -12.3349609375, -11.52197265625, -10.708984375, -9.89599609375, -9.0830078125, -8.27001953125, -7.45703125, -6.64404296875, -5.8310546875, -5.01806640625, -4.205078125, -3.39208984375, -2.5791015625, -1.76611328125, -0.953125, -0.14013671875, 0.6728515625, 1.48583984375, 2.298828125, 3.11181640625, 3.9248046875, 4.73779296875, 5.55078125, 6.36376953125, 7.1767578125, 7.98974609375, 8.802734375, 9.61572265625, 10.4287109375, 11.24169921875, 12.0546875, 12.86767578125, 13.6806640625, 14.49365234375, 15.306640625, 16.11962890625, 16.9326171875, 17.74560546875, 18.55859375, 19.37158203125, 20.1845703125, 20.99755859375, 21.810546875, 22.62353515625, 23.4365234375, 24.24951171875, 25.0625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 10.0, 10.0, 8.0, 16.0, 10.0, 19.0, 22.0, 41.0, 37.0, 49.0, 59.0, 64.0, 105.0, 79.0, 85.0, 66.0, 50.0, 45.0, 42.0, 38.0, 26.0, 16.0, 19.0, 15.0, 12.0, 7.0, 5.0, 10.0, 5.0, 1.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.25, -8.972900390625, -8.69580078125, -8.418701171875, -8.1416015625, -7.864501953125, -7.58740234375, -7.310302734375, -7.033203125, -6.756103515625, -6.47900390625, -6.201904296875, -5.9248046875, -5.647705078125, -5.37060546875, -5.093505859375, -4.81640625, -4.539306640625, -4.26220703125, -3.985107421875, -3.7080078125, -3.430908203125, -3.15380859375, -2.876708984375, -2.599609375, -2.322509765625, -2.04541015625, -1.768310546875, -1.4912109375, -1.214111328125, -0.93701171875, -0.659912109375, -0.3828125, -0.105712890625, 0.17138671875, 0.448486328125, 0.7255859375, 1.002685546875, 1.27978515625, 1.556884765625, 1.833984375, 2.111083984375, 2.38818359375, 2.665283203125, 2.9423828125, 3.219482421875, 3.49658203125, 3.773681640625, 4.05078125, 4.327880859375, 4.60498046875, 4.882080078125, 5.1591796875, 5.436279296875, 5.71337890625, 5.990478515625, 6.267578125, 6.544677734375, 6.82177734375, 7.098876953125, 7.3759765625, 7.653076171875, 7.93017578125, 8.207275390625, 8.484375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 6.0, 15.0, 19.0, 23.0, 26.0, 35.0, 41.0, 57.0, 49.0, 62.0, 67.0, 75.0, 41.0, 52.0, 70.0, 66.0, 45.0, 41.0, 38.0, 38.0, 30.0, 21.0, 7.0, 22.0, 9.0, 11.0, 10.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.146114349365234, -31.970399856567383, -30.79468536376953, -29.61897087097168, -28.443256378173828, -27.267539978027344, -26.091825485229492, -24.91611099243164, -23.74039649963379, -22.564682006835938, -21.388967514038086, -20.213253021240234, -19.03753662109375, -17.86182403564453, -16.686107635498047, -15.510393142700195, -14.334678649902344, -13.158964157104492, -11.98324966430664, -10.807534217834473, -9.631819725036621, -8.45610523223877, -7.28039026260376, -6.10467529296875, -4.928960800170898, -3.7532460689544678, -2.577531337738037, -1.4018166065216064, -0.22610187530517578, 0.9496126174926758, 2.1253275871276855, 3.3010425567626953, 4.4767608642578125, 5.652475357055664, 6.828190326690674, 8.003905296325684, 9.179619789123535, 10.355334281921387, 11.531049728393555, 12.706764221191406, 13.882478713989258, 15.05819320678711, 16.23390769958496, 17.409622192382812, 18.585338592529297, 19.761051177978516, 20.936767578125, 22.11248207092285, 23.288196563720703, 24.463911056518555, 25.639625549316406, 26.815340042114258, 27.99105453491211, 29.166770935058594, 30.342485427856445, 31.518199920654297, 32.69391632080078, 33.869632720947266, 35.045345306396484, 36.22106170654297, 37.39677429199219, 38.57249069213867, 39.74820327758789, 40.923919677734375, 42.099632263183594]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 10.0, 9.0, 11.0, 16.0, 25.0, 10.0, 19.0, 32.0, 21.0, 24.0, 24.0, 21.0, 26.0, 33.0, 27.0, 47.0, 40.0, 40.0, 45.0, 50.0, 45.0, 41.0, 41.0, 35.0, 30.0, 40.0, 40.0, 15.0, 26.0, 30.0, 24.0, 25.0, 14.0, 14.0, 8.0, 9.0, 8.0, 3.0, 6.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-28.99245834350586, -28.15785026550293, -27.3232421875, -26.48863410949707, -25.65402603149414, -24.81941795349121, -23.98480987548828, -23.15020179748535, -22.315593719482422, -21.480985641479492, -20.646377563476562, -19.811769485473633, -18.977161407470703, -18.142553329467773, -17.307945251464844, -16.473337173461914, -15.638729095458984, -14.804121017456055, -13.969512939453125, -13.134904861450195, -12.300296783447266, -11.465688705444336, -10.631080627441406, -9.796472549438477, -8.961864471435547, -8.127256393432617, -7.2926483154296875, -6.458040237426758, -5.623432159423828, -4.788824081420898, -3.9542160034179688, -3.119607925415039, -2.2849998474121094, -1.4503917694091797, -0.61578369140625, 0.2188243865966797, 1.0534324645996094, 1.888040542602539, 2.7226486206054688, 3.5572566986083984, 4.391864776611328, 5.226472854614258, 6.0610809326171875, 6.895689010620117, 7.730297088623047, 8.564905166625977, 9.399513244628906, 10.234121322631836, 11.068729400634766, 11.903337478637695, 12.737945556640625, 13.572553634643555, 14.407161712646484, 15.241769790649414, 16.076377868652344, 16.910985946655273, 17.745594024658203, 18.580202102661133, 19.414810180664062, 20.249418258666992, 21.084026336669922, 21.91863441467285, 22.75324249267578, 23.58785057067871, 24.42245864868164]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 6.0, 11.0, 11.0, 17.0, 41.0, 41.0, 77.0, 82.0, 142.0, 257.0, 359.0, 587.0, 1012.0, 1684.0, 2851.0, 4798.0, 8103.0, 14293.0, 26355.0, 48138.0, 93935.0, 191044.0, 409254.0, 785075.0, 1017686.0, 781667.0, 413493.0, 193334.0, 92919.0, 47677.0, 25414.0, 14013.0, 7964.0, 4750.0, 2846.0, 1702.0, 957.0, 618.0, 333.0, 262.0, 147.0, 118.0, 60.0, 53.0, 34.0, 19.0, 23.0, 9.0, 7.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-33.125, -32.13623046875, -31.1474609375, -30.15869140625, -29.169921875, -28.18115234375, -27.1923828125, -26.20361328125, -25.21484375, -24.22607421875, -23.2373046875, -22.24853515625, -21.259765625, -20.27099609375, -19.2822265625, -18.29345703125, -17.3046875, -16.31591796875, -15.3271484375, -14.33837890625, -13.349609375, -12.36083984375, -11.3720703125, -10.38330078125, -9.39453125, -8.40576171875, -7.4169921875, -6.42822265625, -5.439453125, -4.45068359375, -3.4619140625, -2.47314453125, -1.484375, -0.49560546875, 0.4931640625, 1.48193359375, 2.470703125, 3.45947265625, 4.4482421875, 5.43701171875, 6.42578125, 7.41455078125, 8.4033203125, 9.39208984375, 10.380859375, 11.36962890625, 12.3583984375, 13.34716796875, 14.3359375, 15.32470703125, 16.3134765625, 17.30224609375, 18.291015625, 19.27978515625, 20.2685546875, 21.25732421875, 22.24609375, 23.23486328125, 24.2236328125, 25.21240234375, 26.201171875, 27.18994140625, 28.1787109375, 29.16748046875, 30.15625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 16.0, 16.0, 14.0, 19.0, 22.0, 17.0, 20.0, 26.0, 27.0, 32.0, 34.0, 31.0, 47.0, 39.0, 33.0, 36.0, 49.0, 37.0, 41.0, 51.0, 39.0, 55.0, 25.0, 29.0, 30.0, 25.0, 23.0, 25.0, 28.0, 16.0, 12.0, 12.0, 8.0, 7.0, 5.0, 10.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.46875, -20.763671875, -20.05859375, -19.353515625, -18.6484375, -17.943359375, -17.23828125, -16.533203125, -15.828125, -15.123046875, -14.41796875, -13.712890625, -13.0078125, -12.302734375, -11.59765625, -10.892578125, -10.1875, -9.482421875, -8.77734375, -8.072265625, -7.3671875, -6.662109375, -5.95703125, -5.251953125, -4.546875, -3.841796875, -3.13671875, -2.431640625, -1.7265625, -1.021484375, -0.31640625, 0.388671875, 1.09375, 1.798828125, 2.50390625, 3.208984375, 3.9140625, 4.619140625, 5.32421875, 6.029296875, 6.734375, 7.439453125, 8.14453125, 8.849609375, 9.5546875, 10.259765625, 10.96484375, 11.669921875, 12.375, 13.080078125, 13.78515625, 14.490234375, 15.1953125, 15.900390625, 16.60546875, 17.310546875, 18.015625, 18.720703125, 19.42578125, 20.130859375, 20.8359375, 21.541015625, 22.24609375, 22.951171875, 23.65625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 8.0, 10.0, 11.0, 16.0, 39.0, 50.0, 59.0, 98.0, 141.0, 223.0, 385.0, 529.0, 818.0, 1305.0, 2096.0, 3269.0, 5137.0, 8536.0, 14480.0, 25285.0, 44260.0, 81035.0, 148131.0, 273714.0, 492411.0, 778330.0, 871112.0, 629407.0, 365439.0, 199602.0, 107925.0, 59267.0, 33178.0, 18928.0, 11202.0, 6662.0, 4077.0, 2495.0, 1628.0, 1048.0, 618.0, 439.0, 286.0, 218.0, 125.0, 82.0, 56.0, 35.0, 31.0, 16.0, 11.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-29.28125, -28.31298828125, -27.3447265625, -26.37646484375, -25.408203125, -24.43994140625, -23.4716796875, -22.50341796875, -21.53515625, -20.56689453125, -19.5986328125, -18.63037109375, -17.662109375, -16.69384765625, -15.7255859375, -14.75732421875, -13.7890625, -12.82080078125, -11.8525390625, -10.88427734375, -9.916015625, -8.94775390625, -7.9794921875, -7.01123046875, -6.04296875, -5.07470703125, -4.1064453125, -3.13818359375, -2.169921875, -1.20166015625, -0.2333984375, 0.73486328125, 1.703125, 2.67138671875, 3.6396484375, 4.60791015625, 5.576171875, 6.54443359375, 7.5126953125, 8.48095703125, 9.44921875, 10.41748046875, 11.3857421875, 12.35400390625, 13.322265625, 14.29052734375, 15.2587890625, 16.22705078125, 17.1953125, 18.16357421875, 19.1318359375, 20.10009765625, 21.068359375, 22.03662109375, 23.0048828125, 23.97314453125, 24.94140625, 25.90966796875, 26.8779296875, 27.84619140625, 28.814453125, 29.78271484375, 30.7509765625, 31.71923828125, 32.6875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 4.0, 10.0, 7.0, 14.0, 19.0, 34.0, 29.0, 51.0, 76.0, 87.0, 108.0, 126.0, 174.0, 174.0, 238.0, 256.0, 279.0, 318.0, 301.0, 297.0, 304.0, 246.0, 188.0, 151.0, 112.0, 90.0, 90.0, 55.0, 60.0, 35.0, 31.0, 30.0, 15.0, 12.0, 18.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.6875, -13.2861328125, -12.884765625, -12.4833984375, -12.08203125, -11.6806640625, -11.279296875, -10.8779296875, -10.4765625, -10.0751953125, -9.673828125, -9.2724609375, -8.87109375, -8.4697265625, -8.068359375, -7.6669921875, -7.265625, -6.8642578125, -6.462890625, -6.0615234375, -5.66015625, -5.2587890625, -4.857421875, -4.4560546875, -4.0546875, -3.6533203125, -3.251953125, -2.8505859375, -2.44921875, -2.0478515625, -1.646484375, -1.2451171875, -0.84375, -0.4423828125, -0.041015625, 0.3603515625, 0.76171875, 1.1630859375, 1.564453125, 1.9658203125, 2.3671875, 2.7685546875, 3.169921875, 3.5712890625, 3.97265625, 4.3740234375, 4.775390625, 5.1767578125, 5.578125, 5.9794921875, 6.380859375, 6.7822265625, 7.18359375, 7.5849609375, 7.986328125, 8.3876953125, 8.7890625, 9.1904296875, 9.591796875, 9.9931640625, 10.39453125, 10.7958984375, 11.197265625, 11.5986328125, 12.0]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 9.0, 6.0, 5.0, 12.0, 18.0, 12.0, 26.0, 18.0, 21.0, 32.0, 29.0, 45.0, 46.0, 56.0, 63.0, 67.0, 49.0, 63.0, 62.0, 43.0, 49.0, 37.0, 32.0, 39.0, 29.0, 24.0, 29.0, 20.0, 13.0, 10.0, 8.0, 7.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.22088623046875, -33.20854568481445, -32.19620895385742, -31.183870315551758, -30.171531677246094, -29.159191131591797, -28.146852493286133, -27.13451385498047, -26.122175216674805, -25.10983657836914, -24.097497940063477, -23.085159301757812, -22.072818756103516, -21.060482025146484, -20.048141479492188, -19.035802841186523, -18.02346420288086, -17.011125564575195, -15.998786926269531, -14.98644733428955, -13.974108695983887, -12.961770057678223, -11.949430465698242, -10.937091827392578, -9.924753189086914, -8.91241455078125, -7.900075435638428, -6.8877363204956055, -5.875397682189941, -4.863059043884277, -3.850719928741455, -2.838380813598633, -1.8260459899902344, -0.8137071132659912, 0.19863176345825195, 1.2109706401824951, 2.2233095169067383, 3.2356481552124023, 4.247987270355225, 5.260326385498047, 6.272665023803711, 7.285003662109375, 8.297342300415039, 9.30968189239502, 10.322020530700684, 11.334359169006348, 12.346698760986328, 13.359037399291992, 14.371376037597656, 15.38371467590332, 16.396053314208984, 17.40839195251465, 18.420730590820312, 19.43307113647461, 20.445409774780273, 21.457748413085938, 22.4700870513916, 23.482425689697266, 24.49476432800293, 25.507102966308594, 26.51944351196289, 27.531780242919922, 28.54412078857422, 29.556459426879883, 30.568798065185547]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 3.0, 12.0, 10.0, 18.0, 13.0, 12.0, 14.0, 21.0, 12.0, 25.0, 27.0, 27.0, 34.0, 30.0, 35.0, 50.0, 30.0, 38.0, 40.0, 38.0, 37.0, 41.0, 43.0, 43.0, 35.0, 36.0, 32.0, 39.0, 27.0, 27.0, 20.0, 31.0, 14.0, 15.0, 11.0, 7.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.25445556640625, -25.47844123840332, -24.702425003051758, -23.926410675048828, -23.150394439697266, -22.374380111694336, -21.598365783691406, -20.822349548339844, -20.04633331298828, -19.27031898498535, -18.49430274963379, -17.71828842163086, -16.942272186279297, -16.166257858276367, -15.390242576599121, -14.614227294921875, -13.838212966918945, -13.0621976852417, -12.286182403564453, -11.510168075561523, -10.734151840209961, -9.958137512207031, -9.182122230529785, -8.406106948852539, -7.630091667175293, -6.854076385498047, -6.078061103820801, -5.302046298980713, -4.526031017303467, -3.7500157356262207, -2.974000930786133, -2.1979856491088867, -1.4219703674316406, -0.6459552049636841, 0.13005995750427246, 0.9060750007629395, 1.6820902824401855, 2.4581055641174316, 3.2341203689575195, 4.010135650634766, 4.786150932312012, 5.562166213989258, 6.338181495666504, 7.114196300506592, 7.890211582183838, 8.666227340698242, 9.442241668701172, 10.218256950378418, 10.994272232055664, 11.77028751373291, 12.546302795410156, 13.322317123413086, 14.098333358764648, 14.874347686767578, 15.650362968444824, 16.42637825012207, 17.202392578125, 17.97840690612793, 18.754423141479492, 19.530437469482422, 20.306453704833984, 21.082468032836914, 21.858482360839844, 22.634498596191406, 23.41051483154297]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 11.0, 15.0, 20.0, 23.0, 43.0, 42.0, 79.0, 125.0, 152.0, 222.0, 322.0, 414.0, 634.0, 971.0, 1380.0, 2269.0, 3348.0, 5672.0, 9850.0, 18484.0, 36941.0, 78072.0, 158764.0, 251676.0, 226544.0, 126391.0, 60811.0, 28912.0, 14775.0, 8073.0, 4719.0, 2882.0, 1936.0, 1246.0, 851.0, 570.0, 423.0, 259.0, 180.0, 131.0, 96.0, 57.0, 65.0, 30.0, 20.0, 18.0, 12.0, 8.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.09375, -29.0849609375, -28.076171875, -27.0673828125, -26.05859375, -25.0498046875, -24.041015625, -23.0322265625, -22.0234375, -21.0146484375, -20.005859375, -18.9970703125, -17.98828125, -16.9794921875, -15.970703125, -14.9619140625, -13.953125, -12.9443359375, -11.935546875, -10.9267578125, -9.91796875, -8.9091796875, -7.900390625, -6.8916015625, -5.8828125, -4.8740234375, -3.865234375, -2.8564453125, -1.84765625, -0.8388671875, 0.169921875, 1.1787109375, 2.1875, 3.1962890625, 4.205078125, 5.2138671875, 6.22265625, 7.2314453125, 8.240234375, 9.2490234375, 10.2578125, 11.2666015625, 12.275390625, 13.2841796875, 14.29296875, 15.3017578125, 16.310546875, 17.3193359375, 18.328125, 19.3369140625, 20.345703125, 21.3544921875, 22.36328125, 23.3720703125, 24.380859375, 25.3896484375, 26.3984375, 27.4072265625, 28.416015625, 29.4248046875, 30.43359375, 31.4423828125, 32.451171875, 33.4599609375, 34.46875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 10.0, 13.0, 10.0, 19.0, 17.0, 9.0, 15.0, 26.0, 25.0, 17.0, 33.0, 28.0, 37.0, 38.0, 39.0, 46.0, 42.0, 36.0, 45.0, 42.0, 38.0, 46.0, 36.0, 40.0, 44.0, 33.0, 35.0, 23.0, 22.0, 21.0, 16.0, 19.0, 12.0, 17.0, 8.0, 3.0, 10.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.5, -28.65673828125, -27.8134765625, -26.97021484375, -26.126953125, -25.28369140625, -24.4404296875, -23.59716796875, -22.75390625, -21.91064453125, -21.0673828125, -20.22412109375, -19.380859375, -18.53759765625, -17.6943359375, -16.85107421875, -16.0078125, -15.16455078125, -14.3212890625, -13.47802734375, -12.634765625, -11.79150390625, -10.9482421875, -10.10498046875, -9.26171875, -8.41845703125, -7.5751953125, -6.73193359375, -5.888671875, -5.04541015625, -4.2021484375, -3.35888671875, -2.515625, -1.67236328125, -0.8291015625, 0.01416015625, 0.857421875, 1.70068359375, 2.5439453125, 3.38720703125, 4.23046875, 5.07373046875, 5.9169921875, 6.76025390625, 7.603515625, 8.44677734375, 9.2900390625, 10.13330078125, 10.9765625, 11.81982421875, 12.6630859375, 13.50634765625, 14.349609375, 15.19287109375, 16.0361328125, 16.87939453125, 17.72265625, 18.56591796875, 19.4091796875, 20.25244140625, 21.095703125, 21.93896484375, 22.7822265625, 23.62548828125, 24.46875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 7.0, 16.0, 19.0, 13.0, 38.0, 55.0, 75.0, 79.0, 120.0, 181.0, 280.0, 407.0, 613.0, 912.0, 1392.0, 2110.0, 3481.0, 5805.0, 10017.0, 18332.0, 34565.0, 68868.0, 139676.0, 245364.0, 239120.0, 134452.0, 66647.0, 33645.0, 17384.0, 9728.0, 5656.0, 3290.0, 2072.0, 1363.0, 877.0, 570.0, 406.0, 295.0, 181.0, 116.0, 86.0, 71.0, 42.0, 26.0, 36.0, 13.0, 11.0, 6.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-31.609375, -30.588623046875, -29.56787109375, -28.547119140625, -27.5263671875, -26.505615234375, -25.48486328125, -24.464111328125, -23.443359375, -22.422607421875, -21.40185546875, -20.381103515625, -19.3603515625, -18.339599609375, -17.31884765625, -16.298095703125, -15.27734375, -14.256591796875, -13.23583984375, -12.215087890625, -11.1943359375, -10.173583984375, -9.15283203125, -8.132080078125, -7.111328125, -6.090576171875, -5.06982421875, -4.049072265625, -3.0283203125, -2.007568359375, -0.98681640625, 0.033935546875, 1.0546875, 2.075439453125, 3.09619140625, 4.116943359375, 5.1376953125, 6.158447265625, 7.17919921875, 8.199951171875, 9.220703125, 10.241455078125, 11.26220703125, 12.282958984375, 13.3037109375, 14.324462890625, 15.34521484375, 16.365966796875, 17.38671875, 18.407470703125, 19.42822265625, 20.448974609375, 21.4697265625, 22.490478515625, 23.51123046875, 24.531982421875, 25.552734375, 26.573486328125, 27.59423828125, 28.614990234375, 29.6357421875, 30.656494140625, 31.67724609375, 32.697998046875, 33.71875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 8.0, 13.0, 22.0, 18.0, 17.0, 25.0, 37.0, 26.0, 43.0, 39.0, 47.0, 44.0, 60.0, 47.0, 30.0, 48.0, 50.0, 41.0, 40.0, 41.0, 31.0, 27.0, 34.0, 30.0, 35.0, 22.0, 17.0, 14.0, 13.0, 13.0, 6.0, 9.0, 10.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.3125, -17.652099609375, -16.99169921875, -16.331298828125, -15.6708984375, -15.010498046875, -14.35009765625, -13.689697265625, -13.029296875, -12.368896484375, -11.70849609375, -11.048095703125, -10.3876953125, -9.727294921875, -9.06689453125, -8.406494140625, -7.74609375, -7.085693359375, -6.42529296875, -5.764892578125, -5.1044921875, -4.444091796875, -3.78369140625, -3.123291015625, -2.462890625, -1.802490234375, -1.14208984375, -0.481689453125, 0.1787109375, 0.839111328125, 1.49951171875, 2.159912109375, 2.8203125, 3.480712890625, 4.14111328125, 4.801513671875, 5.4619140625, 6.122314453125, 6.78271484375, 7.443115234375, 8.103515625, 8.763916015625, 9.42431640625, 10.084716796875, 10.7451171875, 11.405517578125, 12.06591796875, 12.726318359375, 13.38671875, 14.047119140625, 14.70751953125, 15.367919921875, 16.0283203125, 16.688720703125, 17.34912109375, 18.009521484375, 18.669921875, 19.330322265625, 19.99072265625, 20.651123046875, 21.3115234375, 21.971923828125, 22.63232421875, 23.292724609375, 23.953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 3.0, 5.0, 10.0, 22.0, 10.0, 26.0, 36.0, 33.0, 61.0, 78.0, 107.0, 153.0, 245.0, 367.0, 593.0, 893.0, 1463.0, 2656.0, 5200.0, 12005.0, 36199.0, 167381.0, 570946.0, 186039.0, 38664.0, 12764.0, 5455.0, 2787.0, 1557.0, 946.0, 584.0, 391.0, 241.0, 161.0, 132.0, 89.0, 73.0, 54.0, 38.0, 19.0, 14.0, 11.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-28.625, -27.8193359375, -27.013671875, -26.2080078125, -25.40234375, -24.5966796875, -23.791015625, -22.9853515625, -22.1796875, -21.3740234375, -20.568359375, -19.7626953125, -18.95703125, -18.1513671875, -17.345703125, -16.5400390625, -15.734375, -14.9287109375, -14.123046875, -13.3173828125, -12.51171875, -11.7060546875, -10.900390625, -10.0947265625, -9.2890625, -8.4833984375, -7.677734375, -6.8720703125, -6.06640625, -5.2607421875, -4.455078125, -3.6494140625, -2.84375, -2.0380859375, -1.232421875, -0.4267578125, 0.37890625, 1.1845703125, 1.990234375, 2.7958984375, 3.6015625, 4.4072265625, 5.212890625, 6.0185546875, 6.82421875, 7.6298828125, 8.435546875, 9.2412109375, 10.046875, 10.8525390625, 11.658203125, 12.4638671875, 13.26953125, 14.0751953125, 14.880859375, 15.6865234375, 16.4921875, 17.2978515625, 18.103515625, 18.9091796875, 19.71484375, 20.5205078125, 21.326171875, 22.1318359375, 22.9375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 9.0, 10.0, 11.0, 14.0, 25.0, 23.0, 41.0, 32.0, 50.0, 70.0, 85.0, 106.0, 81.0, 82.0, 77.0, 56.0, 39.0, 29.0, 32.0, 23.0, 16.0, 8.0, 13.0, 6.0, 12.0, 8.0, 2.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.001216888427734375, -0.001173555850982666, -0.001130223274230957, -0.001086890697479248, -0.001043558120727539, -0.00100022554397583, -0.0009568929672241211, -0.0009135603904724121, -0.0008702278137207031, -0.0008268952369689941, -0.0007835626602172852, -0.0007402300834655762, -0.0006968975067138672, -0.0006535649299621582, -0.0006102323532104492, -0.0005668997764587402, -0.0005235671997070312, -0.00048023462295532227, -0.0004369020462036133, -0.0003935694694519043, -0.0003502368927001953, -0.00030690431594848633, -0.00026357173919677734, -0.00022023916244506836, -0.00017690658569335938, -0.0001335740089416504, -9.02414321899414e-05, -4.690885543823242e-05, -3.5762786865234375e-06, 3.975629806518555e-05, 8.308887481689453e-05, 0.00012642145156860352, 0.0001697540283203125, 0.00021308660507202148, 0.00025641918182373047, 0.00029975175857543945, 0.00034308433532714844, 0.0003864169120788574, 0.0004297494888305664, 0.0004730820655822754, 0.0005164146423339844, 0.0005597472190856934, 0.0006030797958374023, 0.0006464123725891113, 0.0006897449493408203, 0.0007330775260925293, 0.0007764101028442383, 0.0008197426795959473, 0.0008630752563476562, 0.0009064078330993652, 0.0009497404098510742, 0.0009930729866027832, 0.0010364055633544922, 0.0010797381401062012, 0.0011230707168579102, 0.0011664032936096191, 0.0012097358703613281, 0.0012530684471130371, 0.001296401023864746, 0.001339733600616455, 0.001383066177368164, 0.001426398754119873, 0.001469731330871582, 0.001513063907623291, 0.001556396484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 12.0, 10.0, 17.0, 28.0, 43.0, 50.0, 71.0, 76.0, 102.0, 188.0, 252.0, 342.0, 467.0, 661.0, 881.0, 1339.0, 1974.0, 3421.0, 6219.0, 14012.0, 41340.0, 156644.0, 457157.0, 258123.0, 65021.0, 20191.0, 8298.0, 4142.0, 2308.0, 1564.0, 1079.0, 734.0, 491.0, 352.0, 259.0, 164.0, 157.0, 106.0, 75.0, 56.0, 33.0, 27.0, 21.0, 11.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.546875, -23.746826171875, -22.94677734375, -22.146728515625, -21.3466796875, -20.546630859375, -19.74658203125, -18.946533203125, -18.146484375, -17.346435546875, -16.54638671875, -15.746337890625, -14.9462890625, -14.146240234375, -13.34619140625, -12.546142578125, -11.74609375, -10.946044921875, -10.14599609375, -9.345947265625, -8.5458984375, -7.745849609375, -6.94580078125, -6.145751953125, -5.345703125, -4.545654296875, -3.74560546875, -2.945556640625, -2.1455078125, -1.345458984375, -0.54541015625, 0.254638671875, 1.0546875, 1.854736328125, 2.65478515625, 3.454833984375, 4.2548828125, 5.054931640625, 5.85498046875, 6.655029296875, 7.455078125, 8.255126953125, 9.05517578125, 9.855224609375, 10.6552734375, 11.455322265625, 12.25537109375, 13.055419921875, 13.85546875, 14.655517578125, 15.45556640625, 16.255615234375, 17.0556640625, 17.855712890625, 18.65576171875, 19.455810546875, 20.255859375, 21.055908203125, 21.85595703125, 22.656005859375, 23.4560546875, 24.256103515625, 25.05615234375, 25.856201171875, 26.65625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 16.0, 17.0, 47.0, 64.0, 123.0, 191.0, 177.0, 150.0, 76.0, 31.0, 26.0, 18.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8359375, -10.498291015625, -10.16064453125, -9.822998046875, -9.4853515625, -9.147705078125, -8.81005859375, -8.472412109375, -8.134765625, -7.797119140625, -7.45947265625, -7.121826171875, -6.7841796875, -6.446533203125, -6.10888671875, -5.771240234375, -5.43359375, -5.095947265625, -4.75830078125, -4.420654296875, -4.0830078125, -3.745361328125, -3.40771484375, -3.070068359375, -2.732421875, -2.394775390625, -2.05712890625, -1.719482421875, -1.3818359375, -1.044189453125, -0.70654296875, -0.368896484375, -0.03125, 0.306396484375, 0.64404296875, 0.981689453125, 1.3193359375, 1.656982421875, 1.99462890625, 2.332275390625, 2.669921875, 3.007568359375, 3.34521484375, 3.682861328125, 4.0205078125, 4.358154296875, 4.69580078125, 5.033447265625, 5.37109375, 5.708740234375, 6.04638671875, 6.384033203125, 6.7216796875, 7.059326171875, 7.39697265625, 7.734619140625, 8.072265625, 8.409912109375, 8.74755859375, 9.085205078125, 9.4228515625, 9.760498046875, 10.09814453125, 10.435791015625, 10.7734375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 6.0, 3.0, 15.0, 12.0, 17.0, 23.0, 16.0, 29.0, 32.0, 41.0, 41.0, 47.0, 64.0, 61.0, 64.0, 56.0, 53.0, 46.0, 61.0, 52.0, 34.0, 41.0, 35.0, 26.0, 22.0, 19.0, 17.0, 12.0, 15.0, 5.0, 2.0, 5.0, 3.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-38.39461135864258, -37.37541198730469, -36.35620880126953, -35.33700942993164, -34.317806243896484, -33.298606872558594, -32.27940368652344, -31.260204315185547, -30.24100112915039, -29.221799850463867, -28.202598571777344, -27.18339729309082, -26.164196014404297, -25.144994735717773, -24.12579345703125, -23.10659408569336, -22.087392807006836, -21.068191528320312, -20.04899024963379, -19.029788970947266, -18.010587692260742, -16.99138641357422, -15.972186088562012, -14.952984809875488, -13.933783531188965, -12.914582252502441, -11.895380973815918, -10.876180648803711, -9.856979370117188, -8.837778091430664, -7.818576812744141, -6.799375534057617, -5.780176162719727, -4.760974884033203, -3.741773843765259, -2.7225728034973145, -1.703371524810791, -0.6841702461242676, 0.33503055572509766, 1.354231834411621, 2.3734331130981445, 3.392634391784668, 4.411835670471191, 5.431036472320557, 6.45023775100708, 7.4694390296936035, 8.488639831542969, 9.507841110229492, 10.527042388916016, 11.546243667602539, 12.565444946289062, 13.584646224975586, 14.60384750366211, 15.623048782348633, 16.642250061035156, 17.661449432373047, 18.680652618408203, 19.699853897094727, 20.71905517578125, 21.738256454467773, 22.757457733154297, 23.77665901184082, 24.795860290527344, 25.815059661865234, 26.834260940551758]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 5.0, 11.0, 15.0, 11.0, 12.0, 20.0, 12.0, 12.0, 18.0, 27.0, 25.0, 33.0, 34.0, 32.0, 35.0, 43.0, 43.0, 49.0, 39.0, 49.0, 44.0, 36.0, 44.0, 36.0, 37.0, 42.0, 33.0, 31.0, 21.0, 24.0, 18.0, 15.0, 16.0, 17.0, 13.0, 10.0, 5.0, 10.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-27.41048812866211, -26.582136154174805, -25.7537841796875, -24.925432205200195, -24.09708023071289, -23.268728256225586, -22.44037628173828, -21.61202621459961, -20.783672332763672, -19.955320358276367, -19.126968383789062, -18.298616409301758, -17.470264434814453, -16.64191246032715, -15.81356143951416, -14.985209465026855, -14.156858444213867, -13.328506469726562, -12.500154495239258, -11.671802520751953, -10.843450546264648, -10.015098571777344, -9.186747550964355, -8.35839557647705, -7.530043601989746, -6.701691627502441, -5.873339653015137, -5.04498815536499, -4.2166361808776855, -3.388284206390381, -2.5599327087402344, -1.7315807342529297, -0.9032268524169922, -0.07487499713897705, 0.7534768581390381, 1.5818285942077637, 2.4101805686950684, 3.238532543182373, 4.0668840408325195, 4.895236015319824, 5.723587989807129, 6.551939964294434, 7.380291938781738, 8.208642959594727, 9.036994934082031, 9.865346908569336, 10.69369888305664, 11.522050857543945, 12.35040283203125, 13.178754806518555, 14.00710678100586, 14.835458755493164, 15.663810729980469, 16.492162704467773, 17.320514678955078, 18.14886474609375, 18.977218627929688, 19.805570602416992, 20.633922576904297, 21.4622745513916, 22.290626525878906, 23.11897850036621, 23.947330474853516, 24.775680541992188, 25.604032516479492]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [6.0, 5.0, 6.0, 8.0, 8.0, 21.0, 25.0, 34.0, 76.0, 114.0, 157.0, 219.0, 352.0, 524.0, 770.0, 1195.0, 1851.0, 2763.0, 4231.0, 6705.0, 10238.0, 15846.0, 23611.0, 35473.0, 51175.0, 71283.0, 93891.0, 114369.0, 124486.0, 120001.0, 103018.0, 81177.0, 60085.0, 42131.0, 28254.0, 18824.0, 12237.0, 8066.0, 5423.0, 3357.0, 2248.0, 1496.0, 982.0, 635.0, 385.0, 265.0, 203.0, 108.0, 88.0, 47.0, 33.0, 23.0, 21.0, 8.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.234375, -20.4951171875, -19.755859375, -19.0166015625, -18.27734375, -17.5380859375, -16.798828125, -16.0595703125, -15.3203125, -14.5810546875, -13.841796875, -13.1025390625, -12.36328125, -11.6240234375, -10.884765625, -10.1455078125, -9.40625, -8.6669921875, -7.927734375, -7.1884765625, -6.44921875, -5.7099609375, -4.970703125, -4.2314453125, -3.4921875, -2.7529296875, -2.013671875, -1.2744140625, -0.53515625, 0.2041015625, 0.943359375, 1.6826171875, 2.421875, 3.1611328125, 3.900390625, 4.6396484375, 5.37890625, 6.1181640625, 6.857421875, 7.5966796875, 8.3359375, 9.0751953125, 9.814453125, 10.5537109375, 11.29296875, 12.0322265625, 12.771484375, 13.5107421875, 14.25, 14.9892578125, 15.728515625, 16.4677734375, 17.20703125, 17.9462890625, 18.685546875, 19.4248046875, 20.1640625, 20.9033203125, 21.642578125, 22.3818359375, 23.12109375, 23.8603515625, 24.599609375, 25.3388671875, 26.078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 10.0, 9.0, 13.0, 10.0, 11.0, 16.0, 18.0, 21.0, 30.0, 19.0, 29.0, 33.0, 36.0, 29.0, 33.0, 41.0, 52.0, 47.0, 46.0, 42.0, 39.0, 36.0, 42.0, 38.0, 30.0, 37.0, 41.0, 25.0, 17.0, 24.0, 18.0, 18.0, 15.0, 15.0, 12.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-25.640625, -24.82861328125, -24.0166015625, -23.20458984375, -22.392578125, -21.58056640625, -20.7685546875, -19.95654296875, -19.14453125, -18.33251953125, -17.5205078125, -16.70849609375, -15.896484375, -15.08447265625, -14.2724609375, -13.46044921875, -12.6484375, -11.83642578125, -11.0244140625, -10.21240234375, -9.400390625, -8.58837890625, -7.7763671875, -6.96435546875, -6.15234375, -5.34033203125, -4.5283203125, -3.71630859375, -2.904296875, -2.09228515625, -1.2802734375, -0.46826171875, 0.34375, 1.15576171875, 1.9677734375, 2.77978515625, 3.591796875, 4.40380859375, 5.2158203125, 6.02783203125, 6.83984375, 7.65185546875, 8.4638671875, 9.27587890625, 10.087890625, 10.89990234375, 11.7119140625, 12.52392578125, 13.3359375, 14.14794921875, 14.9599609375, 15.77197265625, 16.583984375, 17.39599609375, 18.2080078125, 19.02001953125, 19.83203125, 20.64404296875, 21.4560546875, 22.26806640625, 23.080078125, 23.89208984375, 24.7041015625, 25.51611328125, 26.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 11.0, 15.0, 29.0, 41.0, 52.0, 90.0, 156.0, 226.0, 357.0, 603.0, 955.0, 1483.0, 2519.0, 4256.0, 6886.0, 11770.0, 19133.0, 30908.0, 50875.0, 79786.0, 115669.0, 149662.0, 159265.0, 138178.0, 101016.0, 67076.0, 42365.0, 25654.0, 15617.0, 9205.0, 5761.0, 3484.0, 2100.0, 1241.0, 779.0, 486.0, 324.0, 202.0, 128.0, 64.0, 48.0, 39.0, 19.0, 9.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.40625, -32.3720703125, -31.337890625, -30.3037109375, -29.26953125, -28.2353515625, -27.201171875, -26.1669921875, -25.1328125, -24.0986328125, -23.064453125, -22.0302734375, -20.99609375, -19.9619140625, -18.927734375, -17.8935546875, -16.859375, -15.8251953125, -14.791015625, -13.7568359375, -12.72265625, -11.6884765625, -10.654296875, -9.6201171875, -8.5859375, -7.5517578125, -6.517578125, -5.4833984375, -4.44921875, -3.4150390625, -2.380859375, -1.3466796875, -0.3125, 0.7216796875, 1.755859375, 2.7900390625, 3.82421875, 4.8583984375, 5.892578125, 6.9267578125, 7.9609375, 8.9951171875, 10.029296875, 11.0634765625, 12.09765625, 13.1318359375, 14.166015625, 15.2001953125, 16.234375, 17.2685546875, 18.302734375, 19.3369140625, 20.37109375, 21.4052734375, 22.439453125, 23.4736328125, 24.5078125, 25.5419921875, 26.576171875, 27.6103515625, 28.64453125, 29.6787109375, 30.712890625, 31.7470703125, 32.78125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 10.0, 7.0, 12.0, 13.0, 20.0, 30.0, 21.0, 13.0, 23.0, 26.0, 37.0, 34.0, 28.0, 36.0, 38.0, 40.0, 37.0, 42.0, 36.0, 37.0, 39.0, 43.0, 27.0, 40.0, 28.0, 36.0, 35.0, 22.0, 24.0, 18.0, 16.0, 16.0, 17.0, 10.0, 16.0, 8.0, 5.0, 13.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.730224609375, -16.19482421875, -15.659423828125, -15.1240234375, -14.588623046875, -14.05322265625, -13.517822265625, -12.982421875, -12.447021484375, -11.91162109375, -11.376220703125, -10.8408203125, -10.305419921875, -9.77001953125, -9.234619140625, -8.69921875, -8.163818359375, -7.62841796875, -7.093017578125, -6.5576171875, -6.022216796875, -5.48681640625, -4.951416015625, -4.416015625, -3.880615234375, -3.34521484375, -2.809814453125, -2.2744140625, -1.739013671875, -1.20361328125, -0.668212890625, -0.1328125, 0.402587890625, 0.93798828125, 1.473388671875, 2.0087890625, 2.544189453125, 3.07958984375, 3.614990234375, 4.150390625, 4.685791015625, 5.22119140625, 5.756591796875, 6.2919921875, 6.827392578125, 7.36279296875, 7.898193359375, 8.43359375, 8.968994140625, 9.50439453125, 10.039794921875, 10.5751953125, 11.110595703125, 11.64599609375, 12.181396484375, 12.716796875, 13.252197265625, 13.78759765625, 14.322998046875, 14.8583984375, 15.393798828125, 15.92919921875, 16.464599609375, 17.0]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 8.0, 8.0, 16.0, 27.0, 40.0, 48.0, 80.0, 122.0, 198.0, 291.0, 455.0, 673.0, 1093.0, 1786.0, 3151.0, 5695.0, 12047.0, 29781.0, 90323.0, 284125.0, 385485.0, 150756.0, 47163.0, 17557.0, 7804.0, 3868.0, 2338.0, 1279.0, 823.0, 508.0, 324.0, 236.0, 142.0, 102.0, 60.0, 49.0, 30.0, 18.0, 12.0, 10.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.59375, -38.4365234375, -37.279296875, -36.1220703125, -34.96484375, -33.8076171875, -32.650390625, -31.4931640625, -30.3359375, -29.1787109375, -28.021484375, -26.8642578125, -25.70703125, -24.5498046875, -23.392578125, -22.2353515625, -21.078125, -19.9208984375, -18.763671875, -17.6064453125, -16.44921875, -15.2919921875, -14.134765625, -12.9775390625, -11.8203125, -10.6630859375, -9.505859375, -8.3486328125, -7.19140625, -6.0341796875, -4.876953125, -3.7197265625, -2.5625, -1.4052734375, -0.248046875, 0.9091796875, 2.06640625, 3.2236328125, 4.380859375, 5.5380859375, 6.6953125, 7.8525390625, 9.009765625, 10.1669921875, 11.32421875, 12.4814453125, 13.638671875, 14.7958984375, 15.953125, 17.1103515625, 18.267578125, 19.4248046875, 20.58203125, 21.7392578125, 22.896484375, 24.0537109375, 25.2109375, 26.3681640625, 27.525390625, 28.6826171875, 29.83984375, 30.9970703125, 32.154296875, 33.3115234375, 34.46875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 11.0, 19.0, 33.0, 43.0, 49.0, 81.0, 106.0, 135.0, 135.0, 91.0, 83.0, 57.0, 43.0, 29.0, 18.0, 11.0, 10.0, 4.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003662109375, -0.0035507678985595703, -0.0034394264221191406, -0.003328084945678711, -0.0032167434692382812, -0.0031054019927978516, -0.002994060516357422, -0.002882719039916992, -0.0027713775634765625, -0.002660036087036133, -0.002548694610595703, -0.0024373531341552734, -0.0023260116577148438, -0.002214670181274414, -0.0021033287048339844, -0.0019919872283935547, -0.001880645751953125, -0.0017693042755126953, -0.0016579627990722656, -0.001546621322631836, -0.0014352798461914062, -0.0013239383697509766, -0.0012125968933105469, -0.0011012554168701172, -0.0009899139404296875, -0.0008785724639892578, -0.0007672309875488281, -0.0006558895111083984, -0.0005445480346679688, -0.00043320655822753906, -0.0003218650817871094, -0.0002105236053466797, -9.918212890625e-05, 1.2159347534179688e-05, 0.00012350082397460938, 0.00023484230041503906, 0.00034618377685546875, 0.00045752525329589844, 0.0005688667297363281, 0.0006802082061767578, 0.0007915496826171875, 0.0009028911590576172, 0.0010142326354980469, 0.0011255741119384766, 0.0012369155883789062, 0.001348257064819336, 0.0014595985412597656, 0.0015709400177001953, 0.001682281494140625, 0.0017936229705810547, 0.0019049644470214844, 0.002016305923461914, 0.0021276473999023438, 0.0022389888763427734, 0.002350330352783203, 0.002461671829223633, 0.0025730133056640625, 0.002684354782104492, 0.002795696258544922, 0.0029070377349853516, 0.0030183792114257812, 0.003129720687866211, 0.0032410621643066406, 0.0033524036407470703, 0.0034637451171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 9.0, 15.0, 13.0, 26.0, 44.0, 58.0, 76.0, 108.0, 123.0, 246.0, 346.0, 599.0, 1040.0, 1789.0, 3489.0, 6741.0, 14972.0, 35618.0, 100705.0, 285386.0, 357986.0, 149698.0, 50719.0, 19802.0, 8915.0, 4405.0, 2296.0, 1274.0, 733.0, 471.0, 249.0, 189.0, 101.0, 81.0, 49.0, 33.0, 34.0, 25.0, 20.0, 9.0, 12.0, 6.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-36.59375, -35.582275390625, -34.57080078125, -33.559326171875, -32.5478515625, -31.536376953125, -30.52490234375, -29.513427734375, -28.501953125, -27.490478515625, -26.47900390625, -25.467529296875, -24.4560546875, -23.444580078125, -22.43310546875, -21.421630859375, -20.41015625, -19.398681640625, -18.38720703125, -17.375732421875, -16.3642578125, -15.352783203125, -14.34130859375, -13.329833984375, -12.318359375, -11.306884765625, -10.29541015625, -9.283935546875, -8.2724609375, -7.260986328125, -6.24951171875, -5.238037109375, -4.2265625, -3.215087890625, -2.20361328125, -1.192138671875, -0.1806640625, 0.830810546875, 1.84228515625, 2.853759765625, 3.865234375, 4.876708984375, 5.88818359375, 6.899658203125, 7.9111328125, 8.922607421875, 9.93408203125, 10.945556640625, 11.95703125, 12.968505859375, 13.97998046875, 14.991455078125, 16.0029296875, 17.014404296875, 18.02587890625, 19.037353515625, 20.048828125, 21.060302734375, 22.07177734375, 23.083251953125, 24.0947265625, 25.106201171875, 26.11767578125, 27.129150390625, 28.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 11.0, 4.0, 5.0, 11.0, 17.0, 11.0, 21.0, 26.0, 36.0, 45.0, 50.0, 76.0, 99.0, 102.0, 89.0, 93.0, 62.0, 43.0, 40.0, 40.0, 25.0, 16.0, 10.0, 15.0, 10.0, 9.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.75390625, -6.47296142578125, -6.1920166015625, -5.91107177734375, -5.630126953125, -5.34918212890625, -5.0682373046875, -4.78729248046875, -4.50634765625, -4.22540283203125, -3.9444580078125, -3.66351318359375, -3.382568359375, -3.10162353515625, -2.8206787109375, -2.53973388671875, -2.2587890625, -1.97784423828125, -1.6968994140625, -1.41595458984375, -1.135009765625, -0.85406494140625, -0.5731201171875, -0.29217529296875, -0.01123046875, 0.26971435546875, 0.5506591796875, 0.83160400390625, 1.112548828125, 1.39349365234375, 1.6744384765625, 1.95538330078125, 2.236328125, 2.51727294921875, 2.7982177734375, 3.07916259765625, 3.360107421875, 3.64105224609375, 3.9219970703125, 4.20294189453125, 4.48388671875, 4.76483154296875, 5.0457763671875, 5.32672119140625, 5.607666015625, 5.88861083984375, 6.1695556640625, 6.45050048828125, 6.7314453125, 7.01239013671875, 7.2933349609375, 7.57427978515625, 7.855224609375, 8.13616943359375, 8.4171142578125, 8.69805908203125, 8.97900390625, 9.25994873046875, 9.5408935546875, 9.82183837890625, 10.102783203125, 10.38372802734375, 10.6646728515625, 10.94561767578125, 11.2265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 8.0, 5.0, 9.0, 20.0, 17.0, 18.0, 21.0, 21.0, 23.0, 35.0, 43.0, 41.0, 45.0, 45.0, 55.0, 50.0, 45.0, 60.0, 38.0, 40.0, 55.0, 38.0, 47.0, 31.0, 35.0, 36.0, 16.0, 17.0, 15.0, 8.0, 14.0, 8.0, 5.0, 5.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.01079559326172, -31.08550453186035, -30.160213470458984, -29.23492431640625, -28.309633255004883, -27.384342193603516, -26.45905303955078, -25.533761978149414, -24.608470916748047, -23.68317985534668, -22.757888793945312, -21.832599639892578, -20.90730857849121, -19.982017517089844, -19.05672836303711, -18.131437301635742, -17.206146240234375, -16.280855178833008, -15.355565071105957, -14.430274963378906, -13.504983901977539, -12.579692840576172, -11.654402732849121, -10.72911262512207, -9.803821563720703, -8.878530502319336, -7.953240394592285, -7.027949810028076, -6.102659225463867, -5.177368640899658, -4.252078056335449, -3.3267874717712402, -2.4014949798583984, -1.4762043952941895, -0.5509138107299805, 0.3743767738342285, 1.2996673583984375, 2.2249579429626465, 3.1502485275268555, 4.0755391120910645, 5.000829696655273, 5.926120281219482, 6.851410865783691, 7.7767014503479, 8.70199203491211, 9.627283096313477, 10.552573204040527, 11.477863311767578, 12.403154373168945, 13.328445434570312, 14.253735542297363, 15.179025650024414, 16.10431671142578, 17.02960777282715, 17.954898834228516, 18.88018798828125, 19.805479049682617, 20.730770111083984, 21.65605926513672, 22.581350326538086, 23.506641387939453, 24.43193244934082, 25.357223510742188, 26.282512664794922, 27.20780372619629]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 5.0, 11.0, 15.0, 14.0, 18.0, 11.0, 16.0, 21.0, 28.0, 31.0, 28.0, 31.0, 23.0, 38.0, 53.0, 36.0, 32.0, 44.0, 43.0, 40.0, 49.0, 46.0, 36.0, 39.0, 28.0, 37.0, 37.0, 27.0, 27.0, 18.0, 22.0, 13.0, 8.0, 12.0, 13.0, 10.0, 9.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.625940322875977, -24.803417205810547, -23.98089599609375, -23.15837287902832, -22.335851669311523, -21.513328552246094, -20.690807342529297, -19.868284225463867, -19.045761108398438, -18.223237991333008, -17.40071678161621, -16.57819366455078, -15.755671501159668, -14.933149337768555, -14.110627174377441, -13.288105010986328, -12.465582847595215, -11.643060684204102, -10.820538520812988, -9.998016357421875, -9.175493240356445, -8.352971076965332, -7.530448913574219, -6.707926273345947, -5.885404109954834, -5.062881946563721, -4.240359306335449, -3.417837142944336, -2.5953147411346436, -1.7727923393249512, -0.9502701759338379, -0.1277475357055664, 0.6947746276855469, 1.5172970294952393, 2.3398194313049316, 3.162341594696045, 3.9848639965057373, 4.80738639831543, 5.629908561706543, 6.4524312019348145, 7.274953365325928, 8.0974760055542, 8.919998168945312, 9.742520332336426, 10.565042495727539, 11.387565612792969, 12.210086822509766, 13.032609939575195, 13.855132102966309, 14.677654266357422, 15.500176429748535, 16.32269859313965, 17.145221710205078, 17.967742919921875, 18.790266036987305, 19.612789154052734, 20.43531036376953, 21.25783348083496, 22.080354690551758, 22.902877807617188, 23.725399017333984, 24.547922134399414, 25.370445251464844, 26.19296646118164, 27.01548957824707]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 13.0, 13.0, 18.0, 30.0, 37.0, 62.0, 70.0, 98.0, 178.0, 260.0, 372.0, 573.0, 820.0, 1245.0, 1940.0, 2876.0, 4783.0, 7807.0, 12727.0, 21680.0, 37594.0, 67850.0, 124283.0, 238435.0, 458588.0, 759983.0, 894242.0, 693349.0, 401915.0, 208880.0, 110298.0, 60257.0, 33669.0, 19593.0, 11341.0, 6792.0, 4294.0, 2591.0, 1657.0, 1060.0, 644.0, 442.0, 291.0, 212.0, 139.0, 83.0, 67.0, 43.0, 35.0, 26.0, 11.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.046875, -28.177001953125, -27.30712890625, -26.437255859375, -25.5673828125, -24.697509765625, -23.82763671875, -22.957763671875, -22.087890625, -21.218017578125, -20.34814453125, -19.478271484375, -18.6083984375, -17.738525390625, -16.86865234375, -15.998779296875, -15.12890625, -14.259033203125, -13.38916015625, -12.519287109375, -11.6494140625, -10.779541015625, -9.90966796875, -9.039794921875, -8.169921875, -7.300048828125, -6.43017578125, -5.560302734375, -4.6904296875, -3.820556640625, -2.95068359375, -2.080810546875, -1.2109375, -0.341064453125, 0.52880859375, 1.398681640625, 2.2685546875, 3.138427734375, 4.00830078125, 4.878173828125, 5.748046875, 6.617919921875, 7.48779296875, 8.357666015625, 9.2275390625, 10.097412109375, 10.96728515625, 11.837158203125, 12.70703125, 13.576904296875, 14.44677734375, 15.316650390625, 16.1865234375, 17.056396484375, 17.92626953125, 18.796142578125, 19.666015625, 20.535888671875, 21.40576171875, 22.275634765625, 23.1455078125, 24.015380859375, 24.88525390625, 25.755126953125, 26.625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 7.0, 8.0, 7.0, 13.0, 10.0, 17.0, 16.0, 24.0, 28.0, 23.0, 29.0, 25.0, 31.0, 38.0, 44.0, 40.0, 43.0, 50.0, 33.0, 40.0, 44.0, 52.0, 36.0, 35.0, 44.0, 27.0, 38.0, 41.0, 20.0, 21.0, 8.0, 16.0, 11.0, 11.0, 12.0, 14.0, 9.0, 9.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.625, -20.917236328125, -20.20947265625, -19.501708984375, -18.7939453125, -18.086181640625, -17.37841796875, -16.670654296875, -15.962890625, -15.255126953125, -14.54736328125, -13.839599609375, -13.1318359375, -12.424072265625, -11.71630859375, -11.008544921875, -10.30078125, -9.593017578125, -8.88525390625, -8.177490234375, -7.4697265625, -6.761962890625, -6.05419921875, -5.346435546875, -4.638671875, -3.930908203125, -3.22314453125, -2.515380859375, -1.8076171875, -1.099853515625, -0.39208984375, 0.315673828125, 1.0234375, 1.731201171875, 2.43896484375, 3.146728515625, 3.8544921875, 4.562255859375, 5.27001953125, 5.977783203125, 6.685546875, 7.393310546875, 8.10107421875, 8.808837890625, 9.5166015625, 10.224365234375, 10.93212890625, 11.639892578125, 12.34765625, 13.055419921875, 13.76318359375, 14.470947265625, 15.1787109375, 15.886474609375, 16.59423828125, 17.302001953125, 18.009765625, 18.717529296875, 19.42529296875, 20.133056640625, 20.8408203125, 21.548583984375, 22.25634765625, 22.964111328125, 23.671875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 6.0, 9.0, 16.0, 22.0, 35.0, 51.0, 78.0, 135.0, 235.0, 315.0, 467.0, 792.0, 1193.0, 1886.0, 3226.0, 5148.0, 8970.0, 15778.0, 27826.0, 50651.0, 94034.0, 176513.0, 334544.0, 597600.0, 881239.0, 833396.0, 531283.0, 290147.0, 154001.0, 81938.0, 44177.0, 24511.0, 13771.0, 8044.0, 4711.0, 2795.0, 1717.0, 1137.0, 680.0, 420.0, 288.0, 173.0, 119.0, 85.0, 47.0, 37.0, 15.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-35.0, -33.996826171875, -32.99365234375, -31.990478515625, -30.9873046875, -29.984130859375, -28.98095703125, -27.977783203125, -26.974609375, -25.971435546875, -24.96826171875, -23.965087890625, -22.9619140625, -21.958740234375, -20.95556640625, -19.952392578125, -18.94921875, -17.946044921875, -16.94287109375, -15.939697265625, -14.9365234375, -13.933349609375, -12.93017578125, -11.927001953125, -10.923828125, -9.920654296875, -8.91748046875, -7.914306640625, -6.9111328125, -5.907958984375, -4.90478515625, -3.901611328125, -2.8984375, -1.895263671875, -0.89208984375, 0.111083984375, 1.1142578125, 2.117431640625, 3.12060546875, 4.123779296875, 5.126953125, 6.130126953125, 7.13330078125, 8.136474609375, 9.1396484375, 10.142822265625, 11.14599609375, 12.149169921875, 13.15234375, 14.155517578125, 15.15869140625, 16.161865234375, 17.1650390625, 18.168212890625, 19.17138671875, 20.174560546875, 21.177734375, 22.180908203125, 23.18408203125, 24.187255859375, 25.1904296875, 26.193603515625, 27.19677734375, 28.199951171875, 29.203125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 5.0, 8.0, 5.0, 8.0, 12.0, 17.0, 14.0, 20.0, 18.0, 32.0, 35.0, 55.0, 69.0, 87.0, 89.0, 100.0, 110.0, 152.0, 156.0, 160.0, 207.0, 232.0, 241.0, 260.0, 242.0, 231.0, 228.0, 180.0, 173.0, 146.0, 137.0, 117.0, 106.0, 74.0, 64.0, 63.0, 53.0, 30.0, 38.0, 20.0, 13.0, 12.0, 11.0, 18.0, 2.0, 6.0, 2.0, 3.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.578125, -10.25830078125, -9.9384765625, -9.61865234375, -9.298828125, -8.97900390625, -8.6591796875, -8.33935546875, -8.01953125, -7.69970703125, -7.3798828125, -7.06005859375, -6.740234375, -6.42041015625, -6.1005859375, -5.78076171875, -5.4609375, -5.14111328125, -4.8212890625, -4.50146484375, -4.181640625, -3.86181640625, -3.5419921875, -3.22216796875, -2.90234375, -2.58251953125, -2.2626953125, -1.94287109375, -1.623046875, -1.30322265625, -0.9833984375, -0.66357421875, -0.34375, -0.02392578125, 0.2958984375, 0.61572265625, 0.935546875, 1.25537109375, 1.5751953125, 1.89501953125, 2.21484375, 2.53466796875, 2.8544921875, 3.17431640625, 3.494140625, 3.81396484375, 4.1337890625, 4.45361328125, 4.7734375, 5.09326171875, 5.4130859375, 5.73291015625, 6.052734375, 6.37255859375, 6.6923828125, 7.01220703125, 7.33203125, 7.65185546875, 7.9716796875, 8.29150390625, 8.611328125, 8.93115234375, 9.2509765625, 9.57080078125, 9.890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 3.0, 9.0, 7.0, 11.0, 11.0, 10.0, 18.0, 20.0, 23.0, 28.0, 40.0, 34.0, 53.0, 53.0, 55.0, 49.0, 71.0, 56.0, 64.0, 50.0, 48.0, 56.0, 47.0, 26.0, 34.0, 27.0, 20.0, 12.0, 16.0, 7.0, 12.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.280052185058594, -32.23918533325195, -31.19831657409668, -30.157447814941406, -29.116580963134766, -28.075712203979492, -27.03484344482422, -25.993976593017578, -24.953107833862305, -23.91223907470703, -22.87137222290039, -21.830503463745117, -20.789634704589844, -19.748767852783203, -18.70789909362793, -17.667030334472656, -16.626163482666016, -15.585295677185059, -14.544427871704102, -13.503559112548828, -12.462691307067871, -11.421823501586914, -10.38095474243164, -9.340086936950684, -8.299219131469727, -7.2583513259887695, -6.217483043670654, -5.176614761352539, -4.135746955871582, -3.094879150390625, -2.0540108680725098, -1.0131425857543945, 0.0277252197265625, 1.0685932636260986, 2.1094613075256348, 3.150329351425171, 4.191197395324707, 5.232065200805664, 6.272933483123779, 7.3138017654418945, 8.354669570922852, 9.395537376403809, 10.436405181884766, 11.477273941040039, 12.518141746520996, 13.559009552001953, 14.599878311157227, 15.640746116638184, 16.68161392211914, 17.722482681274414, 18.763349533081055, 19.804218292236328, 20.84508514404297, 21.885953903198242, 22.926822662353516, 23.967689514160156, 25.00855827331543, 26.049427032470703, 27.090293884277344, 28.131162643432617, 29.17203140258789, 30.21289825439453, 31.253767013549805, 32.29463577270508, 33.33550262451172]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 8.0, 5.0, 10.0, 12.0, 9.0, 11.0, 13.0, 19.0, 21.0, 25.0, 41.0, 36.0, 42.0, 28.0, 38.0, 40.0, 35.0, 45.0, 43.0, 49.0, 44.0, 48.0, 48.0, 44.0, 35.0, 43.0, 36.0, 19.0, 29.0, 16.0, 19.0, 23.0, 11.0, 11.0, 12.0, 11.0, 8.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.848255157470703, -27.998109817504883, -27.14796257019043, -26.29781723022461, -25.447669982910156, -24.597524642944336, -23.747379302978516, -22.897232055664062, -22.047086715698242, -21.196941375732422, -20.34679412841797, -19.49664878845215, -18.646503448486328, -17.796356201171875, -16.946210861206055, -16.096065521240234, -15.245918273925781, -14.395771980285645, -13.545625686645508, -12.695480346679688, -11.84533405303955, -10.995187759399414, -10.145042419433594, -9.294896125793457, -8.44474983215332, -7.594603538513184, -6.744457721710205, -5.894311904907227, -5.04416561126709, -4.194019317626953, -3.3438735008239746, -2.493727684020996, -1.6435813903808594, -0.7934353351593018, 0.05671072006225586, 0.9068567752838135, 1.757002830505371, 2.607149124145508, 3.4572949409484863, 4.307440757751465, 5.157587051391602, 6.007733345031738, 6.857879161834717, 7.708024978637695, 8.558171272277832, 9.408317565917969, 10.258462905883789, 11.108609199523926, 11.958755493164062, 12.8089017868042, 13.659048080444336, 14.509193420410156, 15.359339714050293, 16.20948600769043, 17.05963134765625, 17.909778594970703, 18.759923934936523, 19.610069274902344, 20.460216522216797, 21.310361862182617, 22.160507202148438, 23.01065444946289, 23.86079978942871, 24.71094512939453, 25.561092376708984]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 7.0, 13.0, 16.0, 53.0, 61.0, 90.0, 111.0, 192.0, 306.0, 535.0, 781.0, 1214.0, 1933.0, 3098.0, 4689.0, 7582.0, 11648.0, 18359.0, 29639.0, 46593.0, 72918.0, 107820.0, 145534.0, 161365.0, 141340.0, 103597.0, 68489.0, 44444.0, 27919.0, 17599.0, 10846.0, 7118.0, 4500.0, 2978.0, 1757.0, 1244.0, 799.0, 492.0, 332.0, 188.0, 132.0, 81.0, 51.0, 33.0, 29.0, 17.0, 8.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-15.4921875, -15.0289306640625, -14.565673828125, -14.1024169921875, -13.63916015625, -13.1759033203125, -12.712646484375, -12.2493896484375, -11.7861328125, -11.3228759765625, -10.859619140625, -10.3963623046875, -9.93310546875, -9.4698486328125, -9.006591796875, -8.5433349609375, -8.080078125, -7.6168212890625, -7.153564453125, -6.6903076171875, -6.22705078125, -5.7637939453125, -5.300537109375, -4.8372802734375, -4.3740234375, -3.9107666015625, -3.447509765625, -2.9842529296875, -2.52099609375, -2.0577392578125, -1.594482421875, -1.1312255859375, -0.66796875, -0.2047119140625, 0.258544921875, 0.7218017578125, 1.18505859375, 1.6483154296875, 2.111572265625, 2.5748291015625, 3.0380859375, 3.5013427734375, 3.964599609375, 4.4278564453125, 4.89111328125, 5.3543701171875, 5.817626953125, 6.2808837890625, 6.744140625, 7.2073974609375, 7.670654296875, 8.1339111328125, 8.59716796875, 9.0604248046875, 9.523681640625, 9.9869384765625, 10.4501953125, 10.9134521484375, 11.376708984375, 11.8399658203125, 12.30322265625, 12.7664794921875, 13.229736328125, 13.6929931640625, 14.15625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 4.0, 3.0, 7.0, 8.0, 8.0, 11.0, 9.0, 19.0, 16.0, 24.0, 29.0, 33.0, 26.0, 34.0, 40.0, 34.0, 38.0, 38.0, 45.0, 37.0, 35.0, 54.0, 53.0, 35.0, 37.0, 45.0, 37.0, 32.0, 27.0, 24.0, 18.0, 21.0, 20.0, 19.0, 16.0, 12.0, 9.0, 10.0, 8.0, 2.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.734375, -23.920654296875, -23.10693359375, -22.293212890625, -21.4794921875, -20.665771484375, -19.85205078125, -19.038330078125, -18.224609375, -17.410888671875, -16.59716796875, -15.783447265625, -14.9697265625, -14.156005859375, -13.34228515625, -12.528564453125, -11.71484375, -10.901123046875, -10.08740234375, -9.273681640625, -8.4599609375, -7.646240234375, -6.83251953125, -6.018798828125, -5.205078125, -4.391357421875, -3.57763671875, -2.763916015625, -1.9501953125, -1.136474609375, -0.32275390625, 0.490966796875, 1.3046875, 2.118408203125, 2.93212890625, 3.745849609375, 4.5595703125, 5.373291015625, 6.18701171875, 7.000732421875, 7.814453125, 8.628173828125, 9.44189453125, 10.255615234375, 11.0693359375, 11.883056640625, 12.69677734375, 13.510498046875, 14.32421875, 15.137939453125, 15.95166015625, 16.765380859375, 17.5791015625, 18.392822265625, 19.20654296875, 20.020263671875, 20.833984375, 21.647705078125, 22.46142578125, 23.275146484375, 24.0888671875, 24.902587890625, 25.71630859375, 26.530029296875, 27.34375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 14.0, 13.0, 22.0, 37.0, 42.0, 88.0, 115.0, 156.0, 265.0, 413.0, 685.0, 1118.0, 1773.0, 2980.0, 4989.0, 8827.0, 15687.0, 28470.0, 54186.0, 101993.0, 178774.0, 233048.0, 184461.0, 105581.0, 56126.0, 29975.0, 16250.0, 9302.0, 5223.0, 3057.0, 1822.0, 1138.0, 689.0, 419.0, 292.0, 177.0, 110.0, 74.0, 45.0, 37.0, 21.0, 16.0, 16.0, 12.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-22.515625, -21.801513671875, -21.08740234375, -20.373291015625, -19.6591796875, -18.945068359375, -18.23095703125, -17.516845703125, -16.802734375, -16.088623046875, -15.37451171875, -14.660400390625, -13.9462890625, -13.232177734375, -12.51806640625, -11.803955078125, -11.08984375, -10.375732421875, -9.66162109375, -8.947509765625, -8.2333984375, -7.519287109375, -6.80517578125, -6.091064453125, -5.376953125, -4.662841796875, -3.94873046875, -3.234619140625, -2.5205078125, -1.806396484375, -1.09228515625, -0.378173828125, 0.3359375, 1.050048828125, 1.76416015625, 2.478271484375, 3.1923828125, 3.906494140625, 4.62060546875, 5.334716796875, 6.048828125, 6.762939453125, 7.47705078125, 8.191162109375, 8.9052734375, 9.619384765625, 10.33349609375, 11.047607421875, 11.76171875, 12.475830078125, 13.18994140625, 13.904052734375, 14.6181640625, 15.332275390625, 16.04638671875, 16.760498046875, 17.474609375, 18.188720703125, 18.90283203125, 19.616943359375, 20.3310546875, 21.045166015625, 21.75927734375, 22.473388671875, 23.1875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 3.0, 10.0, 4.0, 11.0, 13.0, 11.0, 11.0, 17.0, 19.0, 25.0, 14.0, 26.0, 27.0, 30.0, 35.0, 33.0, 49.0, 31.0, 37.0, 29.0, 28.0, 35.0, 36.0, 42.0, 50.0, 40.0, 30.0, 38.0, 39.0, 26.0, 29.0, 16.0, 24.0, 17.0, 11.0, 15.0, 14.0, 9.0, 13.0, 11.0, 4.0, 6.0, 11.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.3046875, -14.8265380859375, -14.348388671875, -13.8702392578125, -13.39208984375, -12.9139404296875, -12.435791015625, -11.9576416015625, -11.4794921875, -11.0013427734375, -10.523193359375, -10.0450439453125, -9.56689453125, -9.0887451171875, -8.610595703125, -8.1324462890625, -7.654296875, -7.1761474609375, -6.697998046875, -6.2198486328125, -5.74169921875, -5.2635498046875, -4.785400390625, -4.3072509765625, -3.8291015625, -3.3509521484375, -2.872802734375, -2.3946533203125, -1.91650390625, -1.4383544921875, -0.960205078125, -0.4820556640625, -0.00390625, 0.4742431640625, 0.952392578125, 1.4305419921875, 1.90869140625, 2.3868408203125, 2.864990234375, 3.3431396484375, 3.8212890625, 4.2994384765625, 4.777587890625, 5.2557373046875, 5.73388671875, 6.2120361328125, 6.690185546875, 7.1683349609375, 7.646484375, 8.1246337890625, 8.602783203125, 9.0809326171875, 9.55908203125, 10.0372314453125, 10.515380859375, 10.9935302734375, 11.4716796875, 11.9498291015625, 12.427978515625, 12.9061279296875, 13.38427734375, 13.8624267578125, 14.340576171875, 14.8187255859375, 15.296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 11.0, 14.0, 9.0, 19.0, 26.0, 37.0, 54.0, 79.0, 115.0, 175.0, 198.0, 302.0, 388.0, 591.0, 846.0, 1273.0, 1882.0, 2853.0, 4518.0, 6802.0, 10974.0, 17866.0, 29681.0, 50517.0, 87119.0, 148839.0, 212241.0, 186842.0, 116349.0, 66468.0, 39000.0, 23234.0, 14269.0, 8703.0, 5455.0, 3585.0, 2333.0, 1529.0, 1038.0, 683.0, 504.0, 340.0, 225.0, 154.0, 126.0, 81.0, 54.0, 50.0, 36.0, 22.0, 17.0, 7.0, 6.0, 5.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-5.51171875, -5.32647705078125, -5.1412353515625, -4.95599365234375, -4.770751953125, -4.58551025390625, -4.4002685546875, -4.21502685546875, -4.02978515625, -3.84454345703125, -3.6593017578125, -3.47406005859375, -3.288818359375, -3.10357666015625, -2.9183349609375, -2.73309326171875, -2.5478515625, -2.36260986328125, -2.1773681640625, -1.99212646484375, -1.806884765625, -1.62164306640625, -1.4364013671875, -1.25115966796875, -1.06591796875, -0.88067626953125, -0.6954345703125, -0.51019287109375, -0.324951171875, -0.13970947265625, 0.0455322265625, 0.23077392578125, 0.416015625, 0.60125732421875, 0.7864990234375, 0.97174072265625, 1.156982421875, 1.34222412109375, 1.5274658203125, 1.71270751953125, 1.89794921875, 2.08319091796875, 2.2684326171875, 2.45367431640625, 2.638916015625, 2.82415771484375, 3.0093994140625, 3.19464111328125, 3.3798828125, 3.56512451171875, 3.7503662109375, 3.93560791015625, 4.120849609375, 4.30609130859375, 4.4913330078125, 4.67657470703125, 4.86181640625, 5.04705810546875, 5.2322998046875, 5.41754150390625, 5.602783203125, 5.78802490234375, 5.9732666015625, 6.15850830078125, 6.34375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 12.0, 4.0, 8.0, 3.0, 13.0, 6.0, 13.0, 17.0, 10.0, 24.0, 21.0, 32.0, 28.0, 40.0, 48.0, 56.0, 42.0, 64.0, 52.0, 59.0, 44.0, 46.0, 64.0, 41.0, 32.0, 40.0, 24.0, 22.0, 19.0, 21.0, 19.0, 13.0, 16.0, 13.0, 2.0, 9.0, 3.0, 9.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005884170532226562, -0.0005707666277885437, -0.0005531162023544312, -0.0005354657769203186, -0.0005178153514862061, -0.0005001649260520935, -0.00048251450061798096, -0.0004648640751838684, -0.00044721364974975586, -0.0004295632243156433, -0.00041191279888153076, -0.0003942623734474182, -0.00037661194801330566, -0.0003589615225791931, -0.00034131109714508057, -0.000323660671710968, -0.00030601024627685547, -0.0002883598208427429, -0.00027070939540863037, -0.0002530589699745178, -0.00023540854454040527, -0.00021775811910629272, -0.00020010769367218018, -0.00018245726823806763, -0.00016480684280395508, -0.00014715641736984253, -0.00012950599193572998, -0.00011185556650161743, -9.420514106750488e-05, -7.655471563339233e-05, -5.8904290199279785e-05, -4.1253864765167236e-05, -2.3603439331054688e-05, -5.953013896942139e-06, 1.169741153717041e-05, 2.934783697128296e-05, 4.699826240539551e-05, 6.464868783950806e-05, 8.22991132736206e-05, 9.994953870773315e-05, 0.0001175999641418457, 0.00013525038957595825, 0.0001529008150100708, 0.00017055124044418335, 0.0001882016658782959, 0.00020585209131240845, 0.000223502516746521, 0.00024115294218063354, 0.0002588033676147461, 0.00027645379304885864, 0.0002941042184829712, 0.00031175464391708374, 0.0003294050693511963, 0.00034705549478530884, 0.0003647059202194214, 0.00038235634565353394, 0.0004000067710876465, 0.00041765719652175903, 0.0004353076219558716, 0.00045295804738998413, 0.0004706084728240967, 0.00048825889825820923, 0.0005059093236923218, 0.0005235597491264343, 0.0005412101745605469]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 15.0, 21.0, 15.0, 30.0, 55.0, 67.0, 90.0, 114.0, 175.0, 256.0, 346.0, 594.0, 811.0, 1188.0, 1754.0, 2934.0, 4276.0, 6834.0, 10904.0, 18161.0, 30621.0, 52054.0, 90856.0, 152621.0, 207515.0, 183408.0, 116539.0, 67110.0, 38762.0, 22808.0, 13721.0, 8447.0, 5307.0, 3329.0, 2270.0, 1459.0, 941.0, 650.0, 423.0, 330.0, 237.0, 148.0, 114.0, 74.0, 49.0, 33.0, 22.0, 23.0, 11.0, 8.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.27734375, -7.0479736328125, -6.818603515625, -6.5892333984375, -6.35986328125, -6.1304931640625, -5.901123046875, -5.6717529296875, -5.4423828125, -5.2130126953125, -4.983642578125, -4.7542724609375, -4.52490234375, -4.2955322265625, -4.066162109375, -3.8367919921875, -3.607421875, -3.3780517578125, -3.148681640625, -2.9193115234375, -2.68994140625, -2.4605712890625, -2.231201171875, -2.0018310546875, -1.7724609375, -1.5430908203125, -1.313720703125, -1.0843505859375, -0.85498046875, -0.6256103515625, -0.396240234375, -0.1668701171875, 0.0625, 0.2918701171875, 0.521240234375, 0.7506103515625, 0.97998046875, 1.2093505859375, 1.438720703125, 1.6680908203125, 1.8974609375, 2.1268310546875, 2.356201171875, 2.5855712890625, 2.81494140625, 3.0443115234375, 3.273681640625, 3.5030517578125, 3.732421875, 3.9617919921875, 4.191162109375, 4.4205322265625, 4.64990234375, 4.8792724609375, 5.108642578125, 5.3380126953125, 5.5673828125, 5.7967529296875, 6.026123046875, 6.2554931640625, 6.48486328125, 6.7142333984375, 6.943603515625, 7.1729736328125, 7.40234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 14.0, 19.0, 27.0, 30.0, 46.0, 45.0, 73.0, 86.0, 91.0, 113.0, 75.0, 78.0, 70.0, 57.0, 33.0, 34.0, 27.0, 19.0, 11.0, 11.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.8828125, -3.75189208984375, -3.6209716796875, -3.49005126953125, -3.359130859375, -3.22821044921875, -3.0972900390625, -2.96636962890625, -2.83544921875, -2.70452880859375, -2.5736083984375, -2.44268798828125, -2.311767578125, -2.18084716796875, -2.0499267578125, -1.91900634765625, -1.7880859375, -1.65716552734375, -1.5262451171875, -1.39532470703125, -1.264404296875, -1.13348388671875, -1.0025634765625, -0.87164306640625, -0.74072265625, -0.60980224609375, -0.4788818359375, -0.34796142578125, -0.217041015625, -0.08612060546875, 0.0447998046875, 0.17572021484375, 0.306640625, 0.43756103515625, 0.5684814453125, 0.69940185546875, 0.830322265625, 0.96124267578125, 1.0921630859375, 1.22308349609375, 1.35400390625, 1.48492431640625, 1.6158447265625, 1.74676513671875, 1.877685546875, 2.00860595703125, 2.1395263671875, 2.27044677734375, 2.4013671875, 2.53228759765625, 2.6632080078125, 2.79412841796875, 2.925048828125, 3.05596923828125, 3.1868896484375, 3.31781005859375, 3.44873046875, 3.57965087890625, 3.7105712890625, 3.84149169921875, 3.972412109375, 4.10333251953125, 4.2342529296875, 4.36517333984375, 4.49609375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 9.0, 6.0, 12.0, 13.0, 11.0, 17.0, 18.0, 24.0, 30.0, 35.0, 36.0, 51.0, 54.0, 51.0, 58.0, 74.0, 54.0, 67.0, 56.0, 47.0, 42.0, 46.0, 29.0, 31.0, 28.0, 24.0, 16.0, 16.0, 8.0, 5.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.29232406616211, -32.246097564697266, -31.199871063232422, -30.153644561767578, -29.107419967651367, -28.061193466186523, -27.01496696472168, -25.968740463256836, -24.922515869140625, -23.87628936767578, -22.830062866210938, -21.783836364746094, -20.737611770629883, -19.69138526916504, -18.645158767700195, -17.59893226623535, -16.552705764770508, -15.506479263305664, -14.460253715515137, -13.414027214050293, -12.367801666259766, -11.321575164794922, -10.275348663330078, -9.229122161865234, -8.182896614074707, -7.1366705894470215, -6.090444564819336, -5.044218063354492, -3.9979920387268066, -2.951766014099121, -1.9055395126342773, -0.8593134880065918, 0.18691253662109375, 1.2331386804580688, 2.279364824295044, 3.3255910873413086, 4.371817111968994, 5.41804313659668, 6.464269638061523, 7.510495662689209, 8.556721687316895, 9.602948188781738, 10.649173736572266, 11.69540023803711, 12.741626739501953, 13.78785228729248, 14.834078788757324, 15.880304336547852, 16.926530838012695, 17.97275733947754, 19.018983840942383, 20.065208435058594, 21.111434936523438, 22.15766143798828, 23.203887939453125, 24.25011444091797, 25.296340942382812, 26.342567443847656, 27.3887939453125, 28.435020446777344, 29.481245040893555, 30.5274715423584, 31.573698043823242, 32.61992263793945, 33.6661491394043]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 10.0, 7.0, 11.0, 12.0, 16.0, 18.0, 18.0, 29.0, 30.0, 44.0, 28.0, 37.0, 35.0, 39.0, 43.0, 35.0, 42.0, 49.0, 42.0, 46.0, 45.0, 45.0, 42.0, 35.0, 44.0, 29.0, 19.0, 20.0, 25.0, 11.0, 20.0, 12.0, 12.0, 12.0, 10.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.941328048706055, -28.097658157348633, -27.253990173339844, -26.410320281982422, -25.566650390625, -24.722980499267578, -23.879310607910156, -23.035642623901367, -22.191972732543945, -21.348302841186523, -20.504634857177734, -19.660964965820312, -18.81729507446289, -17.97362518310547, -17.129955291748047, -16.286287307739258, -15.442617416381836, -14.598947525024414, -13.755278587341309, -12.911609649658203, -12.067939758300781, -11.22426986694336, -10.380600929260254, -9.536931991577148, -8.693262100219727, -7.849592685699463, -7.005923271179199, -6.1622538566589355, -5.318584442138672, -4.474915027618408, -3.6312456130981445, -2.787576198577881, -1.9439048767089844, -1.1002354621887207, -0.25656604766845703, 0.5871033668518066, 1.4307727813720703, 2.274442195892334, 3.1181116104125977, 3.9617810249328613, 4.805450439453125, 5.649119853973389, 6.492789268493652, 7.336458683013916, 8.18012809753418, 9.023797988891602, 9.867466926574707, 10.711135864257812, 11.554805755615234, 12.398475646972656, 13.242144584655762, 14.085813522338867, 14.929483413696289, 15.773153305053711, 16.6168212890625, 17.460491180419922, 18.304161071777344, 19.147830963134766, 19.991500854492188, 20.835168838500977, 21.6788387298584, 22.52250862121582, 23.36617660522461, 24.20984649658203, 25.053516387939453]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 10.0, 31.0, 41.0, 64.0, 81.0, 140.0, 221.0, 298.0, 517.0, 824.0, 1264.0, 2048.0, 3138.0, 4888.0, 7478.0, 11596.0, 17943.0, 27152.0, 40854.0, 59706.0, 82850.0, 107325.0, 124913.0, 129558.0, 117406.0, 94327.0, 69951.0, 48720.0, 33441.0, 21640.0, 14190.0, 9296.0, 5907.0, 3851.0, 2511.0, 1636.0, 980.0, 610.0, 412.0, 273.0, 156.0, 133.0, 61.0, 37.0, 27.0, 12.0, 12.0, 7.0, 10.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.359375, -21.6435546875, -20.927734375, -20.2119140625, -19.49609375, -18.7802734375, -18.064453125, -17.3486328125, -16.6328125, -15.9169921875, -15.201171875, -14.4853515625, -13.76953125, -13.0537109375, -12.337890625, -11.6220703125, -10.90625, -10.1904296875, -9.474609375, -8.7587890625, -8.04296875, -7.3271484375, -6.611328125, -5.8955078125, -5.1796875, -4.4638671875, -3.748046875, -3.0322265625, -2.31640625, -1.6005859375, -0.884765625, -0.1689453125, 0.546875, 1.2626953125, 1.978515625, 2.6943359375, 3.41015625, 4.1259765625, 4.841796875, 5.5576171875, 6.2734375, 6.9892578125, 7.705078125, 8.4208984375, 9.13671875, 9.8525390625, 10.568359375, 11.2841796875, 12.0, 12.7158203125, 13.431640625, 14.1474609375, 14.86328125, 15.5791015625, 16.294921875, 17.0107421875, 17.7265625, 18.4423828125, 19.158203125, 19.8740234375, 20.58984375, 21.3056640625, 22.021484375, 22.7373046875, 23.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 8.0, 8.0, 6.0, 11.0, 7.0, 12.0, 13.0, 18.0, 23.0, 15.0, 27.0, 26.0, 23.0, 34.0, 33.0, 47.0, 44.0, 31.0, 43.0, 39.0, 38.0, 52.0, 45.0, 34.0, 45.0, 30.0, 43.0, 33.0, 30.0, 27.0, 17.0, 22.0, 31.0, 21.0, 14.0, 11.0, 12.0, 4.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-26.453125, -25.636962890625, -24.82080078125, -24.004638671875, -23.1884765625, -22.372314453125, -21.55615234375, -20.739990234375, -19.923828125, -19.107666015625, -18.29150390625, -17.475341796875, -16.6591796875, -15.843017578125, -15.02685546875, -14.210693359375, -13.39453125, -12.578369140625, -11.76220703125, -10.946044921875, -10.1298828125, -9.313720703125, -8.49755859375, -7.681396484375, -6.865234375, -6.049072265625, -5.23291015625, -4.416748046875, -3.6005859375, -2.784423828125, -1.96826171875, -1.152099609375, -0.3359375, 0.480224609375, 1.29638671875, 2.112548828125, 2.9287109375, 3.744873046875, 4.56103515625, 5.377197265625, 6.193359375, 7.009521484375, 7.82568359375, 8.641845703125, 9.4580078125, 10.274169921875, 11.09033203125, 11.906494140625, 12.72265625, 13.538818359375, 14.35498046875, 15.171142578125, 15.9873046875, 16.803466796875, 17.61962890625, 18.435791015625, 19.251953125, 20.068115234375, 20.88427734375, 21.700439453125, 22.5166015625, 23.332763671875, 24.14892578125, 24.965087890625, 25.78125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 4.0, 21.0, 27.0, 38.0, 53.0, 83.0, 108.0, 197.0, 250.0, 426.0, 574.0, 885.0, 1315.0, 2014.0, 3099.0, 4745.0, 7186.0, 11013.0, 16603.0, 24671.0, 36195.0, 52228.0, 72580.0, 94656.0, 113493.0, 123825.0, 118280.0, 102098.0, 79359.0, 57822.0, 41108.0, 28162.0, 18901.0, 12445.0, 8134.0, 5379.0, 3566.0, 2437.0, 1549.0, 1008.0, 680.0, 439.0, 297.0, 198.0, 138.0, 82.0, 55.0, 37.0, 38.0, 22.0, 13.0, 6.0, 4.0, 2.0, 2.0, 3.0], "bins": [-24.859375, -24.120849609375, -23.38232421875, -22.643798828125, -21.9052734375, -21.166748046875, -20.42822265625, -19.689697265625, -18.951171875, -18.212646484375, -17.47412109375, -16.735595703125, -15.9970703125, -15.258544921875, -14.52001953125, -13.781494140625, -13.04296875, -12.304443359375, -11.56591796875, -10.827392578125, -10.0888671875, -9.350341796875, -8.61181640625, -7.873291015625, -7.134765625, -6.396240234375, -5.65771484375, -4.919189453125, -4.1806640625, -3.442138671875, -2.70361328125, -1.965087890625, -1.2265625, -0.488037109375, 0.25048828125, 0.989013671875, 1.7275390625, 2.466064453125, 3.20458984375, 3.943115234375, 4.681640625, 5.420166015625, 6.15869140625, 6.897216796875, 7.6357421875, 8.374267578125, 9.11279296875, 9.851318359375, 10.58984375, 11.328369140625, 12.06689453125, 12.805419921875, 13.5439453125, 14.282470703125, 15.02099609375, 15.759521484375, 16.498046875, 17.236572265625, 17.97509765625, 18.713623046875, 19.4521484375, 20.190673828125, 20.92919921875, 21.667724609375, 22.40625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 5.0, 6.0, 2.0, 6.0, 5.0, 1.0, 7.0, 16.0, 13.0, 14.0, 12.0, 15.0, 14.0, 24.0, 30.0, 21.0, 24.0, 20.0, 32.0, 31.0, 25.0, 37.0, 34.0, 36.0, 29.0, 29.0, 26.0, 49.0, 41.0, 34.0, 29.0, 32.0, 24.0, 28.0, 29.0, 24.0, 25.0, 23.0, 20.0, 16.0, 22.0, 16.0, 12.0, 19.0, 12.0, 8.0, 8.0, 9.0, 8.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.421875, -12.95166015625, -12.4814453125, -12.01123046875, -11.541015625, -11.07080078125, -10.6005859375, -10.13037109375, -9.66015625, -9.18994140625, -8.7197265625, -8.24951171875, -7.779296875, -7.30908203125, -6.8388671875, -6.36865234375, -5.8984375, -5.42822265625, -4.9580078125, -4.48779296875, -4.017578125, -3.54736328125, -3.0771484375, -2.60693359375, -2.13671875, -1.66650390625, -1.1962890625, -0.72607421875, -0.255859375, 0.21435546875, 0.6845703125, 1.15478515625, 1.625, 2.09521484375, 2.5654296875, 3.03564453125, 3.505859375, 3.97607421875, 4.4462890625, 4.91650390625, 5.38671875, 5.85693359375, 6.3271484375, 6.79736328125, 7.267578125, 7.73779296875, 8.2080078125, 8.67822265625, 9.1484375, 9.61865234375, 10.0888671875, 10.55908203125, 11.029296875, 11.49951171875, 11.9697265625, 12.43994140625, 12.91015625, 13.38037109375, 13.8505859375, 14.32080078125, 14.791015625, 15.26123046875, 15.7314453125, 16.20166015625, 16.671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 19.0, 28.0, 36.0, 50.0, 75.0, 76.0, 163.0, 226.0, 327.0, 476.0, 739.0, 1212.0, 1730.0, 2922.0, 4570.0, 7553.0, 12372.0, 20568.0, 35916.0, 62108.0, 106695.0, 165496.0, 198060.0, 166544.0, 107582.0, 62913.0, 36303.0, 21015.0, 12447.0, 7506.0, 4539.0, 2822.0, 1857.0, 1269.0, 759.0, 507.0, 352.0, 208.0, 150.0, 96.0, 79.0, 61.0, 36.0, 29.0, 16.0, 9.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-15.8515625, -15.3485107421875, -14.845458984375, -14.3424072265625, -13.83935546875, -13.3363037109375, -12.833251953125, -12.3302001953125, -11.8271484375, -11.3240966796875, -10.821044921875, -10.3179931640625, -9.81494140625, -9.3118896484375, -8.808837890625, -8.3057861328125, -7.802734375, -7.2996826171875, -6.796630859375, -6.2935791015625, -5.79052734375, -5.2874755859375, -4.784423828125, -4.2813720703125, -3.7783203125, -3.2752685546875, -2.772216796875, -2.2691650390625, -1.76611328125, -1.2630615234375, -0.760009765625, -0.2569580078125, 0.24609375, 0.7491455078125, 1.252197265625, 1.7552490234375, 2.25830078125, 2.7613525390625, 3.264404296875, 3.7674560546875, 4.2705078125, 4.7735595703125, 5.276611328125, 5.7796630859375, 6.28271484375, 6.7857666015625, 7.288818359375, 7.7918701171875, 8.294921875, 8.7979736328125, 9.301025390625, 9.8040771484375, 10.30712890625, 10.8101806640625, 11.313232421875, 11.8162841796875, 12.3193359375, 12.8223876953125, 13.325439453125, 13.8284912109375, 14.33154296875, 14.8345947265625, 15.337646484375, 15.8406982421875, 16.34375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 10.0, 4.0, 11.0, 8.0, 11.0, 19.0, 16.0, 19.0, 34.0, 23.0, 35.0, 37.0, 56.0, 68.0, 58.0, 76.0, 69.0, 62.0, 66.0, 62.0, 47.0, 39.0, 36.0, 23.0, 20.0, 19.0, 21.0, 10.0, 10.0, 9.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018014907836914062, -0.0017462968826293945, -0.0016911029815673828, -0.001635909080505371, -0.0015807151794433594, -0.0015255212783813477, -0.001470327377319336, -0.0014151334762573242, -0.0013599395751953125, -0.0013047456741333008, -0.001249551773071289, -0.0011943578720092773, -0.0011391639709472656, -0.001083970069885254, -0.0010287761688232422, -0.0009735822677612305, -0.0009183883666992188, -0.000863194465637207, -0.0008080005645751953, -0.0007528066635131836, -0.0006976127624511719, -0.0006424188613891602, -0.0005872249603271484, -0.0005320310592651367, -0.000476837158203125, -0.0004216432571411133, -0.00036644935607910156, -0.00031125545501708984, -0.0002560615539550781, -0.0002008676528930664, -0.0001456737518310547, -9.047985076904297e-05, -3.528594970703125e-05, 1.990795135498047e-05, 7.510185241699219e-05, 0.0001302957534790039, 0.00018548965454101562, 0.00024068355560302734, 0.00029587745666503906, 0.0003510713577270508, 0.0004062652587890625, 0.0004614591598510742, 0.0005166530609130859, 0.0005718469619750977, 0.0006270408630371094, 0.0006822347640991211, 0.0007374286651611328, 0.0007926225662231445, 0.0008478164672851562, 0.000903010368347168, 0.0009582042694091797, 0.0010133981704711914, 0.0010685920715332031, 0.0011237859725952148, 0.0011789798736572266, 0.0012341737747192383, 0.00128936767578125, 0.0013445615768432617, 0.0013997554779052734, 0.0014549493789672852, 0.0015101432800292969, 0.0015653371810913086, 0.0016205310821533203, 0.001675724983215332, 0.0017309188842773438]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 12.0, 18.0, 20.0, 38.0, 47.0, 62.0, 103.0, 143.0, 230.0, 353.0, 505.0, 781.0, 1192.0, 1808.0, 3048.0, 5173.0, 8470.0, 14556.0, 25827.0, 45556.0, 79502.0, 131580.0, 184062.0, 191367.0, 143936.0, 89211.0, 51105.0, 29025.0, 16311.0, 9698.0, 5567.0, 3312.0, 2073.0, 1312.0, 863.0, 540.0, 361.0, 215.0, 192.0, 116.0, 85.0, 54.0, 34.0, 27.0, 15.0, 10.0, 8.0, 10.0, 4.0, 1.0, 4.0, 3.0], "bins": [-17.09375, -16.6068115234375, -16.119873046875, -15.6329345703125, -15.14599609375, -14.6590576171875, -14.172119140625, -13.6851806640625, -13.1982421875, -12.7113037109375, -12.224365234375, -11.7374267578125, -11.25048828125, -10.7635498046875, -10.276611328125, -9.7896728515625, -9.302734375, -8.8157958984375, -8.328857421875, -7.8419189453125, -7.35498046875, -6.8680419921875, -6.381103515625, -5.8941650390625, -5.4072265625, -4.9202880859375, -4.433349609375, -3.9464111328125, -3.45947265625, -2.9725341796875, -2.485595703125, -1.9986572265625, -1.51171875, -1.0247802734375, -0.537841796875, -0.0509033203125, 0.43603515625, 0.9229736328125, 1.409912109375, 1.8968505859375, 2.3837890625, 2.8707275390625, 3.357666015625, 3.8446044921875, 4.33154296875, 4.8184814453125, 5.305419921875, 5.7923583984375, 6.279296875, 6.7662353515625, 7.253173828125, 7.7401123046875, 8.22705078125, 8.7139892578125, 9.200927734375, 9.6878662109375, 10.1748046875, 10.6617431640625, 11.148681640625, 11.6356201171875, 12.12255859375, 12.6094970703125, 13.096435546875, 13.5833740234375, 14.0703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 7.0, 10.0, 16.0, 12.0, 7.0, 27.0, 23.0, 23.0, 33.0, 48.0, 40.0, 56.0, 48.0, 61.0, 47.0, 67.0, 56.0, 50.0, 45.0, 42.0, 47.0, 45.0, 36.0, 27.0, 31.0, 18.0, 20.0, 17.0, 5.0, 7.0, 9.0, 8.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.43359375, -7.2098388671875, -6.986083984375, -6.7623291015625, -6.53857421875, -6.3148193359375, -6.091064453125, -5.8673095703125, -5.6435546875, -5.4197998046875, -5.196044921875, -4.9722900390625, -4.74853515625, -4.5247802734375, -4.301025390625, -4.0772705078125, -3.853515625, -3.6297607421875, -3.406005859375, -3.1822509765625, -2.95849609375, -2.7347412109375, -2.510986328125, -2.2872314453125, -2.0634765625, -1.8397216796875, -1.615966796875, -1.3922119140625, -1.16845703125, -0.9447021484375, -0.720947265625, -0.4971923828125, -0.2734375, -0.0496826171875, 0.174072265625, 0.3978271484375, 0.62158203125, 0.8453369140625, 1.069091796875, 1.2928466796875, 1.5166015625, 1.7403564453125, 1.964111328125, 2.1878662109375, 2.41162109375, 2.6353759765625, 2.859130859375, 3.0828857421875, 3.306640625, 3.5303955078125, 3.754150390625, 3.9779052734375, 4.20166015625, 4.4254150390625, 4.649169921875, 4.8729248046875, 5.0966796875, 5.3204345703125, 5.544189453125, 5.7679443359375, 5.99169921875, 6.2154541015625, 6.439208984375, 6.6629638671875, 6.88671875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 13.0, 10.0, 13.0, 11.0, 12.0, 25.0, 31.0, 24.0, 34.0, 45.0, 37.0, 55.0, 50.0, 44.0, 62.0, 44.0, 64.0, 60.0, 44.0, 62.0, 36.0, 36.0, 39.0, 27.0, 21.0, 18.0, 10.0, 11.0, 12.0, 10.0, 13.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.07898712158203, -34.102783203125, -33.12657928466797, -32.15037536621094, -31.17417335510254, -30.19797134399414, -29.22176742553711, -28.245563507080078, -27.26936149597168, -26.29315757751465, -25.31695556640625, -24.34075164794922, -23.364547729492188, -22.38834571838379, -21.412141799926758, -20.43593978881836, -19.459735870361328, -18.483531951904297, -17.5073299407959, -16.531126022338867, -15.554923057556152, -14.578720092773438, -13.602516174316406, -12.626313209533691, -11.650108337402344, -10.673905372619629, -9.697701454162598, -8.721498489379883, -7.745295524597168, -6.769092082977295, -5.792888641357422, -4.816685676574707, -3.840482711791992, -2.8642795085906982, -1.8880761861801147, -0.9118728637695312, 0.0643303394317627, 1.0405335426330566, 2.0167369842529297, 2.9929399490356445, 3.9691433906555176, 4.945346832275391, 5.9215497970581055, 6.8977532386779785, 7.873956680297852, 8.850159645080566, 9.826362609863281, 10.802566528320312, 11.778769493103027, 12.754972457885742, 13.731176376342773, 14.707379341125488, 15.683582305908203, 16.659786224365234, 17.635990142822266, 18.612192153930664, 19.588396072387695, 20.564599990844727, 21.540802001953125, 22.517005920410156, 23.493209838867188, 24.469411849975586, 25.445615768432617, 26.421817779541016, 27.398021697998047]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 5.0, 7.0, 11.0, 14.0, 23.0, 19.0, 27.0, 19.0, 46.0, 40.0, 36.0, 44.0, 36.0, 50.0, 45.0, 53.0, 29.0, 55.0, 49.0, 52.0, 40.0, 26.0, 33.0, 37.0, 33.0, 28.0, 14.0, 16.0, 20.0, 20.0, 12.0, 10.0, 8.0, 6.0, 2.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.11524200439453, -27.210716247558594, -26.306190490722656, -25.40166473388672, -24.497140884399414, -23.592615127563477, -22.68808937072754, -21.7835636138916, -20.879039764404297, -19.97451400756836, -19.069988250732422, -18.165462493896484, -17.26093864440918, -16.356412887573242, -15.451887130737305, -14.547361373901367, -13.64283561706543, -12.738309860229492, -11.833785057067871, -10.929259300231934, -10.024734497070312, -9.120208740234375, -8.215682983398438, -7.311157703399658, -6.406632423400879, -5.5021071434021, -4.59758186340332, -3.693056106567383, -2.7885308265686035, -1.8840055465698242, -0.9794797897338867, -0.07495450973510742, 0.8295688629150391, 1.734094262123108, 2.6386196613311768, 3.543145179748535, 4.4476704597473145, 5.352195739746094, 6.256721496582031, 7.1612467765808105, 8.06577205657959, 8.970297813415527, 9.874822616577148, 10.779348373413086, 11.683874130249023, 12.588398933410645, 13.492924690246582, 14.397449493408203, 15.30197525024414, 16.206501007080078, 17.111026763916016, 18.015552520751953, 18.920076370239258, 19.824602127075195, 20.729127883911133, 21.63365364074707, 22.538177490234375, 23.442703247070312, 24.34722900390625, 25.251754760742188, 26.156278610229492, 27.06080436706543, 27.965330123901367, 28.869855880737305, 29.774381637573242]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 8.0, 17.0, 33.0, 43.0, 67.0, 98.0, 159.0, 249.0, 473.0, 725.0, 1252.0, 2067.0, 3714.0, 6613.0, 12529.0, 24275.0, 48454.0, 104671.0, 242856.0, 578258.0, 1071087.0, 1070192.0, 578315.0, 243804.0, 104971.0, 48566.0, 23868.0, 12156.0, 6477.0, 3557.0, 1982.0, 1131.0, 635.0, 353.0, 233.0, 145.0, 90.0, 50.0, 38.0, 19.0, 21.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-38.28125, -37.12109375, -35.9609375, -34.80078125, -33.640625, -32.48046875, -31.3203125, -30.16015625, -29.0, -27.83984375, -26.6796875, -25.51953125, -24.359375, -23.19921875, -22.0390625, -20.87890625, -19.71875, -18.55859375, -17.3984375, -16.23828125, -15.078125, -13.91796875, -12.7578125, -11.59765625, -10.4375, -9.27734375, -8.1171875, -6.95703125, -5.796875, -4.63671875, -3.4765625, -2.31640625, -1.15625, 0.00390625, 1.1640625, 2.32421875, 3.484375, 4.64453125, 5.8046875, 6.96484375, 8.125, 9.28515625, 10.4453125, 11.60546875, 12.765625, 13.92578125, 15.0859375, 16.24609375, 17.40625, 18.56640625, 19.7265625, 20.88671875, 22.046875, 23.20703125, 24.3671875, 25.52734375, 26.6875, 27.84765625, 29.0078125, 30.16796875, 31.328125, 32.48828125, 33.6484375, 34.80859375, 35.96875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 8.0, 13.0, 18.0, 26.0, 20.0, 27.0, 27.0, 28.0, 38.0, 23.0, 32.0, 39.0, 35.0, 42.0, 63.0, 54.0, 39.0, 49.0, 43.0, 40.0, 31.0, 36.0, 37.0, 32.0, 24.0, 32.0, 14.0, 15.0, 16.0, 15.0, 14.0, 11.0, 14.0, 6.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.421875, -22.67822265625, -21.9345703125, -21.19091796875, -20.447265625, -19.70361328125, -18.9599609375, -18.21630859375, -17.47265625, -16.72900390625, -15.9853515625, -15.24169921875, -14.498046875, -13.75439453125, -13.0107421875, -12.26708984375, -11.5234375, -10.77978515625, -10.0361328125, -9.29248046875, -8.548828125, -7.80517578125, -7.0615234375, -6.31787109375, -5.57421875, -4.83056640625, -4.0869140625, -3.34326171875, -2.599609375, -1.85595703125, -1.1123046875, -0.36865234375, 0.375, 1.11865234375, 1.8623046875, 2.60595703125, 3.349609375, 4.09326171875, 4.8369140625, 5.58056640625, 6.32421875, 7.06787109375, 7.8115234375, 8.55517578125, 9.298828125, 10.04248046875, 10.7861328125, 11.52978515625, 12.2734375, 13.01708984375, 13.7607421875, 14.50439453125, 15.248046875, 15.99169921875, 16.7353515625, 17.47900390625, 18.22265625, 18.96630859375, 19.7099609375, 20.45361328125, 21.197265625, 21.94091796875, 22.6845703125, 23.42822265625, 24.171875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 17.0, 29.0, 33.0, 48.0, 80.0, 99.0, 165.0, 260.0, 386.0, 597.0, 924.0, 1589.0, 2446.0, 3959.0, 6652.0, 11240.0, 19858.0, 34548.0, 62489.0, 116482.0, 218598.0, 403444.0, 684918.0, 888257.0, 741117.0, 453210.0, 246968.0, 131644.0, 71543.0, 38813.0, 21966.0, 12710.0, 7436.0, 4383.0, 2734.0, 1720.0, 1060.0, 658.0, 415.0, 242.0, 190.0, 116.0, 80.0, 57.0, 35.0, 29.0, 12.0, 6.0, 11.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-30.71875, -29.71484375, -28.7109375, -27.70703125, -26.703125, -25.69921875, -24.6953125, -23.69140625, -22.6875, -21.68359375, -20.6796875, -19.67578125, -18.671875, -17.66796875, -16.6640625, -15.66015625, -14.65625, -13.65234375, -12.6484375, -11.64453125, -10.640625, -9.63671875, -8.6328125, -7.62890625, -6.625, -5.62109375, -4.6171875, -3.61328125, -2.609375, -1.60546875, -0.6015625, 0.40234375, 1.40625, 2.41015625, 3.4140625, 4.41796875, 5.421875, 6.42578125, 7.4296875, 8.43359375, 9.4375, 10.44140625, 11.4453125, 12.44921875, 13.453125, 14.45703125, 15.4609375, 16.46484375, 17.46875, 18.47265625, 19.4765625, 20.48046875, 21.484375, 22.48828125, 23.4921875, 24.49609375, 25.5, 26.50390625, 27.5078125, 28.51171875, 29.515625, 30.51953125, 31.5234375, 32.52734375, 33.53125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 3.0, 10.0, 12.0, 19.0, 20.0, 26.0, 27.0, 55.0, 55.0, 74.0, 89.0, 97.0, 130.0, 190.0, 189.0, 215.0, 236.0, 269.0, 236.0, 291.0, 267.0, 243.0, 241.0, 161.0, 165.0, 140.0, 134.0, 96.0, 76.0, 55.0, 49.0, 37.0, 34.0, 31.0, 17.0, 21.0, 13.0, 9.0, 9.0, 8.0, 5.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.578125, -12.2022705078125, -11.826416015625, -11.4505615234375, -11.07470703125, -10.6988525390625, -10.322998046875, -9.9471435546875, -9.5712890625, -9.1954345703125, -8.819580078125, -8.4437255859375, -8.06787109375, -7.6920166015625, -7.316162109375, -6.9403076171875, -6.564453125, -6.1885986328125, -5.812744140625, -5.4368896484375, -5.06103515625, -4.6851806640625, -4.309326171875, -3.9334716796875, -3.5576171875, -3.1817626953125, -2.805908203125, -2.4300537109375, -2.05419921875, -1.6783447265625, -1.302490234375, -0.9266357421875, -0.55078125, -0.1749267578125, 0.200927734375, 0.5767822265625, 0.95263671875, 1.3284912109375, 1.704345703125, 2.0802001953125, 2.4560546875, 2.8319091796875, 3.207763671875, 3.5836181640625, 3.95947265625, 4.3353271484375, 4.711181640625, 5.0870361328125, 5.462890625, 5.8387451171875, 6.214599609375, 6.5904541015625, 6.96630859375, 7.3421630859375, 7.718017578125, 8.0938720703125, 8.4697265625, 8.8455810546875, 9.221435546875, 9.5972900390625, 9.97314453125, 10.3489990234375, 10.724853515625, 11.1007080078125, 11.4765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 4.0, 7.0, 5.0, 13.0, 11.0, 11.0, 11.0, 12.0, 18.0, 28.0, 25.0, 32.0, 26.0, 39.0, 40.0, 42.0, 57.0, 44.0, 60.0, 61.0, 43.0, 48.0, 31.0, 43.0, 39.0, 46.0, 30.0, 24.0, 15.0, 23.0, 18.0, 19.0, 13.0, 14.0, 10.0, 9.0, 2.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.190847396850586, -29.326860427856445, -28.462871551513672, -27.59888458251953, -26.73489761352539, -25.870908737182617, -25.006921768188477, -24.142932891845703, -23.278945922851562, -22.414958953857422, -21.55097007751465, -20.686983108520508, -19.822996139526367, -18.959007263183594, -18.095020294189453, -17.231033325195312, -16.367046356201172, -15.503058433532715, -14.639071464538574, -13.775083541870117, -12.91109561920166, -12.047107696533203, -11.183120727539062, -10.319132804870605, -9.455144882202148, -8.591156959533691, -7.727169513702393, -6.863182067871094, -5.999194145202637, -5.135206699371338, -4.271219253540039, -3.407231330871582, -2.543243408203125, -1.679255723953247, -0.8152681589126587, 0.04871940612792969, 0.9127070903778076, 1.7766947746276855, 2.6406822204589844, 3.5046701431274414, 4.36865758895874, 5.232645034790039, 6.096632957458496, 6.960620403289795, 7.824607849121094, 8.68859577178955, 9.552583694458008, 10.416570663452148, 11.280558586120605, 12.144546508789062, 13.008533477783203, 13.87252140045166, 14.736509323120117, 15.600496292114258, 16.46448516845703, 17.328472137451172, 18.192459106445312, 19.056446075439453, 19.920434951782227, 20.784421920776367, 21.648408889770508, 22.51239776611328, 23.376384735107422, 24.240371704101562, 25.104360580444336]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 12.0, 6.0, 10.0, 13.0, 18.0, 18.0, 17.0, 29.0, 29.0, 21.0, 36.0, 39.0, 35.0, 43.0, 30.0, 46.0, 43.0, 34.0, 46.0, 42.0, 34.0, 51.0, 30.0, 44.0, 36.0, 32.0, 22.0, 24.0, 18.0, 24.0, 20.0, 9.0, 18.0, 9.0, 9.0, 11.0, 8.0, 3.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.226667404174805, -26.397836685180664, -25.56900405883789, -24.74017333984375, -23.91134262084961, -23.082509994506836, -22.253679275512695, -21.424846649169922, -20.59601593017578, -19.76718521118164, -18.938352584838867, -18.109521865844727, -17.280689239501953, -16.451858520507812, -15.623027801513672, -14.794196128845215, -13.965364456176758, -13.1365327835083, -12.307701110839844, -11.478870391845703, -10.650038719177246, -9.821207046508789, -8.992376327514648, -8.163544654846191, -7.334712982177734, -6.505881309509277, -5.6770501136779785, -4.84821891784668, -4.019387245178223, -3.1905555725097656, -2.361724376678467, -1.532893180847168, -0.7040634155273438, 0.12476801872253418, 0.9535994529724121, 1.78243088722229, 2.611262321472168, 3.440093994140625, 4.268925189971924, 5.097756385803223, 5.92658805847168, 6.755419731140137, 7.5842509269714355, 8.413082122802734, 9.241913795471191, 10.070745468139648, 10.899576187133789, 11.728407859802246, 12.557239532470703, 13.38607120513916, 14.214902877807617, 15.043733596801758, 15.872565269470215, 16.701396942138672, 17.530227661132812, 18.359058380126953, 19.187891006469727, 20.016721725463867, 20.84555435180664, 21.67438507080078, 22.503215789794922, 23.332048416137695, 24.160879135131836, 24.98971176147461, 25.81854248046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 4.0, 6.0, 26.0, 23.0, 37.0, 59.0, 67.0, 123.0, 201.0, 299.0, 465.0, 730.0, 1112.0, 1729.0, 2608.0, 4036.0, 6531.0, 9884.0, 15115.0, 23893.0, 35885.0, 54803.0, 80902.0, 112115.0, 139688.0, 145950.0, 126753.0, 94682.0, 65279.0, 43953.0, 28962.0, 18501.0, 12237.0, 7736.0, 5010.0, 3201.0, 2092.0, 1368.0, 844.0, 599.0, 372.0, 233.0, 171.0, 108.0, 63.0, 35.0, 22.0, 15.0, 8.0, 9.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.859375, -11.4796142578125, -11.099853515625, -10.7200927734375, -10.34033203125, -9.9605712890625, -9.580810546875, -9.2010498046875, -8.8212890625, -8.4415283203125, -8.061767578125, -7.6820068359375, -7.30224609375, -6.9224853515625, -6.542724609375, -6.1629638671875, -5.783203125, -5.4034423828125, -5.023681640625, -4.6439208984375, -4.26416015625, -3.8843994140625, -3.504638671875, -3.1248779296875, -2.7451171875, -2.3653564453125, -1.985595703125, -1.6058349609375, -1.22607421875, -0.8463134765625, -0.466552734375, -0.0867919921875, 0.29296875, 0.6727294921875, 1.052490234375, 1.4322509765625, 1.81201171875, 2.1917724609375, 2.571533203125, 2.9512939453125, 3.3310546875, 3.7108154296875, 4.090576171875, 4.4703369140625, 4.85009765625, 5.2298583984375, 5.609619140625, 5.9893798828125, 6.369140625, 6.7489013671875, 7.128662109375, 7.5084228515625, 7.88818359375, 8.2679443359375, 8.647705078125, 9.0274658203125, 9.4072265625, 9.7869873046875, 10.166748046875, 10.5465087890625, 10.92626953125, 11.3060302734375, 11.685791015625, 12.0655517578125, 12.4453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 5.0, 13.0, 6.0, 10.0, 12.0, 12.0, 13.0, 17.0, 20.0, 21.0, 27.0, 35.0, 28.0, 31.0, 39.0, 38.0, 36.0, 32.0, 31.0, 49.0, 43.0, 49.0, 46.0, 37.0, 43.0, 44.0, 38.0, 38.0, 19.0, 27.0, 20.0, 17.0, 20.0, 14.0, 15.0, 6.0, 12.0, 10.0, 7.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 5.0], "bins": [-30.671875, -29.820068359375, -28.96826171875, -28.116455078125, -27.2646484375, -26.412841796875, -25.56103515625, -24.709228515625, -23.857421875, -23.005615234375, -22.15380859375, -21.302001953125, -20.4501953125, -19.598388671875, -18.74658203125, -17.894775390625, -17.04296875, -16.191162109375, -15.33935546875, -14.487548828125, -13.6357421875, -12.783935546875, -11.93212890625, -11.080322265625, -10.228515625, -9.376708984375, -8.52490234375, -7.673095703125, -6.8212890625, -5.969482421875, -5.11767578125, -4.265869140625, -3.4140625, -2.562255859375, -1.71044921875, -0.858642578125, -0.0068359375, 0.844970703125, 1.69677734375, 2.548583984375, 3.400390625, 4.252197265625, 5.10400390625, 5.955810546875, 6.8076171875, 7.659423828125, 8.51123046875, 9.363037109375, 10.21484375, 11.066650390625, 11.91845703125, 12.770263671875, 13.6220703125, 14.473876953125, 15.32568359375, 16.177490234375, 17.029296875, 17.881103515625, 18.73291015625, 19.584716796875, 20.4365234375, 21.288330078125, 22.14013671875, 22.991943359375, 23.84375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 14.0, 17.0, 23.0, 22.0, 46.0, 46.0, 97.0, 117.0, 187.0, 227.0, 348.0, 544.0, 813.0, 1238.0, 1991.0, 2982.0, 4706.0, 7807.0, 12802.0, 20791.0, 34093.0, 56425.0, 90852.0, 136564.0, 173405.0, 167349.0, 124520.0, 81333.0, 50010.0, 30072.0, 18676.0, 11300.0, 6842.0, 4454.0, 2742.0, 1703.0, 1178.0, 701.0, 454.0, 337.0, 236.0, 149.0, 105.0, 72.0, 50.0, 26.0, 22.0, 22.0, 14.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 2.0, 4.0], "bins": [-14.9453125, -14.4764404296875, -14.007568359375, -13.5386962890625, -13.06982421875, -12.6009521484375, -12.132080078125, -11.6632080078125, -11.1943359375, -10.7254638671875, -10.256591796875, -9.7877197265625, -9.31884765625, -8.8499755859375, -8.381103515625, -7.9122314453125, -7.443359375, -6.9744873046875, -6.505615234375, -6.0367431640625, -5.56787109375, -5.0989990234375, -4.630126953125, -4.1612548828125, -3.6923828125, -3.2235107421875, -2.754638671875, -2.2857666015625, -1.81689453125, -1.3480224609375, -0.879150390625, -0.4102783203125, 0.05859375, 0.5274658203125, 0.996337890625, 1.4652099609375, 1.93408203125, 2.4029541015625, 2.871826171875, 3.3406982421875, 3.8095703125, 4.2784423828125, 4.747314453125, 5.2161865234375, 5.68505859375, 6.1539306640625, 6.622802734375, 7.0916748046875, 7.560546875, 8.0294189453125, 8.498291015625, 8.9671630859375, 9.43603515625, 9.9049072265625, 10.373779296875, 10.8426513671875, 11.3115234375, 11.7803955078125, 12.249267578125, 12.7181396484375, 13.18701171875, 13.6558837890625, 14.124755859375, 14.5936279296875, 15.0625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 4.0, 8.0, 9.0, 7.0, 13.0, 18.0, 14.0, 13.0, 16.0, 18.0, 19.0, 21.0, 17.0, 31.0, 33.0, 26.0, 30.0, 34.0, 30.0, 35.0, 32.0, 35.0, 34.0, 43.0, 34.0, 29.0, 26.0, 34.0, 45.0, 39.0, 26.0, 25.0, 24.0, 26.0, 19.0, 13.0, 18.0, 18.0, 10.0, 12.0, 8.0, 9.0, 10.0, 5.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0], "bins": [-15.0625, -14.6107177734375, -14.158935546875, -13.7071533203125, -13.25537109375, -12.8035888671875, -12.351806640625, -11.9000244140625, -11.4482421875, -10.9964599609375, -10.544677734375, -10.0928955078125, -9.64111328125, -9.1893310546875, -8.737548828125, -8.2857666015625, -7.833984375, -7.3822021484375, -6.930419921875, -6.4786376953125, -6.02685546875, -5.5750732421875, -5.123291015625, -4.6715087890625, -4.2197265625, -3.7679443359375, -3.316162109375, -2.8643798828125, -2.41259765625, -1.9608154296875, -1.509033203125, -1.0572509765625, -0.60546875, -0.1536865234375, 0.298095703125, 0.7498779296875, 1.20166015625, 1.6534423828125, 2.105224609375, 2.5570068359375, 3.0087890625, 3.4605712890625, 3.912353515625, 4.3641357421875, 4.81591796875, 5.2677001953125, 5.719482421875, 6.1712646484375, 6.623046875, 7.0748291015625, 7.526611328125, 7.9783935546875, 8.43017578125, 8.8819580078125, 9.333740234375, 9.7855224609375, 10.2373046875, 10.6890869140625, 11.140869140625, 11.5926513671875, 12.04443359375, 12.4962158203125, 12.947998046875, 13.3997802734375, 13.8515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 12.0, 6.0, 24.0, 19.0, 25.0, 46.0, 47.0, 89.0, 140.0, 244.0, 288.0, 468.0, 775.0, 1274.0, 2142.0, 3972.0, 7513.0, 15506.0, 35021.0, 85195.0, 202755.0, 322757.0, 210494.0, 89111.0, 36788.0, 16117.0, 7791.0, 4152.0, 2237.0, 1276.0, 835.0, 491.0, 317.0, 188.0, 126.0, 103.0, 75.0, 39.0, 30.0, 26.0, 13.0, 12.0, 8.0, 5.0, 0.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.9140625, -8.6558837890625, -8.397705078125, -8.1395263671875, -7.88134765625, -7.6231689453125, -7.364990234375, -7.1068115234375, -6.8486328125, -6.5904541015625, -6.332275390625, -6.0740966796875, -5.81591796875, -5.5577392578125, -5.299560546875, -5.0413818359375, -4.783203125, -4.5250244140625, -4.266845703125, -4.0086669921875, -3.75048828125, -3.4923095703125, -3.234130859375, -2.9759521484375, -2.7177734375, -2.4595947265625, -2.201416015625, -1.9432373046875, -1.68505859375, -1.4268798828125, -1.168701171875, -0.9105224609375, -0.65234375, -0.3941650390625, -0.135986328125, 0.1221923828125, 0.38037109375, 0.6385498046875, 0.896728515625, 1.1549072265625, 1.4130859375, 1.6712646484375, 1.929443359375, 2.1876220703125, 2.44580078125, 2.7039794921875, 2.962158203125, 3.2203369140625, 3.478515625, 3.7366943359375, 3.994873046875, 4.2530517578125, 4.51123046875, 4.7694091796875, 5.027587890625, 5.2857666015625, 5.5439453125, 5.8021240234375, 6.060302734375, 6.3184814453125, 6.57666015625, 6.8348388671875, 7.093017578125, 7.3511962890625, 7.609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 11.0, 15.0, 15.0, 18.0, 23.0, 44.0, 41.0, 36.0, 61.0, 58.0, 69.0, 68.0, 77.0, 64.0, 59.0, 52.0, 47.0, 45.0, 34.0, 25.0, 24.0, 12.0, 10.0, 20.0, 8.0, 9.0, 8.0, 5.0, 2.0, 1.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00060272216796875, -0.0005843937397003174, -0.0005660653114318848, -0.0005477368831634521, -0.0005294084548950195, -0.0005110800266265869, -0.0004927515983581543, -0.0004744231700897217, -0.00045609474182128906, -0.00043776631355285645, -0.00041943788528442383, -0.0004011094570159912, -0.0003827810287475586, -0.000364452600479126, -0.00034612417221069336, -0.00032779574394226074, -0.0003094673156738281, -0.0002911388874053955, -0.0002728104591369629, -0.0002544820308685303, -0.00023615360260009766, -0.00021782517433166504, -0.00019949674606323242, -0.0001811683177947998, -0.0001628398895263672, -0.00014451146125793457, -0.00012618303298950195, -0.00010785460472106934, -8.952617645263672e-05, -7.11977481842041e-05, -5.2869319915771484e-05, -3.454089164733887e-05, -1.621246337890625e-05, 2.115964889526367e-06, 2.0444393157958984e-05, 3.87728214263916e-05, 5.710124969482422e-05, 7.542967796325684e-05, 9.375810623168945e-05, 0.00011208653450012207, 0.0001304149627685547, 0.0001487433910369873, 0.00016707181930541992, 0.00018540024757385254, 0.00020372867584228516, 0.00022205710411071777, 0.0002403855323791504, 0.000258713960647583, 0.0002770423889160156, 0.00029537081718444824, 0.00031369924545288086, 0.0003320276737213135, 0.0003503561019897461, 0.0003686845302581787, 0.00038701295852661133, 0.00040534138679504395, 0.00042366981506347656, 0.0004419982433319092, 0.0004603266716003418, 0.0004786550998687744, 0.000496983528137207, 0.0005153119564056396, 0.0005336403846740723, 0.0005519688129425049, 0.0005702972412109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 1.0, 5.0, 7.0, 10.0, 15.0, 18.0, 29.0, 36.0, 55.0, 84.0, 110.0, 175.0, 213.0, 321.0, 519.0, 782.0, 1316.0, 2124.0, 3543.0, 6270.0, 11387.0, 22677.0, 46269.0, 97274.0, 190581.0, 265014.0, 197563.0, 101822.0, 48752.0, 23519.0, 11859.0, 6563.0, 3651.0, 2177.0, 1340.0, 832.0, 508.0, 367.0, 232.0, 158.0, 115.0, 72.0, 53.0, 44.0, 29.0, 18.0, 12.0, 16.0, 8.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.2421875, -7.98883056640625, -7.7354736328125, -7.48211669921875, -7.228759765625, -6.97540283203125, -6.7220458984375, -6.46868896484375, -6.21533203125, -5.96197509765625, -5.7086181640625, -5.45526123046875, -5.201904296875, -4.94854736328125, -4.6951904296875, -4.44183349609375, -4.1884765625, -3.93511962890625, -3.6817626953125, -3.42840576171875, -3.175048828125, -2.92169189453125, -2.6683349609375, -2.41497802734375, -2.16162109375, -1.90826416015625, -1.6549072265625, -1.40155029296875, -1.148193359375, -0.89483642578125, -0.6414794921875, -0.38812255859375, -0.134765625, 0.11859130859375, 0.3719482421875, 0.62530517578125, 0.878662109375, 1.13201904296875, 1.3853759765625, 1.63873291015625, 1.89208984375, 2.14544677734375, 2.3988037109375, 2.65216064453125, 2.905517578125, 3.15887451171875, 3.4122314453125, 3.66558837890625, 3.9189453125, 4.17230224609375, 4.4256591796875, 4.67901611328125, 4.932373046875, 5.18572998046875, 5.4390869140625, 5.69244384765625, 5.94580078125, 6.19915771484375, 6.4525146484375, 6.70587158203125, 6.959228515625, 7.21258544921875, 7.4659423828125, 7.71929931640625, 7.97265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 10.0, 14.0, 18.0, 26.0, 35.0, 43.0, 68.0, 84.0, 78.0, 104.0, 121.0, 86.0, 76.0, 60.0, 47.0, 28.0, 22.0, 18.0, 7.0, 9.0, 11.0, 8.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.335845947265625, -3.22052001953125, -3.105194091796875, -2.9898681640625, -2.874542236328125, -2.75921630859375, -2.643890380859375, -2.528564453125, -2.413238525390625, -2.29791259765625, -2.182586669921875, -2.0672607421875, -1.951934814453125, -1.83660888671875, -1.721282958984375, -1.60595703125, -1.490631103515625, -1.37530517578125, -1.259979248046875, -1.1446533203125, -1.029327392578125, -0.91400146484375, -0.798675537109375, -0.683349609375, -0.568023681640625, -0.45269775390625, -0.337371826171875, -0.2220458984375, -0.106719970703125, 0.00860595703125, 0.123931884765625, 0.2392578125, 0.354583740234375, 0.46990966796875, 0.585235595703125, 0.7005615234375, 0.815887451171875, 0.93121337890625, 1.046539306640625, 1.161865234375, 1.277191162109375, 1.39251708984375, 1.507843017578125, 1.6231689453125, 1.738494873046875, 1.85382080078125, 1.969146728515625, 2.08447265625, 2.199798583984375, 2.31512451171875, 2.430450439453125, 2.5457763671875, 2.661102294921875, 2.77642822265625, 2.891754150390625, 3.007080078125, 3.122406005859375, 3.23773193359375, 3.353057861328125, 3.4683837890625, 3.583709716796875, 3.69903564453125, 3.814361572265625, 3.9296875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 10.0, 11.0, 6.0, 5.0, 9.0, 16.0, 15.0, 13.0, 13.0, 26.0, 30.0, 34.0, 34.0, 52.0, 44.0, 53.0, 40.0, 46.0, 71.0, 65.0, 41.0, 38.0, 47.0, 48.0, 35.0, 31.0, 28.0, 26.0, 14.0, 14.0, 15.0, 19.0, 14.0, 6.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.694002151489258, -30.791574478149414, -29.88914680480957, -28.986719131469727, -28.084291458129883, -27.18186378479004, -26.279436111450195, -25.37700843811035, -24.474580764770508, -23.572153091430664, -22.66972541809082, -21.767297744750977, -20.864870071411133, -19.96244239807129, -19.060014724731445, -18.1575870513916, -17.255159378051758, -16.352731704711914, -15.45030403137207, -14.547876358032227, -13.645448684692383, -12.743021011352539, -11.840593338012695, -10.938165664672852, -10.035737991333008, -9.133310317993164, -8.23088264465332, -7.328454971313477, -6.426027297973633, -5.523599624633789, -4.621171951293945, -3.7187442779541016, -2.816316604614258, -1.913888931274414, -1.0114612579345703, -0.10903358459472656, 0.7933940887451172, 1.695821762084961, 2.5982494354248047, 3.5006771087646484, 4.403104782104492, 5.305532455444336, 6.20796012878418, 7.110387802124023, 8.012815475463867, 8.915243148803711, 9.817670822143555, 10.720098495483398, 11.622526168823242, 12.524953842163086, 13.42738151550293, 14.329809188842773, 15.232236862182617, 16.13466453552246, 17.037092208862305, 17.93951988220215, 18.841947555541992, 19.744375228881836, 20.64680290222168, 21.549230575561523, 22.451658248901367, 23.35408592224121, 24.256513595581055, 25.1589412689209, 26.061368942260742]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 10.0, 10.0, 6.0, 12.0, 16.0, 20.0, 19.0, 26.0, 23.0, 30.0, 22.0, 32.0, 40.0, 39.0, 39.0, 41.0, 50.0, 37.0, 34.0, 44.0, 46.0, 36.0, 43.0, 36.0, 31.0, 40.0, 22.0, 22.0, 30.0, 21.0, 20.0, 13.0, 17.0, 6.0, 12.0, 12.0, 5.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.143665313720703, -26.327356338500977, -25.511049270629883, -24.694740295410156, -23.878433227539062, -23.062124252319336, -22.24581527709961, -21.429508209228516, -20.61319923400879, -19.796890258789062, -18.98058319091797, -18.164274215698242, -17.347965240478516, -16.531658172607422, -15.715349197387695, -14.899041175842285, -14.082733154296875, -13.266425132751465, -12.450117111206055, -11.633808135986328, -10.817500114440918, -10.001192092895508, -9.184883117675781, -8.368575096130371, -7.552267074584961, -6.735959053039551, -5.919650554656982, -5.103342056274414, -4.287034034729004, -3.4707260131835938, -2.6544175148010254, -1.838109016418457, -1.0218009948730469, -0.20549273490905762, 0.6108155250549316, 1.427123785018921, 2.24343204498291, 3.0597400665283203, 3.8760485649108887, 4.692357063293457, 5.508665084838867, 6.324973106384277, 7.141281604766846, 7.957590103149414, 8.773898124694824, 9.590206146240234, 10.406515121459961, 11.222823143005371, 12.039131164550781, 12.855439186096191, 13.671747207641602, 14.488056182861328, 15.304364204406738, 16.12067222595215, 16.936981201171875, 17.75328826904297, 18.569597244262695, 19.385906219482422, 20.202213287353516, 21.018522262573242, 21.83483123779297, 22.651138305664062, 23.46744728088379, 24.283756256103516, 25.10006332397461]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 9.0, 11.0, 13.0, 25.0, 54.0, 88.0, 121.0, 203.0, 299.0, 421.0, 703.0, 1098.0, 1724.0, 2577.0, 4027.0, 6127.0, 9359.0, 14524.0, 21688.0, 32774.0, 48272.0, 68588.0, 91370.0, 112651.0, 125655.0, 123659.0, 107670.0, 84395.0, 62137.0, 43224.0, 29043.0, 19441.0, 12804.0, 8273.0, 5508.0, 3551.0, 2266.0, 1470.0, 958.0, 633.0, 401.0, 260.0, 186.0, 112.0, 64.0, 56.0, 28.0, 20.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.453125, -20.7578125, -20.0625, -19.3671875, -18.671875, -17.9765625, -17.28125, -16.5859375, -15.890625, -15.1953125, -14.5, -13.8046875, -13.109375, -12.4140625, -11.71875, -11.0234375, -10.328125, -9.6328125, -8.9375, -8.2421875, -7.546875, -6.8515625, -6.15625, -5.4609375, -4.765625, -4.0703125, -3.375, -2.6796875, -1.984375, -1.2890625, -0.59375, 0.1015625, 0.796875, 1.4921875, 2.1875, 2.8828125, 3.578125, 4.2734375, 4.96875, 5.6640625, 6.359375, 7.0546875, 7.75, 8.4453125, 9.140625, 9.8359375, 10.53125, 11.2265625, 11.921875, 12.6171875, 13.3125, 14.0078125, 14.703125, 15.3984375, 16.09375, 16.7890625, 17.484375, 18.1796875, 18.875, 19.5703125, 20.265625, 20.9609375, 21.65625, 22.3515625, 23.046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 6.0, 3.0, 5.0, 13.0, 7.0, 13.0, 18.0, 20.0, 16.0, 25.0, 35.0, 33.0, 21.0, 35.0, 40.0, 30.0, 35.0, 49.0, 44.0, 47.0, 47.0, 47.0, 43.0, 33.0, 35.0, 34.0, 34.0, 29.0, 28.0, 26.0, 20.0, 23.0, 15.0, 14.0, 11.0, 12.0, 8.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.703125, -24.867431640625, -24.03173828125, -23.196044921875, -22.3603515625, -21.524658203125, -20.68896484375, -19.853271484375, -19.017578125, -18.181884765625, -17.34619140625, -16.510498046875, -15.6748046875, -14.839111328125, -14.00341796875, -13.167724609375, -12.33203125, -11.496337890625, -10.66064453125, -9.824951171875, -8.9892578125, -8.153564453125, -7.31787109375, -6.482177734375, -5.646484375, -4.810791015625, -3.97509765625, -3.139404296875, -2.3037109375, -1.468017578125, -0.63232421875, 0.203369140625, 1.0390625, 1.874755859375, 2.71044921875, 3.546142578125, 4.3818359375, 5.217529296875, 6.05322265625, 6.888916015625, 7.724609375, 8.560302734375, 9.39599609375, 10.231689453125, 11.0673828125, 11.903076171875, 12.73876953125, 13.574462890625, 14.41015625, 15.245849609375, 16.08154296875, 16.917236328125, 17.7529296875, 18.588623046875, 19.42431640625, 20.260009765625, 21.095703125, 21.931396484375, 22.76708984375, 23.602783203125, 24.4384765625, 25.274169921875, 26.10986328125, 26.945556640625, 27.78125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 16.0, 34.0, 44.0, 74.0, 100.0, 144.0, 192.0, 319.0, 459.0, 688.0, 1076.0, 1629.0, 2419.0, 3812.0, 6004.0, 9512.0, 14689.0, 23024.0, 35279.0, 53812.0, 78933.0, 106410.0, 130111.0, 139212.0, 126937.0, 100434.0, 72690.0, 49209.0, 32618.0, 20729.0, 13567.0, 8594.0, 5491.0, 3481.0, 2285.0, 1538.0, 956.0, 643.0, 440.0, 313.0, 190.0, 145.0, 94.0, 78.0, 40.0, 22.0, 17.0, 15.0, 9.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-23.984375, -23.1953125, -22.40625, -21.6171875, -20.828125, -20.0390625, -19.25, -18.4609375, -17.671875, -16.8828125, -16.09375, -15.3046875, -14.515625, -13.7265625, -12.9375, -12.1484375, -11.359375, -10.5703125, -9.78125, -8.9921875, -8.203125, -7.4140625, -6.625, -5.8359375, -5.046875, -4.2578125, -3.46875, -2.6796875, -1.890625, -1.1015625, -0.3125, 0.4765625, 1.265625, 2.0546875, 2.84375, 3.6328125, 4.421875, 5.2109375, 6.0, 6.7890625, 7.578125, 8.3671875, 9.15625, 9.9453125, 10.734375, 11.5234375, 12.3125, 13.1015625, 13.890625, 14.6796875, 15.46875, 16.2578125, 17.046875, 17.8359375, 18.625, 19.4140625, 20.203125, 20.9921875, 21.78125, 22.5703125, 23.359375, 24.1484375, 24.9375, 25.7265625, 26.515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 14.0, 10.0, 15.0, 20.0, 14.0, 21.0, 21.0, 23.0, 27.0, 38.0, 28.0, 34.0, 27.0, 33.0, 38.0, 39.0, 42.0, 48.0, 44.0, 48.0, 37.0, 34.0, 33.0, 30.0, 28.0, 33.0, 29.0, 21.0, 34.0, 21.0, 22.0, 9.0, 15.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.703125, -18.15625, -17.609375, -17.0625, -16.515625, -15.96875, -15.421875, -14.875, -14.328125, -13.78125, -13.234375, -12.6875, -12.140625, -11.59375, -11.046875, -10.5, -9.953125, -9.40625, -8.859375, -8.3125, -7.765625, -7.21875, -6.671875, -6.125, -5.578125, -5.03125, -4.484375, -3.9375, -3.390625, -2.84375, -2.296875, -1.75, -1.203125, -0.65625, -0.109375, 0.4375, 0.984375, 1.53125, 2.078125, 2.625, 3.171875, 3.71875, 4.265625, 4.8125, 5.359375, 5.90625, 6.453125, 7.0, 7.546875, 8.09375, 8.640625, 9.1875, 9.734375, 10.28125, 10.828125, 11.375, 11.921875, 12.46875, 13.015625, 13.5625, 14.109375, 14.65625, 15.203125, 15.75, 16.296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 15.0, 15.0, 19.0, 40.0, 54.0, 70.0, 126.0, 149.0, 232.0, 370.0, 533.0, 909.0, 1462.0, 2574.0, 4585.0, 8752.0, 17386.0, 37891.0, 86254.0, 189116.0, 289284.0, 217560.0, 102987.0, 44876.0, 20696.0, 10049.0, 5141.0, 2826.0, 1696.0, 1068.0, 620.0, 374.0, 266.0, 168.0, 121.0, 72.0, 58.0, 35.0, 24.0, 24.0, 14.0, 8.0, 4.0, 3.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.203125, -19.520751953125, -18.83837890625, -18.156005859375, -17.4736328125, -16.791259765625, -16.10888671875, -15.426513671875, -14.744140625, -14.061767578125, -13.37939453125, -12.697021484375, -12.0146484375, -11.332275390625, -10.64990234375, -9.967529296875, -9.28515625, -8.602783203125, -7.92041015625, -7.238037109375, -6.5556640625, -5.873291015625, -5.19091796875, -4.508544921875, -3.826171875, -3.143798828125, -2.46142578125, -1.779052734375, -1.0966796875, -0.414306640625, 0.26806640625, 0.950439453125, 1.6328125, 2.315185546875, 2.99755859375, 3.679931640625, 4.3623046875, 5.044677734375, 5.72705078125, 6.409423828125, 7.091796875, 7.774169921875, 8.45654296875, 9.138916015625, 9.8212890625, 10.503662109375, 11.18603515625, 11.868408203125, 12.55078125, 13.233154296875, 13.91552734375, 14.597900390625, 15.2802734375, 15.962646484375, 16.64501953125, 17.327392578125, 18.009765625, 18.692138671875, 19.37451171875, 20.056884765625, 20.7392578125, 21.421630859375, 22.10400390625, 22.786376953125, 23.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 8.0, 14.0, 9.0, 9.0, 18.0, 17.0, 33.0, 32.0, 50.0, 54.0, 55.0, 56.0, 60.0, 72.0, 70.0, 63.0, 58.0, 57.0, 50.0, 36.0, 30.0, 24.0, 23.0, 17.0, 15.0, 4.0, 9.0, 6.0, 4.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013790130615234375, -0.001329660415649414, -0.0012803077697753906, -0.0012309551239013672, -0.0011816024780273438, -0.0011322498321533203, -0.0010828971862792969, -0.0010335445404052734, -0.00098419189453125, -0.0009348392486572266, -0.0008854866027832031, -0.0008361339569091797, -0.0007867813110351562, -0.0007374286651611328, -0.0006880760192871094, -0.0006387233734130859, -0.0005893707275390625, -0.0005400180816650391, -0.0004906654357910156, -0.0004413127899169922, -0.00039196014404296875, -0.0003426074981689453, -0.0002932548522949219, -0.00024390220642089844, -0.000194549560546875, -0.00014519691467285156, -9.584426879882812e-05, -4.649162292480469e-05, 2.86102294921875e-06, 5.221366882324219e-05, 0.00010156631469726562, 0.00015091896057128906, 0.0002002716064453125, 0.00024962425231933594, 0.0002989768981933594, 0.0003483295440673828, 0.00039768218994140625, 0.0004470348358154297, 0.0004963874816894531, 0.0005457401275634766, 0.0005950927734375, 0.0006444454193115234, 0.0006937980651855469, 0.0007431507110595703, 0.0007925033569335938, 0.0008418560028076172, 0.0008912086486816406, 0.0009405612945556641, 0.0009899139404296875, 0.001039266586303711, 0.0010886192321777344, 0.0011379718780517578, 0.0011873245239257812, 0.0012366771697998047, 0.0012860298156738281, 0.0013353824615478516, 0.001384735107421875, 0.0014340877532958984, 0.0014834403991699219, 0.0015327930450439453, 0.0015821456909179688, 0.0016314983367919922, 0.0016808509826660156, 0.001730203628540039, 0.0017795562744140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 8.0, 4.0, 16.0, 14.0, 25.0, 24.0, 35.0, 57.0, 74.0, 132.0, 157.0, 237.0, 375.0, 583.0, 933.0, 1490.0, 2501.0, 4356.0, 7365.0, 13831.0, 26200.0, 51618.0, 101228.0, 180098.0, 233411.0, 191809.0, 111108.0, 56640.0, 28978.0, 15117.0, 8416.0, 4656.0, 2644.0, 1577.0, 985.0, 601.0, 384.0, 281.0, 179.0, 112.0, 77.0, 63.0, 44.0, 30.0, 25.0, 12.0, 10.0, 6.0, 11.0, 8.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0], "bins": [-17.34375, -16.811279296875, -16.27880859375, -15.746337890625, -15.2138671875, -14.681396484375, -14.14892578125, -13.616455078125, -13.083984375, -12.551513671875, -12.01904296875, -11.486572265625, -10.9541015625, -10.421630859375, -9.88916015625, -9.356689453125, -8.82421875, -8.291748046875, -7.75927734375, -7.226806640625, -6.6943359375, -6.161865234375, -5.62939453125, -5.096923828125, -4.564453125, -4.031982421875, -3.49951171875, -2.967041015625, -2.4345703125, -1.902099609375, -1.36962890625, -0.837158203125, -0.3046875, 0.227783203125, 0.76025390625, 1.292724609375, 1.8251953125, 2.357666015625, 2.89013671875, 3.422607421875, 3.955078125, 4.487548828125, 5.02001953125, 5.552490234375, 6.0849609375, 6.617431640625, 7.14990234375, 7.682373046875, 8.21484375, 8.747314453125, 9.27978515625, 9.812255859375, 10.3447265625, 10.877197265625, 11.40966796875, 11.942138671875, 12.474609375, 13.007080078125, 13.53955078125, 14.072021484375, 14.6044921875, 15.136962890625, 15.66943359375, 16.201904296875, 16.734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 13.0, 16.0, 10.0, 18.0, 22.0, 27.0, 46.0, 30.0, 53.0, 55.0, 44.0, 66.0, 55.0, 54.0, 50.0, 48.0, 56.0, 50.0, 39.0, 47.0, 28.0, 28.0, 15.0, 18.0, 19.0, 11.0, 9.0, 10.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.640625, -7.43414306640625, -7.2276611328125, -7.02117919921875, -6.814697265625, -6.60821533203125, -6.4017333984375, -6.19525146484375, -5.98876953125, -5.78228759765625, -5.5758056640625, -5.36932373046875, -5.162841796875, -4.95635986328125, -4.7498779296875, -4.54339599609375, -4.3369140625, -4.13043212890625, -3.9239501953125, -3.71746826171875, -3.510986328125, -3.30450439453125, -3.0980224609375, -2.89154052734375, -2.68505859375, -2.47857666015625, -2.2720947265625, -2.06561279296875, -1.859130859375, -1.65264892578125, -1.4461669921875, -1.23968505859375, -1.033203125, -0.82672119140625, -0.6202392578125, -0.41375732421875, -0.207275390625, -0.00079345703125, 0.2056884765625, 0.41217041015625, 0.61865234375, 0.82513427734375, 1.0316162109375, 1.23809814453125, 1.444580078125, 1.65106201171875, 1.8575439453125, 2.06402587890625, 2.2705078125, 2.47698974609375, 2.6834716796875, 2.88995361328125, 3.096435546875, 3.30291748046875, 3.5093994140625, 3.71588134765625, 3.92236328125, 4.12884521484375, 4.3353271484375, 4.54180908203125, 4.748291015625, 4.95477294921875, 5.1612548828125, 5.36773681640625, 5.57421875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 7.0, 9.0, 7.0, 12.0, 15.0, 20.0, 26.0, 29.0, 25.0, 33.0, 41.0, 43.0, 52.0, 37.0, 47.0, 49.0, 66.0, 53.0, 68.0, 41.0, 47.0, 37.0, 31.0, 26.0, 29.0, 29.0, 19.0, 12.0, 10.0, 11.0, 7.0, 9.0, 10.0, 5.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.415931701660156, -30.511384963989258, -29.60683822631836, -28.702293395996094, -27.797746658325195, -26.893199920654297, -25.9886531829834, -25.0841064453125, -24.179561614990234, -23.275014877319336, -22.370468139648438, -21.465923309326172, -20.561376571655273, -19.656829833984375, -18.752283096313477, -17.847736358642578, -16.94318962097168, -16.03864288330078, -15.1340970993042, -14.2295503616333, -13.325004577636719, -12.42045783996582, -11.515911102294922, -10.611364364624023, -9.706818580627441, -8.802271842956543, -7.897726058959961, -6.9931793212890625, -6.088633060455322, -5.184086799621582, -4.279540061950684, -3.3749938011169434, -2.4704456329345703, -1.5658992528915405, -0.6613528728485107, 0.2431936264038086, 1.1477398872375488, 2.052286148071289, 2.9568328857421875, 3.8613791465759277, 4.765925407409668, 5.670471668243408, 6.575017929077148, 7.479564666748047, 8.384111404418945, 9.288657188415527, 10.193203926086426, 11.097749710083008, 12.002296447753906, 12.906843185424805, 13.811388969421387, 14.715935707092285, 15.620481491088867, 16.525028228759766, 17.429574966430664, 18.334121704101562, 19.238666534423828, 20.143213272094727, 21.047760009765625, 21.95230484008789, 22.85685157775879, 23.761398315429688, 24.665945053100586, 25.570491790771484, 26.475038528442383]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 12.0, 9.0, 15.0, 11.0, 13.0, 15.0, 22.0, 16.0, 27.0, 26.0, 28.0, 31.0, 28.0, 36.0, 47.0, 51.0, 45.0, 49.0, 49.0, 42.0, 38.0, 38.0, 35.0, 26.0, 31.0, 33.0, 29.0, 20.0, 20.0, 22.0, 12.0, 20.0, 12.0, 21.0, 14.0, 4.0, 5.0, 7.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.35444450378418, -24.535263061523438, -23.716081619262695, -22.896900177001953, -22.077720642089844, -21.2585391998291, -20.43935775756836, -19.620176315307617, -18.800994873046875, -17.981813430786133, -17.16263198852539, -16.34345245361328, -15.524271011352539, -14.705089569091797, -13.885908126831055, -13.066726684570312, -12.247547149658203, -11.428365707397461, -10.609185218811035, -9.790003776550293, -8.970823287963867, -8.151641845703125, -7.332460403442383, -6.513279438018799, -5.694098472595215, -4.874917507171631, -4.055736541748047, -3.2365550994873047, -2.4173741340637207, -1.5981931686401367, -0.7790117263793945, 0.04016923904418945, 0.8593502044677734, 1.678531289100647, 2.4977123737335205, 3.3168935775756836, 4.136074542999268, 4.955255508422852, 5.774436950683594, 6.593617916107178, 7.412798881530762, 8.231980323791504, 9.05116081237793, 9.870342254638672, 10.689523696899414, 11.50870418548584, 12.327885627746582, 13.147066116333008, 13.96624755859375, 14.785429000854492, 15.604609489440918, 16.423789978027344, 17.242971420288086, 18.062152862548828, 18.88133430480957, 19.700515747070312, 20.519695281982422, 21.338876724243164, 22.158058166503906, 22.977237701416016, 23.796419143676758, 24.6156005859375, 25.434782028198242, 26.253963470458984, 27.073144912719727]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 6.0, 12.0, 17.0, 25.0, 34.0, 71.0, 82.0, 121.0, 225.0, 336.0, 531.0, 820.0, 1416.0, 2274.0, 3745.0, 6217.0, 10769.0, 18359.0, 33212.0, 59825.0, 114175.0, 225603.0, 453964.0, 789933.0, 948465.0, 714992.0, 392864.0, 195404.0, 99669.0, 52873.0, 28931.0, 16475.0, 9486.0, 5371.0, 3200.0, 1908.0, 1138.0, 700.0, 398.0, 243.0, 160.0, 91.0, 63.0, 28.0, 22.0, 19.0, 4.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84375, -31.860107421875, -30.87646484375, -29.892822265625, -28.9091796875, -27.925537109375, -26.94189453125, -25.958251953125, -24.974609375, -23.990966796875, -23.00732421875, -22.023681640625, -21.0400390625, -20.056396484375, -19.07275390625, -18.089111328125, -17.10546875, -16.121826171875, -15.13818359375, -14.154541015625, -13.1708984375, -12.187255859375, -11.20361328125, -10.219970703125, -9.236328125, -8.252685546875, -7.26904296875, -6.285400390625, -5.3017578125, -4.318115234375, -3.33447265625, -2.350830078125, -1.3671875, -0.383544921875, 0.60009765625, 1.583740234375, 2.5673828125, 3.551025390625, 4.53466796875, 5.518310546875, 6.501953125, 7.485595703125, 8.46923828125, 9.452880859375, 10.4365234375, 11.420166015625, 12.40380859375, 13.387451171875, 14.37109375, 15.354736328125, 16.33837890625, 17.322021484375, 18.3056640625, 19.289306640625, 20.27294921875, 21.256591796875, 22.240234375, 23.223876953125, 24.20751953125, 25.191162109375, 26.1748046875, 27.158447265625, 28.14208984375, 29.125732421875, 30.109375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 8.0, 6.0, 6.0, 8.0, 8.0, 19.0, 15.0, 12.0, 12.0, 18.0, 16.0, 26.0, 35.0, 27.0, 23.0, 36.0, 34.0, 53.0, 44.0, 51.0, 48.0, 46.0, 39.0, 49.0, 31.0, 38.0, 32.0, 31.0, 35.0, 22.0, 23.0, 26.0, 17.0, 13.0, 15.0, 14.0, 22.0, 11.0, 4.0, 13.0, 4.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.828125, -22.114990234375, -21.40185546875, -20.688720703125, -19.9755859375, -19.262451171875, -18.54931640625, -17.836181640625, -17.123046875, -16.409912109375, -15.69677734375, -14.983642578125, -14.2705078125, -13.557373046875, -12.84423828125, -12.131103515625, -11.41796875, -10.704833984375, -9.99169921875, -9.278564453125, -8.5654296875, -7.852294921875, -7.13916015625, -6.426025390625, -5.712890625, -4.999755859375, -4.28662109375, -3.573486328125, -2.8603515625, -2.147216796875, -1.43408203125, -0.720947265625, -0.0078125, 0.705322265625, 1.41845703125, 2.131591796875, 2.8447265625, 3.557861328125, 4.27099609375, 4.984130859375, 5.697265625, 6.410400390625, 7.12353515625, 7.836669921875, 8.5498046875, 9.262939453125, 9.97607421875, 10.689208984375, 11.40234375, 12.115478515625, 12.82861328125, 13.541748046875, 14.2548828125, 14.968017578125, 15.68115234375, 16.394287109375, 17.107421875, 17.820556640625, 18.53369140625, 19.246826171875, 19.9599609375, 20.673095703125, 21.38623046875, 22.099365234375, 22.8125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 15.0, 7.0, 11.0, 27.0, 21.0, 50.0, 66.0, 84.0, 153.0, 201.0, 332.0, 480.0, 701.0, 1046.0, 1632.0, 2616.0, 3975.0, 6402.0, 9684.0, 16181.0, 25825.0, 42442.0, 70098.0, 118415.0, 200598.0, 333587.0, 523481.0, 702865.0, 713671.0, 543660.0, 350630.0, 211338.0, 123562.0, 73826.0, 44341.0, 26840.0, 16545.0, 10393.0, 6543.0, 4195.0, 2719.0, 1749.0, 1120.0, 710.0, 504.0, 321.0, 202.0, 126.0, 103.0, 57.0, 50.0, 36.0, 10.0, 14.0, 8.0, 9.0, 8.0, 4.0, 5.0], "bins": [-29.109375, -28.228515625, -27.34765625, -26.466796875, -25.5859375, -24.705078125, -23.82421875, -22.943359375, -22.0625, -21.181640625, -20.30078125, -19.419921875, -18.5390625, -17.658203125, -16.77734375, -15.896484375, -15.015625, -14.134765625, -13.25390625, -12.373046875, -11.4921875, -10.611328125, -9.73046875, -8.849609375, -7.96875, -7.087890625, -6.20703125, -5.326171875, -4.4453125, -3.564453125, -2.68359375, -1.802734375, -0.921875, -0.041015625, 0.83984375, 1.720703125, 2.6015625, 3.482421875, 4.36328125, 5.244140625, 6.125, 7.005859375, 7.88671875, 8.767578125, 9.6484375, 10.529296875, 11.41015625, 12.291015625, 13.171875, 14.052734375, 14.93359375, 15.814453125, 16.6953125, 17.576171875, 18.45703125, 19.337890625, 20.21875, 21.099609375, 21.98046875, 22.861328125, 23.7421875, 24.623046875, 25.50390625, 26.384765625, 27.265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 8.0, 9.0, 2.0, 10.0, 16.0, 17.0, 34.0, 40.0, 46.0, 56.0, 75.0, 96.0, 119.0, 141.0, 159.0, 178.0, 226.0, 226.0, 255.0, 278.0, 265.0, 255.0, 239.0, 213.0, 172.0, 195.0, 145.0, 127.0, 98.0, 80.0, 67.0, 46.0, 46.0, 33.0, 25.0, 23.0, 16.0, 9.0, 10.0, 6.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.625, -12.234375, -11.84375, -11.453125, -11.0625, -10.671875, -10.28125, -9.890625, -9.5, -9.109375, -8.71875, -8.328125, -7.9375, -7.546875, -7.15625, -6.765625, -6.375, -5.984375, -5.59375, -5.203125, -4.8125, -4.421875, -4.03125, -3.640625, -3.25, -2.859375, -2.46875, -2.078125, -1.6875, -1.296875, -0.90625, -0.515625, -0.125, 0.265625, 0.65625, 1.046875, 1.4375, 1.828125, 2.21875, 2.609375, 3.0, 3.390625, 3.78125, 4.171875, 4.5625, 4.953125, 5.34375, 5.734375, 6.125, 6.515625, 6.90625, 7.296875, 7.6875, 8.078125, 8.46875, 8.859375, 9.25, 9.640625, 10.03125, 10.421875, 10.8125, 11.203125, 11.59375, 11.984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 6.0, 6.0, 7.0, 3.0, 7.0, 7.0, 6.0, 10.0, 19.0, 12.0, 27.0, 30.0, 29.0, 30.0, 36.0, 43.0, 40.0, 55.0, 45.0, 44.0, 52.0, 47.0, 42.0, 46.0, 38.0, 48.0, 42.0, 34.0, 26.0, 25.0, 34.0, 21.0, 9.0, 8.0, 14.0, 9.0, 10.0, 5.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-33.33519744873047, -32.44449996948242, -31.553802490234375, -30.663105010986328, -29.77240753173828, -28.881710052490234, -27.991012573242188, -27.10031509399414, -26.209617614746094, -25.318920135498047, -24.42822265625, -23.537525177001953, -22.646827697753906, -21.75613021850586, -20.865432739257812, -19.974735260009766, -19.08403778076172, -18.193340301513672, -17.302642822265625, -16.411945343017578, -15.521247863769531, -14.630550384521484, -13.739852905273438, -12.84915542602539, -11.958457946777344, -11.067760467529297, -10.17706298828125, -9.286365509033203, -8.395668029785156, -7.504970550537109, -6.6142730712890625, -5.723575592041016, -4.832878112792969, -3.942180633544922, -3.051483154296875, -2.160785675048828, -1.2700881958007812, -0.3793907165527344, 0.5113067626953125, 1.4020042419433594, 2.2927017211914062, 3.183399200439453, 4.0740966796875, 4.964794158935547, 5.855491638183594, 6.746189117431641, 7.6368865966796875, 8.527584075927734, 9.418281555175781, 10.308979034423828, 11.199676513671875, 12.090373992919922, 12.981071472167969, 13.871768951416016, 14.762466430664062, 15.65316390991211, 16.543861389160156, 17.434558868408203, 18.32525634765625, 19.215953826904297, 20.106651306152344, 20.99734878540039, 21.888046264648438, 22.778743743896484, 23.66944122314453]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 9.0, 8.0, 8.0, 12.0, 11.0, 16.0, 9.0, 17.0, 22.0, 17.0, 21.0, 29.0, 37.0, 29.0, 28.0, 31.0, 48.0, 40.0, 30.0, 34.0, 43.0, 41.0, 47.0, 29.0, 34.0, 40.0, 32.0, 20.0, 29.0, 23.0, 25.0, 24.0, 24.0, 17.0, 20.0, 9.0, 18.0, 10.0, 8.0, 4.0, 11.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.274375915527344, -22.53460121154785, -21.794824600219727, -21.055049896240234, -20.315275192260742, -19.57550048828125, -18.835723876953125, -18.095949172973633, -17.35617446899414, -16.61639976501465, -15.87662410736084, -15.136848449707031, -14.397073745727539, -13.65729808807373, -12.917522430419922, -12.17774772644043, -11.437971115112305, -10.698195457458496, -9.958420753479004, -9.218645095825195, -8.478870391845703, -7.7390947341918945, -6.999319076538086, -6.2595438957214355, -5.519768714904785, -4.779993534088135, -4.040218353271484, -3.300442695617676, -2.5606675148010254, -1.820892333984375, -1.0811166763305664, -0.341341495513916, 0.3984336853027344, 1.1382089853286743, 1.8779842853546143, 2.6177597045898438, 3.357534885406494, 4.0973100662231445, 4.837085723876953, 5.5768609046936035, 6.316636085510254, 7.056411266326904, 7.796186447143555, 8.535962104797363, 9.275737762451172, 10.015512466430664, 10.755288124084473, 11.495063781738281, 12.234838485717773, 12.974614143371582, 13.714388847351074, 14.454164505004883, 15.193939208984375, 15.933714866638184, 16.673490524291992, 17.413265228271484, 18.15304183959961, 18.8928165435791, 19.632593154907227, 20.37236785888672, 21.11214256286621, 21.851917266845703, 22.591693878173828, 23.33146858215332, 24.071243286132812]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 10.0, 19.0, 11.0, 25.0, 51.0, 68.0, 101.0, 177.0, 273.0, 400.0, 618.0, 1016.0, 1601.0, 2580.0, 4141.0, 6637.0, 10542.0, 17087.0, 27272.0, 43356.0, 67980.0, 102120.0, 138992.0, 159713.0, 146857.0, 111537.0, 75244.0, 48654.0, 30487.0, 19077.0, 12001.0, 7464.0, 4709.0, 2797.0, 1831.0, 1121.0, 727.0, 445.0, 288.0, 199.0, 119.0, 70.0, 47.0, 28.0, 29.0, 20.0, 7.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.7674560546875, -10.363037109375, -9.9586181640625, -9.55419921875, -9.1497802734375, -8.745361328125, -8.3409423828125, -7.9365234375, -7.5321044921875, -7.127685546875, -6.7232666015625, -6.31884765625, -5.9144287109375, -5.510009765625, -5.1055908203125, -4.701171875, -4.2967529296875, -3.892333984375, -3.4879150390625, -3.08349609375, -2.6790771484375, -2.274658203125, -1.8702392578125, -1.4658203125, -1.0614013671875, -0.656982421875, -0.2525634765625, 0.15185546875, 0.5562744140625, 0.960693359375, 1.3651123046875, 1.76953125, 2.1739501953125, 2.578369140625, 2.9827880859375, 3.38720703125, 3.7916259765625, 4.196044921875, 4.6004638671875, 5.0048828125, 5.4093017578125, 5.813720703125, 6.2181396484375, 6.62255859375, 7.0269775390625, 7.431396484375, 7.8358154296875, 8.240234375, 8.6446533203125, 9.049072265625, 9.4534912109375, 9.85791015625, 10.2623291015625, 10.666748046875, 11.0711669921875, 11.4755859375, 11.8800048828125, 12.284423828125, 12.6888427734375, 13.09326171875, 13.4976806640625, 13.902099609375, 14.3065185546875, 14.7109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 10.0, 10.0, 9.0, 5.0, 12.0, 13.0, 8.0, 12.0, 25.0, 26.0, 24.0, 27.0, 25.0, 29.0, 40.0, 40.0, 39.0, 38.0, 36.0, 42.0, 41.0, 41.0, 42.0, 35.0, 45.0, 35.0, 40.0, 21.0, 23.0, 32.0, 28.0, 21.0, 19.0, 21.0, 8.0, 10.0, 13.0, 10.0, 9.0, 13.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0], "bins": [-29.71875, -28.905029296875, -28.09130859375, -27.277587890625, -26.4638671875, -25.650146484375, -24.83642578125, -24.022705078125, -23.208984375, -22.395263671875, -21.58154296875, -20.767822265625, -19.9541015625, -19.140380859375, -18.32666015625, -17.512939453125, -16.69921875, -15.885498046875, -15.07177734375, -14.258056640625, -13.4443359375, -12.630615234375, -11.81689453125, -11.003173828125, -10.189453125, -9.375732421875, -8.56201171875, -7.748291015625, -6.9345703125, -6.120849609375, -5.30712890625, -4.493408203125, -3.6796875, -2.865966796875, -2.05224609375, -1.238525390625, -0.4248046875, 0.388916015625, 1.20263671875, 2.016357421875, 2.830078125, 3.643798828125, 4.45751953125, 5.271240234375, 6.0849609375, 6.898681640625, 7.71240234375, 8.526123046875, 9.33984375, 10.153564453125, 10.96728515625, 11.781005859375, 12.5947265625, 13.408447265625, 14.22216796875, 15.035888671875, 15.849609375, 16.663330078125, 17.47705078125, 18.290771484375, 19.1044921875, 19.918212890625, 20.73193359375, 21.545654296875, 22.359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 8.0, 13.0, 14.0, 20.0, 45.0, 49.0, 64.0, 93.0, 171.0, 248.0, 328.0, 541.0, 827.0, 1294.0, 1997.0, 3181.0, 5215.0, 8431.0, 14443.0, 24424.0, 41279.0, 71432.0, 116887.0, 171987.0, 192564.0, 152674.0, 97504.0, 58389.0, 34047.0, 19883.0, 11770.0, 7115.0, 4221.0, 2651.0, 1650.0, 1047.0, 719.0, 445.0, 295.0, 180.0, 118.0, 84.0, 56.0, 45.0, 37.0, 20.0, 18.0, 12.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.984375, -16.458740234375, -15.93310546875, -15.407470703125, -14.8818359375, -14.356201171875, -13.83056640625, -13.304931640625, -12.779296875, -12.253662109375, -11.72802734375, -11.202392578125, -10.6767578125, -10.151123046875, -9.62548828125, -9.099853515625, -8.57421875, -8.048583984375, -7.52294921875, -6.997314453125, -6.4716796875, -5.946044921875, -5.42041015625, -4.894775390625, -4.369140625, -3.843505859375, -3.31787109375, -2.792236328125, -2.2666015625, -1.740966796875, -1.21533203125, -0.689697265625, -0.1640625, 0.361572265625, 0.88720703125, 1.412841796875, 1.9384765625, 2.464111328125, 2.98974609375, 3.515380859375, 4.041015625, 4.566650390625, 5.09228515625, 5.617919921875, 6.1435546875, 6.669189453125, 7.19482421875, 7.720458984375, 8.24609375, 8.771728515625, 9.29736328125, 9.822998046875, 10.3486328125, 10.874267578125, 11.39990234375, 11.925537109375, 12.451171875, 12.976806640625, 13.50244140625, 14.028076171875, 14.5537109375, 15.079345703125, 15.60498046875, 16.130615234375, 16.65625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 8.0, 5.0, 7.0, 5.0, 11.0, 15.0, 12.0, 16.0, 19.0, 20.0, 17.0, 17.0, 28.0, 37.0, 42.0, 32.0, 30.0, 36.0, 27.0, 42.0, 38.0, 40.0, 41.0, 58.0, 34.0, 44.0, 34.0, 42.0, 24.0, 35.0, 29.0, 18.0, 15.0, 18.0, 21.0, 11.0, 12.0, 14.0, 10.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.90625, -16.3946533203125, -15.883056640625, -15.3714599609375, -14.85986328125, -14.3482666015625, -13.836669921875, -13.3250732421875, -12.8134765625, -12.3018798828125, -11.790283203125, -11.2786865234375, -10.76708984375, -10.2554931640625, -9.743896484375, -9.2322998046875, -8.720703125, -8.2091064453125, -7.697509765625, -7.1859130859375, -6.67431640625, -6.1627197265625, -5.651123046875, -5.1395263671875, -4.6279296875, -4.1163330078125, -3.604736328125, -3.0931396484375, -2.58154296875, -2.0699462890625, -1.558349609375, -1.0467529296875, -0.53515625, -0.0235595703125, 0.488037109375, 0.9996337890625, 1.51123046875, 2.0228271484375, 2.534423828125, 3.0460205078125, 3.5576171875, 4.0692138671875, 4.580810546875, 5.0924072265625, 5.60400390625, 6.1156005859375, 6.627197265625, 7.1387939453125, 7.650390625, 8.1619873046875, 8.673583984375, 9.1851806640625, 9.69677734375, 10.2083740234375, 10.719970703125, 11.2315673828125, 11.7431640625, 12.2547607421875, 12.766357421875, 13.2779541015625, 13.78955078125, 14.3011474609375, 14.812744140625, 15.3243408203125, 15.8359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 13.0, 19.0, 25.0, 28.0, 71.0, 92.0, 120.0, 211.0, 333.0, 516.0, 844.0, 1394.0, 2418.0, 4168.0, 8059.0, 15101.0, 29692.0, 62501.0, 130676.0, 240026.0, 256506.0, 150569.0, 72337.0, 35051.0, 17347.0, 8973.0, 4712.0, 2603.0, 1615.0, 1001.0, 551.0, 375.0, 224.0, 130.0, 85.0, 62.0, 29.0, 23.0, 17.0, 14.0, 10.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.31640625, -7.10186767578125, -6.8873291015625, -6.67279052734375, -6.458251953125, -6.24371337890625, -6.0291748046875, -5.81463623046875, -5.60009765625, -5.38555908203125, -5.1710205078125, -4.95648193359375, -4.741943359375, -4.52740478515625, -4.3128662109375, -4.09832763671875, -3.8837890625, -3.66925048828125, -3.4547119140625, -3.24017333984375, -3.025634765625, -2.81109619140625, -2.5965576171875, -2.38201904296875, -2.16748046875, -1.95294189453125, -1.7384033203125, -1.52386474609375, -1.309326171875, -1.09478759765625, -0.8802490234375, -0.66571044921875, -0.451171875, -0.23663330078125, -0.0220947265625, 0.19244384765625, 0.406982421875, 0.62152099609375, 0.8360595703125, 1.05059814453125, 1.26513671875, 1.47967529296875, 1.6942138671875, 1.90875244140625, 2.123291015625, 2.33782958984375, 2.5523681640625, 2.76690673828125, 2.9814453125, 3.19598388671875, 3.4105224609375, 3.62506103515625, 3.839599609375, 4.05413818359375, 4.2686767578125, 4.48321533203125, 4.69775390625, 4.91229248046875, 5.1268310546875, 5.34136962890625, 5.555908203125, 5.77044677734375, 5.9849853515625, 6.19952392578125, 6.4140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 4.0, 12.0, 11.0, 10.0, 15.0, 16.0, 21.0, 21.0, 28.0, 46.0, 48.0, 47.0, 61.0, 57.0, 54.0, 67.0, 68.0, 56.0, 51.0, 59.0, 45.0, 36.0, 37.0, 31.0, 15.0, 17.0, 9.0, 12.0, 8.0, 7.0, 8.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006165504455566406, -0.0006001628935337067, -0.0005837753415107727, -0.0005673877894878387, -0.0005510002374649048, -0.0005346126854419708, -0.0005182251334190369, -0.0005018375813961029, -0.00048545002937316895, -0.000469062477350235, -0.000452674925327301, -0.00043628737330436707, -0.0004198998212814331, -0.00040351226925849915, -0.0003871247172355652, -0.0003707371652126312, -0.00035434961318969727, -0.0003379620611667633, -0.00032157450914382935, -0.0003051869571208954, -0.0002887994050979614, -0.00027241185307502747, -0.0002560243010520935, -0.00023963674902915955, -0.00022324919700622559, -0.00020686164498329163, -0.00019047409296035767, -0.0001740865409374237, -0.00015769898891448975, -0.00014131143689155579, -0.00012492388486862183, -0.00010853633284568787, -9.21487808227539e-05, -7.576122879981995e-05, -5.9373676776885986e-05, -4.2986124753952026e-05, -2.6598572731018066e-05, -1.0211020708084106e-05, 6.1765313148498535e-06, 2.2564083337783813e-05, 3.8951635360717773e-05, 5.5339187383651733e-05, 7.17267394065857e-05, 8.811429142951965e-05, 0.00010450184345245361, 0.00012088939547538757, 0.00013727694749832153, 0.0001536644995212555, 0.00017005205154418945, 0.0001864396035671234, 0.00020282715559005737, 0.00021921470761299133, 0.0002356022596359253, 0.00025198981165885925, 0.0002683773636817932, 0.00028476491570472717, 0.00030115246772766113, 0.0003175400197505951, 0.00033392757177352905, 0.000350315123796463, 0.00036670267581939697, 0.00038309022784233093, 0.0003994777798652649, 0.00041586533188819885, 0.0004322528839111328]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 13.0, 27.0, 34.0, 48.0, 83.0, 140.0, 203.0, 334.0, 481.0, 769.0, 1213.0, 2042.0, 3150.0, 5270.0, 8754.0, 15216.0, 26394.0, 48525.0, 87760.0, 150156.0, 206534.0, 194142.0, 129848.0, 73299.0, 39640.0, 22172.0, 12744.0, 7445.0, 4576.0, 2856.0, 1675.0, 1104.0, 697.0, 418.0, 290.0, 170.0, 128.0, 66.0, 44.0, 34.0, 18.0, 8.0, 4.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91796875, -5.7054443359375, -5.492919921875, -5.2803955078125, -5.06787109375, -4.8553466796875, -4.642822265625, -4.4302978515625, -4.2177734375, -4.0052490234375, -3.792724609375, -3.5802001953125, -3.36767578125, -3.1551513671875, -2.942626953125, -2.7301025390625, -2.517578125, -2.3050537109375, -2.092529296875, -1.8800048828125, -1.66748046875, -1.4549560546875, -1.242431640625, -1.0299072265625, -0.8173828125, -0.6048583984375, -0.392333984375, -0.1798095703125, 0.03271484375, 0.2452392578125, 0.457763671875, 0.6702880859375, 0.8828125, 1.0953369140625, 1.307861328125, 1.5203857421875, 1.73291015625, 1.9454345703125, 2.157958984375, 2.3704833984375, 2.5830078125, 2.7955322265625, 3.008056640625, 3.2205810546875, 3.43310546875, 3.6456298828125, 3.858154296875, 4.0706787109375, 4.283203125, 4.4957275390625, 4.708251953125, 4.9207763671875, 5.13330078125, 5.3458251953125, 5.558349609375, 5.7708740234375, 5.9833984375, 6.1959228515625, 6.408447265625, 6.6209716796875, 6.83349609375, 7.0460205078125, 7.258544921875, 7.4710693359375, 7.68359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 11.0, 7.0, 8.0, 14.0, 14.0, 25.0, 28.0, 27.0, 26.0, 36.0, 52.0, 48.0, 47.0, 52.0, 53.0, 55.0, 58.0, 51.0, 51.0, 53.0, 39.0, 27.0, 41.0, 37.0, 26.0, 14.0, 28.0, 8.0, 5.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.2323150634765625, -2.167755126953125, -2.1031951904296875, -2.03863525390625, -1.9740753173828125, -1.909515380859375, -1.8449554443359375, -1.7803955078125, -1.7158355712890625, -1.651275634765625, -1.5867156982421875, -1.52215576171875, -1.4575958251953125, -1.393035888671875, -1.3284759521484375, -1.263916015625, -1.1993560791015625, -1.134796142578125, -1.0702362060546875, -1.00567626953125, -0.9411163330078125, -0.876556396484375, -0.8119964599609375, -0.7474365234375, -0.6828765869140625, -0.618316650390625, -0.5537567138671875, -0.48919677734375, -0.4246368408203125, -0.360076904296875, -0.2955169677734375, -0.23095703125, -0.1663970947265625, -0.101837158203125, -0.0372772216796875, 0.02728271484375, 0.0918426513671875, 0.156402587890625, 0.2209625244140625, 0.2855224609375, 0.3500823974609375, 0.414642333984375, 0.4792022705078125, 0.54376220703125, 0.6083221435546875, 0.672882080078125, 0.7374420166015625, 0.802001953125, 0.8665618896484375, 0.931121826171875, 0.9956817626953125, 1.06024169921875, 1.1248016357421875, 1.189361572265625, 1.2539215087890625, 1.3184814453125, 1.3830413818359375, 1.447601318359375, 1.5121612548828125, 1.57672119140625, 1.6412811279296875, 1.705841064453125, 1.7704010009765625, 1.8349609375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 4.0, 5.0, 5.0, 5.0, 5.0, 7.0, 9.0, 9.0, 17.0, 15.0, 16.0, 29.0, 32.0, 46.0, 29.0, 33.0, 37.0, 48.0, 44.0, 47.0, 51.0, 40.0, 36.0, 48.0, 44.0, 37.0, 50.0, 42.0, 38.0, 17.0, 23.0, 22.0, 15.0, 19.0, 10.0, 10.0, 15.0, 5.0, 4.0, 7.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-30.283309936523438, -29.434499740600586, -28.5856876373291, -27.73687744140625, -26.8880672454834, -26.039255142211914, -25.190444946289062, -24.341632843017578, -23.492822647094727, -22.644012451171875, -21.79520034790039, -20.94639015197754, -20.097579956054688, -19.248767852783203, -18.39995765686035, -17.5511474609375, -16.702335357666016, -15.853524208068848, -15.004714012145996, -14.155902862548828, -13.30709171295166, -12.458280563354492, -11.60947036743164, -10.760659217834473, -9.911849975585938, -9.06303882598877, -8.214228630065918, -7.36541748046875, -6.516606330871582, -5.667795658111572, -4.8189849853515625, -3.9701738357543945, -3.1213626861572266, -2.2725517749786377, -1.4237409830093384, -0.5749301910400391, 0.2738807201385498, 1.1226916313171387, 1.9715023040771484, 2.8203134536743164, 3.669124126434326, 4.517934799194336, 5.366745948791504, 6.215556621551514, 7.064367294311523, 7.913178443908691, 8.76198959350586, 9.610799789428711, 10.459610939025879, 11.308422088623047, 12.157232284545898, 13.006043434143066, 13.854854583740234, 14.703664779663086, 15.552475929260254, 16.401287078857422, 17.250097274780273, 18.098907470703125, 18.94771957397461, 19.79652976989746, 20.645339965820312, 21.494152069091797, 22.34296226501465, 23.1917724609375, 24.040584564208984]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 9.0, 9.0, 9.0, 14.0, 14.0, 9.0, 16.0, 17.0, 24.0, 23.0, 22.0, 36.0, 33.0, 28.0, 30.0, 48.0, 34.0, 37.0, 36.0, 38.0, 47.0, 49.0, 33.0, 33.0, 37.0, 28.0, 28.0, 25.0, 22.0, 25.0, 29.0, 21.0, 20.0, 15.0, 8.0, 18.0, 8.0, 11.0, 8.0, 10.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.505081176757812, -22.764629364013672, -22.02417755126953, -21.28372573852539, -20.54327392578125, -19.80282211303711, -19.06237030029297, -18.321916580200195, -17.581464767456055, -16.841012954711914, -16.100561141967773, -15.360109329223633, -14.619656562805176, -13.879204750061035, -13.138752937316895, -12.398300170898438, -11.657849311828613, -10.917397499084473, -10.176945686340332, -9.436492919921875, -8.696041107177734, -7.955589294433594, -7.215137481689453, -6.474685192108154, -5.734233379364014, -4.993781566619873, -4.253329277038574, -3.5128774642944336, -2.772425413131714, -2.031973361968994, -1.2915215492248535, -0.5510692596435547, 0.18938255310058594, 0.9298345446586609, 1.6702865362167358, 2.410738468170166, 3.1511905193328857, 3.8916425704956055, 4.632094383239746, 5.372546672821045, 6.1129984855651855, 6.853450298309326, 7.593902587890625, 8.334354400634766, 9.074806213378906, 9.815258026123047, 10.555709838867188, 11.296162605285645, 12.036614418029785, 12.777066230773926, 13.517518043518066, 14.257970809936523, 14.998422622680664, 15.738874435424805, 16.479326248168945, 17.219778060913086, 17.960229873657227, 18.700681686401367, 19.441133499145508, 20.18158531188965, 20.92203712463379, 21.662490844726562, 22.402942657470703, 23.143394470214844, 23.883846282958984]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 7.0, 14.0, 17.0, 35.0, 75.0, 89.0, 165.0, 197.0, 314.0, 562.0, 781.0, 1269.0, 1949.0, 3098.0, 4678.0, 7389.0, 11126.0, 17075.0, 25770.0, 38388.0, 55518.0, 76083.0, 99117.0, 118152.0, 125218.0, 117204.0, 98708.0, 76438.0, 55907.0, 38621.0, 25850.0, 17051.0, 11317.0, 7237.0, 4770.0, 2993.0, 1907.0, 1256.0, 831.0, 511.0, 307.0, 217.0, 107.0, 91.0, 46.0, 32.0, 25.0, 21.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.029296875, -20.33984375, -19.650390625, -18.9609375, -18.271484375, -17.58203125, -16.892578125, -16.203125, -15.513671875, -14.82421875, -14.134765625, -13.4453125, -12.755859375, -12.06640625, -11.376953125, -10.6875, -9.998046875, -9.30859375, -8.619140625, -7.9296875, -7.240234375, -6.55078125, -5.861328125, -5.171875, -4.482421875, -3.79296875, -3.103515625, -2.4140625, -1.724609375, -1.03515625, -0.345703125, 0.34375, 1.033203125, 1.72265625, 2.412109375, 3.1015625, 3.791015625, 4.48046875, 5.169921875, 5.859375, 6.548828125, 7.23828125, 7.927734375, 8.6171875, 9.306640625, 9.99609375, 10.685546875, 11.375, 12.064453125, 12.75390625, 13.443359375, 14.1328125, 14.822265625, 15.51171875, 16.201171875, 16.890625, 17.580078125, 18.26953125, 18.958984375, 19.6484375, 20.337890625, 21.02734375, 21.716796875, 22.40625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 10.0, 12.0, 13.0, 6.0, 18.0, 19.0, 18.0, 17.0, 29.0, 18.0, 33.0, 29.0, 29.0, 30.0, 40.0, 37.0, 54.0, 48.0, 37.0, 35.0, 41.0, 46.0, 31.0, 27.0, 25.0, 33.0, 38.0, 35.0, 24.0, 24.0, 18.0, 13.0, 13.0, 19.0, 9.0, 8.0, 5.0, 11.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.971435546875, -23.19287109375, -22.414306640625, -21.6357421875, -20.857177734375, -20.07861328125, -19.300048828125, -18.521484375, -17.742919921875, -16.96435546875, -16.185791015625, -15.4072265625, -14.628662109375, -13.85009765625, -13.071533203125, -12.29296875, -11.514404296875, -10.73583984375, -9.957275390625, -9.1787109375, -8.400146484375, -7.62158203125, -6.843017578125, -6.064453125, -5.285888671875, -4.50732421875, -3.728759765625, -2.9501953125, -2.171630859375, -1.39306640625, -0.614501953125, 0.1640625, 0.942626953125, 1.72119140625, 2.499755859375, 3.2783203125, 4.056884765625, 4.83544921875, 5.614013671875, 6.392578125, 7.171142578125, 7.94970703125, 8.728271484375, 9.5068359375, 10.285400390625, 11.06396484375, 11.842529296875, 12.62109375, 13.399658203125, 14.17822265625, 14.956787109375, 15.7353515625, 16.513916015625, 17.29248046875, 18.071044921875, 18.849609375, 19.628173828125, 20.40673828125, 21.185302734375, 21.9638671875, 22.742431640625, 23.52099609375, 24.299560546875, 25.078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 28.0, 25.0, 50.0, 58.0, 133.0, 171.0, 244.0, 407.0, 581.0, 955.0, 1365.0, 2157.0, 3447.0, 5215.0, 8039.0, 12681.0, 19462.0, 29628.0, 44375.0, 63620.0, 87563.0, 110439.0, 126369.0, 127265.0, 113232.0, 89830.0, 66389.0, 46456.0, 30855.0, 20357.0, 13135.0, 8460.0, 5598.0, 3647.0, 2113.0, 1499.0, 955.0, 624.0, 367.0, 259.0, 178.0, 105.0, 68.0, 45.0, 41.0, 22.0, 14.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.676025390625, -21.94580078125, -21.215576171875, -20.4853515625, -19.755126953125, -19.02490234375, -18.294677734375, -17.564453125, -16.834228515625, -16.10400390625, -15.373779296875, -14.6435546875, -13.913330078125, -13.18310546875, -12.452880859375, -11.72265625, -10.992431640625, -10.26220703125, -9.531982421875, -8.8017578125, -8.071533203125, -7.34130859375, -6.611083984375, -5.880859375, -5.150634765625, -4.42041015625, -3.690185546875, -2.9599609375, -2.229736328125, -1.49951171875, -0.769287109375, -0.0390625, 0.691162109375, 1.42138671875, 2.151611328125, 2.8818359375, 3.612060546875, 4.34228515625, 5.072509765625, 5.802734375, 6.532958984375, 7.26318359375, 7.993408203125, 8.7236328125, 9.453857421875, 10.18408203125, 10.914306640625, 11.64453125, 12.374755859375, 13.10498046875, 13.835205078125, 14.5654296875, 15.295654296875, 16.02587890625, 16.756103515625, 17.486328125, 18.216552734375, 18.94677734375, 19.677001953125, 20.4072265625, 21.137451171875, 21.86767578125, 22.597900390625, 23.328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 3.0, 16.0, 16.0, 18.0, 16.0, 22.0, 22.0, 25.0, 38.0, 29.0, 46.0, 26.0, 44.0, 40.0, 48.0, 48.0, 39.0, 38.0, 48.0, 40.0, 34.0, 36.0, 32.0, 29.0, 27.0, 32.0, 35.0, 27.0, 14.0, 19.0, 10.0, 14.0, 8.0, 13.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.359375, -14.8349609375, -14.310546875, -13.7861328125, -13.26171875, -12.7373046875, -12.212890625, -11.6884765625, -11.1640625, -10.6396484375, -10.115234375, -9.5908203125, -9.06640625, -8.5419921875, -8.017578125, -7.4931640625, -6.96875, -6.4443359375, -5.919921875, -5.3955078125, -4.87109375, -4.3466796875, -3.822265625, -3.2978515625, -2.7734375, -2.2490234375, -1.724609375, -1.2001953125, -0.67578125, -0.1513671875, 0.373046875, 0.8974609375, 1.421875, 1.9462890625, 2.470703125, 2.9951171875, 3.51953125, 4.0439453125, 4.568359375, 5.0927734375, 5.6171875, 6.1416015625, 6.666015625, 7.1904296875, 7.71484375, 8.2392578125, 8.763671875, 9.2880859375, 9.8125, 10.3369140625, 10.861328125, 11.3857421875, 11.91015625, 12.4345703125, 12.958984375, 13.4833984375, 14.0078125, 14.5322265625, 15.056640625, 15.5810546875, 16.10546875, 16.6298828125, 17.154296875, 17.6787109375, 18.203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 9.0, 18.0, 19.0, 22.0, 50.0, 44.0, 73.0, 105.0, 160.0, 235.0, 336.0, 469.0, 669.0, 1001.0, 1500.0, 2508.0, 4193.0, 7597.0, 15223.0, 31920.0, 71926.0, 149806.0, 242106.0, 238305.0, 146105.0, 69274.0, 31545.0, 14793.0, 7393.0, 4150.0, 2362.0, 1490.0, 1010.0, 673.0, 416.0, 324.0, 211.0, 152.0, 92.0, 80.0, 67.0, 33.0, 31.0, 14.0, 14.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 6.0], "bins": [-17.65625, -17.1514892578125, -16.646728515625, -16.1419677734375, -15.63720703125, -15.1324462890625, -14.627685546875, -14.1229248046875, -13.6181640625, -13.1134033203125, -12.608642578125, -12.1038818359375, -11.59912109375, -11.0943603515625, -10.589599609375, -10.0848388671875, -9.580078125, -9.0753173828125, -8.570556640625, -8.0657958984375, -7.56103515625, -7.0562744140625, -6.551513671875, -6.0467529296875, -5.5419921875, -5.0372314453125, -4.532470703125, -4.0277099609375, -3.52294921875, -3.0181884765625, -2.513427734375, -2.0086669921875, -1.50390625, -0.9991455078125, -0.494384765625, 0.0103759765625, 0.51513671875, 1.0198974609375, 1.524658203125, 2.0294189453125, 2.5341796875, 3.0389404296875, 3.543701171875, 4.0484619140625, 4.55322265625, 5.0579833984375, 5.562744140625, 6.0675048828125, 6.572265625, 7.0770263671875, 7.581787109375, 8.0865478515625, 8.59130859375, 9.0960693359375, 9.600830078125, 10.1055908203125, 10.6103515625, 11.1151123046875, 11.619873046875, 12.1246337890625, 12.62939453125, 13.1341552734375, 13.638916015625, 14.1436767578125, 14.6484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 10.0, 4.0, 9.0, 8.0, 21.0, 38.0, 51.0, 49.0, 72.0, 77.0, 108.0, 108.0, 95.0, 89.0, 73.0, 52.0, 33.0, 27.0, 17.0, 19.0, 10.0, 3.0, 9.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002086639404296875, -0.0020223259925842285, -0.001958012580871582, -0.0018936991691589355, -0.001829385757446289, -0.0017650723457336426, -0.001700758934020996, -0.0016364455223083496, -0.0015721321105957031, -0.0015078186988830566, -0.0014435052871704102, -0.0013791918754577637, -0.0013148784637451172, -0.0012505650520324707, -0.0011862516403198242, -0.0011219382286071777, -0.0010576248168945312, -0.0009933114051818848, -0.0009289979934692383, -0.0008646845817565918, -0.0008003711700439453, -0.0007360577583312988, -0.0006717443466186523, -0.0006074309349060059, -0.0005431175231933594, -0.0004788041114807129, -0.0004144906997680664, -0.0003501772880554199, -0.00028586387634277344, -0.00022155046463012695, -0.00015723705291748047, -9.292364120483398e-05, -2.86102294921875e-05, 3.5703182220458984e-05, 0.00010001659393310547, 0.00016433000564575195, 0.00022864341735839844, 0.0002929568290710449, 0.0003572702407836914, 0.0004215836524963379, 0.0004858970642089844, 0.0005502104759216309, 0.0006145238876342773, 0.0006788372993469238, 0.0007431507110595703, 0.0008074641227722168, 0.0008717775344848633, 0.0009360909461975098, 0.0010004043579101562, 0.0010647177696228027, 0.0011290311813354492, 0.0011933445930480957, 0.0012576580047607422, 0.0013219714164733887, 0.0013862848281860352, 0.0014505982398986816, 0.0015149116516113281, 0.0015792250633239746, 0.001643538475036621, 0.0017078518867492676, 0.001772165298461914, 0.0018364787101745605, 0.001900792121887207, 0.0019651055335998535, 0.0020294189453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 7.0, 13.0, 17.0, 29.0, 30.0, 41.0, 63.0, 112.0, 143.0, 176.0, 252.0, 374.0, 520.0, 809.0, 1229.0, 1995.0, 3305.0, 5887.0, 11133.0, 22627.0, 48383.0, 102751.0, 190985.0, 248802.0, 198567.0, 108388.0, 50934.0, 23922.0, 11579.0, 5986.0, 3456.0, 2031.0, 1239.0, 804.0, 541.0, 404.0, 288.0, 200.0, 135.0, 128.0, 85.0, 44.0, 36.0, 23.0, 23.0, 11.0, 8.0, 5.0, 5.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.931396484375, -15.40966796875, -14.887939453125, -14.3662109375, -13.844482421875, -13.32275390625, -12.801025390625, -12.279296875, -11.757568359375, -11.23583984375, -10.714111328125, -10.1923828125, -9.670654296875, -9.14892578125, -8.627197265625, -8.10546875, -7.583740234375, -7.06201171875, -6.540283203125, -6.0185546875, -5.496826171875, -4.97509765625, -4.453369140625, -3.931640625, -3.409912109375, -2.88818359375, -2.366455078125, -1.8447265625, -1.322998046875, -0.80126953125, -0.279541015625, 0.2421875, 0.763916015625, 1.28564453125, 1.807373046875, 2.3291015625, 2.850830078125, 3.37255859375, 3.894287109375, 4.416015625, 4.937744140625, 5.45947265625, 5.981201171875, 6.5029296875, 7.024658203125, 7.54638671875, 8.068115234375, 8.58984375, 9.111572265625, 9.63330078125, 10.155029296875, 10.6767578125, 11.198486328125, 11.72021484375, 12.241943359375, 12.763671875, 13.285400390625, 13.80712890625, 14.328857421875, 14.8505859375, 15.372314453125, 15.89404296875, 16.415771484375, 16.9375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 12.0, 13.0, 23.0, 18.0, 38.0, 25.0, 53.0, 47.0, 79.0, 69.0, 81.0, 79.0, 82.0, 79.0, 58.0, 40.0, 46.0, 30.0, 23.0, 15.0, 18.0, 8.0, 12.0, 3.0, 5.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.2109375, -6.99395751953125, -6.7769775390625, -6.55999755859375, -6.343017578125, -6.12603759765625, -5.9090576171875, -5.69207763671875, -5.47509765625, -5.25811767578125, -5.0411376953125, -4.82415771484375, -4.607177734375, -4.39019775390625, -4.1732177734375, -3.95623779296875, -3.7392578125, -3.52227783203125, -3.3052978515625, -3.08831787109375, -2.871337890625, -2.65435791015625, -2.4373779296875, -2.22039794921875, -2.00341796875, -1.78643798828125, -1.5694580078125, -1.35247802734375, -1.135498046875, -0.91851806640625, -0.7015380859375, -0.48455810546875, -0.267578125, -0.05059814453125, 0.1663818359375, 0.38336181640625, 0.600341796875, 0.81732177734375, 1.0343017578125, 1.25128173828125, 1.46826171875, 1.68524169921875, 1.9022216796875, 2.11920166015625, 2.336181640625, 2.55316162109375, 2.7701416015625, 2.98712158203125, 3.2041015625, 3.42108154296875, 3.6380615234375, 3.85504150390625, 4.072021484375, 4.28900146484375, 4.5059814453125, 4.72296142578125, 4.93994140625, 5.15692138671875, 5.3739013671875, 5.59088134765625, 5.807861328125, 6.02484130859375, 6.2418212890625, 6.45880126953125, 6.67578125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 3.0, 8.0, 8.0, 9.0, 12.0, 18.0, 16.0, 21.0, 18.0, 32.0, 35.0, 24.0, 38.0, 42.0, 42.0, 41.0, 43.0, 44.0, 57.0, 48.0, 44.0, 43.0, 37.0, 35.0, 32.0, 35.0, 36.0, 22.0, 17.0, 20.0, 22.0, 14.0, 11.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0], "bins": [-29.546329498291016, -28.719093322753906, -27.89185905456543, -27.06462287902832, -26.237388610839844, -25.410152435302734, -24.582916259765625, -23.75568199157715, -22.92844581604004, -22.10120964050293, -21.273975372314453, -20.446739196777344, -19.619504928588867, -18.792268753051758, -17.96503448486328, -17.137798309326172, -16.310562133789062, -15.48332691192627, -14.656091690063477, -13.828855514526367, -13.001620292663574, -12.174385070800781, -11.347149848937988, -10.519914627075195, -9.692680358886719, -8.865445137023926, -8.038209915161133, -7.210974216461182, -6.3837385177612305, -5.5565032958984375, -4.7292680740356445, -3.9020323753356934, -3.074796676635742, -2.24756121635437, -1.4203258752822876, -0.5930905342102051, 0.234144926071167, 1.061380386352539, 1.888615608215332, 2.715851306915283, 3.543086528778076, 4.370321750640869, 5.19755744934082, 6.024792671203613, 6.852027893066406, 7.679263591766357, 8.506498336791992, 9.333734512329102, 10.160969734191895, 10.988204956054688, 11.81544017791748, 12.642675399780273, 13.469911575317383, 14.297146797180176, 15.124382019042969, 15.951618194580078, 16.778852462768555, 17.606088638305664, 18.43332290649414, 19.26055908203125, 20.087793350219727, 20.915029525756836, 21.742263793945312, 22.569499969482422, 23.39673614501953]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 6.0, 9.0, 15.0, 9.0, 22.0, 16.0, 22.0, 26.0, 34.0, 27.0, 38.0, 28.0, 29.0, 26.0, 40.0, 33.0, 47.0, 32.0, 49.0, 42.0, 40.0, 36.0, 25.0, 36.0, 31.0, 24.0, 32.0, 31.0, 19.0, 27.0, 17.0, 15.0, 14.0, 18.0, 15.0, 5.0, 11.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.621994018554688, -23.85186767578125, -23.081741333007812, -22.311614990234375, -21.541488647460938, -20.7713623046875, -20.001235961914062, -19.231111526489258, -18.46098518371582, -17.690858840942383, -16.920732498168945, -16.150606155395508, -15.380480766296387, -14.61035442352295, -13.840228080749512, -13.07010269165039, -12.299975395202637, -11.5298490524292, -10.759722709655762, -9.98959732055664, -9.219470977783203, -8.449344635009766, -7.679218292236328, -6.909092426300049, -6.138966083526611, -5.368839740753174, -4.5987138748168945, -3.828587532043457, -3.0584614276885986, -2.2883353233337402, -1.5182089805603027, -0.7480831146240234, 0.022043228149414062, 0.7921693921089172, 1.5622955560684204, 2.3324217796325684, 3.1025478839874268, 3.872673988342285, 4.642800331115723, 5.412926197052002, 6.1830525398254395, 6.953178882598877, 7.723304748535156, 8.493431091308594, 9.263557434082031, 10.033683776855469, 10.803810119628906, 11.573935508728027, 12.344061851501465, 13.114188194274902, 13.88431453704834, 14.654439926147461, 15.424566268920898, 16.194692611694336, 16.964818954467773, 17.73494529724121, 18.50507164001465, 19.275197982788086, 20.045324325561523, 20.81545066833496, 21.5855770111084, 22.355701446533203, 23.12582778930664, 23.895954132080078, 24.666080474853516]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 13.0, 25.0, 45.0, 76.0, 134.0, 218.0, 324.0, 560.0, 897.0, 1610.0, 2750.0, 4810.0, 8204.0, 14979.0, 28084.0, 53127.0, 106015.0, 223524.0, 474716.0, 867551.0, 1022275.0, 702164.0, 350060.0, 163565.0, 79462.0, 41099.0, 21337.0, 11663.0, 6528.0, 3640.0, 2015.0, 1215.0, 670.0, 370.0, 213.0, 149.0, 88.0, 37.0, 26.0, 15.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.625, -35.49072265625, -34.3564453125, -33.22216796875, -32.087890625, -30.95361328125, -29.8193359375, -28.68505859375, -27.55078125, -26.41650390625, -25.2822265625, -24.14794921875, -23.013671875, -21.87939453125, -20.7451171875, -19.61083984375, -18.4765625, -17.34228515625, -16.2080078125, -15.07373046875, -13.939453125, -12.80517578125, -11.6708984375, -10.53662109375, -9.40234375, -8.26806640625, -7.1337890625, -5.99951171875, -4.865234375, -3.73095703125, -2.5966796875, -1.46240234375, -0.328125, 0.80615234375, 1.9404296875, 3.07470703125, 4.208984375, 5.34326171875, 6.4775390625, 7.61181640625, 8.74609375, 9.88037109375, 11.0146484375, 12.14892578125, 13.283203125, 14.41748046875, 15.5517578125, 16.68603515625, 17.8203125, 18.95458984375, 20.0888671875, 21.22314453125, 22.357421875, 23.49169921875, 24.6259765625, 25.76025390625, 26.89453125, 28.02880859375, 29.1630859375, 30.29736328125, 31.431640625, 32.56591796875, 33.7001953125, 34.83447265625, 35.96875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 3.0, 8.0, 4.0, 11.0, 7.0, 6.0, 15.0, 15.0, 17.0, 15.0, 21.0, 40.0, 23.0, 29.0, 30.0, 34.0, 24.0, 32.0, 29.0, 41.0, 42.0, 48.0, 43.0, 47.0, 38.0, 38.0, 31.0, 23.0, 19.0, 29.0, 35.0, 32.0, 24.0, 23.0, 19.0, 11.0, 18.0, 15.0, 12.0, 7.0, 8.0, 5.0, 6.0, 2.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.40625, -19.74609375, -19.0859375, -18.42578125, -17.765625, -17.10546875, -16.4453125, -15.78515625, -15.125, -14.46484375, -13.8046875, -13.14453125, -12.484375, -11.82421875, -11.1640625, -10.50390625, -9.84375, -9.18359375, -8.5234375, -7.86328125, -7.203125, -6.54296875, -5.8828125, -5.22265625, -4.5625, -3.90234375, -3.2421875, -2.58203125, -1.921875, -1.26171875, -0.6015625, 0.05859375, 0.71875, 1.37890625, 2.0390625, 2.69921875, 3.359375, 4.01953125, 4.6796875, 5.33984375, 6.0, 6.66015625, 7.3203125, 7.98046875, 8.640625, 9.30078125, 9.9609375, 10.62109375, 11.28125, 11.94140625, 12.6015625, 13.26171875, 13.921875, 14.58203125, 15.2421875, 15.90234375, 16.5625, 17.22265625, 17.8828125, 18.54296875, 19.203125, 19.86328125, 20.5234375, 21.18359375, 21.84375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 10.0, 13.0, 12.0, 25.0, 38.0, 71.0, 95.0, 135.0, 236.0, 376.0, 681.0, 1054.0, 1696.0, 2879.0, 4846.0, 8379.0, 14710.0, 26459.0, 47453.0, 88429.0, 164897.0, 304341.0, 531601.0, 788315.0, 828457.0, 601629.0, 354198.0, 192865.0, 103204.0, 55818.0, 30667.0, 17133.0, 9804.0, 5637.0, 3229.0, 1916.0, 1133.0, 713.0, 434.0, 253.0, 172.0, 88.0, 66.0, 43.0, 29.0, 17.0, 17.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.640625, -34.53125, -33.421875, -32.3125, -31.203125, -30.09375, -28.984375, -27.875, -26.765625, -25.65625, -24.546875, -23.4375, -22.328125, -21.21875, -20.109375, -19.0, -17.890625, -16.78125, -15.671875, -14.5625, -13.453125, -12.34375, -11.234375, -10.125, -9.015625, -7.90625, -6.796875, -5.6875, -4.578125, -3.46875, -2.359375, -1.25, -0.140625, 0.96875, 2.078125, 3.1875, 4.296875, 5.40625, 6.515625, 7.625, 8.734375, 9.84375, 10.953125, 12.0625, 13.171875, 14.28125, 15.390625, 16.5, 17.609375, 18.71875, 19.828125, 20.9375, 22.046875, 23.15625, 24.265625, 25.375, 26.484375, 27.59375, 28.703125, 29.8125, 30.921875, 32.03125, 33.140625, 34.25]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 13.0, 18.0, 28.0, 28.0, 38.0, 62.0, 56.0, 89.0, 123.0, 120.0, 171.0, 204.0, 236.0, 242.0, 250.0, 281.0, 299.0, 293.0, 305.0, 243.0, 197.0, 155.0, 135.0, 125.0, 77.0, 72.0, 54.0, 39.0, 29.0, 27.0, 18.0, 18.0, 9.0, 2.0, 10.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.152587890625, -9.69580078125, -9.239013671875, -8.7822265625, -8.325439453125, -7.86865234375, -7.411865234375, -6.955078125, -6.498291015625, -6.04150390625, -5.584716796875, -5.1279296875, -4.671142578125, -4.21435546875, -3.757568359375, -3.30078125, -2.843994140625, -2.38720703125, -1.930419921875, -1.4736328125, -1.016845703125, -0.56005859375, -0.103271484375, 0.353515625, 0.810302734375, 1.26708984375, 1.723876953125, 2.1806640625, 2.637451171875, 3.09423828125, 3.551025390625, 4.0078125, 4.464599609375, 4.92138671875, 5.378173828125, 5.8349609375, 6.291748046875, 6.74853515625, 7.205322265625, 7.662109375, 8.118896484375, 8.57568359375, 9.032470703125, 9.4892578125, 9.946044921875, 10.40283203125, 10.859619140625, 11.31640625, 11.773193359375, 12.22998046875, 12.686767578125, 13.1435546875, 13.600341796875, 14.05712890625, 14.513916015625, 14.970703125, 15.427490234375, 15.88427734375, 16.341064453125, 16.7978515625, 17.254638671875, 17.71142578125, 18.168212890625, 18.625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 10.0, 11.0, 21.0, 14.0, 29.0, 24.0, 31.0, 21.0, 23.0, 42.0, 33.0, 51.0, 48.0, 48.0, 54.0, 49.0, 58.0, 51.0, 33.0, 45.0, 31.0, 28.0, 34.0, 28.0, 34.0, 23.0, 10.0, 17.0, 8.0, 17.0, 16.0, 10.0, 4.0, 6.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-32.16241455078125, -31.269439697265625, -30.37646484375, -29.483489990234375, -28.590517044067383, -27.697542190551758, -26.804567337036133, -25.911592483520508, -25.018619537353516, -24.12564468383789, -23.232669830322266, -22.33969497680664, -21.44672203063965, -20.553747177124023, -19.6607723236084, -18.767797470092773, -17.87482261657715, -16.981847763061523, -16.0888729095459, -15.19589900970459, -14.302925109863281, -13.409950256347656, -12.516975402832031, -11.624000549316406, -10.731026649475098, -9.838051795959473, -8.945077896118164, -8.052103042602539, -7.159128665924072, -6.2661542892456055, -5.3731794357299805, -4.480205059051514, -3.587228775024414, -2.6942543983459473, -1.8012797832489014, -0.9083051681518555, -0.015330791473388672, 0.8776435852050781, 1.7706184387207031, 2.66359281539917, 3.5565671920776367, 4.4495415687561035, 5.34251594543457, 6.235490798950195, 7.128465175628662, 8.021439552307129, 8.914414405822754, 9.807388305664062, 10.700363159179688, 11.593338012695312, 12.486311912536621, 13.379286766052246, 14.272260665893555, 15.16523551940918, 16.058210372924805, 16.95118522644043, 17.844158172607422, 18.737133026123047, 19.630107879638672, 20.523082733154297, 21.41605567932129, 22.309030532836914, 23.20200538635254, 24.094980239868164, 24.98795509338379]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 0.0, 5.0, 6.0, 3.0, 4.0, 7.0, 5.0, 13.0, 7.0, 13.0, 14.0, 13.0, 28.0, 26.0, 30.0, 36.0, 40.0, 30.0, 25.0, 36.0, 29.0, 37.0, 42.0, 49.0, 42.0, 49.0, 37.0, 33.0, 44.0, 35.0, 36.0, 24.0, 33.0, 32.0, 18.0, 20.0, 14.0, 17.0, 12.0, 13.0, 10.0, 8.0, 10.0, 8.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.61370277404785, -22.778467178344727, -21.9432315826416, -21.10799789428711, -20.272762298583984, -19.43752670288086, -18.602291107177734, -17.76705551147461, -16.931819915771484, -16.09658432006836, -15.26134967803955, -14.426114082336426, -13.590879440307617, -12.755643844604492, -11.920408248901367, -11.085172653198242, -10.24993896484375, -9.414703369140625, -8.579468727111816, -7.744233131408691, -6.908998012542725, -6.073762893676758, -5.238527297973633, -4.403292179107666, -3.568057060241699, -2.7328219413757324, -1.8975865840911865, -1.0623512268066406, -0.22711610794067383, 0.608119010925293, 1.443354606628418, 2.2785897254943848, 3.1138229370117188, 3.9490580558776855, 4.784293174743652, 5.619528770446777, 6.454763889312744, 7.289999008178711, 8.125234603881836, 8.960470199584961, 9.79570484161377, 10.630940437316895, 11.466175079345703, 12.301410675048828, 13.136646270751953, 13.971880912780762, 14.807116508483887, 15.642351150512695, 16.47758674621582, 17.312822341918945, 18.14805793762207, 18.983291625976562, 19.818527221679688, 20.653762817382812, 21.488998413085938, 22.324234008789062, 23.159469604492188, 23.994705200195312, 24.829940795898438, 25.665176391601562, 26.500410079956055, 27.33564567565918, 28.170881271362305, 29.00611686706543, 29.841350555419922]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 11.0, 19.0, 22.0, 41.0, 41.0, 67.0, 116.0, 156.0, 272.0, 420.0, 570.0, 875.0, 1251.0, 1784.0, 2739.0, 4041.0, 6054.0, 9018.0, 13178.0, 19951.0, 29334.0, 43731.0, 63971.0, 88842.0, 116367.0, 134585.0, 132679.0, 111202.0, 83746.0, 59069.0, 40788.0, 27303.0, 18468.0, 12361.0, 8207.0, 5670.0, 3762.0, 2552.0, 1703.0, 1184.0, 790.0, 559.0, 370.0, 218.0, 158.0, 104.0, 84.0, 40.0, 37.0, 19.0, 11.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.3671875, -9.0430908203125, -8.718994140625, -8.3948974609375, -8.07080078125, -7.7467041015625, -7.422607421875, -7.0985107421875, -6.7744140625, -6.4503173828125, -6.126220703125, -5.8021240234375, -5.47802734375, -5.1539306640625, -4.829833984375, -4.5057373046875, -4.181640625, -3.8575439453125, -3.533447265625, -3.2093505859375, -2.88525390625, -2.5611572265625, -2.237060546875, -1.9129638671875, -1.5888671875, -1.2647705078125, -0.940673828125, -0.6165771484375, -0.29248046875, 0.0316162109375, 0.355712890625, 0.6798095703125, 1.00390625, 1.3280029296875, 1.652099609375, 1.9761962890625, 2.30029296875, 2.6243896484375, 2.948486328125, 3.2725830078125, 3.5966796875, 3.9207763671875, 4.244873046875, 4.5689697265625, 4.89306640625, 5.2171630859375, 5.541259765625, 5.8653564453125, 6.189453125, 6.5135498046875, 6.837646484375, 7.1617431640625, 7.48583984375, 7.8099365234375, 8.134033203125, 8.4581298828125, 8.7822265625, 9.1063232421875, 9.430419921875, 9.7545166015625, 10.07861328125, 10.4027099609375, 10.726806640625, 11.0509033203125, 11.375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 3.0, 6.0, 7.0, 6.0, 14.0, 9.0, 7.0, 12.0, 19.0, 14.0, 22.0, 20.0, 31.0, 33.0, 40.0, 33.0, 45.0, 39.0, 38.0, 45.0, 45.0, 45.0, 42.0, 37.0, 45.0, 28.0, 40.0, 43.0, 30.0, 33.0, 24.0, 27.0, 28.0, 14.0, 8.0, 13.0, 14.0, 7.0, 8.0, 6.0, 9.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.578125, -24.677490234375, -23.77685546875, -22.876220703125, -21.9755859375, -21.074951171875, -20.17431640625, -19.273681640625, -18.373046875, -17.472412109375, -16.57177734375, -15.671142578125, -14.7705078125, -13.869873046875, -12.96923828125, -12.068603515625, -11.16796875, -10.267333984375, -9.36669921875, -8.466064453125, -7.5654296875, -6.664794921875, -5.76416015625, -4.863525390625, -3.962890625, -3.062255859375, -2.16162109375, -1.260986328125, -0.3603515625, 0.540283203125, 1.44091796875, 2.341552734375, 3.2421875, 4.142822265625, 5.04345703125, 5.944091796875, 6.8447265625, 7.745361328125, 8.64599609375, 9.546630859375, 10.447265625, 11.347900390625, 12.24853515625, 13.149169921875, 14.0498046875, 14.950439453125, 15.85107421875, 16.751708984375, 17.65234375, 18.552978515625, 19.45361328125, 20.354248046875, 21.2548828125, 22.155517578125, 23.05615234375, 23.956787109375, 24.857421875, 25.758056640625, 26.65869140625, 27.559326171875, 28.4599609375, 29.360595703125, 30.26123046875, 31.161865234375, 32.0625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 7.0, 13.0, 23.0, 33.0, 46.0, 90.0, 131.0, 181.0, 284.0, 391.0, 583.0, 914.0, 1409.0, 2213.0, 3342.0, 5312.0, 8400.0, 13573.0, 21740.0, 35161.0, 55777.0, 86254.0, 127057.0, 162845.0, 162274.0, 126809.0, 85596.0, 54770.0, 34874.0, 21464.0, 13436.0, 8529.0, 5471.0, 3341.0, 2105.0, 1401.0, 914.0, 602.0, 392.0, 289.0, 170.0, 116.0, 86.0, 40.0, 34.0, 21.0, 19.0, 10.0, 3.0, 8.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-14.4296875, -13.9923095703125, -13.554931640625, -13.1175537109375, -12.68017578125, -12.2427978515625, -11.805419921875, -11.3680419921875, -10.9306640625, -10.4932861328125, -10.055908203125, -9.6185302734375, -9.18115234375, -8.7437744140625, -8.306396484375, -7.8690185546875, -7.431640625, -6.9942626953125, -6.556884765625, -6.1195068359375, -5.68212890625, -5.2447509765625, -4.807373046875, -4.3699951171875, -3.9326171875, -3.4952392578125, -3.057861328125, -2.6204833984375, -2.18310546875, -1.7457275390625, -1.308349609375, -0.8709716796875, -0.43359375, 0.0037841796875, 0.441162109375, 0.8785400390625, 1.31591796875, 1.7532958984375, 2.190673828125, 2.6280517578125, 3.0654296875, 3.5028076171875, 3.940185546875, 4.3775634765625, 4.81494140625, 5.2523193359375, 5.689697265625, 6.1270751953125, 6.564453125, 7.0018310546875, 7.439208984375, 7.8765869140625, 8.31396484375, 8.7513427734375, 9.188720703125, 9.6260986328125, 10.0634765625, 10.5008544921875, 10.938232421875, 11.3756103515625, 11.81298828125, 12.2503662109375, 12.687744140625, 13.1251220703125, 13.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 6.0, 6.0, 6.0, 13.0, 13.0, 18.0, 21.0, 19.0, 21.0, 16.0, 32.0, 30.0, 17.0, 30.0, 38.0, 32.0, 47.0, 41.0, 37.0, 39.0, 36.0, 37.0, 45.0, 43.0, 33.0, 37.0, 41.0, 25.0, 24.0, 21.0, 22.0, 19.0, 18.0, 22.0, 17.0, 21.0, 8.0, 11.0, 3.0, 6.0, 9.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.625, -15.108154296875, -14.59130859375, -14.074462890625, -13.5576171875, -13.040771484375, -12.52392578125, -12.007080078125, -11.490234375, -10.973388671875, -10.45654296875, -9.939697265625, -9.4228515625, -8.906005859375, -8.38916015625, -7.872314453125, -7.35546875, -6.838623046875, -6.32177734375, -5.804931640625, -5.2880859375, -4.771240234375, -4.25439453125, -3.737548828125, -3.220703125, -2.703857421875, -2.18701171875, -1.670166015625, -1.1533203125, -0.636474609375, -0.11962890625, 0.397216796875, 0.9140625, 1.430908203125, 1.94775390625, 2.464599609375, 2.9814453125, 3.498291015625, 4.01513671875, 4.531982421875, 5.048828125, 5.565673828125, 6.08251953125, 6.599365234375, 7.1162109375, 7.633056640625, 8.14990234375, 8.666748046875, 9.18359375, 9.700439453125, 10.21728515625, 10.734130859375, 11.2509765625, 11.767822265625, 12.28466796875, 12.801513671875, 13.318359375, 13.835205078125, 14.35205078125, 14.868896484375, 15.3857421875, 15.902587890625, 16.41943359375, 16.936279296875, 17.453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 4.0, 11.0, 7.0, 12.0, 18.0, 40.0, 41.0, 84.0, 116.0, 170.0, 267.0, 324.0, 520.0, 893.0, 1306.0, 2196.0, 3571.0, 6102.0, 10688.0, 18711.0, 33906.0, 62001.0, 113203.0, 185699.0, 221708.0, 167098.0, 97600.0, 53340.0, 29117.0, 16156.0, 9513.0, 5461.0, 3228.0, 2027.0, 1176.0, 721.0, 502.0, 336.0, 201.0, 130.0, 104.0, 73.0, 46.0, 32.0, 22.0, 17.0, 13.0, 9.0, 5.0, 8.0, 8.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-5.28125, -5.11810302734375, -4.9549560546875, -4.79180908203125, -4.628662109375, -4.46551513671875, -4.3023681640625, -4.13922119140625, -3.97607421875, -3.81292724609375, -3.6497802734375, -3.48663330078125, -3.323486328125, -3.16033935546875, -2.9971923828125, -2.83404541015625, -2.6708984375, -2.50775146484375, -2.3446044921875, -2.18145751953125, -2.018310546875, -1.85516357421875, -1.6920166015625, -1.52886962890625, -1.36572265625, -1.20257568359375, -1.0394287109375, -0.87628173828125, -0.713134765625, -0.54998779296875, -0.3868408203125, -0.22369384765625, -0.060546875, 0.10260009765625, 0.2657470703125, 0.42889404296875, 0.592041015625, 0.75518798828125, 0.9183349609375, 1.08148193359375, 1.24462890625, 1.40777587890625, 1.5709228515625, 1.73406982421875, 1.897216796875, 2.06036376953125, 2.2235107421875, 2.38665771484375, 2.5498046875, 2.71295166015625, 2.8760986328125, 3.03924560546875, 3.202392578125, 3.36553955078125, 3.5286865234375, 3.69183349609375, 3.85498046875, 4.01812744140625, 4.1812744140625, 4.34442138671875, 4.507568359375, 4.67071533203125, 4.8338623046875, 4.99700927734375, 5.16015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 2.0, 6.0, 4.0, 12.0, 11.0, 18.0, 16.0, 28.0, 31.0, 45.0, 56.0, 63.0, 69.0, 67.0, 66.0, 77.0, 66.0, 72.0, 56.0, 47.0, 33.0, 36.0, 35.0, 14.0, 13.0, 11.0, 10.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000457763671875, -0.000441916286945343, -0.00042606890201568604, -0.00041022151708602905, -0.00039437413215637207, -0.0003785267472267151, -0.0003626793622970581, -0.0003468319773674011, -0.00033098459243774414, -0.00031513720750808716, -0.0002992898225784302, -0.0002834424376487732, -0.0002675950527191162, -0.00025174766778945923, -0.00023590028285980225, -0.00022005289793014526, -0.00020420551300048828, -0.0001883581280708313, -0.00017251074314117432, -0.00015666335821151733, -0.00014081597328186035, -0.00012496858835220337, -0.00010912120342254639, -9.32738184928894e-05, -7.742643356323242e-05, -6.157904863357544e-05, -4.573166370391846e-05, -2.9884278774261475e-05, -1.4036893844604492e-05, 1.8104910850524902e-06, 1.7657876014709473e-05, 3.3505260944366455e-05, 4.935264587402344e-05, 6.520003080368042e-05, 8.10474157333374e-05, 9.689480066299438e-05, 0.00011274218559265137, 0.00012858957052230835, 0.00014443695545196533, 0.00016028434038162231, 0.0001761317253112793, 0.00019197911024093628, 0.00020782649517059326, 0.00022367388010025024, 0.00023952126502990723, 0.0002553686499595642, 0.0002712160348892212, 0.0002870634198188782, 0.00030291080474853516, 0.00031875818967819214, 0.0003346055746078491, 0.0003504529595375061, 0.0003663003444671631, 0.00038214772939682007, 0.00039799511432647705, 0.00041384249925613403, 0.000429689884185791, 0.000445537269115448, 0.000461384654045105, 0.00047723203897476196, 0.0004930794239044189, 0.0005089268088340759, 0.0005247741937637329, 0.0005406215786933899, 0.0005564689636230469]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 8.0, 6.0, 19.0, 14.0, 23.0, 34.0, 59.0, 65.0, 128.0, 159.0, 271.0, 407.0, 554.0, 866.0, 1337.0, 1913.0, 3022.0, 4412.0, 6906.0, 10544.0, 16247.0, 25829.0, 40693.0, 63826.0, 97896.0, 133870.0, 157945.0, 148724.0, 114581.0, 78518.0, 50444.0, 31939.0, 20081.0, 12824.0, 8214.0, 5361.0, 3573.0, 2473.0, 1604.0, 1049.0, 677.0, 479.0, 321.0, 196.0, 155.0, 97.0, 70.0, 39.0, 30.0, 19.0, 6.0, 18.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.49609375, -4.34979248046875, -4.2034912109375, -4.05718994140625, -3.910888671875, -3.76458740234375, -3.6182861328125, -3.47198486328125, -3.32568359375, -3.17938232421875, -3.0330810546875, -2.88677978515625, -2.740478515625, -2.59417724609375, -2.4478759765625, -2.30157470703125, -2.1552734375, -2.00897216796875, -1.8626708984375, -1.71636962890625, -1.570068359375, -1.42376708984375, -1.2774658203125, -1.13116455078125, -0.98486328125, -0.83856201171875, -0.6922607421875, -0.54595947265625, -0.399658203125, -0.25335693359375, -0.1070556640625, 0.03924560546875, 0.185546875, 0.33184814453125, 0.4781494140625, 0.62445068359375, 0.770751953125, 0.91705322265625, 1.0633544921875, 1.20965576171875, 1.35595703125, 1.50225830078125, 1.6485595703125, 1.79486083984375, 1.941162109375, 2.08746337890625, 2.2337646484375, 2.38006591796875, 2.5263671875, 2.67266845703125, 2.8189697265625, 2.96527099609375, 3.111572265625, 3.25787353515625, 3.4041748046875, 3.55047607421875, 3.69677734375, 3.84307861328125, 3.9893798828125, 4.13568115234375, 4.281982421875, 4.42828369140625, 4.5745849609375, 4.72088623046875, 4.8671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 1.0, 5.0, 9.0, 5.0, 7.0, 10.0, 11.0, 10.0, 36.0, 20.0, 25.0, 30.0, 34.0, 41.0, 43.0, 40.0, 58.0, 54.0, 54.0, 49.0, 42.0, 40.0, 49.0, 52.0, 48.0, 38.0, 25.0, 29.0, 25.0, 18.0, 16.0, 12.0, 11.0, 9.0, 11.0, 6.0, 3.0, 1.0, 1.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6630859375, -1.6056060791015625, -1.548126220703125, -1.4906463623046875, -1.43316650390625, -1.3756866455078125, -1.318206787109375, -1.2607269287109375, -1.2032470703125, -1.1457672119140625, -1.088287353515625, -1.0308074951171875, -0.97332763671875, -0.9158477783203125, -0.858367919921875, -0.8008880615234375, -0.743408203125, -0.6859283447265625, -0.628448486328125, -0.5709686279296875, -0.51348876953125, -0.4560089111328125, -0.398529052734375, -0.3410491943359375, -0.2835693359375, -0.2260894775390625, -0.168609619140625, -0.1111297607421875, -0.05364990234375, 0.0038299560546875, 0.061309814453125, 0.1187896728515625, 0.17626953125, 0.2337493896484375, 0.291229248046875, 0.3487091064453125, 0.40618896484375, 0.4636688232421875, 0.521148681640625, 0.5786285400390625, 0.6361083984375, 0.6935882568359375, 0.751068115234375, 0.8085479736328125, 0.86602783203125, 0.9235076904296875, 0.980987548828125, 1.0384674072265625, 1.095947265625, 1.1534271240234375, 1.210906982421875, 1.2683868408203125, 1.32586669921875, 1.3833465576171875, 1.440826416015625, 1.4983062744140625, 1.5557861328125, 1.6132659912109375, 1.670745849609375, 1.7282257080078125, 1.78570556640625, 1.8431854248046875, 1.900665283203125, 1.9581451416015625, 2.015625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 7.0, 10.0, 9.0, 19.0, 19.0, 22.0, 20.0, 30.0, 23.0, 32.0, 32.0, 40.0, 38.0, 40.0, 49.0, 51.0, 57.0, 54.0, 44.0, 44.0, 42.0, 38.0, 31.0, 31.0, 25.0, 32.0, 26.0, 21.0, 20.0, 12.0, 11.0, 9.0, 15.0, 10.0, 6.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.013689041137695, -29.141399383544922, -28.269107818603516, -27.396818161010742, -26.52452850341797, -25.652236938476562, -24.77994728088379, -23.907657623291016, -23.03536605834961, -22.163076400756836, -21.29078483581543, -20.418495178222656, -19.546205520629883, -18.67391586303711, -17.801624298095703, -16.92933464050293, -16.057044982910156, -15.184754371643066, -14.312464714050293, -13.440174102783203, -12.56788444519043, -11.69559383392334, -10.82330322265625, -9.951013565063477, -9.078722953796387, -8.206432342529297, -7.334142684936523, -6.461852073669434, -5.589561939239502, -4.71727180480957, -3.8449811935424805, -2.972691059112549, -2.1003990173339844, -1.2281087636947632, -0.355818510055542, 0.5164718627929688, 1.3887619972229004, 2.261052131652832, 3.133342742919922, 4.0056328773498535, 4.877923011779785, 5.750213146209717, 6.622503280639648, 7.494793891906738, 8.367084503173828, 9.239374160766602, 10.111664772033691, 10.983955383300781, 11.856245040893555, 12.728535652160645, 13.600825309753418, 14.473115921020508, 15.345405578613281, 16.217697143554688, 17.08998680114746, 17.962276458740234, 18.83456802368164, 19.706857681274414, 20.57914924621582, 21.451438903808594, 22.323728561401367, 23.19601821899414, 24.068309783935547, 24.94059944152832, 25.812889099121094]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 3.0, 6.0, 3.0, 10.0, 11.0, 10.0, 11.0, 13.0, 17.0, 31.0, 21.0, 38.0, 32.0, 47.0, 25.0, 34.0, 28.0, 33.0, 38.0, 49.0, 48.0, 45.0, 35.0, 44.0, 38.0, 43.0, 33.0, 31.0, 30.0, 29.0, 26.0, 19.0, 17.0, 16.0, 17.0, 7.0, 17.0, 6.0, 10.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.278066635131836, -22.437660217285156, -21.597253799438477, -20.756847381591797, -19.916440963745117, -19.076034545898438, -18.235626220703125, -17.395219802856445, -16.554813385009766, -15.714406967163086, -14.874000549316406, -14.033594131469727, -13.19318675994873, -12.35278034210205, -11.512373924255371, -10.671966552734375, -9.831561088562012, -8.991154670715332, -8.150748252868652, -7.3103413581848145, -6.469934463500977, -5.629528045654297, -4.789121627807617, -3.9487147331237793, -3.1083083152770996, -2.267901659011841, -1.4274951219558716, -0.5870885848999023, 0.25331807136535645, 1.0937247276306152, 1.934131145477295, 2.774538040161133, 3.6149444580078125, 4.455350875854492, 5.29575777053833, 6.13616418838501, 6.976571083068848, 7.816977500915527, 8.657383918762207, 9.497791290283203, 10.338197708129883, 11.178604125976562, 12.019010543823242, 12.859416961669922, 13.699824333190918, 14.540230751037598, 15.380637168884277, 16.221044540405273, 17.061450958251953, 17.901857376098633, 18.742263793945312, 19.582670211791992, 20.423076629638672, 21.263484954833984, 22.10388946533203, 22.944297790527344, 23.78470230102539, 24.62510871887207, 25.46551513671875, 26.30592155456543, 27.14632797241211, 27.986736297607422, 28.82714080810547, 29.66754913330078, 30.50795555114746]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 11.0, 11.0, 30.0, 31.0, 54.0, 96.0, 131.0, 187.0, 304.0, 373.0, 657.0, 974.0, 1557.0, 2340.0, 3601.0, 5438.0, 8408.0, 12676.0, 19349.0, 28793.0, 42207.0, 59779.0, 79755.0, 101794.0, 117758.0, 121747.0, 112708.0, 94085.0, 72122.0, 52359.0, 36484.0, 24562.0, 16584.0, 11009.0, 7029.0, 4757.0, 3057.0, 1962.0, 1248.0, 888.0, 529.0, 373.0, 248.0, 154.0, 112.0, 77.0, 43.0, 40.0, 19.0, 15.0, 10.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-20.953125, -20.283935546875, -19.61474609375, -18.945556640625, -18.2763671875, -17.607177734375, -16.93798828125, -16.268798828125, -15.599609375, -14.930419921875, -14.26123046875, -13.592041015625, -12.9228515625, -12.253662109375, -11.58447265625, -10.915283203125, -10.24609375, -9.576904296875, -8.90771484375, -8.238525390625, -7.5693359375, -6.900146484375, -6.23095703125, -5.561767578125, -4.892578125, -4.223388671875, -3.55419921875, -2.885009765625, -2.2158203125, -1.546630859375, -0.87744140625, -0.208251953125, 0.4609375, 1.130126953125, 1.79931640625, 2.468505859375, 3.1376953125, 3.806884765625, 4.47607421875, 5.145263671875, 5.814453125, 6.483642578125, 7.15283203125, 7.822021484375, 8.4912109375, 9.160400390625, 9.82958984375, 10.498779296875, 11.16796875, 11.837158203125, 12.50634765625, 13.175537109375, 13.8447265625, 14.513916015625, 15.18310546875, 15.852294921875, 16.521484375, 17.190673828125, 17.85986328125, 18.529052734375, 19.1982421875, 19.867431640625, 20.53662109375, 21.205810546875, 21.875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 5.0, 11.0, 6.0, 10.0, 8.0, 11.0, 16.0, 17.0, 26.0, 21.0, 28.0, 31.0, 26.0, 33.0, 35.0, 42.0, 41.0, 35.0, 39.0, 38.0, 49.0, 41.0, 41.0, 33.0, 37.0, 40.0, 30.0, 29.0, 29.0, 17.0, 32.0, 17.0, 12.0, 9.0, 16.0, 10.0, 12.0, 17.0, 10.0, 5.0, 7.0, 8.0, 1.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0], "bins": [-26.1875, -25.374755859375, -24.56201171875, -23.749267578125, -22.9365234375, -22.123779296875, -21.31103515625, -20.498291015625, -19.685546875, -18.872802734375, -18.06005859375, -17.247314453125, -16.4345703125, -15.621826171875, -14.80908203125, -13.996337890625, -13.18359375, -12.370849609375, -11.55810546875, -10.745361328125, -9.9326171875, -9.119873046875, -8.30712890625, -7.494384765625, -6.681640625, -5.868896484375, -5.05615234375, -4.243408203125, -3.4306640625, -2.617919921875, -1.80517578125, -0.992431640625, -0.1796875, 0.633056640625, 1.44580078125, 2.258544921875, 3.0712890625, 3.884033203125, 4.69677734375, 5.509521484375, 6.322265625, 7.135009765625, 7.94775390625, 8.760498046875, 9.5732421875, 10.385986328125, 11.19873046875, 12.011474609375, 12.82421875, 13.636962890625, 14.44970703125, 15.262451171875, 16.0751953125, 16.887939453125, 17.70068359375, 18.513427734375, 19.326171875, 20.138916015625, 20.95166015625, 21.764404296875, 22.5771484375, 23.389892578125, 24.20263671875, 25.015380859375, 25.828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 10.0, 7.0, 20.0, 19.0, 37.0, 60.0, 119.0, 180.0, 215.0, 388.0, 671.0, 969.0, 1573.0, 2496.0, 3890.0, 6256.0, 9886.0, 15187.0, 23635.0, 37028.0, 56061.0, 80285.0, 106592.0, 127898.0, 134330.0, 123014.0, 100213.0, 74044.0, 50768.0, 33265.0, 21724.0, 13704.0, 8779.0, 5474.0, 3575.0, 2191.0, 1454.0, 900.0, 623.0, 364.0, 228.0, 157.0, 104.0, 54.0, 38.0, 26.0, 24.0, 14.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.90625, -23.119384765625, -22.33251953125, -21.545654296875, -20.7587890625, -19.971923828125, -19.18505859375, -18.398193359375, -17.611328125, -16.824462890625, -16.03759765625, -15.250732421875, -14.4638671875, -13.677001953125, -12.89013671875, -12.103271484375, -11.31640625, -10.529541015625, -9.74267578125, -8.955810546875, -8.1689453125, -7.382080078125, -6.59521484375, -5.808349609375, -5.021484375, -4.234619140625, -3.44775390625, -2.660888671875, -1.8740234375, -1.087158203125, -0.30029296875, 0.486572265625, 1.2734375, 2.060302734375, 2.84716796875, 3.634033203125, 4.4208984375, 5.207763671875, 5.99462890625, 6.781494140625, 7.568359375, 8.355224609375, 9.14208984375, 9.928955078125, 10.7158203125, 11.502685546875, 12.28955078125, 13.076416015625, 13.86328125, 14.650146484375, 15.43701171875, 16.223876953125, 17.0107421875, 17.797607421875, 18.58447265625, 19.371337890625, 20.158203125, 20.945068359375, 21.73193359375, 22.518798828125, 23.3056640625, 24.092529296875, 24.87939453125, 25.666259765625, 26.453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 4.0, 9.0, 9.0, 13.0, 12.0, 13.0, 14.0, 17.0, 18.0, 19.0, 36.0, 26.0, 41.0, 26.0, 41.0, 36.0, 46.0, 38.0, 40.0, 43.0, 49.0, 37.0, 30.0, 43.0, 30.0, 28.0, 23.0, 42.0, 32.0, 34.0, 22.0, 17.0, 16.0, 12.0, 20.0, 4.0, 9.0, 4.0, 13.0, 13.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.90771484375, -15.3623046875, -14.81689453125, -14.271484375, -13.72607421875, -13.1806640625, -12.63525390625, -12.08984375, -11.54443359375, -10.9990234375, -10.45361328125, -9.908203125, -9.36279296875, -8.8173828125, -8.27197265625, -7.7265625, -7.18115234375, -6.6357421875, -6.09033203125, -5.544921875, -4.99951171875, -4.4541015625, -3.90869140625, -3.36328125, -2.81787109375, -2.2724609375, -1.72705078125, -1.181640625, -0.63623046875, -0.0908203125, 0.45458984375, 1.0, 1.54541015625, 2.0908203125, 2.63623046875, 3.181640625, 3.72705078125, 4.2724609375, 4.81787109375, 5.36328125, 5.90869140625, 6.4541015625, 6.99951171875, 7.544921875, 8.09033203125, 8.6357421875, 9.18115234375, 9.7265625, 10.27197265625, 10.8173828125, 11.36279296875, 11.908203125, 12.45361328125, 12.9990234375, 13.54443359375, 14.08984375, 14.63525390625, 15.1806640625, 15.72607421875, 16.271484375, 16.81689453125, 17.3623046875, 17.90771484375, 18.453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 15.0, 16.0, 18.0, 38.0, 58.0, 100.0, 137.0, 217.0, 328.0, 507.0, 779.0, 1182.0, 2007.0, 3199.0, 5327.0, 8828.0, 14994.0, 25055.0, 41885.0, 70284.0, 109687.0, 151469.0, 171555.0, 153119.0, 110887.0, 70846.0, 42945.0, 25304.0, 14851.0, 8771.0, 5312.0, 3378.0, 2009.0, 1227.0, 767.0, 538.0, 286.0, 210.0, 124.0, 87.0, 66.0, 45.0, 23.0, 23.0, 13.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1875, -10.8433837890625, -10.499267578125, -10.1551513671875, -9.81103515625, -9.4669189453125, -9.122802734375, -8.7786865234375, -8.4345703125, -8.0904541015625, -7.746337890625, -7.4022216796875, -7.05810546875, -6.7139892578125, -6.369873046875, -6.0257568359375, -5.681640625, -5.3375244140625, -4.993408203125, -4.6492919921875, -4.30517578125, -3.9610595703125, -3.616943359375, -3.2728271484375, -2.9287109375, -2.5845947265625, -2.240478515625, -1.8963623046875, -1.55224609375, -1.2081298828125, -0.864013671875, -0.5198974609375, -0.17578125, 0.1683349609375, 0.512451171875, 0.8565673828125, 1.20068359375, 1.5447998046875, 1.888916015625, 2.2330322265625, 2.5771484375, 2.9212646484375, 3.265380859375, 3.6094970703125, 3.95361328125, 4.2977294921875, 4.641845703125, 4.9859619140625, 5.330078125, 5.6741943359375, 6.018310546875, 6.3624267578125, 6.70654296875, 7.0506591796875, 7.394775390625, 7.7388916015625, 8.0830078125, 8.4271240234375, 8.771240234375, 9.1153564453125, 9.45947265625, 9.8035888671875, 10.147705078125, 10.4918212890625, 10.8359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 10.0, 5.0, 5.0, 14.0, 13.0, 23.0, 22.0, 23.0, 30.0, 34.0, 48.0, 60.0, 65.0, 48.0, 73.0, 55.0, 64.0, 64.0, 54.0, 42.0, 36.0, 44.0, 26.0, 26.0, 18.0, 16.0, 21.0, 18.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001064300537109375, -0.0010243356227874756, -0.0009843707084655762, -0.0009444057941436768, -0.0009044408798217773, -0.0008644759654998779, -0.0008245110511779785, -0.0007845461368560791, -0.0007445812225341797, -0.0007046163082122803, -0.0006646513938903809, -0.0006246864795684814, -0.000584721565246582, -0.0005447566509246826, -0.0005047917366027832, -0.0004648268222808838, -0.0004248619079589844, -0.00038489699363708496, -0.00034493207931518555, -0.00030496716499328613, -0.0002650022506713867, -0.0002250373363494873, -0.0001850724220275879, -0.00014510750770568848, -0.00010514259338378906, -6.517767906188965e-05, -2.5212764739990234e-05, 1.475214958190918e-05, 5.4717063903808594e-05, 9.468197822570801e-05, 0.00013464689254760742, 0.00017461180686950684, 0.00021457672119140625, 0.00025454163551330566, 0.0002945065498352051, 0.0003344714641571045, 0.0003744363784790039, 0.0004144012928009033, 0.00045436620712280273, 0.0004943311214447021, 0.0005342960357666016, 0.000574260950088501, 0.0006142258644104004, 0.0006541907787322998, 0.0006941556930541992, 0.0007341206073760986, 0.000774085521697998, 0.0008140504360198975, 0.0008540153503417969, 0.0008939802646636963, 0.0009339451789855957, 0.0009739100933074951, 0.0010138750076293945, 0.001053839921951294, 0.0010938048362731934, 0.0011337697505950928, 0.0011737346649169922, 0.0012136995792388916, 0.001253664493560791, 0.0012936294078826904, 0.0013335943222045898, 0.0013735592365264893, 0.0014135241508483887, 0.001453489065170288, 0.0014934539794921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 10.0, 24.0, 21.0, 36.0, 63.0, 81.0, 121.0, 173.0, 226.0, 400.0, 659.0, 1014.0, 1749.0, 3068.0, 5397.0, 10431.0, 20843.0, 41291.0, 81940.0, 149284.0, 216478.0, 212306.0, 143379.0, 77883.0, 39633.0, 19395.0, 9813.0, 5416.0, 2999.0, 1604.0, 979.0, 631.0, 404.0, 257.0, 184.0, 100.0, 72.0, 59.0, 37.0, 24.0, 24.0, 11.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-16.78125, -16.30126953125, -15.8212890625, -15.34130859375, -14.861328125, -14.38134765625, -13.9013671875, -13.42138671875, -12.94140625, -12.46142578125, -11.9814453125, -11.50146484375, -11.021484375, -10.54150390625, -10.0615234375, -9.58154296875, -9.1015625, -8.62158203125, -8.1416015625, -7.66162109375, -7.181640625, -6.70166015625, -6.2216796875, -5.74169921875, -5.26171875, -4.78173828125, -4.3017578125, -3.82177734375, -3.341796875, -2.86181640625, -2.3818359375, -1.90185546875, -1.421875, -0.94189453125, -0.4619140625, 0.01806640625, 0.498046875, 0.97802734375, 1.4580078125, 1.93798828125, 2.41796875, 2.89794921875, 3.3779296875, 3.85791015625, 4.337890625, 4.81787109375, 5.2978515625, 5.77783203125, 6.2578125, 6.73779296875, 7.2177734375, 7.69775390625, 8.177734375, 8.65771484375, 9.1376953125, 9.61767578125, 10.09765625, 10.57763671875, 11.0576171875, 11.53759765625, 12.017578125, 12.49755859375, 12.9775390625, 13.45751953125, 13.9375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 3.0, 13.0, 11.0, 13.0, 20.0, 22.0, 26.0, 38.0, 38.0, 58.0, 68.0, 58.0, 55.0, 62.0, 76.0, 73.0, 63.0, 61.0, 53.0, 36.0, 38.0, 20.0, 24.0, 13.0, 13.0, 11.0, 11.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.4324951171875, -4.267333984375, -4.1021728515625, -3.93701171875, -3.7718505859375, -3.606689453125, -3.4415283203125, -3.2763671875, -3.1112060546875, -2.946044921875, -2.7808837890625, -2.61572265625, -2.4505615234375, -2.285400390625, -2.1202392578125, -1.955078125, -1.7899169921875, -1.624755859375, -1.4595947265625, -1.29443359375, -1.1292724609375, -0.964111328125, -0.7989501953125, -0.6337890625, -0.4686279296875, -0.303466796875, -0.1383056640625, 0.02685546875, 0.1920166015625, 0.357177734375, 0.5223388671875, 0.6875, 0.8526611328125, 1.017822265625, 1.1829833984375, 1.34814453125, 1.5133056640625, 1.678466796875, 1.8436279296875, 2.0087890625, 2.1739501953125, 2.339111328125, 2.5042724609375, 2.66943359375, 2.8345947265625, 2.999755859375, 3.1649169921875, 3.330078125, 3.4952392578125, 3.660400390625, 3.8255615234375, 3.99072265625, 4.1558837890625, 4.321044921875, 4.4862060546875, 4.6513671875, 4.8165283203125, 4.981689453125, 5.1468505859375, 5.31201171875, 5.4771728515625, 5.642333984375, 5.8074951171875, 5.97265625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 7.0, 15.0, 12.0, 10.0, 15.0, 15.0, 14.0, 20.0, 15.0, 31.0, 27.0, 27.0, 29.0, 33.0, 32.0, 56.0, 46.0, 52.0, 52.0, 46.0, 45.0, 54.0, 35.0, 31.0, 21.0, 35.0, 41.0, 30.0, 27.0, 22.0, 26.0, 11.0, 8.0, 14.0, 7.0, 2.0, 10.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-28.05633544921875, -27.192575454711914, -26.328815460205078, -25.465055465698242, -24.601295471191406, -23.73753547668457, -22.873775482177734, -22.0100154876709, -21.146255493164062, -20.282495498657227, -19.41873550415039, -18.554975509643555, -17.69121551513672, -16.827455520629883, -15.963695526123047, -15.099935531616211, -14.236175537109375, -13.372415542602539, -12.508655548095703, -11.644895553588867, -10.781135559082031, -9.917375564575195, -9.05361557006836, -8.189855575561523, -7.3260955810546875, -6.462335586547852, -5.598575592041016, -4.73481559753418, -3.8710556030273438, -3.007295608520508, -2.143535614013672, -1.279775619506836, -0.416015625, 0.44774436950683594, 1.3115043640136719, 2.175264358520508, 3.0390243530273438, 3.9027843475341797, 4.766544342041016, 5.630304336547852, 6.4940643310546875, 7.357824325561523, 8.22158432006836, 9.085344314575195, 9.949104309082031, 10.812864303588867, 11.676624298095703, 12.540384292602539, 13.404144287109375, 14.267904281616211, 15.131664276123047, 15.995424270629883, 16.85918426513672, 17.722944259643555, 18.58670425415039, 19.450464248657227, 20.314224243164062, 21.1779842376709, 22.041744232177734, 22.90550422668457, 23.769264221191406, 24.633024215698242, 25.496784210205078, 26.360544204711914, 27.22430419921875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 5.0, 8.0, 10.0, 9.0, 12.0, 19.0, 16.0, 28.0, 32.0, 29.0, 31.0, 24.0, 37.0, 32.0, 38.0, 31.0, 46.0, 39.0, 57.0, 25.0, 28.0, 48.0, 43.0, 22.0, 39.0, 32.0, 30.0, 30.0, 20.0, 18.0, 18.0, 17.0, 24.0, 22.0, 6.0, 10.0, 9.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.508243560791016, -22.67460060119629, -21.84095573425293, -21.007312774658203, -20.173667907714844, -19.340024948120117, -18.50638198852539, -17.67273712158203, -16.839092254638672, -16.005449295043945, -15.171804428100586, -14.33816146850586, -13.5045166015625, -12.670873641967773, -11.83722972869873, -11.003585815429688, -10.169942855834961, -9.336298942565918, -8.502655029296875, -7.66901159286499, -6.835367679595947, -6.001723766326904, -5.1680803298950195, -4.334436416625977, -3.5007925033569336, -2.6671485900878906, -1.8335049152374268, -0.9998612403869629, -0.16621732711791992, 0.667426586151123, 1.5010700225830078, 2.334713935852051, 3.1683578491210938, 4.002001762390137, 4.83564567565918, 5.6692891120910645, 6.502933025360107, 7.33657693862915, 8.170220375061035, 9.003864288330078, 9.837508201599121, 10.671152114868164, 11.504796028137207, 12.33843994140625, 13.172082901000977, 14.005727767944336, 14.839370727539062, 15.673014640808105, 16.50665855407715, 17.340301513671875, 18.173946380615234, 19.00758934020996, 19.84123420715332, 20.674877166748047, 21.508522033691406, 22.342164993286133, 23.17580795288086, 24.009450912475586, 24.843095779418945, 25.676738739013672, 26.51038360595703, 27.344026565551758, 28.177669525146484, 29.011314392089844, 29.844959259033203]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 11.0, 6.0, 28.0, 25.0, 30.0, 47.0, 89.0, 124.0, 175.0, 258.0, 439.0, 701.0, 1063.0, 1808.0, 2848.0, 4463.0, 7490.0, 12447.0, 21131.0, 36270.0, 63995.0, 117180.0, 218846.0, 409481.0, 690896.0, 873440.0, 737718.0, 453561.0, 243820.0, 129071.0, 70805.0, 39356.0, 22495.0, 13257.0, 8118.0, 4877.0, 2984.0, 1783.0, 1213.0, 711.0, 461.0, 293.0, 192.0, 95.0, 76.0, 45.0, 27.0, 18.0, 5.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.6513671875, -31.583984375, -30.5166015625, -29.44921875, -28.3818359375, -27.314453125, -26.2470703125, -25.1796875, -24.1123046875, -23.044921875, -21.9775390625, -20.91015625, -19.8427734375, -18.775390625, -17.7080078125, -16.640625, -15.5732421875, -14.505859375, -13.4384765625, -12.37109375, -11.3037109375, -10.236328125, -9.1689453125, -8.1015625, -7.0341796875, -5.966796875, -4.8994140625, -3.83203125, -2.7646484375, -1.697265625, -0.6298828125, 0.4375, 1.5048828125, 2.572265625, 3.6396484375, 4.70703125, 5.7744140625, 6.841796875, 7.9091796875, 8.9765625, 10.0439453125, 11.111328125, 12.1787109375, 13.24609375, 14.3134765625, 15.380859375, 16.4482421875, 17.515625, 18.5830078125, 19.650390625, 20.7177734375, 21.78515625, 22.8525390625, 23.919921875, 24.9873046875, 26.0546875, 27.1220703125, 28.189453125, 29.2568359375, 30.32421875, 31.3916015625, 32.458984375, 33.5263671875, 34.59375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 11.0, 6.0, 13.0, 12.0, 11.0, 15.0, 26.0, 18.0, 25.0, 28.0, 25.0, 27.0, 25.0, 29.0, 44.0, 26.0, 55.0, 33.0, 36.0, 36.0, 39.0, 35.0, 31.0, 38.0, 39.0, 40.0, 29.0, 24.0, 26.0, 30.0, 24.0, 13.0, 23.0, 15.0, 8.0, 17.0, 8.0, 14.0, 3.0, 4.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-20.765625, -20.0712890625, -19.376953125, -18.6826171875, -17.98828125, -17.2939453125, -16.599609375, -15.9052734375, -15.2109375, -14.5166015625, -13.822265625, -13.1279296875, -12.43359375, -11.7392578125, -11.044921875, -10.3505859375, -9.65625, -8.9619140625, -8.267578125, -7.5732421875, -6.87890625, -6.1845703125, -5.490234375, -4.7958984375, -4.1015625, -3.4072265625, -2.712890625, -2.0185546875, -1.32421875, -0.6298828125, 0.064453125, 0.7587890625, 1.453125, 2.1474609375, 2.841796875, 3.5361328125, 4.23046875, 4.9248046875, 5.619140625, 6.3134765625, 7.0078125, 7.7021484375, 8.396484375, 9.0908203125, 9.78515625, 10.4794921875, 11.173828125, 11.8681640625, 12.5625, 13.2568359375, 13.951171875, 14.6455078125, 15.33984375, 16.0341796875, 16.728515625, 17.4228515625, 18.1171875, 18.8115234375, 19.505859375, 20.2001953125, 20.89453125, 21.5888671875, 22.283203125, 22.9775390625, 23.671875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 14.0, 16.0, 26.0, 45.0, 85.0, 112.0, 155.0, 287.0, 381.0, 587.0, 810.0, 1321.0, 2055.0, 3351.0, 5532.0, 8945.0, 14398.0, 24690.0, 42834.0, 74499.0, 131410.0, 229468.0, 392967.0, 611923.0, 769843.0, 701108.0, 486135.0, 293294.0, 169287.0, 95570.0, 53972.0, 31570.0, 18558.0, 11072.0, 6691.0, 4102.0, 2618.0, 1624.0, 1034.0, 640.0, 443.0, 260.0, 169.0, 126.0, 82.0, 50.0, 36.0, 28.0, 22.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0], "bins": [-37.65625, -36.53955078125, -35.4228515625, -34.30615234375, -33.189453125, -32.07275390625, -30.9560546875, -29.83935546875, -28.72265625, -27.60595703125, -26.4892578125, -25.37255859375, -24.255859375, -23.13916015625, -22.0224609375, -20.90576171875, -19.7890625, -18.67236328125, -17.5556640625, -16.43896484375, -15.322265625, -14.20556640625, -13.0888671875, -11.97216796875, -10.85546875, -9.73876953125, -8.6220703125, -7.50537109375, -6.388671875, -5.27197265625, -4.1552734375, -3.03857421875, -1.921875, -0.80517578125, 0.3115234375, 1.42822265625, 2.544921875, 3.66162109375, 4.7783203125, 5.89501953125, 7.01171875, 8.12841796875, 9.2451171875, 10.36181640625, 11.478515625, 12.59521484375, 13.7119140625, 14.82861328125, 15.9453125, 17.06201171875, 18.1787109375, 19.29541015625, 20.412109375, 21.52880859375, 22.6455078125, 23.76220703125, 24.87890625, 25.99560546875, 27.1123046875, 28.22900390625, 29.345703125, 30.46240234375, 31.5791015625, 32.69580078125, 33.8125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 8.0, 10.0, 8.0, 19.0, 27.0, 28.0, 35.0, 59.0, 60.0, 83.0, 131.0, 111.0, 167.0, 157.0, 191.0, 223.0, 247.0, 252.0, 268.0, 262.0, 264.0, 220.0, 193.0, 180.0, 190.0, 117.0, 116.0, 103.0, 63.0, 58.0, 46.0, 42.0, 33.0, 15.0, 27.0, 19.0, 10.0, 11.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9375, -12.489013671875, -12.04052734375, -11.592041015625, -11.1435546875, -10.695068359375, -10.24658203125, -9.798095703125, -9.349609375, -8.901123046875, -8.45263671875, -8.004150390625, -7.5556640625, -7.107177734375, -6.65869140625, -6.210205078125, -5.76171875, -5.313232421875, -4.86474609375, -4.416259765625, -3.9677734375, -3.519287109375, -3.07080078125, -2.622314453125, -2.173828125, -1.725341796875, -1.27685546875, -0.828369140625, -0.3798828125, 0.068603515625, 0.51708984375, 0.965576171875, 1.4140625, 1.862548828125, 2.31103515625, 2.759521484375, 3.2080078125, 3.656494140625, 4.10498046875, 4.553466796875, 5.001953125, 5.450439453125, 5.89892578125, 6.347412109375, 6.7958984375, 7.244384765625, 7.69287109375, 8.141357421875, 8.58984375, 9.038330078125, 9.48681640625, 9.935302734375, 10.3837890625, 10.832275390625, 11.28076171875, 11.729248046875, 12.177734375, 12.626220703125, 13.07470703125, 13.523193359375, 13.9716796875, 14.420166015625, 14.86865234375, 15.317138671875, 15.765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 9.0, 4.0, 8.0, 9.0, 11.0, 20.0, 19.0, 17.0, 21.0, 32.0, 38.0, 33.0, 45.0, 52.0, 52.0, 53.0, 53.0, 46.0, 60.0, 63.0, 61.0, 44.0, 35.0, 37.0, 28.0, 28.0, 26.0, 18.0, 21.0, 9.0, 13.0, 7.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28080177307129, -30.171932220458984, -29.063060760498047, -27.95418930053711, -26.845319747924805, -25.7364501953125, -24.627578735351562, -23.518707275390625, -22.40983772277832, -21.300968170166016, -20.192096710205078, -19.08322525024414, -17.974355697631836, -16.86548614501953, -15.756614685058594, -14.647744178771973, -13.538873672485352, -12.43000316619873, -11.32113265991211, -10.212262153625488, -9.103391647338867, -7.994521141052246, -6.885650634765625, -5.776780128479004, -4.667909622192383, -3.5590391159057617, -2.4501686096191406, -1.3412981033325195, -0.23242759704589844, 0.8764429092407227, 1.9853134155273438, 3.094183921813965, 4.203052520751953, 5.311923027038574, 6.420793533325195, 7.529664039611816, 8.638534545898438, 9.747405052185059, 10.85627555847168, 11.9651460647583, 13.074016571044922, 14.182887077331543, 15.291757583618164, 16.40062713623047, 17.509498596191406, 18.618370056152344, 19.72723960876465, 20.836109161376953, 21.94498062133789, 23.053852081298828, 24.162721633911133, 25.271591186523438, 26.380462646484375, 27.489334106445312, 28.598203659057617, 29.707073211669922, 30.81594467163086, 31.924816131591797, 33.03368377685547, 34.142555236816406, 35.251426696777344, 36.36029815673828, 37.46916961669922, 38.57803726196289, 39.68690872192383]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 6.0, 10.0, 11.0, 9.0, 15.0, 14.0, 17.0, 14.0, 20.0, 22.0, 29.0, 34.0, 41.0, 24.0, 30.0, 37.0, 40.0, 44.0, 40.0, 43.0, 42.0, 40.0, 32.0, 42.0, 34.0, 36.0, 23.0, 27.0, 27.0, 26.0, 19.0, 20.0, 20.0, 15.0, 19.0, 14.0, 12.0, 10.0, 7.0, 5.0, 7.0, 3.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-24.141315460205078, -23.274580001831055, -22.4078426361084, -21.541107177734375, -20.67436981201172, -19.807634353637695, -18.940898895263672, -18.074161529541016, -17.207426071166992, -16.34069061279297, -15.473953247070312, -14.607217788696289, -13.74048137664795, -12.87374496459961, -12.007009506225586, -11.140273094177246, -10.273536682128906, -9.406800270080566, -8.540063858032227, -7.673328399658203, -6.806591987609863, -5.939855575561523, -5.073119640350342, -4.20638370513916, -3.3396472930908203, -2.4729111194610596, -1.6061749458312988, -0.7394387722015381, 0.12729740142822266, 0.9940338134765625, 1.8607697486877441, 2.727505683898926, 3.5942440032958984, 4.460980415344238, 5.32771635055542, 6.194452285766602, 7.061188697814941, 7.927925109863281, 8.794660568237305, 9.661396980285645, 10.528133392333984, 11.394869804382324, 12.261606216430664, 13.128341674804688, 13.995078086853027, 14.861814498901367, 15.72854995727539, 16.595287322998047, 17.46202278137207, 18.328758239746094, 19.19549560546875, 20.062231063842773, 20.928966522216797, 21.795703887939453, 22.662439346313477, 23.5291748046875, 24.395912170410156, 25.26264762878418, 26.129384994506836, 26.99612045288086, 27.862857818603516, 28.72959327697754, 29.596328735351562, 30.46306610107422, 31.329801559448242]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 10.0, 6.0, 14.0, 17.0, 32.0, 61.0, 99.0, 143.0, 251.0, 397.0, 616.0, 1010.0, 1519.0, 2480.0, 4005.0, 6454.0, 10236.0, 16321.0, 26168.0, 40478.0, 62945.0, 93117.0, 127314.0, 149838.0, 146896.0, 118220.0, 84724.0, 56357.0, 36307.0, 23522.0, 14625.0, 9029.0, 5785.0, 3569.0, 2211.0, 1434.0, 875.0, 557.0, 314.0, 210.0, 134.0, 100.0, 54.0, 32.0, 23.0, 15.0, 14.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-13.265625, -12.88525390625, -12.5048828125, -12.12451171875, -11.744140625, -11.36376953125, -10.9833984375, -10.60302734375, -10.22265625, -9.84228515625, -9.4619140625, -9.08154296875, -8.701171875, -8.32080078125, -7.9404296875, -7.56005859375, -7.1796875, -6.79931640625, -6.4189453125, -6.03857421875, -5.658203125, -5.27783203125, -4.8974609375, -4.51708984375, -4.13671875, -3.75634765625, -3.3759765625, -2.99560546875, -2.615234375, -2.23486328125, -1.8544921875, -1.47412109375, -1.09375, -0.71337890625, -0.3330078125, 0.04736328125, 0.427734375, 0.80810546875, 1.1884765625, 1.56884765625, 1.94921875, 2.32958984375, 2.7099609375, 3.09033203125, 3.470703125, 3.85107421875, 4.2314453125, 4.61181640625, 4.9921875, 5.37255859375, 5.7529296875, 6.13330078125, 6.513671875, 6.89404296875, 7.2744140625, 7.65478515625, 8.03515625, 8.41552734375, 8.7958984375, 9.17626953125, 9.556640625, 9.93701171875, 10.3173828125, 10.69775390625, 11.078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 6.0, 8.0, 14.0, 15.0, 20.0, 14.0, 17.0, 23.0, 16.0, 19.0, 32.0, 33.0, 38.0, 29.0, 31.0, 36.0, 50.0, 44.0, 53.0, 42.0, 46.0, 42.0, 37.0, 32.0, 26.0, 22.0, 34.0, 25.0, 32.0, 31.0, 11.0, 20.0, 19.0, 14.0, 6.0, 14.0, 10.0, 5.0, 4.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.03125, -28.0986328125, -27.166015625, -26.2333984375, -25.30078125, -24.3681640625, -23.435546875, -22.5029296875, -21.5703125, -20.6376953125, -19.705078125, -18.7724609375, -17.83984375, -16.9072265625, -15.974609375, -15.0419921875, -14.109375, -13.1767578125, -12.244140625, -11.3115234375, -10.37890625, -9.4462890625, -8.513671875, -7.5810546875, -6.6484375, -5.7158203125, -4.783203125, -3.8505859375, -2.91796875, -1.9853515625, -1.052734375, -0.1201171875, 0.8125, 1.7451171875, 2.677734375, 3.6103515625, 4.54296875, 5.4755859375, 6.408203125, 7.3408203125, 8.2734375, 9.2060546875, 10.138671875, 11.0712890625, 12.00390625, 12.9365234375, 13.869140625, 14.8017578125, 15.734375, 16.6669921875, 17.599609375, 18.5322265625, 19.46484375, 20.3974609375, 21.330078125, 22.2626953125, 23.1953125, 24.1279296875, 25.060546875, 25.9931640625, 26.92578125, 27.8583984375, 28.791015625, 29.7236328125, 30.65625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 2.0, 5.0, 16.0, 29.0, 27.0, 59.0, 85.0, 121.0, 193.0, 338.0, 506.0, 821.0, 1347.0, 2411.0, 4081.0, 7361.0, 13245.0, 23959.0, 43790.0, 79309.0, 137206.0, 199946.0, 202919.0, 142915.0, 84028.0, 46146.0, 25478.0, 14027.0, 7680.0, 4234.0, 2529.0, 1480.0, 869.0, 535.0, 315.0, 182.0, 125.0, 77.0, 53.0, 29.0, 26.0, 13.0, 18.0, 10.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.921875, -19.319091796875, -18.71630859375, -18.113525390625, -17.5107421875, -16.907958984375, -16.30517578125, -15.702392578125, -15.099609375, -14.496826171875, -13.89404296875, -13.291259765625, -12.6884765625, -12.085693359375, -11.48291015625, -10.880126953125, -10.27734375, -9.674560546875, -9.07177734375, -8.468994140625, -7.8662109375, -7.263427734375, -6.66064453125, -6.057861328125, -5.455078125, -4.852294921875, -4.24951171875, -3.646728515625, -3.0439453125, -2.441162109375, -1.83837890625, -1.235595703125, -0.6328125, -0.030029296875, 0.57275390625, 1.175537109375, 1.7783203125, 2.381103515625, 2.98388671875, 3.586669921875, 4.189453125, 4.792236328125, 5.39501953125, 5.997802734375, 6.6005859375, 7.203369140625, 7.80615234375, 8.408935546875, 9.01171875, 9.614501953125, 10.21728515625, 10.820068359375, 11.4228515625, 12.025634765625, 12.62841796875, 13.231201171875, 13.833984375, 14.436767578125, 15.03955078125, 15.642333984375, 16.2451171875, 16.847900390625, 17.45068359375, 18.053466796875, 18.65625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 8.0, 8.0, 11.0, 14.0, 17.0, 24.0, 28.0, 28.0, 36.0, 27.0, 43.0, 37.0, 29.0, 48.0, 48.0, 52.0, 52.0, 42.0, 42.0, 45.0, 38.0, 33.0, 28.0, 31.0, 31.0, 34.0, 22.0, 21.0, 20.0, 8.0, 20.0, 13.0, 6.0, 5.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -20.039306640625, -19.40673828125, -18.774169921875, -18.1416015625, -17.509033203125, -16.87646484375, -16.243896484375, -15.611328125, -14.978759765625, -14.34619140625, -13.713623046875, -13.0810546875, -12.448486328125, -11.81591796875, -11.183349609375, -10.55078125, -9.918212890625, -9.28564453125, -8.653076171875, -8.0205078125, -7.387939453125, -6.75537109375, -6.122802734375, -5.490234375, -4.857666015625, -4.22509765625, -3.592529296875, -2.9599609375, -2.327392578125, -1.69482421875, -1.062255859375, -0.4296875, 0.202880859375, 0.83544921875, 1.468017578125, 2.1005859375, 2.733154296875, 3.36572265625, 3.998291015625, 4.630859375, 5.263427734375, 5.89599609375, 6.528564453125, 7.1611328125, 7.793701171875, 8.42626953125, 9.058837890625, 9.69140625, 10.323974609375, 10.95654296875, 11.589111328125, 12.2216796875, 12.854248046875, 13.48681640625, 14.119384765625, 14.751953125, 15.384521484375, 16.01708984375, 16.649658203125, 17.2822265625, 17.914794921875, 18.54736328125, 19.179931640625, 19.8125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 12.0, 19.0, 30.0, 32.0, 53.0, 88.0, 136.0, 196.0, 301.0, 485.0, 763.0, 1116.0, 1781.0, 3004.0, 5258.0, 9735.0, 18323.0, 36722.0, 74546.0, 146512.0, 237381.0, 230927.0, 138135.0, 69470.0, 34235.0, 17292.0, 9153.0, 4993.0, 2883.0, 1824.0, 1089.0, 706.0, 460.0, 287.0, 199.0, 118.0, 77.0, 58.0, 46.0, 31.0, 21.0, 11.0, 6.0, 8.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8795166015625, -5.669189453125, -5.4588623046875, -5.24853515625, -5.0382080078125, -4.827880859375, -4.6175537109375, -4.4072265625, -4.1968994140625, -3.986572265625, -3.7762451171875, -3.56591796875, -3.3555908203125, -3.145263671875, -2.9349365234375, -2.724609375, -2.5142822265625, -2.303955078125, -2.0936279296875, -1.88330078125, -1.6729736328125, -1.462646484375, -1.2523193359375, -1.0419921875, -0.8316650390625, -0.621337890625, -0.4110107421875, -0.20068359375, 0.0096435546875, 0.219970703125, 0.4302978515625, 0.640625, 0.8509521484375, 1.061279296875, 1.2716064453125, 1.48193359375, 1.6922607421875, 1.902587890625, 2.1129150390625, 2.3232421875, 2.5335693359375, 2.743896484375, 2.9542236328125, 3.16455078125, 3.3748779296875, 3.585205078125, 3.7955322265625, 4.005859375, 4.2161865234375, 4.426513671875, 4.6368408203125, 4.84716796875, 5.0574951171875, 5.267822265625, 5.4781494140625, 5.6884765625, 5.8988037109375, 6.109130859375, 6.3194580078125, 6.52978515625, 6.7401123046875, 6.950439453125, 7.1607666015625, 7.37109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 12.0, 13.0, 22.0, 25.0, 30.0, 49.0, 42.0, 52.0, 56.0, 68.0, 76.0, 70.0, 71.0, 57.0, 57.0, 73.0, 42.0, 34.0, 34.0, 25.0, 20.0, 14.0, 8.0, 10.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003542900085449219, -0.0003371909260749817, -0.0003200918436050415, -0.0003029927611351013, -0.00028589367866516113, -0.00026879459619522095, -0.00025169551372528076, -0.00023459643125534058, -0.0002174973487854004, -0.0002003982663154602, -0.00018329918384552002, -0.00016620010137557983, -0.00014910101890563965, -0.00013200193643569946, -0.00011490285396575928, -9.780377149581909e-05, -8.07046890258789e-05, -6.360560655593872e-05, -4.6506524085998535e-05, -2.940744161605835e-05, -1.2308359146118164e-05, 4.7907233238220215e-06, 2.1889805793762207e-05, 3.898888826370239e-05, 5.608797073364258e-05, 7.318705320358276e-05, 9.028613567352295e-05, 0.00010738521814346313, 0.00012448430061340332, 0.0001415833830833435, 0.0001586824655532837, 0.00017578154802322388, 0.00019288063049316406, 0.00020997971296310425, 0.00022707879543304443, 0.0002441778779029846, 0.0002612769603729248, 0.000278376042842865, 0.0002954751253128052, 0.00031257420778274536, 0.00032967329025268555, 0.00034677237272262573, 0.0003638714551925659, 0.0003809705376625061, 0.0003980696201324463, 0.0004151687026023865, 0.00043226778507232666, 0.00044936686754226685, 0.00046646595001220703, 0.0004835650324821472, 0.0005006641149520874, 0.0005177631974220276, 0.0005348622798919678, 0.000551961362361908, 0.0005690604448318481, 0.0005861595273017883, 0.0006032586097717285, 0.0006203576922416687, 0.0006374567747116089, 0.0006545558571815491, 0.0006716549396514893, 0.0006887540221214294, 0.0007058531045913696, 0.0007229521870613098, 0.00074005126953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 5.0, 7.0, 13.0, 12.0, 23.0, 54.0, 72.0, 90.0, 151.0, 234.0, 349.0, 581.0, 966.0, 1426.0, 2559.0, 4383.0, 7695.0, 13723.0, 25453.0, 48065.0, 91723.0, 159932.0, 219959.0, 198534.0, 125128.0, 67763.0, 35777.0, 19133.0, 10463.0, 5755.0, 3326.0, 1954.0, 1220.0, 763.0, 442.0, 300.0, 159.0, 132.0, 75.0, 44.0, 34.0, 25.0, 17.0, 13.0, 11.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.1953125, -6.96142578125, -6.7275390625, -6.49365234375, -6.259765625, -6.02587890625, -5.7919921875, -5.55810546875, -5.32421875, -5.09033203125, -4.8564453125, -4.62255859375, -4.388671875, -4.15478515625, -3.9208984375, -3.68701171875, -3.453125, -3.21923828125, -2.9853515625, -2.75146484375, -2.517578125, -2.28369140625, -2.0498046875, -1.81591796875, -1.58203125, -1.34814453125, -1.1142578125, -0.88037109375, -0.646484375, -0.41259765625, -0.1787109375, 0.05517578125, 0.2890625, 0.52294921875, 0.7568359375, 0.99072265625, 1.224609375, 1.45849609375, 1.6923828125, 1.92626953125, 2.16015625, 2.39404296875, 2.6279296875, 2.86181640625, 3.095703125, 3.32958984375, 3.5634765625, 3.79736328125, 4.03125, 4.26513671875, 4.4990234375, 4.73291015625, 4.966796875, 5.20068359375, 5.4345703125, 5.66845703125, 5.90234375, 6.13623046875, 6.3701171875, 6.60400390625, 6.837890625, 7.07177734375, 7.3056640625, 7.53955078125, 7.7734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 7.0, 8.0, 16.0, 18.0, 21.0, 27.0, 20.0, 32.0, 27.0, 45.0, 51.0, 61.0, 57.0, 52.0, 64.0, 71.0, 65.0, 61.0, 51.0, 42.0, 34.0, 28.0, 25.0, 23.0, 27.0, 4.0, 7.0, 8.0, 4.0, 9.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.938934326171875, -1.86614990234375, -1.793365478515625, -1.7205810546875, -1.647796630859375, -1.57501220703125, -1.502227783203125, -1.429443359375, -1.356658935546875, -1.28387451171875, -1.211090087890625, -1.1383056640625, -1.065521240234375, -0.99273681640625, -0.919952392578125, -0.84716796875, -0.774383544921875, -0.70159912109375, -0.628814697265625, -0.5560302734375, -0.483245849609375, -0.41046142578125, -0.337677001953125, -0.264892578125, -0.192108154296875, -0.11932373046875, -0.046539306640625, 0.0262451171875, 0.099029541015625, 0.17181396484375, 0.244598388671875, 0.3173828125, 0.390167236328125, 0.46295166015625, 0.535736083984375, 0.6085205078125, 0.681304931640625, 0.75408935546875, 0.826873779296875, 0.899658203125, 0.972442626953125, 1.04522705078125, 1.118011474609375, 1.1907958984375, 1.263580322265625, 1.33636474609375, 1.409149169921875, 1.48193359375, 1.554718017578125, 1.62750244140625, 1.700286865234375, 1.7730712890625, 1.845855712890625, 1.91864013671875, 1.991424560546875, 2.064208984375, 2.136993408203125, 2.20977783203125, 2.282562255859375, 2.3553466796875, 2.428131103515625, 2.50091552734375, 2.573699951171875, 2.646484375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 9.0, 9.0, 7.0, 9.0, 16.0, 18.0, 21.0, 25.0, 28.0, 34.0, 32.0, 43.0, 50.0, 50.0, 53.0, 42.0, 51.0, 51.0, 61.0, 56.0, 45.0, 54.0, 39.0, 22.0, 30.0, 23.0, 18.0, 27.0, 14.0, 15.0, 9.0, 4.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.657066345214844, -29.584033966064453, -28.51099967956543, -27.43796730041504, -26.364933013916016, -25.291900634765625, -24.218868255615234, -23.145835876464844, -22.07280158996582, -20.99976921081543, -19.926734924316406, -18.853702545166016, -17.780670166015625, -16.7076358795166, -15.634603500366211, -14.561570167541504, -13.488536834716797, -12.41550350189209, -11.342470169067383, -10.269437789916992, -9.196404457092285, -8.123371124267578, -7.050338268280029, -5.9773054122924805, -4.904272079467773, -3.8312389850616455, -2.7582058906555176, -1.6851727962493896, -0.6121397018432617, 0.4608936309814453, 1.5339264869689941, 2.606959342956543, 3.67999267578125, 4.753026008605957, 5.826058864593506, 6.899091720581055, 7.972125053405762, 9.045158386230469, 10.11819076538086, 11.191224098205566, 12.264257431030273, 13.33729076385498, 14.410324096679688, 15.483356475830078, 16.55638885498047, 17.629423141479492, 18.702455520629883, 19.775489807128906, 20.848522186279297, 21.921554565429688, 22.99458885192871, 24.0676212310791, 25.140655517578125, 26.213687896728516, 27.286720275878906, 28.359752655029297, 29.43278694152832, 30.50581932067871, 31.578853607177734, 32.651885986328125, 33.724918365478516, 34.797950744628906, 35.87098693847656, 36.94401931762695, 38.017051696777344]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 15.0, 7.0, 16.0, 19.0, 11.0, 15.0, 22.0, 26.0, 23.0, 41.0, 33.0, 28.0, 22.0, 47.0, 42.0, 42.0, 39.0, 46.0, 32.0, 46.0, 34.0, 37.0, 36.0, 35.0, 18.0, 32.0, 28.0, 26.0, 18.0, 15.0, 27.0, 18.0, 16.0, 14.0, 14.0, 5.0, 7.0, 7.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-24.079010009765625, -23.21695899963379, -22.354907989501953, -21.492855072021484, -20.63080406188965, -19.768753051757812, -18.906700134277344, -18.044649124145508, -17.182598114013672, -16.320547103881836, -15.458495140075684, -14.596443176269531, -13.734392166137695, -12.87234115600586, -12.010289192199707, -11.148237228393555, -10.286186218261719, -9.424135208129883, -8.56208324432373, -7.700031757354736, -6.837980270385742, -5.975928783416748, -5.113877296447754, -4.25182580947876, -3.3897743225097656, -2.5277228355407715, -1.6656713485717773, -0.8036198616027832, 0.05843162536621094, 0.9204831123352051, 1.7825345993041992, 2.6445860862731934, 3.5066356658935547, 4.368687152862549, 5.230738639831543, 6.092790126800537, 6.954841613769531, 7.816893100738525, 8.67894458770752, 9.540996551513672, 10.403047561645508, 11.265098571777344, 12.127150535583496, 12.989202499389648, 13.851253509521484, 14.71330451965332, 15.575356483459473, 16.437408447265625, 17.29945945739746, 18.161510467529297, 19.023563385009766, 19.8856143951416, 20.747665405273438, 21.609716415405273, 22.47176742553711, 23.333820343017578, 24.195871353149414, 25.05792236328125, 25.91997528076172, 26.782026290893555, 27.64407730102539, 28.506128311157227, 29.368179321289062, 30.23023223876953, 31.092283248901367]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 10.0, 13.0, 15.0, 24.0, 45.0, 72.0, 113.0, 169.0, 276.0, 423.0, 762.0, 1170.0, 1865.0, 3025.0, 4969.0, 7816.0, 12895.0, 20396.0, 32089.0, 48856.0, 70667.0, 96276.0, 119186.0, 131807.0, 127548.0, 109689.0, 85341.0, 60900.0, 41384.0, 26314.0, 16795.0, 10452.0, 6560.0, 4015.0, 2520.0, 1552.0, 966.0, 590.0, 398.0, 205.0, 129.0, 90.0, 62.0, 34.0, 20.0, 17.0, 13.0, 9.0, 4.0, 3.0, 3.0, 0.0, 5.0, 1.0], "bins": [-26.59375, -25.806640625, -25.01953125, -24.232421875, -23.4453125, -22.658203125, -21.87109375, -21.083984375, -20.296875, -19.509765625, -18.72265625, -17.935546875, -17.1484375, -16.361328125, -15.57421875, -14.787109375, -14.0, -13.212890625, -12.42578125, -11.638671875, -10.8515625, -10.064453125, -9.27734375, -8.490234375, -7.703125, -6.916015625, -6.12890625, -5.341796875, -4.5546875, -3.767578125, -2.98046875, -2.193359375, -1.40625, -0.619140625, 0.16796875, 0.955078125, 1.7421875, 2.529296875, 3.31640625, 4.103515625, 4.890625, 5.677734375, 6.46484375, 7.251953125, 8.0390625, 8.826171875, 9.61328125, 10.400390625, 11.1875, 11.974609375, 12.76171875, 13.548828125, 14.3359375, 15.123046875, 15.91015625, 16.697265625, 17.484375, 18.271484375, 19.05859375, 19.845703125, 20.6328125, 21.419921875, 22.20703125, 22.994140625, 23.78125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 6.0, 7.0, 8.0, 10.0, 11.0, 22.0, 20.0, 20.0, 16.0, 27.0, 29.0, 34.0, 32.0, 34.0, 36.0, 35.0, 50.0, 55.0, 46.0, 45.0, 34.0, 38.0, 39.0, 31.0, 40.0, 36.0, 30.0, 31.0, 25.0, 17.0, 17.0, 14.0, 12.0, 25.0, 8.0, 12.0, 9.0, 9.0, 3.0, 2.0, 9.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.921875, -26.969970703125, -26.01806640625, -25.066162109375, -24.1142578125, -23.162353515625, -22.21044921875, -21.258544921875, -20.306640625, -19.354736328125, -18.40283203125, -17.450927734375, -16.4990234375, -15.547119140625, -14.59521484375, -13.643310546875, -12.69140625, -11.739501953125, -10.78759765625, -9.835693359375, -8.8837890625, -7.931884765625, -6.97998046875, -6.028076171875, -5.076171875, -4.124267578125, -3.17236328125, -2.220458984375, -1.2685546875, -0.316650390625, 0.63525390625, 1.587158203125, 2.5390625, 3.490966796875, 4.44287109375, 5.394775390625, 6.3466796875, 7.298583984375, 8.25048828125, 9.202392578125, 10.154296875, 11.106201171875, 12.05810546875, 13.010009765625, 13.9619140625, 14.913818359375, 15.86572265625, 16.817626953125, 17.76953125, 18.721435546875, 19.67333984375, 20.625244140625, 21.5771484375, 22.529052734375, 23.48095703125, 24.432861328125, 25.384765625, 26.336669921875, 27.28857421875, 28.240478515625, 29.1923828125, 30.144287109375, 31.09619140625, 32.048095703125, 33.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 8.0, 18.0, 35.0, 30.0, 63.0, 116.0, 139.0, 234.0, 362.0, 601.0, 816.0, 1368.0, 2044.0, 3183.0, 4690.0, 7318.0, 10934.0, 16577.0, 24619.0, 35975.0, 50840.0, 68961.0, 89580.0, 107172.0, 116673.0, 115262.0, 102211.0, 82839.0, 62634.0, 46066.0, 32059.0, 21728.0, 14693.0, 9750.0, 6495.0, 4323.0, 2854.0, 1880.0, 1187.0, 839.0, 515.0, 311.0, 209.0, 128.0, 73.0, 55.0, 37.0, 18.0, 11.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.453125, -23.708740234375, -22.96435546875, -22.219970703125, -21.4755859375, -20.731201171875, -19.98681640625, -19.242431640625, -18.498046875, -17.753662109375, -17.00927734375, -16.264892578125, -15.5205078125, -14.776123046875, -14.03173828125, -13.287353515625, -12.54296875, -11.798583984375, -11.05419921875, -10.309814453125, -9.5654296875, -8.821044921875, -8.07666015625, -7.332275390625, -6.587890625, -5.843505859375, -5.09912109375, -4.354736328125, -3.6103515625, -2.865966796875, -2.12158203125, -1.377197265625, -0.6328125, 0.111572265625, 0.85595703125, 1.600341796875, 2.3447265625, 3.089111328125, 3.83349609375, 4.577880859375, 5.322265625, 6.066650390625, 6.81103515625, 7.555419921875, 8.2998046875, 9.044189453125, 9.78857421875, 10.532958984375, 11.27734375, 12.021728515625, 12.76611328125, 13.510498046875, 14.2548828125, 14.999267578125, 15.74365234375, 16.488037109375, 17.232421875, 17.976806640625, 18.72119140625, 19.465576171875, 20.2099609375, 20.954345703125, 21.69873046875, 22.443115234375, 23.1875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 5.0, 5.0, 17.0, 11.0, 18.0, 19.0, 19.0, 22.0, 29.0, 26.0, 22.0, 32.0, 34.0, 43.0, 35.0, 51.0, 35.0, 35.0, 40.0, 47.0, 40.0, 33.0, 49.0, 31.0, 19.0, 34.0, 38.0, 24.0, 30.0, 22.0, 14.0, 21.0, 7.0, 18.0, 9.0, 10.0, 11.0, 6.0, 5.0, 2.0, 8.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.9375, -18.323974609375, -17.71044921875, -17.096923828125, -16.4833984375, -15.869873046875, -15.25634765625, -14.642822265625, -14.029296875, -13.415771484375, -12.80224609375, -12.188720703125, -11.5751953125, -10.961669921875, -10.34814453125, -9.734619140625, -9.12109375, -8.507568359375, -7.89404296875, -7.280517578125, -6.6669921875, -6.053466796875, -5.43994140625, -4.826416015625, -4.212890625, -3.599365234375, -2.98583984375, -2.372314453125, -1.7587890625, -1.145263671875, -0.53173828125, 0.081787109375, 0.6953125, 1.308837890625, 1.92236328125, 2.535888671875, 3.1494140625, 3.762939453125, 4.37646484375, 4.989990234375, 5.603515625, 6.217041015625, 6.83056640625, 7.444091796875, 8.0576171875, 8.671142578125, 9.28466796875, 9.898193359375, 10.51171875, 11.125244140625, 11.73876953125, 12.352294921875, 12.9658203125, 13.579345703125, 14.19287109375, 14.806396484375, 15.419921875, 16.033447265625, 16.64697265625, 17.260498046875, 17.8740234375, 18.487548828125, 19.10107421875, 19.714599609375, 20.328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 25.0, 22.0, 45.0, 42.0, 83.0, 139.0, 229.0, 339.0, 555.0, 916.0, 1414.0, 2304.0, 3792.0, 6081.0, 10002.0, 16363.0, 26099.0, 41179.0, 63170.0, 92091.0, 123227.0, 144334.0, 143115.0, 119675.0, 88760.0, 60372.0, 39006.0, 24737.0, 15421.0, 9517.0, 5947.0, 3634.0, 2295.0, 1338.0, 857.0, 528.0, 323.0, 207.0, 125.0, 82.0, 52.0, 37.0, 19.0, 14.0, 12.0, 9.0, 8.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-10.7734375, -10.4560546875, -10.138671875, -9.8212890625, -9.50390625, -9.1865234375, -8.869140625, -8.5517578125, -8.234375, -7.9169921875, -7.599609375, -7.2822265625, -6.96484375, -6.6474609375, -6.330078125, -6.0126953125, -5.6953125, -5.3779296875, -5.060546875, -4.7431640625, -4.42578125, -4.1083984375, -3.791015625, -3.4736328125, -3.15625, -2.8388671875, -2.521484375, -2.2041015625, -1.88671875, -1.5693359375, -1.251953125, -0.9345703125, -0.6171875, -0.2998046875, 0.017578125, 0.3349609375, 0.65234375, 0.9697265625, 1.287109375, 1.6044921875, 1.921875, 2.2392578125, 2.556640625, 2.8740234375, 3.19140625, 3.5087890625, 3.826171875, 4.1435546875, 4.4609375, 4.7783203125, 5.095703125, 5.4130859375, 5.73046875, 6.0478515625, 6.365234375, 6.6826171875, 7.0, 7.3173828125, 7.634765625, 7.9521484375, 8.26953125, 8.5869140625, 8.904296875, 9.2216796875, 9.5390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 7.0, 5.0, 7.0, 15.0, 21.0, 21.0, 17.0, 27.0, 27.0, 37.0, 35.0, 36.0, 42.0, 37.0, 51.0, 47.0, 46.0, 64.0, 63.0, 43.0, 43.0, 61.0, 34.0, 29.0, 26.0, 20.0, 22.0, 24.0, 16.0, 12.0, 8.0, 7.0, 9.0, 5.0, 3.0, 9.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0010843276977539062, -0.0010512620210647583, -0.0010181963443756104, -0.0009851306676864624, -0.0009520649909973145, -0.0009189993143081665, -0.0008859336376190186, -0.0008528679609298706, -0.0008198022842407227, -0.0007867366075515747, -0.0007536709308624268, -0.0007206052541732788, -0.0006875395774841309, -0.0006544739007949829, -0.000621408224105835, -0.000588342547416687, -0.0005552768707275391, -0.0005222111940383911, -0.0004891455173492432, -0.0004560798406600952, -0.00042301416397094727, -0.0003899484872817993, -0.00035688281059265137, -0.0003238171339035034, -0.00029075145721435547, -0.0002576857805252075, -0.00022462010383605957, -0.00019155442714691162, -0.00015848875045776367, -0.00012542307376861572, -9.235739707946777e-05, -5.9291720390319824e-05, -2.6226043701171875e-05, 6.839632987976074e-06, 3.9905309677124023e-05, 7.297098636627197e-05, 0.00010603666305541992, 0.00013910233974456787, 0.00017216801643371582, 0.00020523369312286377, 0.00023829936981201172, 0.00027136504650115967, 0.0003044307231903076, 0.00033749639987945557, 0.0003705620765686035, 0.00040362775325775146, 0.0004366934299468994, 0.00046975910663604736, 0.0005028247833251953, 0.0005358904600143433, 0.0005689561367034912, 0.0006020218133926392, 0.0006350874900817871, 0.0006681531667709351, 0.000701218843460083, 0.000734284520149231, 0.0007673501968383789, 0.0008004158735275269, 0.0008334815502166748, 0.0008665472269058228, 0.0008996129035949707, 0.0009326785802841187, 0.0009657442569732666, 0.0009988099336624146, 0.0010318756103515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 8.0, 13.0, 25.0, 34.0, 50.0, 58.0, 124.0, 156.0, 307.0, 449.0, 740.0, 1185.0, 1897.0, 3183.0, 5313.0, 9142.0, 15879.0, 26876.0, 46308.0, 78085.0, 119635.0, 161447.0, 174194.0, 147110.0, 102110.0, 64039.0, 37500.0, 21846.0, 12484.0, 7372.0, 4285.0, 2636.0, 1522.0, 1000.0, 561.0, 362.0, 237.0, 138.0, 103.0, 50.0, 38.0, 18.0, 14.0, 7.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.2584228515625, -10.860595703125, -10.4627685546875, -10.06494140625, -9.6671142578125, -9.269287109375, -8.8714599609375, -8.4736328125, -8.0758056640625, -7.677978515625, -7.2801513671875, -6.88232421875, -6.4844970703125, -6.086669921875, -5.6888427734375, -5.291015625, -4.8931884765625, -4.495361328125, -4.0975341796875, -3.69970703125, -3.3018798828125, -2.904052734375, -2.5062255859375, -2.1083984375, -1.7105712890625, -1.312744140625, -0.9149169921875, -0.51708984375, -0.1192626953125, 0.278564453125, 0.6763916015625, 1.07421875, 1.4720458984375, 1.869873046875, 2.2677001953125, 2.66552734375, 3.0633544921875, 3.461181640625, 3.8590087890625, 4.2568359375, 4.6546630859375, 5.052490234375, 5.4503173828125, 5.84814453125, 6.2459716796875, 6.643798828125, 7.0416259765625, 7.439453125, 7.8372802734375, 8.235107421875, 8.6329345703125, 9.03076171875, 9.4285888671875, 9.826416015625, 10.2242431640625, 10.6220703125, 11.0198974609375, 11.417724609375, 11.8155517578125, 12.21337890625, 12.6112060546875, 13.009033203125, 13.4068603515625, 13.8046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 8.0, 11.0, 9.0, 10.0, 13.0, 14.0, 22.0, 24.0, 27.0, 40.0, 33.0, 39.0, 34.0, 54.0, 44.0, 58.0, 56.0, 59.0, 46.0, 40.0, 45.0, 53.0, 36.0, 31.0, 28.0, 22.0, 24.0, 24.0, 15.0, 18.0, 16.0, 10.0, 5.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0], "bins": [-5.0234375, -4.891815185546875, -4.76019287109375, -4.628570556640625, -4.4969482421875, -4.365325927734375, -4.23370361328125, -4.102081298828125, -3.970458984375, -3.838836669921875, -3.70721435546875, -3.575592041015625, -3.4439697265625, -3.312347412109375, -3.18072509765625, -3.049102783203125, -2.91748046875, -2.785858154296875, -2.65423583984375, -2.522613525390625, -2.3909912109375, -2.259368896484375, -2.12774658203125, -1.996124267578125, -1.864501953125, -1.732879638671875, -1.60125732421875, -1.469635009765625, -1.3380126953125, -1.206390380859375, -1.07476806640625, -0.943145751953125, -0.8115234375, -0.679901123046875, -0.54827880859375, -0.416656494140625, -0.2850341796875, -0.153411865234375, -0.02178955078125, 0.109832763671875, 0.241455078125, 0.373077392578125, 0.50469970703125, 0.636322021484375, 0.7679443359375, 0.899566650390625, 1.03118896484375, 1.162811279296875, 1.29443359375, 1.426055908203125, 1.55767822265625, 1.689300537109375, 1.8209228515625, 1.952545166015625, 2.08416748046875, 2.215789794921875, 2.347412109375, 2.479034423828125, 2.61065673828125, 2.742279052734375, 2.8739013671875, 3.005523681640625, 3.13714599609375, 3.268768310546875, 3.400390625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 10.0, 4.0, 6.0, 13.0, 19.0, 23.0, 23.0, 26.0, 29.0, 37.0, 45.0, 49.0, 37.0, 50.0, 52.0, 48.0, 54.0, 49.0, 55.0, 45.0, 37.0, 45.0, 31.0, 33.0, 22.0, 29.0, 21.0, 25.0, 8.0, 17.0, 6.0, 8.0, 0.0, 7.0, 4.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.262115478515625, -30.227493286132812, -29.192869186401367, -28.158246994018555, -27.12362289428711, -26.089000701904297, -25.054378509521484, -24.01975440979004, -22.985130310058594, -21.95050811767578, -20.915884017944336, -19.881261825561523, -18.846637725830078, -17.812015533447266, -16.777393341064453, -15.742769241333008, -14.708147048950195, -13.673523902893066, -12.638900756835938, -11.604278564453125, -10.56965446472168, -9.535032272338867, -8.500409126281738, -7.465785980224609, -6.4311628341674805, -5.396539688110352, -4.361916542053223, -3.327293872833252, -2.292670726776123, -1.2580475807189941, -0.22342491149902344, 0.8111982345581055, 1.8458213806152344, 2.8804445266723633, 3.915067434310913, 4.949690341949463, 5.984313488006592, 7.018936634063721, 8.053559303283691, 9.08818244934082, 10.12280559539795, 11.157428741455078, 12.192051887512207, 13.226675033569336, 14.261297225952148, 15.295921325683594, 16.330543518066406, 17.36516571044922, 18.399789810180664, 19.434412002563477, 20.469036102294922, 21.503658294677734, 22.53828239440918, 23.572904586791992, 24.607528686523438, 25.64215087890625, 26.676773071289062, 27.711395263671875, 28.74601936340332, 29.780641555786133, 30.815265655517578, 31.84988784790039, 32.8845100402832, 33.91913604736328, 34.953758239746094]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 12.0, 14.0, 8.0, 8.0, 21.0, 25.0, 18.0, 20.0, 34.0, 26.0, 29.0, 29.0, 44.0, 46.0, 34.0, 42.0, 34.0, 43.0, 37.0, 42.0, 44.0, 51.0, 35.0, 35.0, 29.0, 25.0, 27.0, 31.0, 16.0, 23.0, 21.0, 21.0, 9.0, 17.0, 7.0, 10.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.238452911376953, -26.227962493896484, -25.217472076416016, -24.206981658935547, -23.196491241455078, -22.18600082397461, -21.175508499145508, -20.16501808166504, -19.15452766418457, -18.1440372467041, -17.133546829223633, -16.123056411743164, -15.112565040588379, -14.10207462310791, -13.091583251953125, -12.081092834472656, -11.070602416992188, -10.060111999511719, -9.04962158203125, -8.039130210876465, -7.028639793395996, -6.018149375915527, -5.0076584815979, -3.9971675872802734, -2.9866771697998047, -1.9761865139007568, -0.965695858001709, 0.04479479789733887, 1.0552854537963867, 2.0657758712768555, 3.0762667655944824, 4.086757659912109, 5.097251892089844, 6.1077423095703125, 7.1182332038879395, 8.128724098205566, 9.139214515686035, 10.149704933166504, 11.160196304321289, 12.170686721801758, 13.181177139282227, 14.191667556762695, 15.202157974243164, 16.212648391723633, 17.223140716552734, 18.233631134033203, 19.244121551513672, 20.25461196899414, 21.26510238647461, 22.275592803955078, 23.286083221435547, 24.296573638916016, 25.307064056396484, 26.317554473876953, 27.328046798706055, 28.338537216186523, 29.349027633666992, 30.35951805114746, 31.37000846862793, 32.38050079345703, 33.3909912109375, 34.40148162841797, 35.41197204589844, 36.422462463378906, 37.432952880859375]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 23.0, 26.0, 36.0, 43.0, 82.0, 107.0, 149.0, 215.0, 338.0, 476.0, 773.0, 1091.0, 1595.0, 2556.0, 3781.0, 5682.0, 8661.0, 13766.0, 21694.0, 34854.0, 56978.0, 95607.0, 164450.0, 284842.0, 470361.0, 676256.0, 750231.0, 610170.0, 397805.0, 236959.0, 138951.0, 82312.0, 49204.0, 30625.0, 19037.0, 12027.0, 7706.0, 5052.0, 3289.0, 2138.0, 1408.0, 964.0, 657.0, 424.0, 305.0, 180.0, 139.0, 90.0, 49.0, 37.0, 27.0, 15.0, 17.0, 5.0, 11.0, 5.0, 2.0], "bins": [-35.65625, -34.58642578125, -33.5166015625, -32.44677734375, -31.376953125, -30.30712890625, -29.2373046875, -28.16748046875, -27.09765625, -26.02783203125, -24.9580078125, -23.88818359375, -22.818359375, -21.74853515625, -20.6787109375, -19.60888671875, -18.5390625, -17.46923828125, -16.3994140625, -15.32958984375, -14.259765625, -13.18994140625, -12.1201171875, -11.05029296875, -9.98046875, -8.91064453125, -7.8408203125, -6.77099609375, -5.701171875, -4.63134765625, -3.5615234375, -2.49169921875, -1.421875, -0.35205078125, 0.7177734375, 1.78759765625, 2.857421875, 3.92724609375, 4.9970703125, 6.06689453125, 7.13671875, 8.20654296875, 9.2763671875, 10.34619140625, 11.416015625, 12.48583984375, 13.5556640625, 14.62548828125, 15.6953125, 16.76513671875, 17.8349609375, 18.90478515625, 19.974609375, 21.04443359375, 22.1142578125, 23.18408203125, 24.25390625, 25.32373046875, 26.3935546875, 27.46337890625, 28.533203125, 29.60302734375, 30.6728515625, 31.74267578125, 32.8125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 12.0, 16.0, 10.0, 17.0, 23.0, 18.0, 20.0, 27.0, 37.0, 25.0, 34.0, 38.0, 36.0, 46.0, 44.0, 45.0, 39.0, 49.0, 36.0, 48.0, 46.0, 40.0, 31.0, 24.0, 40.0, 22.0, 28.0, 23.0, 27.0, 20.0, 14.0, 13.0, 11.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.671875, -25.706787109375, -24.74169921875, -23.776611328125, -22.8115234375, -21.846435546875, -20.88134765625, -19.916259765625, -18.951171875, -17.986083984375, -17.02099609375, -16.055908203125, -15.0908203125, -14.125732421875, -13.16064453125, -12.195556640625, -11.23046875, -10.265380859375, -9.30029296875, -8.335205078125, -7.3701171875, -6.405029296875, -5.43994140625, -4.474853515625, -3.509765625, -2.544677734375, -1.57958984375, -0.614501953125, 0.3505859375, 1.315673828125, 2.28076171875, 3.245849609375, 4.2109375, 5.176025390625, 6.14111328125, 7.106201171875, 8.0712890625, 9.036376953125, 10.00146484375, 10.966552734375, 11.931640625, 12.896728515625, 13.86181640625, 14.826904296875, 15.7919921875, 16.757080078125, 17.72216796875, 18.687255859375, 19.65234375, 20.617431640625, 21.58251953125, 22.547607421875, 23.5126953125, 24.477783203125, 25.44287109375, 26.407958984375, 27.373046875, 28.338134765625, 29.30322265625, 30.268310546875, 31.2333984375, 32.198486328125, 33.16357421875, 34.128662109375, 35.09375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 9.0, 11.0, 26.0, 35.0, 70.0, 129.0, 223.0, 504.0, 879.0, 1756.0, 3392.0, 7017.0, 14461.0, 31880.0, 73262.0, 174591.0, 415794.0, 871343.0, 1163478.0, 797461.0, 367344.0, 152677.0, 64043.0, 28093.0, 13169.0, 6317.0, 3066.0, 1513.0, 829.0, 426.0, 204.0, 104.0, 69.0, 38.0, 23.0, 13.0, 6.0, 3.0, 3.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.03125, -55.98974609375, -53.9482421875, -51.90673828125, -49.865234375, -47.82373046875, -45.7822265625, -43.74072265625, -41.69921875, -39.65771484375, -37.6162109375, -35.57470703125, -33.533203125, -31.49169921875, -29.4501953125, -27.40869140625, -25.3671875, -23.32568359375, -21.2841796875, -19.24267578125, -17.201171875, -15.15966796875, -13.1181640625, -11.07666015625, -9.03515625, -6.99365234375, -4.9521484375, -2.91064453125, -0.869140625, 1.17236328125, 3.2138671875, 5.25537109375, 7.296875, 9.33837890625, 11.3798828125, 13.42138671875, 15.462890625, 17.50439453125, 19.5458984375, 21.58740234375, 23.62890625, 25.67041015625, 27.7119140625, 29.75341796875, 31.794921875, 33.83642578125, 35.8779296875, 37.91943359375, 39.9609375, 42.00244140625, 44.0439453125, 46.08544921875, 48.126953125, 50.16845703125, 52.2099609375, 54.25146484375, 56.29296875, 58.33447265625, 60.3759765625, 62.41748046875, 64.458984375, 66.50048828125, 68.5419921875, 70.58349609375, 72.625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 9.0, 9.0, 20.0, 20.0, 31.0, 25.0, 39.0, 44.0, 75.0, 80.0, 75.0, 105.0, 126.0, 131.0, 189.0, 186.0, 227.0, 224.0, 259.0, 254.0, 259.0, 212.0, 203.0, 180.0, 190.0, 151.0, 155.0, 98.0, 101.0, 72.0, 54.0, 58.0, 54.0, 35.0, 38.0, 18.0, 11.0, 14.0, 12.0, 10.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.71875, -14.2255859375, -13.732421875, -13.2392578125, -12.74609375, -12.2529296875, -11.759765625, -11.2666015625, -10.7734375, -10.2802734375, -9.787109375, -9.2939453125, -8.80078125, -8.3076171875, -7.814453125, -7.3212890625, -6.828125, -6.3349609375, -5.841796875, -5.3486328125, -4.85546875, -4.3623046875, -3.869140625, -3.3759765625, -2.8828125, -2.3896484375, -1.896484375, -1.4033203125, -0.91015625, -0.4169921875, 0.076171875, 0.5693359375, 1.0625, 1.5556640625, 2.048828125, 2.5419921875, 3.03515625, 3.5283203125, 4.021484375, 4.5146484375, 5.0078125, 5.5009765625, 5.994140625, 6.4873046875, 6.98046875, 7.4736328125, 7.966796875, 8.4599609375, 8.953125, 9.4462890625, 9.939453125, 10.4326171875, 10.92578125, 11.4189453125, 11.912109375, 12.4052734375, 12.8984375, 13.3916015625, 13.884765625, 14.3779296875, 14.87109375, 15.3642578125, 15.857421875, 16.3505859375, 16.84375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 3.0, 4.0, 10.0, 9.0, 11.0, 16.0, 16.0, 18.0, 33.0, 44.0, 49.0, 38.0, 50.0, 48.0, 58.0, 47.0, 64.0, 55.0, 61.0, 58.0, 52.0, 47.0, 42.0, 38.0, 24.0, 16.0, 24.0, 12.0, 13.0, 6.0, 8.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.733158111572266, -41.240211486816406, -39.74726104736328, -38.25431442260742, -36.7613639831543, -35.26841735839844, -33.77546691894531, -32.28252029418945, -30.789573669433594, -29.2966251373291, -27.80367660522461, -26.31072998046875, -24.817781448364258, -23.324832916259766, -21.831884384155273, -20.33893585205078, -18.84598731994629, -17.353038787841797, -15.860091209411621, -14.367142677307129, -12.874195098876953, -11.381246566772461, -9.888298034667969, -8.395350456237793, -6.902401924133301, -5.409453868865967, -3.9165055751800537, -2.4235572814941406, -0.9306092262268066, 0.5623388290405273, 2.0552873611450195, 3.5482349395751953, 5.0411834716796875, 6.5341315269470215, 8.027079582214355, 9.520028114318848, 11.012975692749023, 12.505924224853516, 13.998872756958008, 15.491820335388184, 16.98476791381836, 18.47771644592285, 19.970664978027344, 21.463611602783203, 22.956560134887695, 24.449508666992188, 25.94245719909668, 27.435405731201172, 28.928354263305664, 30.421302795410156, 31.91425132751465, 33.40719985961914, 34.900146484375, 36.393096923828125, 37.886043548583984, 39.378990173339844, 40.87194061279297, 42.36488723754883, 43.85783767700195, 45.35078430175781, 46.84373474121094, 48.3366813659668, 49.829627990722656, 51.32257843017578, 52.81552505493164]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 6.0, 5.0, 14.0, 8.0, 7.0, 19.0, 19.0, 14.0, 22.0, 27.0, 38.0, 40.0, 32.0, 39.0, 39.0, 43.0, 60.0, 48.0, 46.0, 37.0, 43.0, 47.0, 36.0, 36.0, 41.0, 40.0, 21.0, 40.0, 28.0, 15.0, 19.0, 21.0, 12.0, 10.0, 7.0, 7.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.154190063476562, -28.934864044189453, -27.715539932250977, -26.496213912963867, -25.27688980102539, -24.05756378173828, -22.838237762451172, -21.618911743164062, -20.399587631225586, -19.180261611938477, -17.9609375, -16.74161148071289, -15.522286415100098, -14.302961349487305, -13.083635330200195, -11.864310264587402, -10.64498519897461, -9.425660133361816, -8.206335067749023, -6.987009048461914, -5.767683982849121, -4.548358917236328, -3.329033374786377, -2.109707832336426, -0.8903827667236328, 0.32894253730773926, 1.5482678413391113, 2.7675931453704834, 3.9869184494018555, 5.206243515014648, 6.4255690574646, 7.644894599914551, 8.86422348022461, 10.083548545837402, 11.302873611450195, 12.522199630737305, 13.741524696350098, 14.96084976196289, 16.18017578125, 17.39950180053711, 18.618825912475586, 19.838151931762695, 21.057476043701172, 22.27680206298828, 23.49612808227539, 24.715452194213867, 25.934778213500977, 27.154102325439453, 28.373428344726562, 29.592754364013672, 30.81207847595215, 32.031402587890625, 33.250728607177734, 34.470054626464844, 35.68938064575195, 36.90870666503906, 38.128028869628906, 39.347354888916016, 40.566680908203125, 41.78600311279297, 43.00532913208008, 44.22465515136719, 45.4439811706543, 46.663307189941406, 47.882633209228516]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 5.0, 9.0, 6.0, 16.0, 28.0, 53.0, 71.0, 81.0, 146.0, 271.0, 350.0, 571.0, 906.0, 1372.0, 2118.0, 3424.0, 5461.0, 8747.0, 14234.0, 23135.0, 36757.0, 58280.0, 89490.0, 126508.0, 156072.0, 155709.0, 124866.0, 87631.0, 56808.0, 35975.0, 22326.0, 13826.0, 8765.0, 5314.0, 3379.0, 2092.0, 1358.0, 812.0, 575.0, 361.0, 225.0, 158.0, 90.0, 71.0, 38.0, 23.0, 15.0, 11.0, 10.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.34375, -14.8638916015625, -14.384033203125, -13.9041748046875, -13.42431640625, -12.9444580078125, -12.464599609375, -11.9847412109375, -11.5048828125, -11.0250244140625, -10.545166015625, -10.0653076171875, -9.58544921875, -9.1055908203125, -8.625732421875, -8.1458740234375, -7.666015625, -7.1861572265625, -6.706298828125, -6.2264404296875, -5.74658203125, -5.2667236328125, -4.786865234375, -4.3070068359375, -3.8271484375, -3.3472900390625, -2.867431640625, -2.3875732421875, -1.90771484375, -1.4278564453125, -0.947998046875, -0.4681396484375, 0.01171875, 0.4915771484375, 0.971435546875, 1.4512939453125, 1.93115234375, 2.4110107421875, 2.890869140625, 3.3707275390625, 3.8505859375, 4.3304443359375, 4.810302734375, 5.2901611328125, 5.77001953125, 6.2498779296875, 6.729736328125, 7.2095947265625, 7.689453125, 8.1693115234375, 8.649169921875, 9.1290283203125, 9.60888671875, 10.0887451171875, 10.568603515625, 11.0484619140625, 11.5283203125, 12.0081787109375, 12.488037109375, 12.9678955078125, 13.44775390625, 13.9276123046875, 14.407470703125, 14.8873291015625, 15.3671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 1.0, 3.0, 4.0, 9.0, 9.0, 11.0, 15.0, 21.0, 19.0, 21.0, 19.0, 30.0, 39.0, 34.0, 38.0, 39.0, 39.0, 52.0, 52.0, 51.0, 38.0, 48.0, 57.0, 43.0, 39.0, 45.0, 34.0, 22.0, 30.0, 33.0, 23.0, 21.0, 17.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.28125, -30.93359375, -29.5859375, -28.23828125, -26.890625, -25.54296875, -24.1953125, -22.84765625, -21.5, -20.15234375, -18.8046875, -17.45703125, -16.109375, -14.76171875, -13.4140625, -12.06640625, -10.71875, -9.37109375, -8.0234375, -6.67578125, -5.328125, -3.98046875, -2.6328125, -1.28515625, 0.0625, 1.41015625, 2.7578125, 4.10546875, 5.453125, 6.80078125, 8.1484375, 9.49609375, 10.84375, 12.19140625, 13.5390625, 14.88671875, 16.234375, 17.58203125, 18.9296875, 20.27734375, 21.625, 22.97265625, 24.3203125, 25.66796875, 27.015625, 28.36328125, 29.7109375, 31.05859375, 32.40625, 33.75390625, 35.1015625, 36.44921875, 37.796875, 39.14453125, 40.4921875, 41.83984375, 43.1875, 44.53515625, 45.8828125, 47.23046875, 48.578125, 49.92578125, 51.2734375, 52.62109375, 53.96875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 20.0, 20.0, 23.0, 42.0, 51.0, 89.0, 124.0, 207.0, 323.0, 493.0, 741.0, 1156.0, 1830.0, 2720.0, 4375.0, 7144.0, 11327.0, 18440.0, 30400.0, 48974.0, 78881.0, 121628.0, 164321.0, 172690.0, 138461.0, 92586.0, 58047.0, 35375.0, 22070.0, 13357.0, 8120.0, 5201.0, 3346.0, 2087.0, 1414.0, 889.0, 513.0, 338.0, 228.0, 159.0, 96.0, 77.0, 64.0, 29.0, 34.0, 11.0, 10.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-18.8125, -18.227783203125, -17.64306640625, -17.058349609375, -16.4736328125, -15.888916015625, -15.30419921875, -14.719482421875, -14.134765625, -13.550048828125, -12.96533203125, -12.380615234375, -11.7958984375, -11.211181640625, -10.62646484375, -10.041748046875, -9.45703125, -8.872314453125, -8.28759765625, -7.702880859375, -7.1181640625, -6.533447265625, -5.94873046875, -5.364013671875, -4.779296875, -4.194580078125, -3.60986328125, -3.025146484375, -2.4404296875, -1.855712890625, -1.27099609375, -0.686279296875, -0.1015625, 0.483154296875, 1.06787109375, 1.652587890625, 2.2373046875, 2.822021484375, 3.40673828125, 3.991455078125, 4.576171875, 5.160888671875, 5.74560546875, 6.330322265625, 6.9150390625, 7.499755859375, 8.08447265625, 8.669189453125, 9.25390625, 9.838623046875, 10.42333984375, 11.008056640625, 11.5927734375, 12.177490234375, 12.76220703125, 13.346923828125, 13.931640625, 14.516357421875, 15.10107421875, 15.685791015625, 16.2705078125, 16.855224609375, 17.43994140625, 18.024658203125, 18.609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 7.0, 9.0, 14.0, 12.0, 16.0, 21.0, 14.0, 23.0, 25.0, 21.0, 36.0, 38.0, 30.0, 36.0, 38.0, 42.0, 35.0, 36.0, 46.0, 48.0, 48.0, 52.0, 36.0, 44.0, 34.0, 21.0, 25.0, 36.0, 20.0, 20.0, 18.0, 12.0, 6.0, 13.0, 11.0, 5.0, 7.0, 4.0, 9.0, 2.0, 2.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.625, -21.921630859375, -21.21826171875, -20.514892578125, -19.8115234375, -19.108154296875, -18.40478515625, -17.701416015625, -16.998046875, -16.294677734375, -15.59130859375, -14.887939453125, -14.1845703125, -13.481201171875, -12.77783203125, -12.074462890625, -11.37109375, -10.667724609375, -9.96435546875, -9.260986328125, -8.5576171875, -7.854248046875, -7.15087890625, -6.447509765625, -5.744140625, -5.040771484375, -4.33740234375, -3.634033203125, -2.9306640625, -2.227294921875, -1.52392578125, -0.820556640625, -0.1171875, 0.586181640625, 1.28955078125, 1.992919921875, 2.6962890625, 3.399658203125, 4.10302734375, 4.806396484375, 5.509765625, 6.213134765625, 6.91650390625, 7.619873046875, 8.3232421875, 9.026611328125, 9.72998046875, 10.433349609375, 11.13671875, 11.840087890625, 12.54345703125, 13.246826171875, 13.9501953125, 14.653564453125, 15.35693359375, 16.060302734375, 16.763671875, 17.467041015625, 18.17041015625, 18.873779296875, 19.5771484375, 20.280517578125, 20.98388671875, 21.687255859375, 22.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 9.0, 15.0, 13.0, 23.0, 43.0, 58.0, 73.0, 110.0, 186.0, 278.0, 392.0, 694.0, 1094.0, 1858.0, 3420.0, 6007.0, 11303.0, 22388.0, 44726.0, 87633.0, 160392.0, 233847.0, 210787.0, 127219.0, 65914.0, 33187.0, 16715.0, 8698.0, 4686.0, 2554.0, 1591.0, 952.0, 641.0, 346.0, 233.0, 169.0, 85.0, 55.0, 49.0, 32.0, 20.0, 19.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-7.328125, -7.11749267578125, -6.9068603515625, -6.69622802734375, -6.485595703125, -6.27496337890625, -6.0643310546875, -5.85369873046875, -5.64306640625, -5.43243408203125, -5.2218017578125, -5.01116943359375, -4.800537109375, -4.58990478515625, -4.3792724609375, -4.16864013671875, -3.9580078125, -3.74737548828125, -3.5367431640625, -3.32611083984375, -3.115478515625, -2.90484619140625, -2.6942138671875, -2.48358154296875, -2.27294921875, -2.06231689453125, -1.8516845703125, -1.64105224609375, -1.430419921875, -1.21978759765625, -1.0091552734375, -0.79852294921875, -0.587890625, -0.37725830078125, -0.1666259765625, 0.04400634765625, 0.254638671875, 0.46527099609375, 0.6759033203125, 0.88653564453125, 1.09716796875, 1.30780029296875, 1.5184326171875, 1.72906494140625, 1.939697265625, 2.15032958984375, 2.3609619140625, 2.57159423828125, 2.7822265625, 2.99285888671875, 3.2034912109375, 3.41412353515625, 3.624755859375, 3.83538818359375, 4.0460205078125, 4.25665283203125, 4.46728515625, 4.67791748046875, 4.8885498046875, 5.09918212890625, 5.309814453125, 5.52044677734375, 5.7310791015625, 5.94171142578125, 6.15234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 10.0, 8.0, 15.0, 11.0, 13.0, 23.0, 38.0, 40.0, 47.0, 49.0, 35.0, 49.0, 57.0, 61.0, 54.0, 51.0, 47.0, 46.0, 55.0, 46.0, 39.0, 35.0, 26.0, 22.0, 23.0, 17.0, 12.0, 11.0, 7.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004603862762451172, -0.0004449225962162018, -0.0004294589161872864, -0.00041399523615837097, -0.00039853155612945557, -0.00038306787610054016, -0.00036760419607162476, -0.00035214051604270935, -0.00033667683601379395, -0.00032121315598487854, -0.00030574947595596313, -0.00029028579592704773, -0.0002748221158981323, -0.0002593584358692169, -0.00024389475584030151, -0.0002284310758113861, -0.0002129673957824707, -0.0001975037157535553, -0.0001820400357246399, -0.0001665763556957245, -0.00015111267566680908, -0.00013564899563789368, -0.00012018531560897827, -0.00010472163558006287, -8.925795555114746e-05, -7.379427552223206e-05, -5.833059549331665e-05, -4.2866915464401245e-05, -2.740323543548584e-05, -1.1939555406570435e-05, 3.5241246223449707e-06, 1.8987804651260376e-05, 3.445148468017578e-05, 4.9915164709091187e-05, 6.537884473800659e-05, 8.0842524766922e-05, 9.63062047958374e-05, 0.00011176988482475281, 0.0001272335648536682, 0.00014269724488258362, 0.00015816092491149902, 0.00017362460494041443, 0.00018908828496932983, 0.00020455196499824524, 0.00022001564502716064, 0.00023547932505607605, 0.00025094300508499146, 0.00026640668511390686, 0.00028187036514282227, 0.00029733404517173767, 0.0003127977252006531, 0.0003282614052295685, 0.0003437250852584839, 0.0003591887652873993, 0.0003746524453163147, 0.0003901161253452301, 0.0004055798053741455, 0.0004210434854030609, 0.0004365071654319763, 0.0004519708454608917, 0.00046743452548980713, 0.00048289820551872253, 0.0004983618855476379, 0.0005138255655765533, 0.0005292892456054688]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 17.0, 24.0, 34.0, 51.0, 89.0, 156.0, 282.0, 529.0, 967.0, 1910.0, 3870.0, 8171.0, 17947.0, 41519.0, 97837.0, 205482.0, 285722.0, 207269.0, 100305.0, 42075.0, 18024.0, 8261.0, 3882.0, 1848.0, 1032.0, 542.0, 274.0, 171.0, 76.0, 59.0, 41.0, 20.0, 14.0, 10.0, 12.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.740234375, -9.41015625, -9.080078125, -8.75, -8.419921875, -8.08984375, -7.759765625, -7.4296875, -7.099609375, -6.76953125, -6.439453125, -6.109375, -5.779296875, -5.44921875, -5.119140625, -4.7890625, -4.458984375, -4.12890625, -3.798828125, -3.46875, -3.138671875, -2.80859375, -2.478515625, -2.1484375, -1.818359375, -1.48828125, -1.158203125, -0.828125, -0.498046875, -0.16796875, 0.162109375, 0.4921875, 0.822265625, 1.15234375, 1.482421875, 1.8125, 2.142578125, 2.47265625, 2.802734375, 3.1328125, 3.462890625, 3.79296875, 4.123046875, 4.453125, 4.783203125, 5.11328125, 5.443359375, 5.7734375, 6.103515625, 6.43359375, 6.763671875, 7.09375, 7.423828125, 7.75390625, 8.083984375, 8.4140625, 8.744140625, 9.07421875, 9.404296875, 9.734375, 10.064453125, 10.39453125, 10.724609375, 11.0546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 10.0, 9.0, 18.0, 19.0, 26.0, 25.0, 44.0, 37.0, 35.0, 56.0, 79.0, 63.0, 78.0, 64.0, 69.0, 46.0, 61.0, 51.0, 47.0, 32.0, 35.0, 15.0, 13.0, 16.0, 7.0, 14.0, 2.0, 8.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -2.994964599609375, -2.89617919921875, -2.797393798828125, -2.6986083984375, -2.599822998046875, -2.50103759765625, -2.402252197265625, -2.303466796875, -2.204681396484375, -2.10589599609375, -2.007110595703125, -1.9083251953125, -1.809539794921875, -1.71075439453125, -1.611968994140625, -1.51318359375, -1.414398193359375, -1.31561279296875, -1.216827392578125, -1.1180419921875, -1.019256591796875, -0.92047119140625, -0.821685791015625, -0.722900390625, -0.624114990234375, -0.52532958984375, -0.426544189453125, -0.3277587890625, -0.228973388671875, -0.13018798828125, -0.031402587890625, 0.0673828125, 0.166168212890625, 0.26495361328125, 0.363739013671875, 0.4625244140625, 0.561309814453125, 0.66009521484375, 0.758880615234375, 0.857666015625, 0.956451416015625, 1.05523681640625, 1.154022216796875, 1.2528076171875, 1.351593017578125, 1.45037841796875, 1.549163818359375, 1.64794921875, 1.746734619140625, 1.84552001953125, 1.944305419921875, 2.0430908203125, 2.141876220703125, 2.24066162109375, 2.339447021484375, 2.438232421875, 2.537017822265625, 2.63580322265625, 2.734588623046875, 2.8333740234375, 2.932159423828125, 3.03094482421875, 3.129730224609375, 3.228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 4.0, 11.0, 13.0, 18.0, 18.0, 33.0, 44.0, 40.0, 45.0, 50.0, 55.0, 63.0, 56.0, 63.0, 64.0, 58.0, 60.0, 58.0, 53.0, 28.0, 38.0, 25.0, 24.0, 14.0, 11.0, 10.0, 13.0, 6.0, 7.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.611724853515625, -44.01176071166992, -42.41179275512695, -40.81182861328125, -39.21186065673828, -37.61189651489258, -36.011932373046875, -34.411964416503906, -32.8120002746582, -31.212034225463867, -29.61206817626953, -28.012104034423828, -26.412137985229492, -24.812171936035156, -23.21220588684082, -21.612239837646484, -20.01227378845215, -18.412307739257812, -16.812341690063477, -15.212376594543457, -13.612411499023438, -12.012445449829102, -10.412479400634766, -8.812514305114746, -7.21254825592041, -5.612582683563232, -4.012617111206055, -2.4126510620117188, -0.812685489654541, 0.7872800827026367, 2.3872461318969727, 3.987211227416992, 5.587177276611328, 7.187142848968506, 8.787108421325684, 10.38707447052002, 11.987039566040039, 13.587005615234375, 15.186971664428711, 16.786937713623047, 18.38690185546875, 19.986867904663086, 21.586833953857422, 23.186798095703125, 24.78676414489746, 26.386730194091797, 27.986696243286133, 29.58666229248047, 31.186628341674805, 32.78659439086914, 34.386558532714844, 35.98652648925781, 37.586490631103516, 39.18645477294922, 40.78642272949219, 42.38638687133789, 43.98635482788086, 45.58631896972656, 47.18628692626953, 48.786251068115234, 50.3862190246582, 51.986183166503906, 53.586151123046875, 55.18611526489258, 56.78607940673828]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 10.0, 13.0, 17.0, 21.0, 13.0, 20.0, 29.0, 40.0, 32.0, 36.0, 46.0, 31.0, 52.0, 52.0, 53.0, 37.0, 46.0, 49.0, 36.0, 41.0, 40.0, 37.0, 34.0, 26.0, 37.0, 25.0, 13.0, 23.0, 21.0, 10.0, 9.0, 7.0, 5.0, 6.0, 9.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.726268768310547, -28.51274871826172, -27.29922866821289, -26.085708618164062, -24.872188568115234, -23.658668518066406, -22.445148468017578, -21.23162841796875, -20.018108367919922, -18.804588317871094, -17.591068267822266, -16.377548217773438, -15.16402816772461, -13.950508117675781, -12.736988067626953, -11.523468017578125, -10.309947967529297, -9.096427917480469, -7.882907867431641, -6.6693878173828125, -5.455867767333984, -4.242347717285156, -3.028827667236328, -1.8153076171875, -0.6017875671386719, 0.6117324829101562, 1.8252525329589844, 3.0387725830078125, 4.252292633056641, 5.465812683105469, 6.679332733154297, 7.892852783203125, 9.106372833251953, 10.319892883300781, 11.53341293334961, 12.746932983398438, 13.960453033447266, 15.173973083496094, 16.387493133544922, 17.60101318359375, 18.814533233642578, 20.028053283691406, 21.241573333740234, 22.455093383789062, 23.66861343383789, 24.88213348388672, 26.095653533935547, 27.309173583984375, 28.522693634033203, 29.73621368408203, 30.94973373413086, 32.16325378417969, 33.376773834228516, 34.590293884277344, 35.80381393432617, 37.017333984375, 38.23085403442383, 39.444374084472656, 40.657894134521484, 41.87141418457031, 43.08493423461914, 44.29845428466797, 45.5119743347168, 46.725494384765625, 47.93901443481445]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 16.0, 28.0, 39.0, 53.0, 64.0, 111.0, 175.0, 220.0, 356.0, 547.0, 841.0, 1271.0, 1850.0, 2868.0, 4395.0, 6670.0, 10028.0, 15175.0, 22286.0, 32666.0, 46639.0, 62924.0, 82274.0, 100262.0, 111837.0, 114269.0, 105514.0, 89426.0, 70010.0, 51820.0, 36792.0, 25574.0, 17281.0, 11591.0, 7809.0, 5094.0, 3375.0, 2165.0, 1414.0, 941.0, 624.0, 410.0, 271.0, 181.0, 130.0, 89.0, 46.0, 43.0, 30.0, 22.0, 14.0, 5.0, 3.0, 1.0, 3.0, 5.0], "bins": [-27.125, -26.307373046875, -25.48974609375, -24.672119140625, -23.8544921875, -23.036865234375, -22.21923828125, -21.401611328125, -20.583984375, -19.766357421875, -18.94873046875, -18.131103515625, -17.3134765625, -16.495849609375, -15.67822265625, -14.860595703125, -14.04296875, -13.225341796875, -12.40771484375, -11.590087890625, -10.7724609375, -9.954833984375, -9.13720703125, -8.319580078125, -7.501953125, -6.684326171875, -5.86669921875, -5.049072265625, -4.2314453125, -3.413818359375, -2.59619140625, -1.778564453125, -0.9609375, -0.143310546875, 0.67431640625, 1.491943359375, 2.3095703125, 3.127197265625, 3.94482421875, 4.762451171875, 5.580078125, 6.397705078125, 7.21533203125, 8.032958984375, 8.8505859375, 9.668212890625, 10.48583984375, 11.303466796875, 12.12109375, 12.938720703125, 13.75634765625, 14.573974609375, 15.3916015625, 16.209228515625, 17.02685546875, 17.844482421875, 18.662109375, 19.479736328125, 20.29736328125, 21.114990234375, 21.9326171875, 22.750244140625, 23.56787109375, 24.385498046875, 25.203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 6.0, 1.0, 10.0, 4.0, 4.0, 17.0, 15.0, 19.0, 19.0, 25.0, 32.0, 43.0, 30.0, 35.0, 41.0, 41.0, 49.0, 63.0, 36.0, 41.0, 48.0, 43.0, 39.0, 46.0, 37.0, 51.0, 40.0, 29.0, 29.0, 24.0, 21.0, 14.0, 15.0, 10.0, 4.0, 11.0, 8.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -29.909423828125, -28.58447265625, -27.259521484375, -25.9345703125, -24.609619140625, -23.28466796875, -21.959716796875, -20.634765625, -19.309814453125, -17.98486328125, -16.659912109375, -15.3349609375, -14.010009765625, -12.68505859375, -11.360107421875, -10.03515625, -8.710205078125, -7.38525390625, -6.060302734375, -4.7353515625, -3.410400390625, -2.08544921875, -0.760498046875, 0.564453125, 1.889404296875, 3.21435546875, 4.539306640625, 5.8642578125, 7.189208984375, 8.51416015625, 9.839111328125, 11.1640625, 12.489013671875, 13.81396484375, 15.138916015625, 16.4638671875, 17.788818359375, 19.11376953125, 20.438720703125, 21.763671875, 23.088623046875, 24.41357421875, 25.738525390625, 27.0634765625, 28.388427734375, 29.71337890625, 31.038330078125, 32.36328125, 33.688232421875, 35.01318359375, 36.338134765625, 37.6630859375, 38.988037109375, 40.31298828125, 41.637939453125, 42.962890625, 44.287841796875, 45.61279296875, 46.937744140625, 48.2626953125, 49.587646484375, 50.91259765625, 52.237548828125, 53.5625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 13.0, 24.0, 39.0, 52.0, 70.0, 119.0, 198.0, 317.0, 447.0, 702.0, 1040.0, 1613.0, 2563.0, 4092.0, 6248.0, 9350.0, 14500.0, 21899.0, 32878.0, 46898.0, 65816.0, 86611.0, 105228.0, 117219.0, 117992.0, 106768.0, 88636.0, 67468.0, 49321.0, 34036.0, 23194.0, 15209.0, 9909.0, 6283.0, 4194.0, 2595.0, 1802.0, 1128.0, 719.0, 482.0, 295.0, 212.0, 128.0, 78.0, 60.0, 36.0, 25.0, 16.0, 11.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.609375, -27.716796875, -26.82421875, -25.931640625, -25.0390625, -24.146484375, -23.25390625, -22.361328125, -21.46875, -20.576171875, -19.68359375, -18.791015625, -17.8984375, -17.005859375, -16.11328125, -15.220703125, -14.328125, -13.435546875, -12.54296875, -11.650390625, -10.7578125, -9.865234375, -8.97265625, -8.080078125, -7.1875, -6.294921875, -5.40234375, -4.509765625, -3.6171875, -2.724609375, -1.83203125, -0.939453125, -0.046875, 0.845703125, 1.73828125, 2.630859375, 3.5234375, 4.416015625, 5.30859375, 6.201171875, 7.09375, 7.986328125, 8.87890625, 9.771484375, 10.6640625, 11.556640625, 12.44921875, 13.341796875, 14.234375, 15.126953125, 16.01953125, 16.912109375, 17.8046875, 18.697265625, 19.58984375, 20.482421875, 21.375, 22.267578125, 23.16015625, 24.052734375, 24.9453125, 25.837890625, 26.73046875, 27.623046875, 28.515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 10.0, 4.0, 6.0, 4.0, 5.0, 8.0, 15.0, 18.0, 9.0, 20.0, 20.0, 30.0, 19.0, 31.0, 35.0, 35.0, 33.0, 33.0, 35.0, 50.0, 41.0, 43.0, 44.0, 45.0, 30.0, 42.0, 49.0, 27.0, 42.0, 30.0, 35.0, 30.0, 22.0, 15.0, 21.0, 14.0, 15.0, 11.0, 8.0, 4.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.660400390625, -21.91455078125, -21.168701171875, -20.4228515625, -19.677001953125, -18.93115234375, -18.185302734375, -17.439453125, -16.693603515625, -15.94775390625, -15.201904296875, -14.4560546875, -13.710205078125, -12.96435546875, -12.218505859375, -11.47265625, -10.726806640625, -9.98095703125, -9.235107421875, -8.4892578125, -7.743408203125, -6.99755859375, -6.251708984375, -5.505859375, -4.760009765625, -4.01416015625, -3.268310546875, -2.5224609375, -1.776611328125, -1.03076171875, -0.284912109375, 0.4609375, 1.206787109375, 1.95263671875, 2.698486328125, 3.4443359375, 4.190185546875, 4.93603515625, 5.681884765625, 6.427734375, 7.173583984375, 7.91943359375, 8.665283203125, 9.4111328125, 10.156982421875, 10.90283203125, 11.648681640625, 12.39453125, 13.140380859375, 13.88623046875, 14.632080078125, 15.3779296875, 16.123779296875, 16.86962890625, 17.615478515625, 18.361328125, 19.107177734375, 19.85302734375, 20.598876953125, 21.3447265625, 22.090576171875, 22.83642578125, 23.582275390625, 24.328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 11.0, 15.0, 20.0, 28.0, 31.0, 60.0, 60.0, 104.0, 131.0, 197.0, 307.0, 462.0, 740.0, 1250.0, 2163.0, 4125.0, 8078.0, 16903.0, 37039.0, 81309.0, 163529.0, 247860.0, 229338.0, 134230.0, 63351.0, 28850.0, 13549.0, 6567.0, 3379.0, 1866.0, 1064.0, 645.0, 391.0, 259.0, 179.0, 124.0, 96.0, 70.0, 48.0, 36.0, 29.0, 18.0, 11.0, 6.0, 6.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.420654296875, -21.66943359375, -20.918212890625, -20.1669921875, -19.415771484375, -18.66455078125, -17.913330078125, -17.162109375, -16.410888671875, -15.65966796875, -14.908447265625, -14.1572265625, -13.406005859375, -12.65478515625, -11.903564453125, -11.15234375, -10.401123046875, -9.64990234375, -8.898681640625, -8.1474609375, -7.396240234375, -6.64501953125, -5.893798828125, -5.142578125, -4.391357421875, -3.64013671875, -2.888916015625, -2.1376953125, -1.386474609375, -0.63525390625, 0.115966796875, 0.8671875, 1.618408203125, 2.36962890625, 3.120849609375, 3.8720703125, 4.623291015625, 5.37451171875, 6.125732421875, 6.876953125, 7.628173828125, 8.37939453125, 9.130615234375, 9.8818359375, 10.633056640625, 11.38427734375, 12.135498046875, 12.88671875, 13.637939453125, 14.38916015625, 15.140380859375, 15.8916015625, 16.642822265625, 17.39404296875, 18.145263671875, 18.896484375, 19.647705078125, 20.39892578125, 21.150146484375, 21.9013671875, 22.652587890625, 23.40380859375, 24.155029296875, 24.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 7.0, 8.0, 13.0, 12.0, 31.0, 28.0, 51.0, 74.0, 83.0, 95.0, 103.0, 99.0, 95.0, 68.0, 64.0, 41.0, 38.0, 28.0, 16.0, 15.0, 8.0, 6.0, 4.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0021762847900390625, -0.0020858049392700195, -0.0019953250885009766, -0.0019048452377319336, -0.0018143653869628906, -0.0017238855361938477, -0.0016334056854248047, -0.0015429258346557617, -0.0014524459838867188, -0.0013619661331176758, -0.0012714862823486328, -0.0011810064315795898, -0.0010905265808105469, -0.001000046730041504, -0.0009095668792724609, -0.000819087028503418, -0.000728607177734375, -0.000638127326965332, -0.0005476474761962891, -0.0004571676254272461, -0.0003666877746582031, -0.00027620792388916016, -0.0001857280731201172, -9.524822235107422e-05, -4.76837158203125e-06, 8.571147918701172e-05, 0.0001761913299560547, 0.00026667118072509766, 0.0003571510314941406, 0.0004476308822631836, 0.0005381107330322266, 0.0006285905838012695, 0.0007190704345703125, 0.0008095502853393555, 0.0009000301361083984, 0.0009905099868774414, 0.0010809898376464844, 0.0011714696884155273, 0.0012619495391845703, 0.0013524293899536133, 0.0014429092407226562, 0.0015333890914916992, 0.0016238689422607422, 0.0017143487930297852, 0.0018048286437988281, 0.001895308494567871, 0.001985788345336914, 0.002076268196105957, 0.002166748046875, 0.002257227897644043, 0.002347707748413086, 0.002438187599182129, 0.002528667449951172, 0.002619147300720215, 0.002709627151489258, 0.0028001070022583008, 0.0028905868530273438, 0.0029810667037963867, 0.0030715465545654297, 0.0031620264053344727, 0.0032525062561035156, 0.0033429861068725586, 0.0034334659576416016, 0.0035239458084106445, 0.0036144256591796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 11.0, 6.0, 11.0, 16.0, 16.0, 25.0, 31.0, 46.0, 58.0, 85.0, 132.0, 182.0, 283.0, 376.0, 547.0, 825.0, 1264.0, 2140.0, 3704.0, 6627.0, 12501.0, 24432.0, 50253.0, 102209.0, 184205.0, 239875.0, 194689.0, 111331.0, 55137.0, 26482.0, 13400.0, 7098.0, 4047.0, 2319.0, 1474.0, 858.0, 574.0, 408.0, 265.0, 184.0, 131.0, 93.0, 55.0, 39.0, 39.0, 21.0, 17.0, 13.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0], "bins": [-25.71875, -24.974609375, -24.23046875, -23.486328125, -22.7421875, -21.998046875, -21.25390625, -20.509765625, -19.765625, -19.021484375, -18.27734375, -17.533203125, -16.7890625, -16.044921875, -15.30078125, -14.556640625, -13.8125, -13.068359375, -12.32421875, -11.580078125, -10.8359375, -10.091796875, -9.34765625, -8.603515625, -7.859375, -7.115234375, -6.37109375, -5.626953125, -4.8828125, -4.138671875, -3.39453125, -2.650390625, -1.90625, -1.162109375, -0.41796875, 0.326171875, 1.0703125, 1.814453125, 2.55859375, 3.302734375, 4.046875, 4.791015625, 5.53515625, 6.279296875, 7.0234375, 7.767578125, 8.51171875, 9.255859375, 10.0, 10.744140625, 11.48828125, 12.232421875, 12.9765625, 13.720703125, 14.46484375, 15.208984375, 15.953125, 16.697265625, 17.44140625, 18.185546875, 18.9296875, 19.673828125, 20.41796875, 21.162109375, 21.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 4.0, 1.0, 11.0, 12.0, 8.0, 26.0, 14.0, 27.0, 34.0, 38.0, 47.0, 49.0, 50.0, 74.0, 64.0, 63.0, 61.0, 56.0, 51.0, 51.0, 55.0, 33.0, 26.0, 44.0, 19.0, 14.0, 8.0, 10.0, 13.0, 6.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.86883544921875, -5.6478271484375, -5.42681884765625, -5.205810546875, -4.98480224609375, -4.7637939453125, -4.54278564453125, -4.32177734375, -4.10076904296875, -3.8797607421875, -3.65875244140625, -3.437744140625, -3.21673583984375, -2.9957275390625, -2.77471923828125, -2.5537109375, -2.33270263671875, -2.1116943359375, -1.89068603515625, -1.669677734375, -1.44866943359375, -1.2276611328125, -1.00665283203125, -0.78564453125, -0.56463623046875, -0.3436279296875, -0.12261962890625, 0.098388671875, 0.31939697265625, 0.5404052734375, 0.76141357421875, 0.982421875, 1.20343017578125, 1.4244384765625, 1.64544677734375, 1.866455078125, 2.08746337890625, 2.3084716796875, 2.52947998046875, 2.75048828125, 2.97149658203125, 3.1925048828125, 3.41351318359375, 3.634521484375, 3.85552978515625, 4.0765380859375, 4.29754638671875, 4.5185546875, 4.73956298828125, 4.9605712890625, 5.18157958984375, 5.402587890625, 5.62359619140625, 5.8446044921875, 6.06561279296875, 6.28662109375, 6.50762939453125, 6.7286376953125, 6.94964599609375, 7.170654296875, 7.39166259765625, 7.6126708984375, 7.83367919921875, 8.0546875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 4.0, 8.0, 9.0, 19.0, 15.0, 14.0, 20.0, 40.0, 42.0, 50.0, 54.0, 58.0, 38.0, 52.0, 55.0, 59.0, 56.0, 64.0, 69.0, 38.0, 38.0, 32.0, 35.0, 26.0, 21.0, 21.0, 12.0, 14.0, 10.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.97416687011719, -51.42745590209961, -49.88074493408203, -48.33403396606445, -46.787322998046875, -45.24061584472656, -43.69390106201172, -42.147193908691406, -40.60048294067383, -39.05377197265625, -37.50706100463867, -35.960350036621094, -34.413639068603516, -32.86692810058594, -31.320219039916992, -29.773509979248047, -28.226797103881836, -26.680086135864258, -25.13337516784668, -23.586666107177734, -22.039955139160156, -20.493244171142578, -18.946533203125, -17.399822235107422, -15.85311222076416, -14.306401252746582, -12.75969123840332, -11.212980270385742, -9.666269302368164, -8.119559288024902, -6.572848320007324, -5.0261383056640625, -3.4794273376464844, -1.932716727256775, -0.38600611686706543, 1.1607046127319336, 2.7074151039123535, 4.254125595092773, 5.800836563110352, 7.347546577453613, 8.894257545471191, 10.44096851348877, 11.987678527832031, 13.53438949584961, 15.081100463867188, 16.627811431884766, 18.174522399902344, 19.72123146057129, 21.267942428588867, 22.814653396606445, 24.361364364624023, 25.90807342529297, 27.454784393310547, 29.001495361328125, 30.548206329345703, 32.09491729736328, 33.64162826538086, 35.18833923339844, 36.735050201416016, 38.281761169433594, 39.82847213745117, 41.37518310546875, 42.92189025878906, 44.46860122680664, 46.01531219482422]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 8.0, 9.0, 14.0, 18.0, 19.0, 19.0, 36.0, 20.0, 24.0, 34.0, 40.0, 38.0, 43.0, 32.0, 41.0, 46.0, 43.0, 48.0, 35.0, 33.0, 58.0, 29.0, 29.0, 30.0, 45.0, 30.0, 21.0, 32.0, 22.0, 14.0, 10.0, 11.0, 7.0, 8.0, 9.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.671630859375, -38.380489349365234, -37.0893440246582, -35.79820251464844, -34.507057189941406, -33.21591567993164, -31.924774169921875, -30.633630752563477, -29.342487335205078, -28.05134391784668, -26.76020050048828, -25.469058990478516, -24.177915573120117, -22.88677215576172, -21.595630645751953, -20.304487228393555, -19.013343811035156, -17.722200393676758, -16.43105697631836, -15.139915466308594, -13.848772048950195, -12.557628631591797, -11.266486167907715, -9.975343704223633, -8.684200286865234, -7.393057346343994, -6.101914405822754, -4.810771465301514, -3.5196285247802734, -2.228485584259033, -0.937342643737793, 0.35379981994628906, 1.6449432373046875, 2.9360861778259277, 4.227229118347168, 5.518372058868408, 6.809514999389648, 8.100658416748047, 9.391800880432129, 10.682943344116211, 11.97408676147461, 13.265230178833008, 14.55637264251709, 15.847515106201172, 17.13865852355957, 18.42980194091797, 19.720943450927734, 21.012086868286133, 22.30323028564453, 23.59437370300293, 24.885517120361328, 26.176658630371094, 27.467802047729492, 28.75894546508789, 30.050086975097656, 31.341230392456055, 32.63237380981445, 33.92351531982422, 35.21466064453125, 36.505802154541016, 37.79694366455078, 39.08808898925781, 40.37923049926758, 41.670372009277344, 42.961517333984375]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 0.0, 8.0, 6.0, 14.0, 20.0, 34.0, 48.0, 74.0, 107.0, 149.0, 230.0, 319.0, 531.0, 753.0, 1080.0, 1700.0, 2606.0, 3996.0, 6274.0, 9928.0, 16452.0, 27497.0, 46182.0, 81533.0, 146895.0, 268107.0, 469185.0, 720660.0, 822909.0, 652902.0, 401128.0, 223087.0, 121946.0, 68014.0, 38915.0, 22700.0, 13830.0, 8545.0, 5571.0, 3493.0, 2350.0, 1469.0, 1006.0, 650.0, 461.0, 333.0, 184.0, 154.0, 102.0, 53.0, 36.0, 19.0, 13.0, 10.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0], "bins": [-49.96875, -48.423828125, -46.87890625, -45.333984375, -43.7890625, -42.244140625, -40.69921875, -39.154296875, -37.609375, -36.064453125, -34.51953125, -32.974609375, -31.4296875, -29.884765625, -28.33984375, -26.794921875, -25.25, -23.705078125, -22.16015625, -20.615234375, -19.0703125, -17.525390625, -15.98046875, -14.435546875, -12.890625, -11.345703125, -9.80078125, -8.255859375, -6.7109375, -5.166015625, -3.62109375, -2.076171875, -0.53125, 1.013671875, 2.55859375, 4.103515625, 5.6484375, 7.193359375, 8.73828125, 10.283203125, 11.828125, 13.373046875, 14.91796875, 16.462890625, 18.0078125, 19.552734375, 21.09765625, 22.642578125, 24.1875, 25.732421875, 27.27734375, 28.822265625, 30.3671875, 31.912109375, 33.45703125, 35.001953125, 36.546875, 38.091796875, 39.63671875, 41.181640625, 42.7265625, 44.271484375, 45.81640625, 47.361328125, 48.90625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 11.0, 12.0, 12.0, 20.0, 20.0, 15.0, 18.0, 22.0, 28.0, 42.0, 30.0, 40.0, 32.0, 36.0, 37.0, 39.0, 38.0, 46.0, 34.0, 42.0, 42.0, 42.0, 30.0, 32.0, 26.0, 38.0, 28.0, 36.0, 16.0, 25.0, 14.0, 11.0, 17.0, 9.0, 5.0, 7.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.828125, -30.668212890625, -29.50830078125, -28.348388671875, -27.1884765625, -26.028564453125, -24.86865234375, -23.708740234375, -22.548828125, -21.388916015625, -20.22900390625, -19.069091796875, -17.9091796875, -16.749267578125, -15.58935546875, -14.429443359375, -13.26953125, -12.109619140625, -10.94970703125, -9.789794921875, -8.6298828125, -7.469970703125, -6.31005859375, -5.150146484375, -3.990234375, -2.830322265625, -1.67041015625, -0.510498046875, 0.6494140625, 1.809326171875, 2.96923828125, 4.129150390625, 5.2890625, 6.448974609375, 7.60888671875, 8.768798828125, 9.9287109375, 11.088623046875, 12.24853515625, 13.408447265625, 14.568359375, 15.728271484375, 16.88818359375, 18.048095703125, 19.2080078125, 20.367919921875, 21.52783203125, 22.687744140625, 23.84765625, 25.007568359375, 26.16748046875, 27.327392578125, 28.4873046875, 29.647216796875, 30.80712890625, 31.967041015625, 33.126953125, 34.286865234375, 35.44677734375, 36.606689453125, 37.7666015625, 38.926513671875, 40.08642578125, 41.246337890625, 42.40625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 12.0, 16.0, 44.0, 35.0, 63.0, 96.0, 145.0, 194.0, 303.0, 450.0, 683.0, 1046.0, 1460.0, 2396.0, 3542.0, 5780.0, 9231.0, 15165.0, 25463.0, 43901.0, 78367.0, 143495.0, 264683.0, 471872.0, 739594.0, 845637.0, 654338.0, 394083.0, 217299.0, 117321.0, 64934.0, 36254.0, 21615.0, 12874.0, 8021.0, 4873.0, 3071.0, 2060.0, 1264.0, 884.0, 605.0, 387.0, 248.0, 179.0, 104.0, 56.0, 39.0, 38.0, 29.0, 15.0, 9.0, 5.0, 1.0, 6.0, 0.0, 0.0, 1.0], "bins": [-63.15625, -61.203125, -59.25, -57.296875, -55.34375, -53.390625, -51.4375, -49.484375, -47.53125, -45.578125, -43.625, -41.671875, -39.71875, -37.765625, -35.8125, -33.859375, -31.90625, -29.953125, -28.0, -26.046875, -24.09375, -22.140625, -20.1875, -18.234375, -16.28125, -14.328125, -12.375, -10.421875, -8.46875, -6.515625, -4.5625, -2.609375, -0.65625, 1.296875, 3.25, 5.203125, 7.15625, 9.109375, 11.0625, 13.015625, 14.96875, 16.921875, 18.875, 20.828125, 22.78125, 24.734375, 26.6875, 28.640625, 30.59375, 32.546875, 34.5, 36.453125, 38.40625, 40.359375, 42.3125, 44.265625, 46.21875, 48.171875, 50.125, 52.078125, 54.03125, 55.984375, 57.9375, 59.890625, 61.84375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 11.0, 13.0, 14.0, 22.0, 20.0, 38.0, 45.0, 47.0, 45.0, 53.0, 94.0, 110.0, 129.0, 148.0, 150.0, 176.0, 195.0, 185.0, 226.0, 200.0, 208.0, 208.0, 218.0, 197.0, 178.0, 169.0, 144.0, 124.0, 119.0, 111.0, 111.0, 60.0, 47.0, 42.0, 35.0, 30.0, 32.0, 32.0, 17.0, 19.0, 9.0, 10.0, 8.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.46875, -18.857666015625, -18.24658203125, -17.635498046875, -17.0244140625, -16.413330078125, -15.80224609375, -15.191162109375, -14.580078125, -13.968994140625, -13.35791015625, -12.746826171875, -12.1357421875, -11.524658203125, -10.91357421875, -10.302490234375, -9.69140625, -9.080322265625, -8.46923828125, -7.858154296875, -7.2470703125, -6.635986328125, -6.02490234375, -5.413818359375, -4.802734375, -4.191650390625, -3.58056640625, -2.969482421875, -2.3583984375, -1.747314453125, -1.13623046875, -0.525146484375, 0.0859375, 0.697021484375, 1.30810546875, 1.919189453125, 2.5302734375, 3.141357421875, 3.75244140625, 4.363525390625, 4.974609375, 5.585693359375, 6.19677734375, 6.807861328125, 7.4189453125, 8.030029296875, 8.64111328125, 9.252197265625, 9.86328125, 10.474365234375, 11.08544921875, 11.696533203125, 12.3076171875, 12.918701171875, 13.52978515625, 14.140869140625, 14.751953125, 15.363037109375, 15.97412109375, 16.585205078125, 17.1962890625, 17.807373046875, 18.41845703125, 19.029541015625, 19.640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 8.0, 17.0, 13.0, 18.0, 17.0, 33.0, 43.0, 56.0, 53.0, 69.0, 85.0, 83.0, 85.0, 88.0, 65.0, 58.0, 44.0, 33.0, 25.0, 31.0, 22.0, 7.0, 13.0, 11.0, 3.0, 7.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.51981353759766, -94.56147003173828, -91.6031265258789, -88.644775390625, -85.68643188476562, -82.72808837890625, -79.76974487304688, -76.8114013671875, -73.85305786132812, -70.89471435546875, -67.93637084960938, -64.97802734375, -62.019676208496094, -59.06133270263672, -56.102989196777344, -53.14464569091797, -50.18629455566406, -47.22795104980469, -44.26960372924805, -41.31126022338867, -38.35291290283203, -35.394569396972656, -32.43622589111328, -29.477880477905273, -26.519535064697266, -23.561189651489258, -20.60284423828125, -17.644500732421875, -14.686155319213867, -11.72780990600586, -8.769466400146484, -5.811120986938477, -2.8527679443359375, 0.10557699203491211, 3.0639219284057617, 6.022266387939453, 8.980611801147461, 11.938957214355469, 14.897300720214844, 17.85564613342285, 20.81399154663086, 23.772336959838867, 26.730682373046875, 29.68902587890625, 32.647369384765625, 35.605716705322266, 38.56406021118164, 41.52240753173828, 44.480751037597656, 47.43909454345703, 50.39744186401367, 53.35578536987305, 56.31413269042969, 59.27247619628906, 62.23081970214844, 65.18916320800781, 68.14750671386719, 71.10585021972656, 74.06419372558594, 77.02253723144531, 79.98088836669922, 82.9392318725586, 85.89757537841797, 88.85591888427734, 91.81427001953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 10.0, 4.0, 11.0, 6.0, 11.0, 11.0, 10.0, 14.0, 17.0, 13.0, 18.0, 23.0, 29.0, 21.0, 23.0, 23.0, 42.0, 27.0, 29.0, 31.0, 44.0, 32.0, 42.0, 38.0, 38.0, 30.0, 31.0, 26.0, 40.0, 31.0, 27.0, 30.0, 24.0, 21.0, 31.0, 16.0, 20.0, 16.0, 12.0, 12.0, 17.0, 9.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-40.53941345214844, -39.245582580566406, -37.951751708984375, -36.657920837402344, -35.36408996582031, -34.07026290893555, -32.776432037353516, -31.482601165771484, -30.188770294189453, -28.894939422607422, -27.60110855102539, -26.307279586791992, -25.01344871520996, -23.71961784362793, -22.42578887939453, -21.1319580078125, -19.83812713623047, -18.544296264648438, -17.250465393066406, -15.956636428833008, -14.662805557250977, -13.368974685668945, -12.07514476776123, -10.781314849853516, -9.487483978271484, -8.193653106689453, -6.899823188781738, -5.605992794036865, -4.312162399291992, -3.018332004547119, -1.724501609802246, -0.43067169189453125, 0.8631553649902344, 2.1569857597351074, 3.4508161544799805, 4.7446465492248535, 6.038476943969727, 7.3323073387146, 8.626137733459473, 9.919967651367188, 11.213798522949219, 12.50762939453125, 13.801459312438965, 15.09528923034668, 16.38912010192871, 17.682950973510742, 18.97677993774414, 20.270610809326172, 21.564441680908203, 22.858272552490234, 24.152103424072266, 25.445932388305664, 26.739763259887695, 28.033594131469727, 29.327423095703125, 30.621253967285156, 31.915084838867188, 33.20891571044922, 34.50274658203125, 35.79657745361328, 37.09040832519531, 38.38423538208008, 39.67806625366211, 40.97189712524414, 42.26572799682617]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 11.0, 8.0, 15.0, 13.0, 20.0, 36.0, 57.0, 102.0, 125.0, 181.0, 297.0, 506.0, 662.0, 1099.0, 1706.0, 2487.0, 4000.0, 6228.0, 9919.0, 15032.0, 23844.0, 38063.0, 60035.0, 90514.0, 128363.0, 158068.0, 154238.0, 121040.0, 83026.0, 54070.0, 34386.0, 21792.0, 13651.0, 8933.0, 5620.0, 3670.0, 2349.0, 1485.0, 988.0, 618.0, 445.0, 242.0, 189.0, 153.0, 97.0, 59.0, 38.0, 37.0, 18.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-23.15625, -22.43017578125, -21.7041015625, -20.97802734375, -20.251953125, -19.52587890625, -18.7998046875, -18.07373046875, -17.34765625, -16.62158203125, -15.8955078125, -15.16943359375, -14.443359375, -13.71728515625, -12.9912109375, -12.26513671875, -11.5390625, -10.81298828125, -10.0869140625, -9.36083984375, -8.634765625, -7.90869140625, -7.1826171875, -6.45654296875, -5.73046875, -5.00439453125, -4.2783203125, -3.55224609375, -2.826171875, -2.10009765625, -1.3740234375, -0.64794921875, 0.078125, 0.80419921875, 1.5302734375, 2.25634765625, 2.982421875, 3.70849609375, 4.4345703125, 5.16064453125, 5.88671875, 6.61279296875, 7.3388671875, 8.06494140625, 8.791015625, 9.51708984375, 10.2431640625, 10.96923828125, 11.6953125, 12.42138671875, 13.1474609375, 13.87353515625, 14.599609375, 15.32568359375, 16.0517578125, 16.77783203125, 17.50390625, 18.22998046875, 18.9560546875, 19.68212890625, 20.408203125, 21.13427734375, 21.8603515625, 22.58642578125, 23.3125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 11.0, 13.0, 21.0, 19.0, 19.0, 25.0, 31.0, 26.0, 28.0, 32.0, 29.0, 49.0, 33.0, 37.0, 39.0, 50.0, 44.0, 41.0, 53.0, 43.0, 32.0, 34.0, 38.0, 28.0, 33.0, 18.0, 30.0, 22.0, 20.0, 14.0, 13.0, 4.0, 13.0, 12.0, 5.0, 2.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.15625, -42.45556640625, -40.7548828125, -39.05419921875, -37.353515625, -35.65283203125, -33.9521484375, -32.25146484375, -30.55078125, -28.85009765625, -27.1494140625, -25.44873046875, -23.748046875, -22.04736328125, -20.3466796875, -18.64599609375, -16.9453125, -15.24462890625, -13.5439453125, -11.84326171875, -10.142578125, -8.44189453125, -6.7412109375, -5.04052734375, -3.33984375, -1.63916015625, 0.0615234375, 1.76220703125, 3.462890625, 5.16357421875, 6.8642578125, 8.56494140625, 10.265625, 11.96630859375, 13.6669921875, 15.36767578125, 17.068359375, 18.76904296875, 20.4697265625, 22.17041015625, 23.87109375, 25.57177734375, 27.2724609375, 28.97314453125, 30.673828125, 32.37451171875, 34.0751953125, 35.77587890625, 37.4765625, 39.17724609375, 40.8779296875, 42.57861328125, 44.279296875, 45.97998046875, 47.6806640625, 49.38134765625, 51.08203125, 52.78271484375, 54.4833984375, 56.18408203125, 57.884765625, 59.58544921875, 61.2861328125, 62.98681640625, 64.6875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 7.0, 7.0, 9.0, 13.0, 25.0, 39.0, 44.0, 62.0, 95.0, 140.0, 213.0, 316.0, 525.0, 791.0, 1137.0, 1833.0, 3110.0, 5152.0, 8703.0, 14567.0, 25149.0, 43391.0, 75283.0, 128126.0, 190683.0, 199891.0, 143617.0, 86605.0, 49394.0, 28484.0, 16455.0, 9662.0, 5662.0, 3376.0, 2170.0, 1313.0, 887.0, 533.0, 344.0, 241.0, 167.0, 98.0, 74.0, 48.0, 31.0, 24.0, 18.0, 12.0, 5.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-30.703125, -29.716552734375, -28.72998046875, -27.743408203125, -26.7568359375, -25.770263671875, -24.78369140625, -23.797119140625, -22.810546875, -21.823974609375, -20.83740234375, -19.850830078125, -18.8642578125, -17.877685546875, -16.89111328125, -15.904541015625, -14.91796875, -13.931396484375, -12.94482421875, -11.958251953125, -10.9716796875, -9.985107421875, -8.99853515625, -8.011962890625, -7.025390625, -6.038818359375, -5.05224609375, -4.065673828125, -3.0791015625, -2.092529296875, -1.10595703125, -0.119384765625, 0.8671875, 1.853759765625, 2.84033203125, 3.826904296875, 4.8134765625, 5.800048828125, 6.78662109375, 7.773193359375, 8.759765625, 9.746337890625, 10.73291015625, 11.719482421875, 12.7060546875, 13.692626953125, 14.67919921875, 15.665771484375, 16.65234375, 17.638916015625, 18.62548828125, 19.612060546875, 20.5986328125, 21.585205078125, 22.57177734375, 23.558349609375, 24.544921875, 25.531494140625, 26.51806640625, 27.504638671875, 28.4912109375, 29.477783203125, 30.46435546875, 31.450927734375, 32.4375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 3.0, 6.0, 13.0, 12.0, 17.0, 12.0, 15.0, 15.0, 26.0, 21.0, 33.0, 31.0, 41.0, 28.0, 43.0, 41.0, 48.0, 48.0, 44.0, 44.0, 47.0, 36.0, 42.0, 44.0, 29.0, 24.0, 32.0, 29.0, 36.0, 27.0, 26.0, 10.0, 18.0, 15.0, 10.0, 8.0, 6.0, 6.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.875, -32.78955078125, -31.7041015625, -30.61865234375, -29.533203125, -28.44775390625, -27.3623046875, -26.27685546875, -25.19140625, -24.10595703125, -23.0205078125, -21.93505859375, -20.849609375, -19.76416015625, -18.6787109375, -17.59326171875, -16.5078125, -15.42236328125, -14.3369140625, -13.25146484375, -12.166015625, -11.08056640625, -9.9951171875, -8.90966796875, -7.82421875, -6.73876953125, -5.6533203125, -4.56787109375, -3.482421875, -2.39697265625, -1.3115234375, -0.22607421875, 0.859375, 1.94482421875, 3.0302734375, 4.11572265625, 5.201171875, 6.28662109375, 7.3720703125, 8.45751953125, 9.54296875, 10.62841796875, 11.7138671875, 12.79931640625, 13.884765625, 14.97021484375, 16.0556640625, 17.14111328125, 18.2265625, 19.31201171875, 20.3974609375, 21.48291015625, 22.568359375, 23.65380859375, 24.7392578125, 25.82470703125, 26.91015625, 27.99560546875, 29.0810546875, 30.16650390625, 31.251953125, 32.33740234375, 33.4228515625, 34.50830078125, 35.59375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 19.0, 27.0, 37.0, 54.0, 93.0, 125.0, 198.0, 301.0, 446.0, 636.0, 934.0, 1472.0, 2182.0, 3644.0, 5605.0, 8975.0, 14483.0, 23600.0, 39109.0, 63970.0, 104936.0, 158950.0, 191547.0, 158177.0, 104125.0, 63822.0, 38399.0, 23383.0, 14341.0, 8945.0, 5696.0, 3557.0, 2291.0, 1477.0, 1014.0, 645.0, 437.0, 282.0, 186.0, 136.0, 83.0, 60.0, 48.0, 32.0, 14.0, 12.0, 11.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-8.78125, -8.50244140625, -8.2236328125, -7.94482421875, -7.666015625, -7.38720703125, -7.1083984375, -6.82958984375, -6.55078125, -6.27197265625, -5.9931640625, -5.71435546875, -5.435546875, -5.15673828125, -4.8779296875, -4.59912109375, -4.3203125, -4.04150390625, -3.7626953125, -3.48388671875, -3.205078125, -2.92626953125, -2.6474609375, -2.36865234375, -2.08984375, -1.81103515625, -1.5322265625, -1.25341796875, -0.974609375, -0.69580078125, -0.4169921875, -0.13818359375, 0.140625, 0.41943359375, 0.6982421875, 0.97705078125, 1.255859375, 1.53466796875, 1.8134765625, 2.09228515625, 2.37109375, 2.64990234375, 2.9287109375, 3.20751953125, 3.486328125, 3.76513671875, 4.0439453125, 4.32275390625, 4.6015625, 4.88037109375, 5.1591796875, 5.43798828125, 5.716796875, 5.99560546875, 6.2744140625, 6.55322265625, 6.83203125, 7.11083984375, 7.3896484375, 7.66845703125, 7.947265625, 8.22607421875, 8.5048828125, 8.78369140625, 9.0625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 10.0, 8.0, 6.0, 7.0, 10.0, 19.0, 32.0, 44.0, 30.0, 57.0, 42.0, 63.0, 81.0, 98.0, 69.0, 82.0, 76.0, 57.0, 40.0, 43.0, 26.0, 26.0, 16.0, 16.0, 9.0, 11.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012483596801757812, -0.0012136027216911316, -0.001178845763206482, -0.0011440888047218323, -0.0011093318462371826, -0.001074574887752533, -0.0010398179292678833, -0.0010050609707832336, -0.000970304012298584, -0.0009355470538139343, -0.0009007900953292847, -0.000866033136844635, -0.0008312761783599854, -0.0007965192198753357, -0.000761762261390686, -0.0007270053029060364, -0.0006922483444213867, -0.0006574913859367371, -0.0006227344274520874, -0.0005879774689674377, -0.0005532205104827881, -0.0005184635519981384, -0.00048370659351348877, -0.0004489496350288391, -0.00041419267654418945, -0.0003794357180595398, -0.00034467875957489014, -0.0003099218010902405, -0.0002751648426055908, -0.00024040788412094116, -0.0002056509256362915, -0.00017089396715164185, -0.0001361370086669922, -0.00010138005018234253, -6.662309169769287e-05, -3.186613321304321e-05, 2.8908252716064453e-06, 3.7647783756256104e-05, 7.240474224090576e-05, 0.00010716170072555542, 0.00014191865921020508, 0.00017667561769485474, 0.0002114325761795044, 0.00024618953466415405, 0.0002809464931488037, 0.00031570345163345337, 0.00035046041011810303, 0.0003852173686027527, 0.00041997432708740234, 0.000454731285572052, 0.0004894882440567017, 0.0005242452025413513, 0.000559002161026001, 0.0005937591195106506, 0.0006285160779953003, 0.00066327303647995, 0.0006980299949645996, 0.0007327869534492493, 0.0007675439119338989, 0.0008023008704185486, 0.0008370578289031982, 0.0008718147873878479, 0.0009065717458724976, 0.0009413287043571472, 0.0009760856628417969]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 13.0, 17.0, 20.0, 35.0, 71.0, 107.0, 166.0, 227.0, 333.0, 545.0, 813.0, 1375.0, 2061.0, 3314.0, 5441.0, 9064.0, 15507.0, 26782.0, 46910.0, 82158.0, 142163.0, 208682.0, 199166.0, 129089.0, 73300.0, 41726.0, 24062.0, 13899.0, 8214.0, 5050.0, 3006.0, 1896.0, 1217.0, 749.0, 443.0, 318.0, 204.0, 126.0, 102.0, 54.0, 35.0, 30.0, 22.0, 15.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.381591796875, -10.95849609375, -10.535400390625, -10.1123046875, -9.689208984375, -9.26611328125, -8.843017578125, -8.419921875, -7.996826171875, -7.57373046875, -7.150634765625, -6.7275390625, -6.304443359375, -5.88134765625, -5.458251953125, -5.03515625, -4.612060546875, -4.18896484375, -3.765869140625, -3.3427734375, -2.919677734375, -2.49658203125, -2.073486328125, -1.650390625, -1.227294921875, -0.80419921875, -0.381103515625, 0.0419921875, 0.465087890625, 0.88818359375, 1.311279296875, 1.734375, 2.157470703125, 2.58056640625, 3.003662109375, 3.4267578125, 3.849853515625, 4.27294921875, 4.696044921875, 5.119140625, 5.542236328125, 5.96533203125, 6.388427734375, 6.8115234375, 7.234619140625, 7.65771484375, 8.080810546875, 8.50390625, 8.927001953125, 9.35009765625, 9.773193359375, 10.1962890625, 10.619384765625, 11.04248046875, 11.465576171875, 11.888671875, 12.311767578125, 12.73486328125, 13.157958984375, 13.5810546875, 14.004150390625, 14.42724609375, 14.850341796875, 15.2734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 17.0, 22.0, 18.0, 24.0, 26.0, 38.0, 44.0, 40.0, 48.0, 57.0, 63.0, 61.0, 60.0, 60.0, 56.0, 60.0, 43.0, 31.0, 29.0, 26.0, 14.0, 24.0, 25.0, 25.0, 10.0, 11.0, 7.0, 2.0, 2.0, 7.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.92657470703125, -3.7750244140625, -3.62347412109375, -3.471923828125, -3.32037353515625, -3.1688232421875, -3.01727294921875, -2.86572265625, -2.71417236328125, -2.5626220703125, -2.41107177734375, -2.259521484375, -2.10797119140625, -1.9564208984375, -1.80487060546875, -1.6533203125, -1.50177001953125, -1.3502197265625, -1.19866943359375, -1.047119140625, -0.89556884765625, -0.7440185546875, -0.59246826171875, -0.44091796875, -0.28936767578125, -0.1378173828125, 0.01373291015625, 0.165283203125, 0.31683349609375, 0.4683837890625, 0.61993408203125, 0.771484375, 0.92303466796875, 1.0745849609375, 1.22613525390625, 1.377685546875, 1.52923583984375, 1.6807861328125, 1.83233642578125, 1.98388671875, 2.13543701171875, 2.2869873046875, 2.43853759765625, 2.590087890625, 2.74163818359375, 2.8931884765625, 3.04473876953125, 3.1962890625, 3.34783935546875, 3.4993896484375, 3.65093994140625, 3.802490234375, 3.95404052734375, 4.1055908203125, 4.25714111328125, 4.40869140625, 4.56024169921875, 4.7117919921875, 4.86334228515625, 5.014892578125, 5.16644287109375, 5.3179931640625, 5.46954345703125, 5.62109375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 5.0, 16.0, 17.0, 18.0, 20.0, 36.0, 50.0, 54.0, 66.0, 76.0, 76.0, 92.0, 92.0, 78.0, 53.0, 58.0, 34.0, 28.0, 33.0, 27.0, 10.0, 14.0, 10.0, 7.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.11541748046875, -97.12666320800781, -94.13790893554688, -91.1491470336914, -88.16039276123047, -85.17163848876953, -82.18287658691406, -79.19412231445312, -76.20536804199219, -73.21661376953125, -70.22785949707031, -67.23909759521484, -64.2503433227539, -61.26158905029297, -58.272830963134766, -55.28407287597656, -52.295318603515625, -49.30656433105469, -46.317806243896484, -43.32904815673828, -40.340293884277344, -37.351539611816406, -34.3627815246582, -31.374025344848633, -28.385269165039062, -25.396512985229492, -22.407756805419922, -19.41900062561035, -16.43024444580078, -13.441488265991211, -10.45273208618164, -7.46397590637207, -4.475227355957031, -1.486471176147461, 1.5022850036621094, 4.49104118347168, 7.47979736328125, 10.46855354309082, 13.45730972290039, 16.44606590270996, 19.43482208251953, 22.4235782623291, 25.412334442138672, 28.401090621948242, 31.389846801757812, 34.37860107421875, 37.36735916137695, 40.356117248535156, 43.344871520996094, 46.33362579345703, 49.322383880615234, 52.31114196777344, 55.299896240234375, 58.28865051269531, 61.277408599853516, 64.26616668701172, 67.25492095947266, 70.2436752319336, 73.23243713378906, 76.22119140625, 79.20994567871094, 82.19869995117188, 85.18745422363281, 88.17621612548828, 91.16497039794922]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 12.0, 10.0, 8.0, 10.0, 11.0, 10.0, 14.0, 13.0, 20.0, 18.0, 21.0, 27.0, 31.0, 22.0, 22.0, 31.0, 33.0, 30.0, 31.0, 29.0, 48.0, 41.0, 37.0, 35.0, 34.0, 38.0, 34.0, 29.0, 33.0, 26.0, 20.0, 23.0, 28.0, 18.0, 24.0, 20.0, 14.0, 16.0, 15.0, 10.0, 9.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-38.84930419921875, -37.54950714111328, -36.24971389770508, -34.94991683959961, -33.650123596191406, -32.35032653808594, -31.050533294677734, -29.750736236572266, -28.450942993164062, -27.151147842407227, -25.85135269165039, -24.551557540893555, -23.25176239013672, -21.951967239379883, -20.652172088623047, -19.352375030517578, -18.052579879760742, -16.752784729003906, -15.45298957824707, -14.153194427490234, -12.853399276733398, -11.553604125976562, -10.25380802154541, -8.954012870788574, -7.654217720031738, -6.354422569274902, -5.054627418518066, -3.7548317909240723, -2.4550366401672363, -1.1552414894104004, 0.14455413818359375, 1.4443492889404297, 2.7441444396972656, 4.043939590454102, 5.3437347412109375, 6.643530368804932, 7.943325519561768, 9.243120193481445, 10.542916297912598, 11.842711448669434, 13.14250659942627, 14.442301750183105, 15.742096900939941, 17.041893005371094, 18.34168815612793, 19.641483306884766, 20.9412784576416, 22.241073608398438, 23.540868759155273, 24.84066390991211, 26.140459060668945, 27.44025421142578, 28.740049362182617, 30.039844512939453, 31.339641571044922, 32.639434814453125, 33.939231872558594, 35.23902893066406, 36.538822174072266, 37.838619232177734, 39.13841247558594, 40.438209533691406, 41.73800277709961, 43.03779983520508, 44.33759307861328]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 3.0, 1.0, 9.0, 13.0, 16.0, 11.0, 27.0, 28.0, 51.0, 70.0, 87.0, 144.0, 254.0, 386.0, 550.0, 875.0, 1523.0, 2426.0, 4042.0, 7000.0, 11859.0, 20724.0, 36180.0, 62275.0, 101615.0, 146099.0, 174355.0, 163199.0, 122250.0, 79526.0, 47484.0, 27548.0, 15570.0, 9018.0, 5272.0, 3043.0, 1844.0, 1137.0, 704.0, 448.0, 311.0, 219.0, 145.0, 74.0, 48.0, 34.0, 21.0, 15.0, 9.0, 8.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-61.46875, -59.64697265625, -57.8251953125, -56.00341796875, -54.181640625, -52.35986328125, -50.5380859375, -48.71630859375, -46.89453125, -45.07275390625, -43.2509765625, -41.42919921875, -39.607421875, -37.78564453125, -35.9638671875, -34.14208984375, -32.3203125, -30.49853515625, -28.6767578125, -26.85498046875, -25.033203125, -23.21142578125, -21.3896484375, -19.56787109375, -17.74609375, -15.92431640625, -14.1025390625, -12.28076171875, -10.458984375, -8.63720703125, -6.8154296875, -4.99365234375, -3.171875, -1.35009765625, 0.4716796875, 2.29345703125, 4.115234375, 5.93701171875, 7.7587890625, 9.58056640625, 11.40234375, 13.22412109375, 15.0458984375, 16.86767578125, 18.689453125, 20.51123046875, 22.3330078125, 24.15478515625, 25.9765625, 27.79833984375, 29.6201171875, 31.44189453125, 33.263671875, 35.08544921875, 36.9072265625, 38.72900390625, 40.55078125, 42.37255859375, 44.1943359375, 46.01611328125, 47.837890625, 49.65966796875, 51.4814453125, 53.30322265625, 55.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 7.0, 8.0, 12.0, 13.0, 11.0, 15.0, 10.0, 14.0, 20.0, 23.0, 22.0, 32.0, 21.0, 38.0, 25.0, 25.0, 34.0, 36.0, 37.0, 29.0, 40.0, 39.0, 52.0, 36.0, 40.0, 43.0, 27.0, 30.0, 34.0, 24.0, 19.0, 28.0, 25.0, 25.0, 14.0, 18.0, 15.0, 12.0, 9.0, 9.0, 1.0, 3.0, 7.0, 4.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.5625, -41.16552734375, -39.7685546875, -38.37158203125, -36.974609375, -35.57763671875, -34.1806640625, -32.78369140625, -31.38671875, -29.98974609375, -28.5927734375, -27.19580078125, -25.798828125, -24.40185546875, -23.0048828125, -21.60791015625, -20.2109375, -18.81396484375, -17.4169921875, -16.02001953125, -14.623046875, -13.22607421875, -11.8291015625, -10.43212890625, -9.03515625, -7.63818359375, -6.2412109375, -4.84423828125, -3.447265625, -2.05029296875, -0.6533203125, 0.74365234375, 2.140625, 3.53759765625, 4.9345703125, 6.33154296875, 7.728515625, 9.12548828125, 10.5224609375, 11.91943359375, 13.31640625, 14.71337890625, 16.1103515625, 17.50732421875, 18.904296875, 20.30126953125, 21.6982421875, 23.09521484375, 24.4921875, 25.88916015625, 27.2861328125, 28.68310546875, 30.080078125, 31.47705078125, 32.8740234375, 34.27099609375, 35.66796875, 37.06494140625, 38.4619140625, 39.85888671875, 41.255859375, 42.65283203125, 44.0498046875, 45.44677734375, 46.84375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 11.0, 14.0, 19.0, 20.0, 26.0, 36.0, 35.0, 58.0, 85.0, 135.0, 151.0, 212.0, 358.0, 553.0, 1035.0, 1752.0, 3632.0, 7836.0, 19177.0, 49595.0, 128129.0, 265434.0, 295772.0, 163987.0, 65408.0, 25157.0, 10024.0, 4603.0, 2195.0, 1169.0, 655.0, 403.0, 246.0, 181.0, 109.0, 80.0, 63.0, 50.0, 39.0, 21.0, 21.0, 9.0, 11.0, 7.0, 10.0, 4.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-124.875, -120.865234375, -116.85546875, -112.845703125, -108.8359375, -104.826171875, -100.81640625, -96.806640625, -92.796875, -88.787109375, -84.77734375, -80.767578125, -76.7578125, -72.748046875, -68.73828125, -64.728515625, -60.71875, -56.708984375, -52.69921875, -48.689453125, -44.6796875, -40.669921875, -36.66015625, -32.650390625, -28.640625, -24.630859375, -20.62109375, -16.611328125, -12.6015625, -8.591796875, -4.58203125, -0.572265625, 3.4375, 7.447265625, 11.45703125, 15.466796875, 19.4765625, 23.486328125, 27.49609375, 31.505859375, 35.515625, 39.525390625, 43.53515625, 47.544921875, 51.5546875, 55.564453125, 59.57421875, 63.583984375, 67.59375, 71.603515625, 75.61328125, 79.623046875, 83.6328125, 87.642578125, 91.65234375, 95.662109375, 99.671875, 103.681640625, 107.69140625, 111.701171875, 115.7109375, 119.720703125, 123.73046875, 127.740234375, 131.75]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 12.0, 12.0, 13.0, 9.0, 10.0, 11.0, 16.0, 20.0, 17.0, 22.0, 30.0, 35.0, 29.0, 34.0, 44.0, 32.0, 41.0, 38.0, 37.0, 48.0, 30.0, 45.0, 39.0, 38.0, 38.0, 47.0, 39.0, 36.0, 25.0, 23.0, 14.0, 29.0, 12.0, 7.0, 14.0, 12.0, 10.0, 2.0, 6.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.859375, -30.812744140625, -29.76611328125, -28.719482421875, -27.6728515625, -26.626220703125, -25.57958984375, -24.532958984375, -23.486328125, -22.439697265625, -21.39306640625, -20.346435546875, -19.2998046875, -18.253173828125, -17.20654296875, -16.159912109375, -15.11328125, -14.066650390625, -13.02001953125, -11.973388671875, -10.9267578125, -9.880126953125, -8.83349609375, -7.786865234375, -6.740234375, -5.693603515625, -4.64697265625, -3.600341796875, -2.5537109375, -1.507080078125, -0.46044921875, 0.586181640625, 1.6328125, 2.679443359375, 3.72607421875, 4.772705078125, 5.8193359375, 6.865966796875, 7.91259765625, 8.959228515625, 10.005859375, 11.052490234375, 12.09912109375, 13.145751953125, 14.1923828125, 15.239013671875, 16.28564453125, 17.332275390625, 18.37890625, 19.425537109375, 20.47216796875, 21.518798828125, 22.5654296875, 23.612060546875, 24.65869140625, 25.705322265625, 26.751953125, 27.798583984375, 28.84521484375, 29.891845703125, 30.9384765625, 31.985107421875, 33.03173828125, 34.078369140625, 35.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 15.0, 12.0, 31.0, 27.0, 49.0, 55.0, 92.0, 123.0, 197.0, 251.0, 424.0, 649.0, 1056.0, 1655.0, 2674.0, 4333.0, 7024.0, 11948.0, 20372.0, 35896.0, 64035.0, 108222.0, 165380.0, 195544.0, 165541.0, 109967.0, 64609.0, 36510.0, 20760.0, 12074.0, 7236.0, 4381.0, 2578.0, 1718.0, 1084.0, 695.0, 478.0, 267.0, 189.0, 122.0, 85.0, 58.0, 37.0, 22.0, 24.0, 12.0, 8.0, 11.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.576171875, -31.43359375, -30.291015625, -29.1484375, -28.005859375, -26.86328125, -25.720703125, -24.578125, -23.435546875, -22.29296875, -21.150390625, -20.0078125, -18.865234375, -17.72265625, -16.580078125, -15.4375, -14.294921875, -13.15234375, -12.009765625, -10.8671875, -9.724609375, -8.58203125, -7.439453125, -6.296875, -5.154296875, -4.01171875, -2.869140625, -1.7265625, -0.583984375, 0.55859375, 1.701171875, 2.84375, 3.986328125, 5.12890625, 6.271484375, 7.4140625, 8.556640625, 9.69921875, 10.841796875, 11.984375, 13.126953125, 14.26953125, 15.412109375, 16.5546875, 17.697265625, 18.83984375, 19.982421875, 21.125, 22.267578125, 23.41015625, 24.552734375, 25.6953125, 26.837890625, 27.98046875, 29.123046875, 30.265625, 31.408203125, 32.55078125, 33.693359375, 34.8359375, 35.978515625, 37.12109375, 38.263671875, 39.40625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 10.0, 19.0, 24.0, 32.0, 42.0, 58.0, 90.0, 105.0, 113.0, 122.0, 93.0, 62.0, 68.0, 41.0, 33.0, 19.0, 13.0, 10.0, 8.0, 10.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004047393798828125, -0.003861725330352783, -0.0036760568618774414, -0.0034903883934020996, -0.003304719924926758, -0.003119051456451416, -0.0029333829879760742, -0.0027477145195007324, -0.0025620460510253906, -0.002376377582550049, -0.002190709114074707, -0.0020050406455993652, -0.0018193721771240234, -0.0016337037086486816, -0.0014480352401733398, -0.001262366771697998, -0.0010766983032226562, -0.0008910298347473145, -0.0007053613662719727, -0.0005196928977966309, -0.00033402442932128906, -0.00014835596084594727, 3.731250762939453e-05, 0.00022298097610473633, 0.0004086494445800781, 0.0005943179130554199, 0.0007799863815307617, 0.0009656548500061035, 0.0011513233184814453, 0.0013369917869567871, 0.001522660255432129, 0.0017083287239074707, 0.0018939971923828125, 0.0020796656608581543, 0.002265334129333496, 0.002451002597808838, 0.0026366710662841797, 0.0028223395347595215, 0.0030080080032348633, 0.003193676471710205, 0.003379344940185547, 0.0035650134086608887, 0.0037506818771362305, 0.003936350345611572, 0.004122018814086914, 0.004307687282562256, 0.004493355751037598, 0.0046790242195129395, 0.004864692687988281, 0.005050361156463623, 0.005236029624938965, 0.005421698093414307, 0.0056073665618896484, 0.00579303503036499, 0.005978703498840332, 0.006164371967315674, 0.006350040435791016, 0.006535708904266357, 0.006721377372741699, 0.006907045841217041, 0.007092714309692383, 0.007278382778167725, 0.007464051246643066, 0.007649719715118408, 0.00783538818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 16.0, 16.0, 20.0, 39.0, 58.0, 60.0, 115.0, 148.0, 246.0, 379.0, 578.0, 925.0, 1427.0, 2145.0, 3564.0, 5609.0, 8796.0, 14250.0, 23277.0, 39551.0, 65415.0, 107063.0, 159320.0, 186933.0, 158346.0, 105937.0, 63938.0, 38792.0, 23280.0, 14159.0, 8843.0, 5523.0, 3604.0, 2212.0, 1401.0, 873.0, 608.0, 371.0, 242.0, 165.0, 100.0, 65.0, 47.0, 27.0, 18.0, 22.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.5625, -33.46484375, -32.3671875, -31.26953125, -30.171875, -29.07421875, -27.9765625, -26.87890625, -25.78125, -24.68359375, -23.5859375, -22.48828125, -21.390625, -20.29296875, -19.1953125, -18.09765625, -17.0, -15.90234375, -14.8046875, -13.70703125, -12.609375, -11.51171875, -10.4140625, -9.31640625, -8.21875, -7.12109375, -6.0234375, -4.92578125, -3.828125, -2.73046875, -1.6328125, -0.53515625, 0.5625, 1.66015625, 2.7578125, 3.85546875, 4.953125, 6.05078125, 7.1484375, 8.24609375, 9.34375, 10.44140625, 11.5390625, 12.63671875, 13.734375, 14.83203125, 15.9296875, 17.02734375, 18.125, 19.22265625, 20.3203125, 21.41796875, 22.515625, 23.61328125, 24.7109375, 25.80859375, 26.90625, 28.00390625, 29.1015625, 30.19921875, 31.296875, 32.39453125, 33.4921875, 34.58984375, 35.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 9.0, 14.0, 12.0, 17.0, 15.0, 10.0, 22.0, 28.0, 30.0, 35.0, 36.0, 36.0, 37.0, 38.0, 51.0, 58.0, 44.0, 43.0, 47.0, 55.0, 43.0, 43.0, 28.0, 31.0, 26.0, 27.0, 31.0, 18.0, 18.0, 11.0, 16.0, 10.0, 14.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.8046875, -9.4984130859375, -9.192138671875, -8.8858642578125, -8.57958984375, -8.2733154296875, -7.967041015625, -7.6607666015625, -7.3544921875, -7.0482177734375, -6.741943359375, -6.4356689453125, -6.12939453125, -5.8231201171875, -5.516845703125, -5.2105712890625, -4.904296875, -4.5980224609375, -4.291748046875, -3.9854736328125, -3.67919921875, -3.3729248046875, -3.066650390625, -2.7603759765625, -2.4541015625, -2.1478271484375, -1.841552734375, -1.5352783203125, -1.22900390625, -0.9227294921875, -0.616455078125, -0.3101806640625, -0.00390625, 0.3023681640625, 0.608642578125, 0.9149169921875, 1.22119140625, 1.5274658203125, 1.833740234375, 2.1400146484375, 2.4462890625, 2.7525634765625, 3.058837890625, 3.3651123046875, 3.67138671875, 3.9776611328125, 4.283935546875, 4.5902099609375, 4.896484375, 5.2027587890625, 5.509033203125, 5.8153076171875, 6.12158203125, 6.4278564453125, 6.734130859375, 7.0404052734375, 7.3466796875, 7.6529541015625, 7.959228515625, 8.2655029296875, 8.57177734375, 8.8780517578125, 9.184326171875, 9.4906005859375, 9.796875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 16.0, 15.0, 17.0, 24.0, 34.0, 55.0, 39.0, 46.0, 69.0, 62.0, 86.0, 73.0, 70.0, 76.0, 58.0, 53.0, 33.0, 37.0, 26.0, 21.0, 21.0, 13.0, 12.0, 12.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.44152069091797, -102.274658203125, -99.10779571533203, -95.94093322753906, -92.77406311035156, -89.6072006225586, -86.44033813476562, -83.27347564697266, -80.10661315917969, -76.93975067138672, -73.77288818359375, -70.60601806640625, -67.43915557861328, -64.27229309082031, -61.105430603027344, -57.938568115234375, -54.771697998046875, -51.604835510253906, -48.43796920776367, -45.2711067199707, -42.10424041748047, -38.9373779296875, -35.77051544189453, -32.60365295410156, -29.436786651611328, -26.269922256469727, -23.103057861328125, -19.936195373535156, -16.769330978393555, -13.602466583251953, -10.435604095458984, -7.268739700317383, -4.1018829345703125, -0.9350190162658691, 2.231844902038574, 5.398708343505859, 8.565572738647461, 11.732437133789062, 14.899299621582031, 18.066164016723633, 21.233028411865234, 24.399892807006836, 27.566757202148438, 30.733619689941406, 33.900482177734375, 37.06734848022461, 40.23421096801758, 43.40107727050781, 46.56793975830078, 49.73480224609375, 52.901668548583984, 56.06853103637695, 59.23539733886719, 62.402259826660156, 65.56912231445312, 68.7359848022461, 71.90284729003906, 75.06970977783203, 78.236572265625, 81.4034423828125, 84.57030487060547, 87.73716735839844, 90.9040298461914, 94.07089233398438, 97.23776245117188]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 7.0, 12.0, 9.0, 10.0, 20.0, 20.0, 12.0, 19.0, 23.0, 21.0, 32.0, 25.0, 21.0, 31.0, 30.0, 29.0, 32.0, 44.0, 45.0, 45.0, 34.0, 41.0, 29.0, 43.0, 36.0, 36.0, 30.0, 26.0, 22.0, 27.0, 26.0, 17.0, 20.0, 17.0, 14.0, 8.0, 11.0, 9.0, 10.0, 12.0, 8.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-51.89430236816406, -50.25565719604492, -48.61701583862305, -46.978370666503906, -45.339725494384766, -43.701080322265625, -42.06243896484375, -40.42379379272461, -38.78514862060547, -37.14650344848633, -35.50786209106445, -33.86921691894531, -32.23057174682617, -30.591928482055664, -28.953285217285156, -27.314640045166016, -25.675996780395508, -24.037353515625, -22.39870834350586, -20.76006507873535, -19.12141990661621, -17.482776641845703, -15.844132423400879, -14.205488204956055, -12.56684398651123, -10.928199768066406, -9.289555549621582, -7.650911808013916, -6.012267589569092, -4.373623847961426, -2.7349796295166016, -1.0963354110717773, 0.5423088073730469, 2.180953025817871, 3.819597005844116, 5.458240985870361, 7.0968852043151855, 8.735528945922852, 10.374173164367676, 12.0128173828125, 13.651461601257324, 15.290105819702148, 16.928749084472656, 18.567394256591797, 20.206037521362305, 21.844680786132812, 23.483325958251953, 25.121971130371094, 26.7606143951416, 28.39925765991211, 30.03790283203125, 31.676546096801758, 33.315189361572266, 34.953834533691406, 36.59247970581055, 38.23112487792969, 39.86976623535156, 41.5084114074707, 43.14705276489258, 44.78569793701172, 46.42434310913086, 48.06298828125, 49.701629638671875, 51.340274810791016, 52.978919982910156]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 6.0, 6.0, 7.0, 4.0, 12.0, 10.0, 12.0, 17.0, 18.0, 26.0, 27.0, 30.0, 52.0, 43.0, 74.0, 73.0, 104.0, 130.0, 204.0, 280.0, 387.0, 661.0, 1000.0, 1715.0, 1039945.0, 1977.0, 1232.0, 757.0, 510.0, 330.0, 210.0, 146.0, 136.0, 82.0, 68.0, 70.0, 54.0, 39.0, 27.0, 21.0, 20.0, 13.0, 17.0, 17.0, 11.0, 8.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1530.567626953125, -1483.7633056640625, -1436.958984375, -1390.1546630859375, -1343.350341796875, -1296.546142578125, -1249.7418212890625, -1202.9375, -1156.1331787109375, -1109.328857421875, -1062.5245361328125, -1015.7202758789062, -968.9159545898438, -922.1116333007812, -875.307373046875, -828.5030517578125, -781.69873046875, -734.8944091796875, -688.090087890625, -641.2858276367188, -594.4815063476562, -547.6771850585938, -500.8728942871094, -454.068603515625, -407.2642822265625, -360.4599609375, -313.6556701660156, -266.85137939453125, -220.04705810546875, -173.2427520751953, -126.43844604492188, -79.6341552734375, -32.8299560546875, 13.974349975585938, 60.778656005859375, 107.58296203613281, 154.38726806640625, 201.1915740966797, 247.99588012695312, 294.8001708984375, 341.6044921875, 388.4088134765625, 435.2131042480469, 482.01739501953125, 528.8217163085938, 575.6260375976562, 622.4302978515625, 669.234619140625, 716.0389404296875, 762.84326171875, 809.6475830078125, 856.4518432617188, 903.2561645507812, 950.0604858398438, 996.86474609375, 1043.6690673828125, 1090.473388671875, 1137.2777099609375, 1184.08203125, 1230.8863525390625, 1277.690673828125, 1324.494873046875, 1371.2991943359375, 1418.103515625, 1464.9078369140625]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 5.0, 15.0, 8.0, 12.0, 10.0, 18.0, 23.0, 28.0, 28.0, 40.0, 54.0, 73.0, 118.0, 126.0, 184.0, 297.0, 437.0, 916.0, 1993.0, 4100.0, 8268.0, 51412228.0, 28069.0, 7004.0, 3467.0, 1603.0, 772.0, 422.0, 279.0, 172.0, 134.0, 98.0, 70.0, 53.0, 27.0, 33.0, 26.0, 15.0, 22.0, 11.0, 16.0, 9.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0], "bins": [-1515.934814453125, -1472.479736328125, -1429.024658203125, -1385.569580078125, -1342.114501953125, -1298.659423828125, -1255.204345703125, -1211.7491455078125, -1168.2940673828125, -1124.8389892578125, -1081.3839111328125, -1037.9288330078125, -994.4736938476562, -951.0186157226562, -907.5635375976562, -864.1083984375, -820.6533813476562, -777.1983032226562, -733.7432250976562, -690.2880859375, -646.8330078125, -603.3779296875, -559.9228515625, -516.4677734375, -473.0126647949219, -429.5575866699219, -386.10247802734375, -342.64739990234375, -299.19232177734375, -255.73721313476562, -212.28213500976562, -168.8270263671875, -125.3719482421875, -81.91685485839844, -38.461769104003906, 4.993316650390625, 48.44841003417969, 91.90350341796875, 135.35858154296875, 178.81369018554688, 222.26876831054688, 265.7238464355469, 309.178955078125, 352.634033203125, 396.089111328125, 439.5442199707031, 482.9992980957031, 526.4544067382812, 569.9094848632812, 613.3645629882812, 656.8196411132812, 700.2747802734375, 743.7298583984375, 787.1849365234375, 830.6400146484375, 874.0950927734375, 917.5501708984375, 961.0052490234375, 1004.4603271484375, 1047.9154052734375, 1091.3704833984375, 1134.82568359375, 1178.28076171875, 1221.73583984375, 1265.19091796875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 7.0, 2.0, 10.0, 12.0, 15.0, 22.0, 42.0, 53.0, 84.0, 126.0, 194.0, 272.0, 412.0, 635.0, 1024.0, 1691.0, 2587.0, 4134.0, 6605.0, 11239.0, 19040.0, 32331.0, 54701.0, 92916.0, 160370.0, 275128.0, 504898.0, 1070135.0, 1816356.0, 1065625.0, 503003.0, 275678.0, 160882.0, 94058.0, 55076.0, 32460.0, 19455.0, 11479.0, 6920.0, 4250.0, 2854.0, 1663.0, 1045.0, 637.0, 468.0, 301.0, 185.0, 132.0, 76.0, 58.0, 40.0, 24.0, 19.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-38.5, -37.3154296875, -36.130859375, -34.9462890625, -33.76171875, -32.5771484375, -31.392578125, -30.2080078125, -29.0234375, -27.8388671875, -26.654296875, -25.4697265625, -24.28515625, -23.1005859375, -21.916015625, -20.7314453125, -19.546875, -18.3623046875, -17.177734375, -15.9931640625, -14.80859375, -13.6240234375, -12.439453125, -11.2548828125, -10.0703125, -8.8857421875, -7.701171875, -6.5166015625, -5.33203125, -4.1474609375, -2.962890625, -1.7783203125, -0.59375, 0.5908203125, 1.775390625, 2.9599609375, 4.14453125, 5.3291015625, 6.513671875, 7.6982421875, 8.8828125, 10.0673828125, 11.251953125, 12.4365234375, 13.62109375, 14.8056640625, 15.990234375, 17.1748046875, 18.359375, 19.5439453125, 20.728515625, 21.9130859375, 23.09765625, 24.2822265625, 25.466796875, 26.6513671875, 27.8359375, 29.0205078125, 30.205078125, 31.3896484375, 32.57421875, 33.7587890625, 34.943359375, 36.1279296875, 37.3125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 11.0, 6.0, 6.0, 9.0, 7.0, 11.0, 23.0, 22.0, 21.0, 25.0, 26.0, 26.0, 31.0, 51.0, 46.0, 64.0, 75.0, 139.0, 151.0, 197.0, 232.0, 184.0, 145.0, 111.0, 74.0, 51.0, 51.0, 40.0, 24.0, 26.0, 29.0, 19.0, 22.0, 23.0, 9.0, 9.0, 10.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.046875, -28.935302734375, -27.82373046875, -26.712158203125, -25.6005859375, -24.489013671875, -23.37744140625, -22.265869140625, -21.154296875, -20.042724609375, -18.93115234375, -17.819580078125, -16.7080078125, -15.596435546875, -14.48486328125, -13.373291015625, -12.26171875, -11.150146484375, -10.03857421875, -8.927001953125, -7.8154296875, -6.703857421875, -5.59228515625, -4.480712890625, -3.369140625, -2.257568359375, -1.14599609375, -0.034423828125, 1.0771484375, 2.188720703125, 3.30029296875, 4.411865234375, 5.5234375, 6.635009765625, 7.74658203125, 8.858154296875, 9.9697265625, 11.081298828125, 12.19287109375, 13.304443359375, 14.416015625, 15.527587890625, 16.63916015625, 17.750732421875, 18.8623046875, 19.973876953125, 21.08544921875, 22.197021484375, 23.30859375, 24.420166015625, 25.53173828125, 26.643310546875, 27.7548828125, 28.866455078125, 29.97802734375, 31.089599609375, 32.201171875, 33.312744140625, 34.42431640625, 35.535888671875, 36.6474609375, 37.759033203125, 38.87060546875, 39.982177734375, 41.09375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 7.0, 8.0, 20.0, 27.0, 26.0, 28.0, 54.0, 71.0, 123.0, 195.0, 283.0, 456.0, 758.0, 1173.0, 1792.0, 2958.0, 4594.0, 7335.0, 11349.0, 17795.0, 28212.0, 43169.0, 66884.0, 100937.0, 150691.0, 221127.0, 333687.0, 617002.0, 1534858.0, 1532828.0, 617541.0, 332572.0, 221285.0, 151711.0, 101630.0, 66651.0, 43880.0, 28260.0, 18393.0, 11548.0, 7169.0, 4473.0, 2847.0, 1866.0, 1165.0, 711.0, 455.0, 304.0, 183.0, 126.0, 84.0, 49.0, 36.0, 27.0, 14.0, 8.0, 5.0, 2.0], "bins": [-22.5, -21.857177734375, -21.21435546875, -20.571533203125, -19.9287109375, -19.285888671875, -18.64306640625, -18.000244140625, -17.357421875, -16.714599609375, -16.07177734375, -15.428955078125, -14.7861328125, -14.143310546875, -13.50048828125, -12.857666015625, -12.21484375, -11.572021484375, -10.92919921875, -10.286376953125, -9.6435546875, -9.000732421875, -8.35791015625, -7.715087890625, -7.072265625, -6.429443359375, -5.78662109375, -5.143798828125, -4.5009765625, -3.858154296875, -3.21533203125, -2.572509765625, -1.9296875, -1.286865234375, -0.64404296875, -0.001220703125, 0.6416015625, 1.284423828125, 1.92724609375, 2.570068359375, 3.212890625, 3.855712890625, 4.49853515625, 5.141357421875, 5.7841796875, 6.427001953125, 7.06982421875, 7.712646484375, 8.35546875, 8.998291015625, 9.64111328125, 10.283935546875, 10.9267578125, 11.569580078125, 12.21240234375, 12.855224609375, 13.498046875, 14.140869140625, 14.78369140625, 15.426513671875, 16.0693359375, 16.712158203125, 17.35498046875, 17.997802734375, 18.640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 7.0, 3.0, 8.0, 11.0, 7.0, 13.0, 22.0, 24.0, 20.0, 21.0, 21.0, 23.0, 42.0, 29.0, 47.0, 61.0, 120.0, 201.0, 268.0, 249.0, 203.0, 141.0, 94.0, 74.0, 48.0, 50.0, 45.0, 40.0, 21.0, 18.0, 19.0, 15.0, 10.0, 7.0, 8.0, 8.0, 4.0, 8.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0625, -45.671875, -44.28125, -42.890625, -41.5, -40.109375, -38.71875, -37.328125, -35.9375, -34.546875, -33.15625, -31.765625, -30.375, -28.984375, -27.59375, -26.203125, -24.8125, -23.421875, -22.03125, -20.640625, -19.25, -17.859375, -16.46875, -15.078125, -13.6875, -12.296875, -10.90625, -9.515625, -8.125, -6.734375, -5.34375, -3.953125, -2.5625, -1.171875, 0.21875, 1.609375, 3.0, 4.390625, 5.78125, 7.171875, 8.5625, 9.953125, 11.34375, 12.734375, 14.125, 15.515625, 16.90625, 18.296875, 19.6875, 21.078125, 22.46875, 23.859375, 25.25, 26.640625, 28.03125, 29.421875, 30.8125, 32.203125, 33.59375, 34.984375, 36.375, 37.765625, 39.15625, 40.546875, 41.9375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 8.0, 13.0, 18.0, 24.0, 21.0, 24.0, 35.0, 48.0, 80.0, 116.0, 170.0, 222.0, 350.0, 483.0, 734.0, 1093.0, 1702.0, 2868.0, 4655.0, 7860.0, 13593.0, 24329.0, 44171.0, 84179.0, 237345.0, 5545320.0, 162984.0, 70204.0, 37916.0, 21103.0, 11831.0, 6826.0, 4006.0, 2447.0, 1531.0, 954.0, 678.0, 443.0, 340.0, 217.0, 141.0, 107.0, 80.0, 50.0, 33.0, 26.0, 21.0, 17.0, 3.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-62.5625, -60.357421875, -58.15234375, -55.947265625, -53.7421875, -51.537109375, -49.33203125, -47.126953125, -44.921875, -42.716796875, -40.51171875, -38.306640625, -36.1015625, -33.896484375, -31.69140625, -29.486328125, -27.28125, -25.076171875, -22.87109375, -20.666015625, -18.4609375, -16.255859375, -14.05078125, -11.845703125, -9.640625, -7.435546875, -5.23046875, -3.025390625, -0.8203125, 1.384765625, 3.58984375, 5.794921875, 8.0, 10.205078125, 12.41015625, 14.615234375, 16.8203125, 19.025390625, 21.23046875, 23.435546875, 25.640625, 27.845703125, 30.05078125, 32.255859375, 34.4609375, 36.666015625, 38.87109375, 41.076171875, 43.28125, 45.486328125, 47.69140625, 49.896484375, 52.1015625, 54.306640625, 56.51171875, 58.716796875, 60.921875, 63.126953125, 65.33203125, 67.537109375, 69.7421875, 71.947265625, 74.15234375, 76.357421875, 78.5625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 6.0, 6.0, 7.0, 5.0, 9.0, 6.0, 12.0, 15.0, 10.0, 20.0, 29.0, 29.0, 33.0, 32.0, 21.0, 34.0, 38.0, 37.0, 43.0, 70.0, 154.0, 326.0, 348.0, 209.0, 106.0, 74.0, 47.0, 42.0, 42.0, 32.0, 26.0, 25.0, 29.0, 19.0, 18.0, 11.0, 10.0, 7.0, 10.0, 11.0, 5.0, 2.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-65.0, -63.0791015625, -61.158203125, -59.2373046875, -57.31640625, -55.3955078125, -53.474609375, -51.5537109375, -49.6328125, -47.7119140625, -45.791015625, -43.8701171875, -41.94921875, -40.0283203125, -38.107421875, -36.1865234375, -34.265625, -32.3447265625, -30.423828125, -28.5029296875, -26.58203125, -24.6611328125, -22.740234375, -20.8193359375, -18.8984375, -16.9775390625, -15.056640625, -13.1357421875, -11.21484375, -9.2939453125, -7.373046875, -5.4521484375, -3.53125, -1.6103515625, 0.310546875, 2.2314453125, 4.15234375, 6.0732421875, 7.994140625, 9.9150390625, 11.8359375, 13.7568359375, 15.677734375, 17.5986328125, 19.51953125, 21.4404296875, 23.361328125, 25.2822265625, 27.203125, 29.1240234375, 31.044921875, 32.9658203125, 34.88671875, 36.8076171875, 38.728515625, 40.6494140625, 42.5703125, 44.4912109375, 46.412109375, 48.3330078125, 50.25390625, 52.1748046875, 54.095703125, 56.0166015625, 57.9375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 9.0, 9.0, 18.0, 21.0, 38.0, 50.0, 92.0, 211.0, 239.0, 108.0, 73.0, 50.0, 34.0, 21.0, 17.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3444.7783203125, -3358.5693359375, -3272.3603515625, -3186.1513671875, -3099.9423828125, -3013.7333984375, -2927.5244140625, -2841.315185546875, -2755.106201171875, -2668.897216796875, -2582.688232421875, -2496.479248046875, -2410.270263671875, -2324.06103515625, -2237.85205078125, -2151.64306640625, -2065.43408203125, -1979.22509765625, -1893.01611328125, -1806.80712890625, -1720.5980224609375, -1634.3890380859375, -1548.1800537109375, -1461.970947265625, -1375.76220703125, -1289.55322265625, -1203.34423828125, -1117.13525390625, -1030.9261474609375, -944.7171630859375, -858.5081787109375, -772.2991333007812, -686.090087890625, -599.881103515625, -513.6720581054688, -427.46307373046875, -341.2540588378906, -255.0450439453125, -168.8360595703125, -82.62701416015625, 3.58197021484375, 89.79097747802734, 175.99998474121094, 262.208984375, 348.4179992675781, 434.62701416015625, 520.8359985351562, 607.0450439453125, 693.2540283203125, 779.4630126953125, 865.6720581054688, 951.8810424804688, 1038.090087890625, 1124.299072265625, 1210.508056640625, 1296.717041015625, 1382.926025390625, 1469.135009765625, 1555.343994140625, 1641.552978515625, 1727.7620849609375, 1813.9710693359375, 1900.1800537109375, 1986.38916015625, 2072.59814453125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 0.0, 11.0, 10.0, 10.0, 20.0, 24.0, 13.0, 22.0, 19.0, 28.0, 38.0, 30.0, 34.0, 38.0, 59.0, 64.0, 94.0, 77.0, 69.0, 57.0, 45.0, 31.0, 24.0, 33.0, 19.0, 15.0, 16.0, 24.0, 14.0, 11.0, 7.0, 2.0, 7.0, 5.0, 6.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1230.11181640625, -1193.7510986328125, -1157.3905029296875, -1121.02978515625, -1084.6690673828125, -1048.308349609375, -1011.94775390625, -975.5870361328125, -939.2263793945312, -902.86572265625, -866.5050048828125, -830.1443481445312, -793.78369140625, -757.4229736328125, -721.0623168945312, -684.70166015625, -648.3409423828125, -611.9802856445312, -575.6195678710938, -539.2589111328125, -502.8982238769531, -466.53753662109375, -430.1768798828125, -393.8161926269531, -357.45550537109375, -321.0948181152344, -284.734130859375, -248.37347412109375, -212.01278686523438, -175.652099609375, -139.2914276123047, -102.93075561523438, -66.5699462890625, -30.209266662597656, 6.1514129638671875, 42.51209259033203, 78.87277221679688, 115.23345947265625, 151.59413146972656, 187.95480346679688, 224.31549072265625, 260.6761779785156, 297.036865234375, 333.39752197265625, 369.7582092285156, 406.118896484375, 442.47955322265625, 478.8402404785156, 515.200927734375, 551.5615844726562, 587.9223022460938, 624.282958984375, 660.6436767578125, 697.0043334960938, 733.364990234375, 769.7257080078125, 806.0863647460938, 842.447021484375, 878.8077392578125, 915.1683959960938, 951.529052734375, 987.8897705078125, 1024.25048828125, 1060.611083984375, 1096.9718017578125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 7.0, 4.0, 7.0, 12.0, 11.0, 21.0, 25.0, 43.0, 53.0, 86.0, 117.0, 150.0, 280.0, 403.0, 590.0, 882.0, 1382.0, 2260.0, 3812.0, 6884.0, 13081.0, 28109.0, 83543.0, 673410.0, 3135990.0, 161814.0, 43203.0, 17774.0, 8875.0, 4716.0, 2756.0, 1552.0, 919.0, 550.0, 354.0, 236.0, 136.0, 102.0, 42.0, 29.0, 21.0, 8.0, 8.0, 11.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-13.2734375, -12.8963623046875, -12.519287109375, -12.1422119140625, -11.76513671875, -11.3880615234375, -11.010986328125, -10.6339111328125, -10.2568359375, -9.8797607421875, -9.502685546875, -9.1256103515625, -8.74853515625, -8.3714599609375, -7.994384765625, -7.6173095703125, -7.240234375, -6.8631591796875, -6.486083984375, -6.1090087890625, -5.73193359375, -5.3548583984375, -4.977783203125, -4.6007080078125, -4.2236328125, -3.8465576171875, -3.469482421875, -3.0924072265625, -2.71533203125, -2.3382568359375, -1.961181640625, -1.5841064453125, -1.20703125, -0.8299560546875, -0.452880859375, -0.0758056640625, 0.30126953125, 0.6783447265625, 1.055419921875, 1.4324951171875, 1.8095703125, 2.1866455078125, 2.563720703125, 2.9407958984375, 3.31787109375, 3.6949462890625, 4.072021484375, 4.4490966796875, 4.826171875, 5.2032470703125, 5.580322265625, 5.9573974609375, 6.33447265625, 6.7115478515625, 7.088623046875, 7.4656982421875, 7.8427734375, 8.2198486328125, 8.596923828125, 8.9739990234375, 9.35107421875, 9.7281494140625, 10.105224609375, 10.4822998046875, 10.859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 7.0, 4.0, 9.0, 4.0, 15.0, 13.0, 22.0, 39.0, 71.0, 113.0, 166.0, 169.0, 111.0, 69.0, 63.0, 27.0, 16.0, 13.0, 10.0, 6.0, 6.0, 9.0, 3.0, 3.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.623046875, -1.5742034912109375, -1.525360107421875, -1.4765167236328125, -1.42767333984375, -1.3788299560546875, -1.329986572265625, -1.2811431884765625, -1.2322998046875, -1.1834564208984375, -1.134613037109375, -1.0857696533203125, -1.03692626953125, -0.9880828857421875, -0.939239501953125, -0.8903961181640625, -0.841552734375, -0.7927093505859375, -0.743865966796875, -0.6950225830078125, -0.64617919921875, -0.5973358154296875, -0.548492431640625, -0.4996490478515625, -0.4508056640625, -0.4019622802734375, -0.353118896484375, -0.3042755126953125, -0.25543212890625, -0.2065887451171875, -0.157745361328125, -0.1089019775390625, -0.06005859375, -0.0112152099609375, 0.037628173828125, 0.0864715576171875, 0.13531494140625, 0.1841583251953125, 0.233001708984375, 0.2818450927734375, 0.3306884765625, 0.3795318603515625, 0.428375244140625, 0.4772186279296875, 0.52606201171875, 0.5749053955078125, 0.623748779296875, 0.6725921630859375, 0.721435546875, 0.7702789306640625, 0.819122314453125, 0.8679656982421875, 0.91680908203125, 0.9656524658203125, 1.014495849609375, 1.0633392333984375, 1.1121826171875, 1.1610260009765625, 1.209869384765625, 1.2587127685546875, 1.30755615234375, 1.3563995361328125, 1.405242919921875, 1.4540863037109375, 1.5029296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 20.0, 14.0, 17.0, 29.0, 57.0, 84.0, 128.0, 188.0, 308.0, 591.0, 966.0, 1770.0, 3525.0, 7153.0, 15691.0, 36742.0, 97680.0, 289428.0, 1101566.0, 1952229.0, 454527.0, 141475.0, 51096.0, 20443.0, 9134.0, 4302.0, 2146.0, 1168.0, 682.0, 397.0, 255.0, 149.0, 103.0, 76.0, 34.0, 31.0, 21.0, 17.0, 12.0, 5.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.803955078125, -7.54541015625, -7.286865234375, -7.0283203125, -6.769775390625, -6.51123046875, -6.252685546875, -5.994140625, -5.735595703125, -5.47705078125, -5.218505859375, -4.9599609375, -4.701416015625, -4.44287109375, -4.184326171875, -3.92578125, -3.667236328125, -3.40869140625, -3.150146484375, -2.8916015625, -2.633056640625, -2.37451171875, -2.115966796875, -1.857421875, -1.598876953125, -1.34033203125, -1.081787109375, -0.8232421875, -0.564697265625, -0.30615234375, -0.047607421875, 0.2109375, 0.469482421875, 0.72802734375, 0.986572265625, 1.2451171875, 1.503662109375, 1.76220703125, 2.020751953125, 2.279296875, 2.537841796875, 2.79638671875, 3.054931640625, 3.3134765625, 3.572021484375, 3.83056640625, 4.089111328125, 4.34765625, 4.606201171875, 4.86474609375, 5.123291015625, 5.3818359375, 5.640380859375, 5.89892578125, 6.157470703125, 6.416015625, 6.674560546875, 6.93310546875, 7.191650390625, 7.4501953125, 7.708740234375, 7.96728515625, 8.225830078125, 8.484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 14.0, 13.0, 16.0, 33.0, 32.0, 43.0, 59.0, 94.0, 110.0, 125.0, 160.0, 209.0, 326.0, 473.0, 699.0, 462.0, 300.0, 243.0, 159.0, 123.0, 103.0, 64.0, 57.0, 42.0, 24.0, 19.0, 16.0, 11.0, 11.0, 6.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.120208740234375, -3.01776123046875, -2.915313720703125, -2.8128662109375, -2.710418701171875, -2.60797119140625, -2.505523681640625, -2.403076171875, -2.300628662109375, -2.19818115234375, -2.095733642578125, -1.9932861328125, -1.890838623046875, -1.78839111328125, -1.685943603515625, -1.58349609375, -1.481048583984375, -1.37860107421875, -1.276153564453125, -1.1737060546875, -1.071258544921875, -0.96881103515625, -0.866363525390625, -0.763916015625, -0.661468505859375, -0.55902099609375, -0.456573486328125, -0.3541259765625, -0.251678466796875, -0.14923095703125, -0.046783447265625, 0.0556640625, 0.158111572265625, 0.26055908203125, 0.363006591796875, 0.4654541015625, 0.567901611328125, 0.67034912109375, 0.772796630859375, 0.875244140625, 0.977691650390625, 1.08013916015625, 1.182586669921875, 1.2850341796875, 1.387481689453125, 1.48992919921875, 1.592376708984375, 1.69482421875, 1.797271728515625, 1.89971923828125, 2.002166748046875, 2.1046142578125, 2.207061767578125, 2.30950927734375, 2.411956787109375, 2.514404296875, 2.616851806640625, 2.71929931640625, 2.821746826171875, 2.9241943359375, 3.026641845703125, 3.12908935546875, 3.231536865234375, 3.333984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 19.0, 44.0, 104.0, 155.0, 282.0, 192.0, 111.0, 48.0, 9.0, 18.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.88779067993164, -51.938392639160156, -49.988990783691406, -48.039588928222656, -46.09019088745117, -44.14079284667969, -42.19139099121094, -40.24198913574219, -38.2925910949707, -36.34319305419922, -34.39379119873047, -32.44438934326172, -30.494991302490234, -28.545591354370117, -26.59619140625, -24.646791458129883, -22.697391510009766, -20.74799156188965, -18.79859161376953, -16.849191665649414, -14.899791717529297, -12.95039176940918, -11.000991821289062, -9.051591873168945, -7.102191925048828, -5.152791976928711, -3.2033920288085938, -1.2539920806884766, 0.6954078674316406, 2.644807815551758, 4.594207763671875, 6.543607711791992, 8.493011474609375, 10.442411422729492, 12.39181137084961, 14.341211318969727, 16.290611267089844, 18.24001121520996, 20.189411163330078, 22.138811111450195, 24.088211059570312, 26.03761100769043, 27.987010955810547, 29.936410903930664, 31.88581085205078, 33.83521270751953, 35.784610748291016, 37.7340087890625, 39.68341064453125, 41.6328125, 43.582210540771484, 45.53160858154297, 47.48101043701172, 49.43041229248047, 51.37981033325195, 53.32920837402344, 55.27861022949219, 57.22801208496094, 59.17741012573242, 61.126808166503906, 63.076210021972656, 65.0256118774414, 66.97500610351562, 68.92440795898438, 70.87380981445312]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 12.0, 15.0, 14.0, 11.0, 20.0, 20.0, 26.0, 26.0, 44.0, 36.0, 45.0, 47.0, 55.0, 52.0, 56.0, 64.0, 56.0, 52.0, 52.0, 46.0, 41.0, 29.0, 32.0, 44.0, 22.0, 12.0, 16.0, 14.0, 12.0, 8.0, 3.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.651752471923828, -22.992904663085938, -22.334056854248047, -21.675209045410156, -21.016361236572266, -20.357513427734375, -19.698665618896484, -19.039817810058594, -18.380970001220703, -17.722122192382812, -17.063274383544922, -16.40442657470703, -15.74557876586914, -15.08673095703125, -14.427884101867676, -13.769036293029785, -13.110189437866211, -12.45134162902832, -11.79249382019043, -11.133646011352539, -10.474798202514648, -9.815950393676758, -9.157103538513184, -8.498255729675293, -7.839407920837402, -7.180560111999512, -6.521712303161621, -5.862864971160889, -5.204017162322998, -4.545169353485107, -3.886321783065796, -3.2274742126464844, -2.5686264038085938, -1.9097787141799927, -1.2509310245513916, -0.5920833349227905, 0.06676435470581055, 0.7256121635437012, 1.3844597339630127, 2.043307304382324, 2.702155113220215, 3.3610029220581055, 4.019850730895996, 4.6786980628967285, 5.337545871734619, 5.99639368057251, 6.655241012573242, 7.314088821411133, 7.972936630249023, 8.631784439086914, 9.290632247924805, 9.949480056762695, 10.608327865600586, 11.267175674438477, 11.92602252960205, 12.584870338439941, 13.243718147277832, 13.902565956115723, 14.561413764953613, 15.220261573791504, 15.879108428955078, 16.53795623779297, 17.19680404663086, 17.85565185546875, 18.51449966430664]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 10.0, 9.0, 20.0, 27.0, 44.0, 60.0, 68.0, 111.0, 174.0, 189.0, 337.0, 482.0, 706.0, 1092.0, 1661.0, 2791.0, 4574.0, 8528.0, 17941.0, 49323.0, 216750.0, 542234.0, 133400.0, 35682.0, 14409.0, 7172.0, 4018.0, 2299.0, 1492.0, 940.0, 605.0, 431.0, 281.0, 181.0, 171.0, 109.0, 66.0, 57.0, 30.0, 26.0, 14.0, 16.0, 9.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.68524169921875, -5.4915771484375, -5.29791259765625, -5.104248046875, -4.91058349609375, -4.7169189453125, -4.52325439453125, -4.32958984375, -4.13592529296875, -3.9422607421875, -3.74859619140625, -3.554931640625, -3.36126708984375, -3.1676025390625, -2.97393798828125, -2.7802734375, -2.58660888671875, -2.3929443359375, -2.19927978515625, -2.005615234375, -1.81195068359375, -1.6182861328125, -1.42462158203125, -1.23095703125, -1.03729248046875, -0.8436279296875, -0.64996337890625, -0.456298828125, -0.26263427734375, -0.0689697265625, 0.12469482421875, 0.318359375, 0.51202392578125, 0.7056884765625, 0.89935302734375, 1.093017578125, 1.28668212890625, 1.4803466796875, 1.67401123046875, 1.86767578125, 2.06134033203125, 2.2550048828125, 2.44866943359375, 2.642333984375, 2.83599853515625, 3.0296630859375, 3.22332763671875, 3.4169921875, 3.61065673828125, 3.8043212890625, 3.99798583984375, 4.191650390625, 4.38531494140625, 4.5789794921875, 4.77264404296875, 4.96630859375, 5.15997314453125, 5.3536376953125, 5.54730224609375, 5.740966796875, 5.93463134765625, 6.1282958984375, 6.32196044921875, 6.515625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 8.0, 6.0, 19.0, 16.0, 27.0, 37.0, 65.0, 96.0, 130.0, 111.0, 133.0, 95.0, 72.0, 46.0, 35.0, 16.0, 8.0, 12.0, 12.0, 5.0, 11.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7783203125, -1.7221832275390625, -1.666046142578125, -1.6099090576171875, -1.55377197265625, -1.4976348876953125, -1.441497802734375, -1.3853607177734375, -1.3292236328125, -1.2730865478515625, -1.216949462890625, -1.1608123779296875, -1.10467529296875, -1.0485382080078125, -0.992401123046875, -0.9362640380859375, -0.880126953125, -0.8239898681640625, -0.767852783203125, -0.7117156982421875, -0.65557861328125, -0.5994415283203125, -0.543304443359375, -0.4871673583984375, -0.4310302734375, -0.3748931884765625, -0.318756103515625, -0.2626190185546875, -0.20648193359375, -0.1503448486328125, -0.094207763671875, -0.0380706787109375, 0.01806640625, 0.0742034912109375, 0.130340576171875, 0.1864776611328125, 0.24261474609375, 0.2987518310546875, 0.354888916015625, 0.4110260009765625, 0.4671630859375, 0.5233001708984375, 0.579437255859375, 0.6355743408203125, 0.69171142578125, 0.7478485107421875, 0.803985595703125, 0.8601226806640625, 0.916259765625, 0.9723968505859375, 1.028533935546875, 1.0846710205078125, 1.14080810546875, 1.1969451904296875, 1.253082275390625, 1.3092193603515625, 1.3653564453125, 1.4214935302734375, 1.477630615234375, 1.5337677001953125, 1.58990478515625, 1.6460418701171875, 1.702178955078125, 1.7583160400390625, 1.814453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 13.0, 8.0, 14.0, 22.0, 35.0, 52.0, 55.0, 104.0, 173.0, 290.0, 434.0, 699.0, 1196.0, 2123.0, 3775.0, 6974.0, 14037.0, 30301.0, 70669.0, 182590.0, 377685.0, 209412.0, 80527.0, 34206.0, 15716.0, 7763.0, 4029.0, 2263.0, 1294.0, 794.0, 471.0, 306.0, 199.0, 102.0, 85.0, 48.0, 26.0, 15.0, 23.0, 11.0, 1.0, 5.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.26171875, -6.0751953125, -5.888671875, -5.7021484375, -5.515625, -5.3291015625, -5.142578125, -4.9560546875, -4.76953125, -4.5830078125, -4.396484375, -4.2099609375, -4.0234375, -3.8369140625, -3.650390625, -3.4638671875, -3.27734375, -3.0908203125, -2.904296875, -2.7177734375, -2.53125, -2.3447265625, -2.158203125, -1.9716796875, -1.78515625, -1.5986328125, -1.412109375, -1.2255859375, -1.0390625, -0.8525390625, -0.666015625, -0.4794921875, -0.29296875, -0.1064453125, 0.080078125, 0.2666015625, 0.453125, 0.6396484375, 0.826171875, 1.0126953125, 1.19921875, 1.3857421875, 1.572265625, 1.7587890625, 1.9453125, 2.1318359375, 2.318359375, 2.5048828125, 2.69140625, 2.8779296875, 3.064453125, 3.2509765625, 3.4375, 3.6240234375, 3.810546875, 3.9970703125, 4.18359375, 4.3701171875, 4.556640625, 4.7431640625, 4.9296875, 5.1162109375, 5.302734375, 5.4892578125, 5.67578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 11.0, 8.0, 9.0, 21.0, 27.0, 15.0, 18.0, 31.0, 33.0, 38.0, 27.0, 38.0, 37.0, 46.0, 47.0, 47.0, 42.0, 43.0, 48.0, 41.0, 42.0, 43.0, 37.0, 23.0, 28.0, 21.0, 34.0, 27.0, 19.0, 12.0, 22.0, 8.0, 10.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.94140625, -6.73748779296875, -6.5335693359375, -6.32965087890625, -6.125732421875, -5.92181396484375, -5.7178955078125, -5.51397705078125, -5.31005859375, -5.10614013671875, -4.9022216796875, -4.69830322265625, -4.494384765625, -4.29046630859375, -4.0865478515625, -3.88262939453125, -3.6787109375, -3.47479248046875, -3.2708740234375, -3.06695556640625, -2.863037109375, -2.65911865234375, -2.4552001953125, -2.25128173828125, -2.04736328125, -1.84344482421875, -1.6395263671875, -1.43560791015625, -1.231689453125, -1.02777099609375, -0.8238525390625, -0.61993408203125, -0.416015625, -0.21209716796875, -0.0081787109375, 0.19573974609375, 0.399658203125, 0.60357666015625, 0.8074951171875, 1.01141357421875, 1.21533203125, 1.41925048828125, 1.6231689453125, 1.82708740234375, 2.031005859375, 2.23492431640625, 2.4388427734375, 2.64276123046875, 2.8466796875, 3.05059814453125, 3.2545166015625, 3.45843505859375, 3.662353515625, 3.86627197265625, 4.0701904296875, 4.27410888671875, 4.47802734375, 4.68194580078125, 4.8858642578125, 5.08978271484375, 5.293701171875, 5.49761962890625, 5.7015380859375, 5.90545654296875, 6.109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 10.0, 4.0, 12.0, 12.0, 23.0, 40.0, 88.0, 104.0, 190.0, 362.0, 879.0, 2517.0, 8543.0, 46495.0, 590464.0, 359009.0, 30068.0, 6287.0, 1973.0, 700.0, 334.0, 167.0, 90.0, 53.0, 39.0, 22.0, 19.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.203125, -7.8980712890625, -7.593017578125, -7.2879638671875, -6.98291015625, -6.6778564453125, -6.372802734375, -6.0677490234375, -5.7626953125, -5.4576416015625, -5.152587890625, -4.8475341796875, -4.54248046875, -4.2374267578125, -3.932373046875, -3.6273193359375, -3.322265625, -3.0172119140625, -2.712158203125, -2.4071044921875, -2.10205078125, -1.7969970703125, -1.491943359375, -1.1868896484375, -0.8818359375, -0.5767822265625, -0.271728515625, 0.0333251953125, 0.33837890625, 0.6434326171875, 0.948486328125, 1.2535400390625, 1.55859375, 1.8636474609375, 2.168701171875, 2.4737548828125, 2.77880859375, 3.0838623046875, 3.388916015625, 3.6939697265625, 3.9990234375, 4.3040771484375, 4.609130859375, 4.9141845703125, 5.21923828125, 5.5242919921875, 5.829345703125, 6.1343994140625, 6.439453125, 6.7445068359375, 7.049560546875, 7.3546142578125, 7.65966796875, 7.9647216796875, 8.269775390625, 8.5748291015625, 8.8798828125, 9.1849365234375, 9.489990234375, 9.7950439453125, 10.10009765625, 10.4051513671875, 10.710205078125, 11.0152587890625, 11.3203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 8.0, 12.0, 10.0, 21.0, 21.0, 29.0, 30.0, 47.0, 63.0, 80.0, 63.0, 81.0, 94.0, 87.0, 66.0, 56.0, 50.0, 40.0, 32.0, 22.0, 16.0, 11.0, 6.0, 9.0, 10.0, 12.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00039005279541015625, -0.0003782510757446289, -0.00036644935607910156, -0.0003546476364135742, -0.0003428459167480469, -0.00033104419708251953, -0.0003192424774169922, -0.00030744075775146484, -0.0002956390380859375, -0.00028383731842041016, -0.0002720355987548828, -0.00026023387908935547, -0.0002484321594238281, -0.00023663043975830078, -0.00022482872009277344, -0.0002130270004272461, -0.00020122528076171875, -0.0001894235610961914, -0.00017762184143066406, -0.00016582012176513672, -0.00015401840209960938, -0.00014221668243408203, -0.0001304149627685547, -0.00011861324310302734, -0.0001068115234375, -9.500980377197266e-05, -8.320808410644531e-05, -7.140636444091797e-05, -5.9604644775390625e-05, -4.780292510986328e-05, -3.600120544433594e-05, -2.4199485778808594e-05, -1.239776611328125e-05, -5.960464477539062e-07, 1.1205673217773438e-05, 2.300739288330078e-05, 3.4809112548828125e-05, 4.661083221435547e-05, 5.841255187988281e-05, 7.021427154541016e-05, 8.20159912109375e-05, 9.381771087646484e-05, 0.00010561943054199219, 0.00011742115020751953, 0.00012922286987304688, 0.00014102458953857422, 0.00015282630920410156, 0.0001646280288696289, 0.00017642974853515625, 0.0001882314682006836, 0.00020003318786621094, 0.00021183490753173828, 0.00022363662719726562, 0.00023543834686279297, 0.0002472400665283203, 0.00025904178619384766, 0.000270843505859375, 0.00028264522552490234, 0.0002944469451904297, 0.00030624866485595703, 0.0003180503845214844, 0.0003298521041870117, 0.00034165382385253906, 0.0003534555435180664, 0.00036525726318359375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 9.0, 7.0, 10.0, 23.0, 32.0, 64.0, 84.0, 196.0, 345.0, 808.0, 1731.0, 4599.0, 15024.0, 70573.0, 507174.0, 377188.0, 52037.0, 11952.0, 3777.0, 1521.0, 618.0, 353.0, 166.0, 88.0, 59.0, 42.0, 20.0, 18.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.15625, -8.908203125, -8.66015625, -8.412109375, -8.1640625, -7.916015625, -7.66796875, -7.419921875, -7.171875, -6.923828125, -6.67578125, -6.427734375, -6.1796875, -5.931640625, -5.68359375, -5.435546875, -5.1875, -4.939453125, -4.69140625, -4.443359375, -4.1953125, -3.947265625, -3.69921875, -3.451171875, -3.203125, -2.955078125, -2.70703125, -2.458984375, -2.2109375, -1.962890625, -1.71484375, -1.466796875, -1.21875, -0.970703125, -0.72265625, -0.474609375, -0.2265625, 0.021484375, 0.26953125, 0.517578125, 0.765625, 1.013671875, 1.26171875, 1.509765625, 1.7578125, 2.005859375, 2.25390625, 2.501953125, 2.75, 2.998046875, 3.24609375, 3.494140625, 3.7421875, 3.990234375, 4.23828125, 4.486328125, 4.734375, 4.982421875, 5.23046875, 5.478515625, 5.7265625, 5.974609375, 6.22265625, 6.470703125, 6.71875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 8.0, 10.0, 17.0, 21.0, 46.0, 40.0, 34.0, 56.0, 48.0, 65.0, 78.0, 87.0, 78.0, 84.0, 67.0, 57.0, 54.0, 35.0, 28.0, 12.0, 11.0, 18.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.14617919921875, -3.0189208984375, -2.89166259765625, -2.764404296875, -2.63714599609375, -2.5098876953125, -2.38262939453125, -2.25537109375, -2.12811279296875, -2.0008544921875, -1.87359619140625, -1.746337890625, -1.61907958984375, -1.4918212890625, -1.36456298828125, -1.2373046875, -1.11004638671875, -0.9827880859375, -0.85552978515625, -0.728271484375, -0.60101318359375, -0.4737548828125, -0.34649658203125, -0.21923828125, -0.09197998046875, 0.0352783203125, 0.16253662109375, 0.289794921875, 0.41705322265625, 0.5443115234375, 0.67156982421875, 0.798828125, 0.92608642578125, 1.0533447265625, 1.18060302734375, 1.307861328125, 1.43511962890625, 1.5623779296875, 1.68963623046875, 1.81689453125, 1.94415283203125, 2.0714111328125, 2.19866943359375, 2.325927734375, 2.45318603515625, 2.5804443359375, 2.70770263671875, 2.8349609375, 2.96221923828125, 3.0894775390625, 3.21673583984375, 3.343994140625, 3.47125244140625, 3.5985107421875, 3.72576904296875, 3.85302734375, 3.98028564453125, 4.1075439453125, 4.23480224609375, 4.362060546875, 4.48931884765625, 4.6165771484375, 4.74383544921875, 4.87109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 16.0, 13.0, 30.0, 95.0, 260.0, 346.0, 149.0, 47.0, 15.0, 13.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.5968017578125, -158.52476501464844, -153.45272827148438, -148.3806915283203, -143.30865478515625, -138.2366180419922, -133.16458129882812, -128.09255981445312, -123.02051544189453, -117.94847869873047, -112.8764419555664, -107.80440521240234, -102.73237609863281, -97.66033935546875, -92.58830261230469, -87.51626586914062, -82.44422912597656, -77.3721923828125, -72.30015563964844, -67.22811889648438, -62.15608596801758, -57.084049224853516, -52.01201629638672, -46.939979553222656, -41.867942810058594, -36.79590606689453, -31.7238712310791, -26.651836395263672, -21.57979965209961, -16.507762908935547, -11.435728073120117, -6.3636932373046875, -1.2916717529296875, 3.7803640365600586, 8.852399826049805, 13.92443561553955, 18.996471405029297, 24.06850814819336, 29.14054298400879, 34.21257781982422, 39.28461456298828, 44.356651306152344, 49.428688049316406, 54.5007209777832, 59.572757720947266, 64.64479064941406, 69.71682739257812, 74.78886413574219, 79.86090087890625, 84.93293762207031, 90.00497436523438, 95.07701110839844, 100.1490478515625, 105.22108459472656, 110.2931137084961, 115.36515045166016, 120.43718719482422, 125.50922393798828, 130.5812530517578, 135.65328979492188, 140.72532653808594, 145.79736328125, 150.86940002441406, 155.94143676757812, 161.0134735107422]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 2.0, 5.0, 7.0, 11.0, 17.0, 20.0, 31.0, 57.0, 87.0, 111.0, 144.0, 156.0, 105.0, 85.0, 51.0, 24.0, 14.0, 13.0, 14.0, 10.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.89652252197266, -101.9616928100586, -98.02685546875, -94.09202575683594, -90.15719604492188, -86.22235870361328, -82.28752899169922, -78.35269165039062, -74.41786193847656, -70.4830322265625, -66.5481948852539, -62.613365173339844, -58.678531646728516, -54.74369812011719, -50.808868408203125, -46.8740348815918, -42.93920135498047, -39.00436782836914, -35.06953430175781, -31.13470458984375, -27.199871063232422, -23.265037536621094, -19.3302059173584, -15.395374298095703, -11.460540771484375, -7.525708198547363, -3.5908756256103516, 0.34395694732666016, 4.278789520263672, 8.213623046875, 12.148454666137695, 16.08328628540039, 20.018112182617188, 23.952945709228516, 27.88777732849121, 31.822608947753906, 35.757442474365234, 39.69227600097656, 43.627105712890625, 47.56193923950195, 51.49677276611328, 55.43160629272461, 59.36643981933594, 63.30126953125, 67.23609924316406, 71.17093658447266, 75.10576629638672, 79.04060363769531, 82.97543334960938, 86.91026306152344, 90.84510040283203, 94.7799301147461, 98.71476745605469, 102.64959716796875, 106.58442687988281, 110.51925659179688, 114.45409393310547, 118.38892364501953, 122.32376098632812, 126.25859069824219, 130.19342041015625, 134.12826538085938, 138.06309509277344, 141.9979248046875, 145.93275451660156]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 3.0, 10.0, 17.0, 31.0, 35.0, 50.0, 80.0, 172.0, 275.0, 567.0, 1195.0, 3207.0, 10609.0, 65838.0, 3889739.0, 197487.0, 17932.0, 4307.0, 1503.0, 585.0, 276.0, 137.0, 88.0, 48.0, 24.0, 10.0, 15.0, 7.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.9892578125, -33.884765625, -32.7802734375, -31.67578125, -30.5712890625, -29.466796875, -28.3623046875, -27.2578125, -26.1533203125, -25.048828125, -23.9443359375, -22.83984375, -21.7353515625, -20.630859375, -19.5263671875, -18.421875, -17.3173828125, -16.212890625, -15.1083984375, -14.00390625, -12.8994140625, -11.794921875, -10.6904296875, -9.5859375, -8.4814453125, -7.376953125, -6.2724609375, -5.16796875, -4.0634765625, -2.958984375, -1.8544921875, -0.75, 0.3544921875, 1.458984375, 2.5634765625, 3.66796875, 4.7724609375, 5.876953125, 6.9814453125, 8.0859375, 9.1904296875, 10.294921875, 11.3994140625, 12.50390625, 13.6083984375, 14.712890625, 15.8173828125, 16.921875, 18.0263671875, 19.130859375, 20.2353515625, 21.33984375, 22.4443359375, 23.548828125, 24.6533203125, 25.7578125, 26.8623046875, 27.966796875, 29.0712890625, 30.17578125, 31.2802734375, 32.384765625, 33.4892578125, 34.59375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 3.0, 8.0, 14.0, 23.0, 22.0, 32.0, 37.0, 59.0, 79.0, 98.0, 105.0, 105.0, 81.0, 69.0, 62.0, 52.0, 42.0, 20.0, 20.0, 7.0, 12.0, 3.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7509765625, -1.700836181640625, -1.65069580078125, -1.600555419921875, -1.5504150390625, -1.500274658203125, -1.45013427734375, -1.399993896484375, -1.349853515625, -1.299713134765625, -1.24957275390625, -1.199432373046875, -1.1492919921875, -1.099151611328125, -1.04901123046875, -0.998870849609375, -0.94873046875, -0.898590087890625, -0.84844970703125, -0.798309326171875, -0.7481689453125, -0.698028564453125, -0.64788818359375, -0.597747802734375, -0.547607421875, -0.497467041015625, -0.44732666015625, -0.397186279296875, -0.3470458984375, -0.296905517578125, -0.24676513671875, -0.196624755859375, -0.146484375, -0.096343994140625, -0.04620361328125, 0.003936767578125, 0.0540771484375, 0.104217529296875, 0.15435791015625, 0.204498291015625, 0.254638671875, 0.304779052734375, 0.35491943359375, 0.405059814453125, 0.4552001953125, 0.505340576171875, 0.55548095703125, 0.605621337890625, 0.65576171875, 0.705902099609375, 0.75604248046875, 0.806182861328125, 0.8563232421875, 0.906463623046875, 0.95660400390625, 1.006744384765625, 1.056884765625, 1.107025146484375, 1.15716552734375, 1.207305908203125, 1.2574462890625, 1.307586669921875, 1.35772705078125, 1.407867431640625, 1.4580078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 0.0, 8.0, 5.0, 6.0, 12.0, 7.0, 29.0, 42.0, 55.0, 105.0, 163.0, 264.0, 468.0, 802.0, 1577.0, 3340.0, 7869.0, 22192.0, 75325.0, 400789.0, 3233540.0, 346264.0, 68274.0, 19942.0, 7085.0, 3052.0, 1396.0, 737.0, 390.0, 220.0, 114.0, 80.0, 51.0, 29.0, 18.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.083251953125, -16.57275390625, -16.062255859375, -15.5517578125, -15.041259765625, -14.53076171875, -14.020263671875, -13.509765625, -12.999267578125, -12.48876953125, -11.978271484375, -11.4677734375, -10.957275390625, -10.44677734375, -9.936279296875, -9.42578125, -8.915283203125, -8.40478515625, -7.894287109375, -7.3837890625, -6.873291015625, -6.36279296875, -5.852294921875, -5.341796875, -4.831298828125, -4.32080078125, -3.810302734375, -3.2998046875, -2.789306640625, -2.27880859375, -1.768310546875, -1.2578125, -0.747314453125, -0.23681640625, 0.273681640625, 0.7841796875, 1.294677734375, 1.80517578125, 2.315673828125, 2.826171875, 3.336669921875, 3.84716796875, 4.357666015625, 4.8681640625, 5.378662109375, 5.88916015625, 6.399658203125, 6.91015625, 7.420654296875, 7.93115234375, 8.441650390625, 8.9521484375, 9.462646484375, 9.97314453125, 10.483642578125, 10.994140625, 11.504638671875, 12.01513671875, 12.525634765625, 13.0361328125, 13.546630859375, 14.05712890625, 14.567626953125, 15.078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 10.0, 4.0, 14.0, 11.0, 16.0, 18.0, 40.0, 54.0, 57.0, 101.0, 146.0, 224.0, 499.0, 1623.0, 525.0, 258.0, 152.0, 94.0, 69.0, 42.0, 34.0, 34.0, 9.0, 8.0, 8.0, 8.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.552734375, -2.469146728515625, -2.38555908203125, -2.301971435546875, -2.2183837890625, -2.134796142578125, -2.05120849609375, -1.967620849609375, -1.884033203125, -1.800445556640625, -1.71685791015625, -1.633270263671875, -1.5496826171875, -1.466094970703125, -1.38250732421875, -1.298919677734375, -1.21533203125, -1.131744384765625, -1.04815673828125, -0.964569091796875, -0.8809814453125, -0.797393798828125, -0.71380615234375, -0.630218505859375, -0.546630859375, -0.463043212890625, -0.37945556640625, -0.295867919921875, -0.2122802734375, -0.128692626953125, -0.04510498046875, 0.038482666015625, 0.1220703125, 0.205657958984375, 0.28924560546875, 0.372833251953125, 0.4564208984375, 0.540008544921875, 0.62359619140625, 0.707183837890625, 0.790771484375, 0.874359130859375, 0.95794677734375, 1.041534423828125, 1.1251220703125, 1.208709716796875, 1.29229736328125, 1.375885009765625, 1.45947265625, 1.543060302734375, 1.62664794921875, 1.710235595703125, 1.7938232421875, 1.877410888671875, 1.96099853515625, 2.044586181640625, 2.128173828125, 2.211761474609375, 2.29534912109375, 2.378936767578125, 2.4625244140625, 2.546112060546875, 2.62969970703125, 2.713287353515625, 2.796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 12.0, 18.0, 42.0, 125.0, 210.0, 210.0, 182.0, 96.0, 46.0, 26.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.104042053222656, -33.084327697753906, -32.064613342285156, -31.044897079467773, -30.02518081665039, -29.00546646118164, -27.98575210571289, -26.96603775024414, -25.946321487426758, -24.926607131958008, -23.906890869140625, -22.887176513671875, -21.867462158203125, -20.847745895385742, -19.828031539916992, -18.80831527709961, -17.78860092163086, -16.76888656616211, -15.749170303344727, -14.729455947875977, -13.70974063873291, -12.690025329589844, -11.670310974121094, -10.650595664978027, -9.630880355834961, -8.611165046691895, -7.591450214385986, -6.571735382080078, -5.552020072937012, -4.532304763793945, -3.512589931488037, -2.492875099182129, -1.4731578826904297, -0.4534428119659424, 0.5662722587585449, 1.5859873294830322, 2.6057024002075195, 3.625417709350586, 4.645132541656494, 5.664847373962402, 6.684562683105469, 7.704277992248535, 8.723993301391602, 9.743707656860352, 10.763422966003418, 11.783138275146484, 12.802852630615234, 13.8225679397583, 14.842283248901367, 15.861998558044434, 16.8817138671875, 17.90142822265625, 18.921142578125, 19.940858840942383, 20.960573196411133, 21.980289459228516, 23.000003814697266, 24.019718170166016, 25.0394344329834, 26.05914878845215, 27.07886505126953, 28.09857940673828, 29.11829376220703, 30.13800811767578, 31.157724380493164]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 13.0, 19.0, 19.0, 11.0, 20.0, 24.0, 30.0, 30.0, 38.0, 52.0, 57.0, 70.0, 65.0, 62.0, 78.0, 59.0, 55.0, 52.0, 45.0, 37.0, 28.0, 34.0, 29.0, 17.0, 17.0, 13.0, 13.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.659423828125, -12.290857315063477, -11.922290802001953, -11.55372428894043, -11.185157775878906, -10.816591262817383, -10.44802474975586, -10.079458236694336, -9.710891723632812, -9.342325210571289, -8.973758697509766, -8.605192184448242, -8.236625671386719, -7.868059158325195, -7.499492645263672, -7.130926132202148, -6.762359619140625, -6.393793106079102, -6.025226593017578, -5.656660079956055, -5.288093566894531, -4.919527053833008, -4.550960540771484, -4.182394027709961, -3.8138275146484375, -3.445261001586914, -3.0766944885253906, -2.708127975463867, -2.3395614624023438, -1.9709949493408203, -1.6024284362792969, -1.2338619232177734, -0.8652944564819336, -0.49672794342041016, -0.12816143035888672, 0.24040508270263672, 0.6089715957641602, 0.9775381088256836, 1.346104621887207, 1.7146711349487305, 2.083237648010254, 2.4518041610717773, 2.820370674133301, 3.188937187194824, 3.5575037002563477, 3.926070213317871, 4.2946367263793945, 4.663203239440918, 5.031769752502441, 5.400336265563965, 5.768902778625488, 6.137469291687012, 6.506035804748535, 6.874602317810059, 7.243168830871582, 7.6117353439331055, 7.980301856994629, 8.348868370056152, 8.717434883117676, 9.0860013961792, 9.454567909240723, 9.823134422302246, 10.19170093536377, 10.560267448425293, 10.928833961486816]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 12.0, 9.0, 11.0, 21.0, 39.0, 45.0, 58.0, 78.0, 147.0, 202.0, 299.0, 508.0, 823.0, 1472.0, 2902.0, 6158.0, 16015.0, 52087.0, 226048.0, 520460.0, 158590.0, 39090.0, 12536.0, 5096.0, 2400.0, 1313.0, 739.0, 449.0, 326.0, 188.0, 130.0, 83.0, 66.0, 40.0, 35.0, 15.0, 15.0, 15.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-14.390625, -13.9462890625, -13.501953125, -13.0576171875, -12.61328125, -12.1689453125, -11.724609375, -11.2802734375, -10.8359375, -10.3916015625, -9.947265625, -9.5029296875, -9.05859375, -8.6142578125, -8.169921875, -7.7255859375, -7.28125, -6.8369140625, -6.392578125, -5.9482421875, -5.50390625, -5.0595703125, -4.615234375, -4.1708984375, -3.7265625, -3.2822265625, -2.837890625, -2.3935546875, -1.94921875, -1.5048828125, -1.060546875, -0.6162109375, -0.171875, 0.2724609375, 0.716796875, 1.1611328125, 1.60546875, 2.0498046875, 2.494140625, 2.9384765625, 3.3828125, 3.8271484375, 4.271484375, 4.7158203125, 5.16015625, 5.6044921875, 6.048828125, 6.4931640625, 6.9375, 7.3818359375, 7.826171875, 8.2705078125, 8.71484375, 9.1591796875, 9.603515625, 10.0478515625, 10.4921875, 10.9365234375, 11.380859375, 11.8251953125, 12.26953125, 12.7138671875, 13.158203125, 13.6025390625, 14.046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 13.0, 13.0, 20.0, 28.0, 21.0, 53.0, 46.0, 73.0, 97.0, 92.0, 93.0, 94.0, 67.0, 70.0, 54.0, 45.0, 24.0, 23.0, 16.0, 10.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.609375, -1.5593719482421875, -1.509368896484375, -1.4593658447265625, -1.40936279296875, -1.3593597412109375, -1.309356689453125, -1.2593536376953125, -1.2093505859375, -1.1593475341796875, -1.109344482421875, -1.0593414306640625, -1.00933837890625, -0.9593353271484375, -0.909332275390625, -0.8593292236328125, -0.809326171875, -0.7593231201171875, -0.709320068359375, -0.6593170166015625, -0.60931396484375, -0.5593109130859375, -0.509307861328125, -0.4593048095703125, -0.4093017578125, -0.3592987060546875, -0.309295654296875, -0.2592926025390625, -0.20928955078125, -0.1592864990234375, -0.109283447265625, -0.0592803955078125, -0.00927734375, 0.0407257080078125, 0.090728759765625, 0.1407318115234375, 0.19073486328125, 0.2407379150390625, 0.290740966796875, 0.3407440185546875, 0.3907470703125, 0.4407501220703125, 0.490753173828125, 0.5407562255859375, 0.59075927734375, 0.6407623291015625, 0.690765380859375, 0.7407684326171875, 0.790771484375, 0.8407745361328125, 0.890777587890625, 0.9407806396484375, 0.99078369140625, 1.0407867431640625, 1.090789794921875, 1.1407928466796875, 1.1907958984375, 1.2407989501953125, 1.290802001953125, 1.3408050537109375, 1.39080810546875, 1.4408111572265625, 1.490814208984375, 1.5408172607421875, 1.5908203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 3.0, 14.0, 16.0, 24.0, 25.0, 37.0, 65.0, 83.0, 134.0, 198.0, 280.0, 480.0, 786.0, 1380.0, 2688.0, 5112.0, 10677.0, 24967.0, 63447.0, 183584.0, 382351.0, 234066.0, 81278.0, 30560.0, 13097.0, 6028.0, 3080.0, 1691.0, 897.0, 490.0, 341.0, 228.0, 136.0, 91.0, 58.0, 42.0, 32.0, 21.0, 18.0, 11.0, 9.0, 7.0, 6.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.93743896484375, -6.7108154296875, -6.48419189453125, -6.257568359375, -6.03094482421875, -5.8043212890625, -5.57769775390625, -5.35107421875, -5.12445068359375, -4.8978271484375, -4.67120361328125, -4.444580078125, -4.21795654296875, -3.9913330078125, -3.76470947265625, -3.5380859375, -3.31146240234375, -3.0848388671875, -2.85821533203125, -2.631591796875, -2.40496826171875, -2.1783447265625, -1.95172119140625, -1.72509765625, -1.49847412109375, -1.2718505859375, -1.04522705078125, -0.818603515625, -0.59197998046875, -0.3653564453125, -0.13873291015625, 0.087890625, 0.31451416015625, 0.5411376953125, 0.76776123046875, 0.994384765625, 1.22100830078125, 1.4476318359375, 1.67425537109375, 1.90087890625, 2.12750244140625, 2.3541259765625, 2.58074951171875, 2.807373046875, 3.03399658203125, 3.2606201171875, 3.48724365234375, 3.7138671875, 3.94049072265625, 4.1671142578125, 4.39373779296875, 4.620361328125, 4.84698486328125, 5.0736083984375, 5.30023193359375, 5.52685546875, 5.75347900390625, 5.9801025390625, 6.20672607421875, 6.433349609375, 6.65997314453125, 6.8865966796875, 7.11322021484375, 7.33984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 11.0, 1.0, 10.0, 16.0, 16.0, 24.0, 13.0, 20.0, 27.0, 29.0, 21.0, 33.0, 33.0, 49.0, 39.0, 34.0, 53.0, 40.0, 36.0, 53.0, 40.0, 48.0, 42.0, 43.0, 43.0, 33.0, 19.0, 26.0, 29.0, 24.0, 13.0, 10.0, 10.0, 11.0, 12.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.6435546875, -3.501953125, -3.3603515625, -3.21875, -3.0771484375, -2.935546875, -2.7939453125, -2.65234375, -2.5107421875, -2.369140625, -2.2275390625, -2.0859375, -1.9443359375, -1.802734375, -1.6611328125, -1.51953125, -1.3779296875, -1.236328125, -1.0947265625, -0.953125, -0.8115234375, -0.669921875, -0.5283203125, -0.38671875, -0.2451171875, -0.103515625, 0.0380859375, 0.1796875, 0.3212890625, 0.462890625, 0.6044921875, 0.74609375, 0.8876953125, 1.029296875, 1.1708984375, 1.3125, 1.4541015625, 1.595703125, 1.7373046875, 1.87890625, 2.0205078125, 2.162109375, 2.3037109375, 2.4453125, 2.5869140625, 2.728515625, 2.8701171875, 3.01171875, 3.1533203125, 3.294921875, 3.4365234375, 3.578125, 3.7197265625, 3.861328125, 4.0029296875, 4.14453125, 4.2861328125, 4.427734375, 4.5693359375, 4.7109375, 4.8525390625, 4.994140625, 5.1357421875, 5.27734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 13.0, 19.0, 18.0, 33.0, 78.0, 109.0, 230.0, 476.0, 1281.0, 3836.0, 16504.0, 118623.0, 681952.0, 193888.0, 23582.0, 5123.0, 1595.0, 639.0, 253.0, 119.0, 62.0, 43.0, 29.0, 16.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9609375, -14.3985595703125, -13.836181640625, -13.2738037109375, -12.71142578125, -12.1490478515625, -11.586669921875, -11.0242919921875, -10.4619140625, -9.8995361328125, -9.337158203125, -8.7747802734375, -8.21240234375, -7.6500244140625, -7.087646484375, -6.5252685546875, -5.962890625, -5.4005126953125, -4.838134765625, -4.2757568359375, -3.71337890625, -3.1510009765625, -2.588623046875, -2.0262451171875, -1.4638671875, -0.9014892578125, -0.339111328125, 0.2232666015625, 0.78564453125, 1.3480224609375, 1.910400390625, 2.4727783203125, 3.03515625, 3.5975341796875, 4.159912109375, 4.7222900390625, 5.28466796875, 5.8470458984375, 6.409423828125, 6.9718017578125, 7.5341796875, 8.0965576171875, 8.658935546875, 9.2213134765625, 9.78369140625, 10.3460693359375, 10.908447265625, 11.4708251953125, 12.033203125, 12.5955810546875, 13.157958984375, 13.7203369140625, 14.28271484375, 14.8450927734375, 15.407470703125, 15.9698486328125, 16.5322265625, 17.0946044921875, 17.656982421875, 18.2193603515625, 18.78173828125, 19.3441162109375, 19.906494140625, 20.4688720703125, 21.03125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 10.0, 18.0, 23.0, 51.0, 113.0, 168.0, 211.0, 170.0, 100.0, 51.0, 27.0, 11.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018835067749023438, -0.0018330961465835571, -0.0017826855182647705, -0.0017322748899459839, -0.0016818642616271973, -0.0016314536333084106, -0.001581043004989624, -0.0015306323766708374, -0.0014802217483520508, -0.0014298111200332642, -0.0013794004917144775, -0.001328989863395691, -0.0012785792350769043, -0.0012281686067581177, -0.001177757978439331, -0.0011273473501205444, -0.0010769367218017578, -0.0010265260934829712, -0.0009761154651641846, -0.000925704836845398, -0.0008752942085266113, -0.0008248835802078247, -0.0007744729518890381, -0.0007240623235702515, -0.0006736516952514648, -0.0006232410669326782, -0.0005728304386138916, -0.000522419810295105, -0.00047200918197631836, -0.00042159855365753174, -0.0003711879253387451, -0.0003207772970199585, -0.0002703666687011719, -0.00021995604038238525, -0.00016954541206359863, -0.00011913478374481201, -6.872415542602539e-05, -1.831352710723877e-05, 3.209710121154785e-05, 8.250772953033447e-05, 0.0001329183578491211, 0.00018332898616790771, 0.00023373961448669434, 0.00028415024280548096, 0.0003345608711242676, 0.0003849714994430542, 0.0004353821277618408, 0.00048579275608062744, 0.0005362033843994141, 0.0005866140127182007, 0.0006370246410369873, 0.0006874352693557739, 0.0007378458976745605, 0.0007882565259933472, 0.0008386671543121338, 0.0008890777826309204, 0.000939488410949707, 0.0009898990392684937, 0.0010403096675872803, 0.001090720295906067, 0.0011411309242248535, 0.0011915415525436401, 0.0012419521808624268, 0.0012923628091812134, 0.0013427734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 15.0, 17.0, 22.0, 34.0, 62.0, 75.0, 132.0, 196.0, 336.0, 577.0, 1057.0, 1986.0, 4257.0, 9796.0, 26024.0, 85984.0, 296461.0, 409349.0, 145188.0, 41003.0, 14199.0, 5888.0, 2693.0, 1362.0, 754.0, 430.0, 244.0, 153.0, 85.0, 55.0, 45.0, 25.0, 19.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.4246826171875, -8.114990234375, -7.8052978515625, -7.49560546875, -7.1859130859375, -6.876220703125, -6.5665283203125, -6.2568359375, -5.9471435546875, -5.637451171875, -5.3277587890625, -5.01806640625, -4.7083740234375, -4.398681640625, -4.0889892578125, -3.779296875, -3.4696044921875, -3.159912109375, -2.8502197265625, -2.54052734375, -2.2308349609375, -1.921142578125, -1.6114501953125, -1.3017578125, -0.9920654296875, -0.682373046875, -0.3726806640625, -0.06298828125, 0.2467041015625, 0.556396484375, 0.8660888671875, 1.17578125, 1.4854736328125, 1.795166015625, 2.1048583984375, 2.41455078125, 2.7242431640625, 3.033935546875, 3.3436279296875, 3.6533203125, 3.9630126953125, 4.272705078125, 4.5823974609375, 4.89208984375, 5.2017822265625, 5.511474609375, 5.8211669921875, 6.130859375, 6.4405517578125, 6.750244140625, 7.0599365234375, 7.36962890625, 7.6793212890625, 7.989013671875, 8.2987060546875, 8.6083984375, 8.9180908203125, 9.227783203125, 9.5374755859375, 9.84716796875, 10.1568603515625, 10.466552734375, 10.7762451171875, 11.0859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 14.0, 24.0, 24.0, 51.0, 38.0, 58.0, 60.0, 83.0, 91.0, 94.0, 93.0, 76.0, 54.0, 53.0, 33.0, 28.0, 19.0, 14.0, 8.0, 7.0, 12.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.149658203125, -5.95166015625, -5.753662109375, -5.5556640625, -5.357666015625, -5.15966796875, -4.961669921875, -4.763671875, -4.565673828125, -4.36767578125, -4.169677734375, -3.9716796875, -3.773681640625, -3.57568359375, -3.377685546875, -3.1796875, -2.981689453125, -2.78369140625, -2.585693359375, -2.3876953125, -2.189697265625, -1.99169921875, -1.793701171875, -1.595703125, -1.397705078125, -1.19970703125, -1.001708984375, -0.8037109375, -0.605712890625, -0.40771484375, -0.209716796875, -0.01171875, 0.186279296875, 0.38427734375, 0.582275390625, 0.7802734375, 0.978271484375, 1.17626953125, 1.374267578125, 1.572265625, 1.770263671875, 1.96826171875, 2.166259765625, 2.3642578125, 2.562255859375, 2.76025390625, 2.958251953125, 3.15625, 3.354248046875, 3.55224609375, 3.750244140625, 3.9482421875, 4.146240234375, 4.34423828125, 4.542236328125, 4.740234375, 4.938232421875, 5.13623046875, 5.334228515625, 5.5322265625, 5.730224609375, 5.92822265625, 6.126220703125, 6.32421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 5.0, 4.0, 7.0, 8.0, 27.0, 56.0, 124.0, 214.0, 277.0, 155.0, 70.0, 35.0, 12.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.39089965820312, -119.12557983398438, -115.8602523803711, -112.59493255615234, -109.32960510253906, -106.06428527832031, -102.79896545410156, -99.53364562988281, -96.26831817626953, -93.00299835205078, -89.7376708984375, -86.47235107421875, -83.20703125, -79.94170379638672, -76.67638397216797, -73.41105651855469, -70.14573669433594, -66.88041687011719, -63.615089416503906, -60.349769592285156, -57.08444595336914, -53.819122314453125, -50.553802490234375, -47.28847885131836, -44.023155212402344, -40.75783157348633, -37.49250793457031, -34.22718811035156, -30.961864471435547, -27.69654083251953, -24.43121910095215, -21.165897369384766, -17.90058135986328, -14.635258674621582, -11.369935989379883, -8.104613304138184, -4.839290618896484, -1.5739669799804688, 1.691354751586914, 4.956676483154297, 8.222000122070312, 11.487322807312012, 14.752645492553711, 18.017967224121094, 21.28329086303711, 24.548614501953125, 27.813936233520508, 31.07925796508789, 34.344581604003906, 37.60990524291992, 40.87522888183594, 44.14054870605469, 47.4058723449707, 50.67119598388672, 53.93651580810547, 57.201839447021484, 60.4671630859375, 63.732486724853516, 66.99781036376953, 70.26313018798828, 73.52845764160156, 76.79377746582031, 80.05909729003906, 83.32441711425781, 86.5897445678711]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 6.0, 9.0, 20.0, 21.0, 31.0, 45.0, 39.0, 56.0, 64.0, 61.0, 82.0, 77.0, 67.0, 83.0, 69.0, 55.0, 45.0, 36.0, 25.0, 16.0, 22.0, 10.0, 6.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.96773147583008, -39.429840087890625, -37.89194869995117, -36.35405731201172, -34.81616973876953, -33.27827835083008, -31.740386962890625, -30.202495574951172, -28.66460609436035, -27.1267147064209, -25.588825225830078, -24.050933837890625, -22.513042449951172, -20.97515296936035, -19.4372615814209, -17.899372100830078, -16.361480712890625, -14.823590278625488, -13.285699844360352, -11.747808456420898, -10.209918022155762, -8.672027587890625, -7.134136199951172, -5.596245765686035, -4.058355331420898, -2.5204646587371826, -0.9825739860534668, 0.5553169250488281, 2.093207359313965, 3.6310977935791016, 5.168989181518555, 6.706879615783691, 8.244773864746094, 9.78266429901123, 11.320554733276367, 12.85844612121582, 14.396336555480957, 15.934226989746094, 17.472118377685547, 19.010009765625, 20.54789924621582, 22.085790634155273, 23.623680114746094, 25.161571502685547, 26.699462890625, 28.23735237121582, 29.775243759155273, 31.313133239746094, 32.85102462768555, 34.388916015625, 35.92680740356445, 37.464698791503906, 39.002586364746094, 40.54047775268555, 42.078369140625, 43.61626052856445, 45.154151916503906, 46.69204330444336, 48.22993469238281, 49.767822265625, 51.30571365356445, 52.843605041503906, 54.38149642944336, 55.91938781738281, 57.457275390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 11.0, 17.0, 27.0, 33.0, 41.0, 67.0, 94.0, 138.0, 232.0, 317.0, 553.0, 950.0, 1862.0, 3941.0, 9819.0, 31282.0, 171358.0, 3517087.0, 385072.0, 49199.0, 13354.0, 4814.0, 1901.0, 939.0, 477.0, 256.0, 157.0, 109.0, 65.0, 33.0, 21.0, 14.0, 10.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34375, -34.405029296875, -33.46630859375, -32.527587890625, -31.5888671875, -30.650146484375, -29.71142578125, -28.772705078125, -27.833984375, -26.895263671875, -25.95654296875, -25.017822265625, -24.0791015625, -23.140380859375, -22.20166015625, -21.262939453125, -20.32421875, -19.385498046875, -18.44677734375, -17.508056640625, -16.5693359375, -15.630615234375, -14.69189453125, -13.753173828125, -12.814453125, -11.875732421875, -10.93701171875, -9.998291015625, -9.0595703125, -8.120849609375, -7.18212890625, -6.243408203125, -5.3046875, -4.365966796875, -3.42724609375, -2.488525390625, -1.5498046875, -0.611083984375, 0.32763671875, 1.266357421875, 2.205078125, 3.143798828125, 4.08251953125, 5.021240234375, 5.9599609375, 6.898681640625, 7.83740234375, 8.776123046875, 9.71484375, 10.653564453125, 11.59228515625, 12.531005859375, 13.4697265625, 14.408447265625, 15.34716796875, 16.285888671875, 17.224609375, 18.163330078125, 19.10205078125, 20.040771484375, 20.9794921875, 21.918212890625, 22.85693359375, 23.795654296875, 24.734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 6.0, 10.0, 22.0, 21.0, 35.0, 50.0, 54.0, 71.0, 59.0, 88.0, 98.0, 91.0, 83.0, 55.0, 51.0, 38.0, 42.0, 35.0, 27.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5830078125, -1.5342864990234375, -1.485565185546875, -1.4368438720703125, -1.38812255859375, -1.3394012451171875, -1.290679931640625, -1.2419586181640625, -1.1932373046875, -1.1445159912109375, -1.095794677734375, -1.0470733642578125, -0.99835205078125, -0.9496307373046875, -0.900909423828125, -0.8521881103515625, -0.803466796875, -0.7547454833984375, -0.706024169921875, -0.6573028564453125, -0.60858154296875, -0.5598602294921875, -0.511138916015625, -0.4624176025390625, -0.4136962890625, -0.3649749755859375, -0.316253662109375, -0.2675323486328125, -0.21881103515625, -0.1700897216796875, -0.121368408203125, -0.0726470947265625, -0.02392578125, 0.0247955322265625, 0.073516845703125, 0.1222381591796875, 0.17095947265625, 0.2196807861328125, 0.268402099609375, 0.3171234130859375, 0.3658447265625, 0.4145660400390625, 0.463287353515625, 0.5120086669921875, 0.56072998046875, 0.6094512939453125, 0.658172607421875, 0.7068939208984375, 0.755615234375, 0.8043365478515625, 0.853057861328125, 0.9017791748046875, 0.95050048828125, 0.9992218017578125, 1.047943115234375, 1.0966644287109375, 1.1453857421875, 1.1941070556640625, 1.242828369140625, 1.2915496826171875, 1.34027099609375, 1.3889923095703125, 1.437713623046875, 1.4864349365234375, 1.53515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 13.0, 8.0, 15.0, 22.0, 40.0, 51.0, 73.0, 135.0, 262.0, 851.0, 5637.0, 125621.0, 3939726.0, 114882.0, 5384.0, 862.0, 287.0, 162.0, 63.0, 55.0, 47.0, 30.0, 23.0, 4.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-78.5625, -76.6689453125, -74.775390625, -72.8818359375, -70.98828125, -69.0947265625, -67.201171875, -65.3076171875, -63.4140625, -61.5205078125, -59.626953125, -57.7333984375, -55.83984375, -53.9462890625, -52.052734375, -50.1591796875, -48.265625, -46.3720703125, -44.478515625, -42.5849609375, -40.69140625, -38.7978515625, -36.904296875, -35.0107421875, -33.1171875, -31.2236328125, -29.330078125, -27.4365234375, -25.54296875, -23.6494140625, -21.755859375, -19.8623046875, -17.96875, -16.0751953125, -14.181640625, -12.2880859375, -10.39453125, -8.5009765625, -6.607421875, -4.7138671875, -2.8203125, -0.9267578125, 0.966796875, 2.8603515625, 4.75390625, 6.6474609375, 8.541015625, 10.4345703125, 12.328125, 14.2216796875, 16.115234375, 18.0087890625, 19.90234375, 21.7958984375, 23.689453125, 25.5830078125, 27.4765625, 29.3701171875, 31.263671875, 33.1572265625, 35.05078125, 36.9443359375, 38.837890625, 40.7314453125, 42.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 2.0, 3.0, 14.0, 20.0, 41.0, 32.0, 48.0, 85.0, 105.0, 182.0, 299.0, 478.0, 1160.0, 681.0, 336.0, 191.0, 120.0, 73.0, 63.0, 33.0, 36.0, 14.0, 14.0, 15.0, 6.0, 8.0, 3.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.1331787109375, -2.012451171875, -1.8917236328125, -1.77099609375, -1.6502685546875, -1.529541015625, -1.4088134765625, -1.2880859375, -1.1673583984375, -1.046630859375, -0.9259033203125, -0.80517578125, -0.6844482421875, -0.563720703125, -0.4429931640625, -0.322265625, -0.2015380859375, -0.080810546875, 0.0399169921875, 0.16064453125, 0.2813720703125, 0.402099609375, 0.5228271484375, 0.6435546875, 0.7642822265625, 0.885009765625, 1.0057373046875, 1.12646484375, 1.2471923828125, 1.367919921875, 1.4886474609375, 1.609375, 1.7301025390625, 1.850830078125, 1.9715576171875, 2.09228515625, 2.2130126953125, 2.333740234375, 2.4544677734375, 2.5751953125, 2.6959228515625, 2.816650390625, 2.9373779296875, 3.05810546875, 3.1788330078125, 3.299560546875, 3.4202880859375, 3.541015625, 3.6617431640625, 3.782470703125, 3.9031982421875, 4.02392578125, 4.1446533203125, 4.265380859375, 4.3861083984375, 4.5068359375, 4.6275634765625, 4.748291015625, 4.8690185546875, 4.98974609375, 5.1104736328125, 5.231201171875, 5.3519287109375, 5.47265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 32.0, 95.0, 195.0, 274.0, 230.0, 99.0, 38.0, 14.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.01563262939453, -65.32146453857422, -63.627296447753906, -61.93312454223633, -60.238956451416016, -58.5447883605957, -56.850616455078125, -55.15644836425781, -53.4622802734375, -51.76811218261719, -50.073944091796875, -48.3797721862793, -46.685604095458984, -44.99143600463867, -43.297264099121094, -41.60309600830078, -39.90892791748047, -38.214759826660156, -36.520591735839844, -34.826419830322266, -33.13225173950195, -31.43808364868164, -29.743913650512695, -28.04974365234375, -26.355575561523438, -24.661407470703125, -22.96723747253418, -21.273067474365234, -19.578899383544922, -17.88473129272461, -16.190561294555664, -14.496392250061035, -12.80221939086914, -11.108050346374512, -9.413881301879883, -7.719712257385254, -6.025543212890625, -4.331374168395996, -2.637205123901367, -0.9430360794067383, 0.7511329650878906, 2.4453020095825195, 4.139471054077148, 5.833640098571777, 7.527809143066406, 9.221978187561035, 10.916147232055664, 12.610316276550293, 14.304485321044922, 15.99865436553955, 17.69282341003418, 19.386993408203125, 21.081161499023438, 22.77532958984375, 24.469499588012695, 26.16366958618164, 27.857837677001953, 29.552005767822266, 31.24617576599121, 32.940345764160156, 34.63451385498047, 36.32868194580078, 38.022850036621094, 39.71702194213867, 41.411190032958984]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 9.0, 9.0, 5.0, 12.0, 15.0, 23.0, 24.0, 25.0, 28.0, 42.0, 41.0, 54.0, 40.0, 49.0, 49.0, 55.0, 58.0, 53.0, 59.0, 58.0, 38.0, 39.0, 48.0, 41.0, 28.0, 16.0, 24.0, 12.0, 8.0, 10.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.889745712280273, -13.383111000061035, -12.876477241516113, -12.369842529296875, -11.863208770751953, -11.356574058532715, -10.849939346313477, -10.343305587768555, -9.836670875549316, -9.330036163330078, -8.823402404785156, -8.316767692565918, -7.810133457183838, -7.303499221801758, -6.7968645095825195, -6.2902302742004395, -5.783596038818359, -5.276961803436279, -4.770327568054199, -4.263692855834961, -3.757058620452881, -3.250424385070801, -2.7437899112701416, -2.2371554374694824, -1.7305212020874023, -1.2238868474960327, -0.7172524929046631, -0.21061813831329346, 0.29601621627807617, 0.8026504516601562, 1.3092849254608154, 1.8159193992614746, 2.3225536346435547, 2.8291878700256348, 3.335822343826294, 3.842456817626953, 4.349091053009033, 4.855725288391113, 5.362360000610352, 5.868994235992432, 6.375628471374512, 6.882262706756592, 7.388896942138672, 7.89553165435791, 8.402166366577148, 8.90880012512207, 9.415434837341309, 9.922069549560547, 10.428703308105469, 10.935338020324707, 11.441971778869629, 11.948606491088867, 12.455240249633789, 12.961874961853027, 13.468509674072266, 13.975143432617188, 14.481778144836426, 14.988412857055664, 15.495046615600586, 16.001680374145508, 16.508316040039062, 17.014949798583984, 17.521583557128906, 18.02821922302246, 18.534852981567383]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 11.0, 12.0, 15.0, 19.0, 21.0, 36.0, 37.0, 73.0, 82.0, 112.0, 171.0, 248.0, 312.0, 490.0, 813.0, 1337.0, 2583.0, 5392.0, 12289.0, 30722.0, 85097.0, 242379.0, 380915.0, 180528.0, 62449.0, 23179.0, 9411.0, 4290.0, 2110.0, 1172.0, 733.0, 457.0, 286.0, 210.0, 168.0, 107.0, 90.0, 50.0, 39.0, 26.0, 21.0, 18.0, 11.0, 8.0, 9.0, 5.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.4375, -14.004638671875, -13.57177734375, -13.138916015625, -12.7060546875, -12.273193359375, -11.84033203125, -11.407470703125, -10.974609375, -10.541748046875, -10.10888671875, -9.676025390625, -9.2431640625, -8.810302734375, -8.37744140625, -7.944580078125, -7.51171875, -7.078857421875, -6.64599609375, -6.213134765625, -5.7802734375, -5.347412109375, -4.91455078125, -4.481689453125, -4.048828125, -3.615966796875, -3.18310546875, -2.750244140625, -2.3173828125, -1.884521484375, -1.45166015625, -1.018798828125, -0.5859375, -0.153076171875, 0.27978515625, 0.712646484375, 1.1455078125, 1.578369140625, 2.01123046875, 2.444091796875, 2.876953125, 3.309814453125, 3.74267578125, 4.175537109375, 4.6083984375, 5.041259765625, 5.47412109375, 5.906982421875, 6.33984375, 6.772705078125, 7.20556640625, 7.638427734375, 8.0712890625, 8.504150390625, 8.93701171875, 9.369873046875, 9.802734375, 10.235595703125, 10.66845703125, 11.101318359375, 11.5341796875, 11.967041015625, 12.39990234375, 12.832763671875, 13.265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 10.0, 14.0, 11.0, 13.0, 26.0, 37.0, 55.0, 73.0, 72.0, 89.0, 79.0, 77.0, 87.0, 64.0, 52.0, 53.0, 50.0, 24.0, 32.0, 17.0, 21.0, 12.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.501953125, -1.4537811279296875, -1.405609130859375, -1.3574371337890625, -1.30926513671875, -1.2610931396484375, -1.212921142578125, -1.1647491455078125, -1.1165771484375, -1.0684051513671875, -1.020233154296875, -0.9720611572265625, -0.92388916015625, -0.8757171630859375, -0.827545166015625, -0.7793731689453125, -0.731201171875, -0.6830291748046875, -0.634857177734375, -0.5866851806640625, -0.53851318359375, -0.4903411865234375, -0.442169189453125, -0.3939971923828125, -0.3458251953125, -0.2976531982421875, -0.249481201171875, -0.2013092041015625, -0.15313720703125, -0.1049652099609375, -0.056793212890625, -0.0086212158203125, 0.03955078125, 0.0877227783203125, 0.135894775390625, 0.1840667724609375, 0.23223876953125, 0.2804107666015625, 0.328582763671875, 0.3767547607421875, 0.4249267578125, 0.4730987548828125, 0.521270751953125, 0.5694427490234375, 0.61761474609375, 0.6657867431640625, 0.713958740234375, 0.7621307373046875, 0.810302734375, 0.8584747314453125, 0.906646728515625, 0.9548187255859375, 1.00299072265625, 1.0511627197265625, 1.099334716796875, 1.1475067138671875, 1.1956787109375, 1.2438507080078125, 1.292022705078125, 1.3401947021484375, 1.38836669921875, 1.4365386962890625, 1.484710693359375, 1.5328826904296875, 1.5810546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 4.0, 7.0, 11.0, 20.0, 8.0, 29.0, 50.0, 69.0, 91.0, 198.0, 336.0, 632.0, 1410.0, 3288.0, 9417.0, 30370.0, 109789.0, 357170.0, 369956.0, 116744.0, 32311.0, 10053.0, 3612.0, 1472.0, 642.0, 304.0, 197.0, 122.0, 71.0, 43.0, 37.0, 26.0, 11.0, 10.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.15625, -16.6519775390625, -16.147705078125, -15.6434326171875, -15.13916015625, -14.6348876953125, -14.130615234375, -13.6263427734375, -13.1220703125, -12.6177978515625, -12.113525390625, -11.6092529296875, -11.10498046875, -10.6007080078125, -10.096435546875, -9.5921630859375, -9.087890625, -8.5836181640625, -8.079345703125, -7.5750732421875, -7.07080078125, -6.5665283203125, -6.062255859375, -5.5579833984375, -5.0537109375, -4.5494384765625, -4.045166015625, -3.5408935546875, -3.03662109375, -2.5323486328125, -2.028076171875, -1.5238037109375, -1.01953125, -0.5152587890625, -0.010986328125, 0.4932861328125, 0.99755859375, 1.5018310546875, 2.006103515625, 2.5103759765625, 3.0146484375, 3.5189208984375, 4.023193359375, 4.5274658203125, 5.03173828125, 5.5360107421875, 6.040283203125, 6.5445556640625, 7.048828125, 7.5531005859375, 8.057373046875, 8.5616455078125, 9.06591796875, 9.5701904296875, 10.074462890625, 10.5787353515625, 11.0830078125, 11.5872802734375, 12.091552734375, 12.5958251953125, 13.10009765625, 13.6043701171875, 14.108642578125, 14.6129150390625, 15.1171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 9.0, 5.0, 16.0, 14.0, 23.0, 12.0, 20.0, 34.0, 20.0, 32.0, 46.0, 48.0, 52.0, 47.0, 67.0, 51.0, 50.0, 39.0, 58.0, 32.0, 33.0, 46.0, 35.0, 28.0, 19.0, 34.0, 19.0, 17.0, 18.0, 16.0, 5.0, 15.0, 4.0, 5.0, 7.0, 7.0, 3.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.7529296875, -6.548828125, -6.3447265625, -6.140625, -5.9365234375, -5.732421875, -5.5283203125, -5.32421875, -5.1201171875, -4.916015625, -4.7119140625, -4.5078125, -4.3037109375, -4.099609375, -3.8955078125, -3.69140625, -3.4873046875, -3.283203125, -3.0791015625, -2.875, -2.6708984375, -2.466796875, -2.2626953125, -2.05859375, -1.8544921875, -1.650390625, -1.4462890625, -1.2421875, -1.0380859375, -0.833984375, -0.6298828125, -0.42578125, -0.2216796875, -0.017578125, 0.1865234375, 0.390625, 0.5947265625, 0.798828125, 1.0029296875, 1.20703125, 1.4111328125, 1.615234375, 1.8193359375, 2.0234375, 2.2275390625, 2.431640625, 2.6357421875, 2.83984375, 3.0439453125, 3.248046875, 3.4521484375, 3.65625, 3.8603515625, 4.064453125, 4.2685546875, 4.47265625, 4.6767578125, 4.880859375, 5.0849609375, 5.2890625, 5.4931640625, 5.697265625, 5.9013671875, 6.10546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 19.0, 27.0, 38.0, 49.0, 87.0, 126.0, 177.0, 360.0, 483.0, 818.0, 1509.0, 2634.0, 5022.0, 10453.0, 24073.0, 63280.0, 213283.0, 460378.0, 172051.0, 53234.0, 20799.0, 9240.0, 4562.0, 2429.0, 1359.0, 777.0, 484.0, 262.0, 154.0, 111.0, 83.0, 47.0, 38.0, 16.0, 20.0, 16.0, 10.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.0572509765625, -14.606689453125, -14.1561279296875, -13.70556640625, -13.2550048828125, -12.804443359375, -12.3538818359375, -11.9033203125, -11.4527587890625, -11.002197265625, -10.5516357421875, -10.10107421875, -9.6505126953125, -9.199951171875, -8.7493896484375, -8.298828125, -7.8482666015625, -7.397705078125, -6.9471435546875, -6.49658203125, -6.0460205078125, -5.595458984375, -5.1448974609375, -4.6943359375, -4.2437744140625, -3.793212890625, -3.3426513671875, -2.89208984375, -2.4415283203125, -1.990966796875, -1.5404052734375, -1.08984375, -0.6392822265625, -0.188720703125, 0.2618408203125, 0.71240234375, 1.1629638671875, 1.613525390625, 2.0640869140625, 2.5146484375, 2.9652099609375, 3.415771484375, 3.8663330078125, 4.31689453125, 4.7674560546875, 5.218017578125, 5.6685791015625, 6.119140625, 6.5697021484375, 7.020263671875, 7.4708251953125, 7.92138671875, 8.3719482421875, 8.822509765625, 9.2730712890625, 9.7236328125, 10.1741943359375, 10.624755859375, 11.0753173828125, 11.52587890625, 11.9764404296875, 12.427001953125, 12.8775634765625, 13.328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 4.0, 8.0, 10.0, 13.0, 14.0, 23.0, 30.0, 50.0, 98.0, 143.0, 167.0, 147.0, 89.0, 47.0, 32.0, 26.0, 23.0, 15.0, 8.0, 9.0, 4.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00293731689453125, -0.0028441548347473145, -0.002750992774963379, -0.0026578307151794434, -0.002564668655395508, -0.0024715065956115723, -0.0023783445358276367, -0.002285182476043701, -0.0021920204162597656, -0.00209885835647583, -0.0020056962966918945, -0.001912534236907959, -0.0018193721771240234, -0.0017262101173400879, -0.0016330480575561523, -0.0015398859977722168, -0.0014467239379882812, -0.0013535618782043457, -0.0012603998184204102, -0.0011672377586364746, -0.001074075698852539, -0.0009809136390686035, -0.000887751579284668, -0.0007945895195007324, -0.0007014274597167969, -0.0006082653999328613, -0.0005151033401489258, -0.00042194128036499023, -0.0003287792205810547, -0.00023561716079711914, -0.0001424551010131836, -4.929304122924805e-05, 4.38690185546875e-05, 0.00013703107833862305, 0.0002301931381225586, 0.00032335519790649414, 0.0004165172576904297, 0.0005096793174743652, 0.0006028413772583008, 0.0006960034370422363, 0.0007891654968261719, 0.0008823275566101074, 0.000975489616394043, 0.0010686516761779785, 0.001161813735961914, 0.0012549757957458496, 0.0013481378555297852, 0.0014412999153137207, 0.0015344619750976562, 0.0016276240348815918, 0.0017207860946655273, 0.0018139481544494629, 0.0019071102142333984, 0.002000272274017334, 0.0020934343338012695, 0.002186596393585205, 0.0022797584533691406, 0.002372920513153076, 0.0024660825729370117, 0.0025592446327209473, 0.002652406692504883, 0.0027455687522888184, 0.002838730812072754, 0.0029318928718566895, 0.003025054931640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 6.0, 7.0, 9.0, 20.0, 34.0, 38.0, 64.0, 89.0, 193.0, 336.0, 791.0, 1666.0, 4231.0, 11995.0, 41794.0, 225980.0, 616219.0, 106668.0, 25193.0, 7857.0, 2916.0, 1208.0, 549.0, 301.0, 137.0, 71.0, 59.0, 29.0, 19.0, 22.0, 5.0, 10.0, 11.0, 8.0, 2.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.953125, -24.1806640625, -23.408203125, -22.6357421875, -21.86328125, -21.0908203125, -20.318359375, -19.5458984375, -18.7734375, -18.0009765625, -17.228515625, -16.4560546875, -15.68359375, -14.9111328125, -14.138671875, -13.3662109375, -12.59375, -11.8212890625, -11.048828125, -10.2763671875, -9.50390625, -8.7314453125, -7.958984375, -7.1865234375, -6.4140625, -5.6416015625, -4.869140625, -4.0966796875, -3.32421875, -2.5517578125, -1.779296875, -1.0068359375, -0.234375, 0.5380859375, 1.310546875, 2.0830078125, 2.85546875, 3.6279296875, 4.400390625, 5.1728515625, 5.9453125, 6.7177734375, 7.490234375, 8.2626953125, 9.03515625, 9.8076171875, 10.580078125, 11.3525390625, 12.125, 12.8974609375, 13.669921875, 14.4423828125, 15.21484375, 15.9873046875, 16.759765625, 17.5322265625, 18.3046875, 19.0771484375, 19.849609375, 20.6220703125, 21.39453125, 22.1669921875, 22.939453125, 23.7119140625, 24.484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 4.0, 6.0, 7.0, 8.0, 12.0, 14.0, 13.0, 20.0, 30.0, 35.0, 48.0, 55.0, 85.0, 89.0, 93.0, 89.0, 85.0, 65.0, 52.0, 38.0, 14.0, 20.0, 19.0, 8.0, 15.0, 9.0, 10.0, 5.0, 4.0, 5.0, 7.0, 2.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.0546875, -9.7437744140625, -9.432861328125, -9.1219482421875, -8.81103515625, -8.5001220703125, -8.189208984375, -7.8782958984375, -7.5673828125, -7.2564697265625, -6.945556640625, -6.6346435546875, -6.32373046875, -6.0128173828125, -5.701904296875, -5.3909912109375, -5.080078125, -4.7691650390625, -4.458251953125, -4.1473388671875, -3.83642578125, -3.5255126953125, -3.214599609375, -2.9036865234375, -2.5927734375, -2.2818603515625, -1.970947265625, -1.6600341796875, -1.34912109375, -1.0382080078125, -0.727294921875, -0.4163818359375, -0.10546875, 0.2054443359375, 0.516357421875, 0.8272705078125, 1.13818359375, 1.4490966796875, 1.760009765625, 2.0709228515625, 2.3818359375, 2.6927490234375, 3.003662109375, 3.3145751953125, 3.62548828125, 3.9364013671875, 4.247314453125, 4.5582275390625, 4.869140625, 5.1800537109375, 5.490966796875, 5.8018798828125, 6.11279296875, 6.4237060546875, 6.734619140625, 7.0455322265625, 7.3564453125, 7.6673583984375, 7.978271484375, 8.2891845703125, 8.60009765625, 8.9110107421875, 9.221923828125, 9.5328369140625, 9.84375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 27.0, 123.0, 387.0, 342.0, 103.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.44189453125, -143.41519165039062, -131.3885040283203, -119.36180114746094, -107.3351058959961, -95.30841064453125, -83.28170776367188, -71.25501251220703, -59.22831726074219, -47.201622009277344, -35.174922943115234, -23.148223876953125, -11.121528625488281, 0.9051666259765625, 12.931869506835938, 24.95856475830078, 36.985260009765625, 49.01195526123047, 61.03865432739258, 73.06535339355469, 85.09204864501953, 97.11874389648438, 109.14544677734375, 121.1721420288086, 133.19883728027344, 145.2255401611328, 157.25222778320312, 169.2789306640625, 181.30563354492188, 193.3323211669922, 205.35902404785156, 217.38571166992188, 229.41241455078125, 241.43911743164062, 253.46580505371094, 265.49249267578125, 277.5191955566406, 289.5458984375, 301.5726013183594, 313.59930419921875, 325.6259765625, 337.6526794433594, 349.67938232421875, 361.7060546875, 373.7327575683594, 385.75946044921875, 397.7861633300781, 409.8128662109375, 421.8395690917969, 433.86627197265625, 445.8929748535156, 457.919677734375, 469.94635009765625, 481.9730529785156, 493.999755859375, 506.0264587402344, 518.0531616210938, 530.079833984375, 542.1065673828125, 554.1332397460938, 566.1599731445312, 578.1866455078125, 590.21337890625, 602.2400512695312, 614.2667236328125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 6.0, 10.0, 8.0, 10.0, 14.0, 19.0, 17.0, 29.0, 22.0, 45.0, 36.0, 41.0, 52.0, 63.0, 73.0, 59.0, 58.0, 60.0, 56.0, 61.0, 49.0, 39.0, 19.0, 41.0, 28.0, 23.0, 20.0, 12.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.74826431274414, -60.60056686401367, -58.45287322998047, -56.30517578125, -54.15747833251953, -52.00978088378906, -49.862083435058594, -47.71438980102539, -45.56669235229492, -43.41899490356445, -41.27130126953125, -39.12360382080078, -36.97590637207031, -34.828208923339844, -32.680511474609375, -30.532817840576172, -28.385120391845703, -26.237422943115234, -24.0897274017334, -21.942031860351562, -19.794334411621094, -17.646636962890625, -15.498941421508789, -13.351244926452637, -11.203548431396484, -9.055851936340332, -6.90815544128418, -4.760458946228027, -2.612762451171875, -0.46506595611572266, 1.6826305389404297, 3.830327033996582, 5.978019714355469, 8.125716209411621, 10.273412704467773, 12.421109199523926, 14.568805694580078, 16.716503143310547, 18.864198684692383, 21.01189422607422, 23.159591674804688, 25.307289123535156, 27.454984664916992, 29.602680206298828, 31.750377655029297, 33.898075103759766, 36.04576873779297, 38.19346618652344, 40.341163635253906, 42.488861083984375, 44.636558532714844, 46.78425216674805, 48.931949615478516, 51.079647064208984, 53.22734069824219, 55.375038146972656, 57.522735595703125, 59.670433044433594, 61.81813049316406, 63.965824127197266, 66.113525390625, 68.26121520996094, 70.4089126586914, 72.55661010742188, 74.70430755615234]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 14.0, 16.0, 14.0, 30.0, 37.0, 37.0, 51.0, 63.0, 91.0, 119.0, 163.0, 245.0, 349.0, 552.0, 828.0, 1403.0, 2474.0, 4924.0, 11049.0, 29564.0, 102348.0, 641936.0, 3088973.0, 221380.0, 54306.0, 18161.0, 7491.0, 3423.0, 1734.0, 956.0, 589.0, 318.0, 213.0, 123.0, 84.0, 67.0, 31.0, 38.0, 17.0, 18.0, 7.0, 10.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.578125, -26.817138671875, -26.05615234375, -25.295166015625, -24.5341796875, -23.773193359375, -23.01220703125, -22.251220703125, -21.490234375, -20.729248046875, -19.96826171875, -19.207275390625, -18.4462890625, -17.685302734375, -16.92431640625, -16.163330078125, -15.40234375, -14.641357421875, -13.88037109375, -13.119384765625, -12.3583984375, -11.597412109375, -10.83642578125, -10.075439453125, -9.314453125, -8.553466796875, -7.79248046875, -7.031494140625, -6.2705078125, -5.509521484375, -4.74853515625, -3.987548828125, -3.2265625, -2.465576171875, -1.70458984375, -0.943603515625, -0.1826171875, 0.578369140625, 1.33935546875, 2.100341796875, 2.861328125, 3.622314453125, 4.38330078125, 5.144287109375, 5.9052734375, 6.666259765625, 7.42724609375, 8.188232421875, 8.94921875, 9.710205078125, 10.47119140625, 11.232177734375, 11.9931640625, 12.754150390625, 13.51513671875, 14.276123046875, 15.037109375, 15.798095703125, 16.55908203125, 17.320068359375, 18.0810546875, 18.842041015625, 19.60302734375, 20.364013671875, 21.125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 16.0, 16.0, 21.0, 16.0, 31.0, 40.0, 48.0, 46.0, 56.0, 73.0, 80.0, 68.0, 76.0, 66.0, 57.0, 54.0, 55.0, 42.0, 29.0, 26.0, 19.0, 10.0, 6.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.048828125, -1.99273681640625, -1.9366455078125, -1.88055419921875, -1.824462890625, -1.76837158203125, -1.7122802734375, -1.65618896484375, -1.60009765625, -1.54400634765625, -1.4879150390625, -1.43182373046875, -1.375732421875, -1.31964111328125, -1.2635498046875, -1.20745849609375, -1.1513671875, -1.09527587890625, -1.0391845703125, -0.98309326171875, -0.927001953125, -0.87091064453125, -0.8148193359375, -0.75872802734375, -0.70263671875, -0.64654541015625, -0.5904541015625, -0.53436279296875, -0.478271484375, -0.42218017578125, -0.3660888671875, -0.30999755859375, -0.25390625, -0.19781494140625, -0.1417236328125, -0.08563232421875, -0.029541015625, 0.02655029296875, 0.0826416015625, 0.13873291015625, 0.19482421875, 0.25091552734375, 0.3070068359375, 0.36309814453125, 0.419189453125, 0.47528076171875, 0.5313720703125, 0.58746337890625, 0.6435546875, 0.69964599609375, 0.7557373046875, 0.81182861328125, 0.867919921875, 0.92401123046875, 0.9801025390625, 1.03619384765625, 1.09228515625, 1.14837646484375, 1.2044677734375, 1.26055908203125, 1.316650390625, 1.37274169921875, 1.4288330078125, 1.48492431640625, 1.541015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 18.0, 21.0, 31.0, 42.0, 74.0, 133.0, 181.0, 342.0, 619.0, 1351.0, 3009.0, 7840.0, 22922.0, 84524.0, 462288.0, 3030754.0, 458895.0, 84499.0, 23118.0, 7654.0, 3055.0, 1325.0, 672.0, 329.0, 221.0, 110.0, 67.0, 53.0, 31.0, 27.0, 18.0, 10.0, 7.0, 10.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.578125, -23.7978515625, -23.017578125, -22.2373046875, -21.45703125, -20.6767578125, -19.896484375, -19.1162109375, -18.3359375, -17.5556640625, -16.775390625, -15.9951171875, -15.21484375, -14.4345703125, -13.654296875, -12.8740234375, -12.09375, -11.3134765625, -10.533203125, -9.7529296875, -8.97265625, -8.1923828125, -7.412109375, -6.6318359375, -5.8515625, -5.0712890625, -4.291015625, -3.5107421875, -2.73046875, -1.9501953125, -1.169921875, -0.3896484375, 0.390625, 1.1708984375, 1.951171875, 2.7314453125, 3.51171875, 4.2919921875, 5.072265625, 5.8525390625, 6.6328125, 7.4130859375, 8.193359375, 8.9736328125, 9.75390625, 10.5341796875, 11.314453125, 12.0947265625, 12.875, 13.6552734375, 14.435546875, 15.2158203125, 15.99609375, 16.7763671875, 17.556640625, 18.3369140625, 19.1171875, 19.8974609375, 20.677734375, 21.4580078125, 22.23828125, 23.0185546875, 23.798828125, 24.5791015625, 25.359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 13.0, 19.0, 28.0, 38.0, 50.0, 65.0, 130.0, 165.0, 343.0, 602.0, 1345.0, 492.0, 303.0, 143.0, 88.0, 84.0, 40.0, 36.0, 17.0, 21.0, 11.0, 6.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.260009765625, -5.07470703125, -4.889404296875, -4.7041015625, -4.518798828125, -4.33349609375, -4.148193359375, -3.962890625, -3.777587890625, -3.59228515625, -3.406982421875, -3.2216796875, -3.036376953125, -2.85107421875, -2.665771484375, -2.48046875, -2.295166015625, -2.10986328125, -1.924560546875, -1.7392578125, -1.553955078125, -1.36865234375, -1.183349609375, -0.998046875, -0.812744140625, -0.62744140625, -0.442138671875, -0.2568359375, -0.071533203125, 0.11376953125, 0.299072265625, 0.484375, 0.669677734375, 0.85498046875, 1.040283203125, 1.2255859375, 1.410888671875, 1.59619140625, 1.781494140625, 1.966796875, 2.152099609375, 2.33740234375, 2.522705078125, 2.7080078125, 2.893310546875, 3.07861328125, 3.263916015625, 3.44921875, 3.634521484375, 3.81982421875, 4.005126953125, 4.1904296875, 4.375732421875, 4.56103515625, 4.746337890625, 4.931640625, 5.116943359375, 5.30224609375, 5.487548828125, 5.6728515625, 5.858154296875, 6.04345703125, 6.228759765625, 6.4140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 14.0, 35.0, 116.0, 288.0, 342.0, 154.0, 43.0, 13.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.66848754882812, -188.0599365234375, -184.45138549804688, -180.84283447265625, -177.23426818847656, -173.62571716308594, -170.0171661376953, -166.4086151123047, -162.80006408691406, -159.19151306152344, -155.5829620361328, -151.97439575195312, -148.3658447265625, -144.75729370117188, -141.14874267578125, -137.54019165039062, -133.931640625, -130.32308959960938, -126.71453094482422, -123.1059799194336, -119.49742889404297, -115.88887023925781, -112.28031921386719, -108.67176818847656, -105.06320190429688, -101.45465087890625, -97.8460922241211, -94.23754119873047, -90.62899017333984, -87.02043151855469, -83.41188049316406, -79.80332946777344, -76.19478607177734, -72.58623504638672, -68.97767639160156, -65.36912536621094, -61.76057434082031, -58.15201950073242, -54.54346466064453, -50.934913635253906, -47.326358795166016, -43.717803955078125, -40.1092529296875, -36.50069808959961, -32.89214324951172, -29.283592224121094, -25.675037384033203, -22.066484451293945, -18.457931518554688, -14.84937858581543, -11.240824699401855, -7.632270812988281, -4.023717880249023, -0.4151649475097656, 3.193389892578125, 6.801942825317383, 10.41049575805664, 14.019048690795898, 17.627601623535156, 21.236156463623047, 24.844709396362305, 28.453262329101562, 32.06181716918945, 35.670372009277344, 39.27892303466797]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 15.0, 23.0, 17.0, 25.0, 37.0, 22.0, 32.0, 35.0, 43.0, 40.0, 43.0, 51.0, 50.0, 55.0, 64.0, 70.0, 52.0, 44.0, 39.0, 33.0, 38.0, 41.0, 29.0, 17.0, 21.0, 16.0, 12.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.077171325683594, -25.220531463623047, -24.3638916015625, -23.507251739501953, -22.650611877441406, -21.79397201538086, -20.937332153320312, -20.080692291259766, -19.22405242919922, -18.367412567138672, -17.510772705078125, -16.654132843017578, -15.797492980957031, -14.940853118896484, -14.084214210510254, -13.227574348449707, -12.370935440063477, -11.51429557800293, -10.657655715942383, -9.801015853881836, -8.944375991821289, -8.087736129760742, -7.231097221374512, -6.374457359313965, -5.517817497253418, -4.661177635192871, -3.8045380115509033, -2.9478983879089355, -2.0912585258483887, -1.2346186637878418, -0.3779792785644531, 0.47866058349609375, 1.3353004455566406, 2.1919403076171875, 3.0485799312591553, 3.905219554901123, 4.76185941696167, 5.618499279022217, 6.4751386642456055, 7.331778526306152, 8.1884183883667, 9.045058250427246, 9.901698112487793, 10.758337020874023, 11.61497688293457, 12.471616744995117, 13.328256607055664, 14.184896469116211, 15.041536331176758, 15.898176193237305, 16.75481605529785, 17.6114559173584, 18.468095779418945, 19.324735641479492, 20.181373596191406, 21.038013458251953, 21.8946533203125, 22.751293182373047, 23.607933044433594, 24.46457290649414, 25.321212768554688, 26.177852630615234, 27.03449249267578, 27.891132354736328, 28.747772216796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 13.0, 9.0, 11.0, 17.0, 30.0, 45.0, 52.0, 77.0, 111.0, 136.0, 216.0, 301.0, 443.0, 665.0, 1079.0, 1789.0, 3345.0, 6502.0, 13703.0, 30325.0, 67256.0, 144290.0, 259193.0, 254869.0, 140649.0, 65510.0, 29774.0, 13625.0, 6406.0, 3168.0, 1839.0, 1021.0, 648.0, 454.0, 292.0, 221.0, 125.0, 98.0, 62.0, 56.0, 36.0, 22.0, 20.0, 16.0, 9.0, 5.0, 4.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4296875, -11.060791015625, -10.69189453125, -10.322998046875, -9.9541015625, -9.585205078125, -9.21630859375, -8.847412109375, -8.478515625, -8.109619140625, -7.74072265625, -7.371826171875, -7.0029296875, -6.634033203125, -6.26513671875, -5.896240234375, -5.52734375, -5.158447265625, -4.78955078125, -4.420654296875, -4.0517578125, -3.682861328125, -3.31396484375, -2.945068359375, -2.576171875, -2.207275390625, -1.83837890625, -1.469482421875, -1.1005859375, -0.731689453125, -0.36279296875, 0.006103515625, 0.375, 0.743896484375, 1.11279296875, 1.481689453125, 1.8505859375, 2.219482421875, 2.58837890625, 2.957275390625, 3.326171875, 3.695068359375, 4.06396484375, 4.432861328125, 4.8017578125, 5.170654296875, 5.53955078125, 5.908447265625, 6.27734375, 6.646240234375, 7.01513671875, 7.384033203125, 7.7529296875, 8.121826171875, 8.49072265625, 8.859619140625, 9.228515625, 9.597412109375, 9.96630859375, 10.335205078125, 10.7041015625, 11.072998046875, 11.44189453125, 11.810791015625, 12.1796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 13.0, 11.0, 17.0, 25.0, 30.0, 24.0, 38.0, 41.0, 42.0, 56.0, 70.0, 69.0, 69.0, 65.0, 74.0, 47.0, 59.0, 38.0, 39.0, 42.0, 28.0, 30.0, 12.0, 14.0, 11.0, 6.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9609375, -1.896820068359375, -1.83270263671875, -1.768585205078125, -1.7044677734375, -1.640350341796875, -1.57623291015625, -1.512115478515625, -1.447998046875, -1.383880615234375, -1.31976318359375, -1.255645751953125, -1.1915283203125, -1.127410888671875, -1.06329345703125, -0.999176025390625, -0.93505859375, -0.870941162109375, -0.80682373046875, -0.742706298828125, -0.6785888671875, -0.614471435546875, -0.55035400390625, -0.486236572265625, -0.422119140625, -0.358001708984375, -0.29388427734375, -0.229766845703125, -0.1656494140625, -0.101531982421875, -0.03741455078125, 0.026702880859375, 0.0908203125, 0.154937744140625, 0.21905517578125, 0.283172607421875, 0.3472900390625, 0.411407470703125, 0.47552490234375, 0.539642333984375, 0.603759765625, 0.667877197265625, 0.73199462890625, 0.796112060546875, 0.8602294921875, 0.924346923828125, 0.98846435546875, 1.052581787109375, 1.11669921875, 1.180816650390625, 1.24493408203125, 1.309051513671875, 1.3731689453125, 1.437286376953125, 1.50140380859375, 1.565521240234375, 1.629638671875, 1.693756103515625, 1.75787353515625, 1.821990966796875, 1.8861083984375, 1.950225830078125, 2.01434326171875, 2.078460693359375, 2.142578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 13.0, 11.0, 18.0, 21.0, 25.0, 41.0, 74.0, 88.0, 153.0, 245.0, 361.0, 667.0, 1269.0, 2703.0, 5892.0, 14957.0, 42767.0, 129026.0, 354167.0, 322037.0, 112547.0, 37888.0, 13226.0, 5278.0, 2305.0, 1156.0, 641.0, 337.0, 227.0, 140.0, 88.0, 57.0, 39.0, 17.0, 23.0, 16.0, 10.0, 3.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-20.375, -19.80810546875, -19.2412109375, -18.67431640625, -18.107421875, -17.54052734375, -16.9736328125, -16.40673828125, -15.83984375, -15.27294921875, -14.7060546875, -14.13916015625, -13.572265625, -13.00537109375, -12.4384765625, -11.87158203125, -11.3046875, -10.73779296875, -10.1708984375, -9.60400390625, -9.037109375, -8.47021484375, -7.9033203125, -7.33642578125, -6.76953125, -6.20263671875, -5.6357421875, -5.06884765625, -4.501953125, -3.93505859375, -3.3681640625, -2.80126953125, -2.234375, -1.66748046875, -1.1005859375, -0.53369140625, 0.033203125, 0.60009765625, 1.1669921875, 1.73388671875, 2.30078125, 2.86767578125, 3.4345703125, 4.00146484375, 4.568359375, 5.13525390625, 5.7021484375, 6.26904296875, 6.8359375, 7.40283203125, 7.9697265625, 8.53662109375, 9.103515625, 9.67041015625, 10.2373046875, 10.80419921875, 11.37109375, 11.93798828125, 12.5048828125, 13.07177734375, 13.638671875, 14.20556640625, 14.7724609375, 15.33935546875, 15.90625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 9.0, 1.0, 11.0, 9.0, 12.0, 13.0, 12.0, 20.0, 22.0, 37.0, 32.0, 32.0, 34.0, 30.0, 57.0, 55.0, 56.0, 48.0, 49.0, 51.0, 48.0, 49.0, 30.0, 40.0, 41.0, 36.0, 33.0, 23.0, 23.0, 13.0, 12.0, 7.0, 9.0, 7.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.3955078125, -10.064453125, -9.7333984375, -9.40234375, -9.0712890625, -8.740234375, -8.4091796875, -8.078125, -7.7470703125, -7.416015625, -7.0849609375, -6.75390625, -6.4228515625, -6.091796875, -5.7607421875, -5.4296875, -5.0986328125, -4.767578125, -4.4365234375, -4.10546875, -3.7744140625, -3.443359375, -3.1123046875, -2.78125, -2.4501953125, -2.119140625, -1.7880859375, -1.45703125, -1.1259765625, -0.794921875, -0.4638671875, -0.1328125, 0.1982421875, 0.529296875, 0.8603515625, 1.19140625, 1.5224609375, 1.853515625, 2.1845703125, 2.515625, 2.8466796875, 3.177734375, 3.5087890625, 3.83984375, 4.1708984375, 4.501953125, 4.8330078125, 5.1640625, 5.4951171875, 5.826171875, 6.1572265625, 6.48828125, 6.8193359375, 7.150390625, 7.4814453125, 7.8125, 8.1435546875, 8.474609375, 8.8056640625, 9.13671875, 9.4677734375, 9.798828125, 10.1298828125, 10.4609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 14.0, 15.0, 25.0, 47.0, 89.0, 146.0, 299.0, 617.0, 1197.0, 2877.0, 6556.0, 16159.0, 45645.0, 162947.0, 544793.0, 187025.0, 49784.0, 17621.0, 6957.0, 3144.0, 1333.0, 633.0, 313.0, 144.0, 68.0, 42.0, 23.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9921875, -14.4669189453125, -13.941650390625, -13.4163818359375, -12.89111328125, -12.3658447265625, -11.840576171875, -11.3153076171875, -10.7900390625, -10.2647705078125, -9.739501953125, -9.2142333984375, -8.68896484375, -8.1636962890625, -7.638427734375, -7.1131591796875, -6.587890625, -6.0626220703125, -5.537353515625, -5.0120849609375, -4.48681640625, -3.9615478515625, -3.436279296875, -2.9110107421875, -2.3857421875, -1.8604736328125, -1.335205078125, -0.8099365234375, -0.28466796875, 0.2406005859375, 0.765869140625, 1.2911376953125, 1.81640625, 2.3416748046875, 2.866943359375, 3.3922119140625, 3.91748046875, 4.4427490234375, 4.968017578125, 5.4932861328125, 6.0185546875, 6.5438232421875, 7.069091796875, 7.5943603515625, 8.11962890625, 8.6448974609375, 9.170166015625, 9.6954345703125, 10.220703125, 10.7459716796875, 11.271240234375, 11.7965087890625, 12.32177734375, 12.8470458984375, 13.372314453125, 13.8975830078125, 14.4228515625, 14.9481201171875, 15.473388671875, 15.9986572265625, 16.52392578125, 17.0491943359375, 17.574462890625, 18.0997314453125, 18.625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 5.0, 13.0, 22.0, 19.0, 29.0, 54.0, 46.0, 78.0, 148.0, 173.0, 101.0, 84.0, 43.0, 38.0, 27.0, 22.0, 19.0, 12.0, 14.0, 9.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00264739990234375, -0.0025568604469299316, -0.0024663209915161133, -0.002375781536102295, -0.0022852420806884766, -0.002194702625274658, -0.00210416316986084, -0.0020136237144470215, -0.0019230842590332031, -0.0018325448036193848, -0.0017420053482055664, -0.001651465892791748, -0.0015609264373779297, -0.0014703869819641113, -0.001379847526550293, -0.0012893080711364746, -0.0011987686157226562, -0.0011082291603088379, -0.0010176897048950195, -0.0009271502494812012, -0.0008366107940673828, -0.0007460713386535645, -0.0006555318832397461, -0.0005649924278259277, -0.0004744529724121094, -0.000383913516998291, -0.00029337406158447266, -0.0002028346061706543, -0.00011229515075683594, -2.1755695343017578e-05, 6.878376007080078e-05, 0.00015932321548461914, 0.0002498626708984375, 0.00034040212631225586, 0.0004309415817260742, 0.0005214810371398926, 0.0006120204925537109, 0.0007025599479675293, 0.0007930994033813477, 0.000883638858795166, 0.0009741783142089844, 0.0010647177696228027, 0.001155257225036621, 0.0012457966804504395, 0.0013363361358642578, 0.0014268755912780762, 0.0015174150466918945, 0.0016079545021057129, 0.0016984939575195312, 0.0017890334129333496, 0.001879572868347168, 0.0019701123237609863, 0.0020606517791748047, 0.002151191234588623, 0.0022417306900024414, 0.0023322701454162598, 0.002422809600830078, 0.0025133490562438965, 0.002603888511657715, 0.002694427967071533, 0.0027849674224853516, 0.00287550687789917, 0.0029660463333129883, 0.0030565857887268066, 0.003147125244140625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 13.0, 9.0, 21.0, 28.0, 37.0, 48.0, 62.0, 109.0, 144.0, 250.0, 436.0, 720.0, 1305.0, 2488.0, 5363.0, 12350.0, 32295.0, 104711.0, 503557.0, 280780.0, 64186.0, 21913.0, 9015.0, 4054.0, 2079.0, 1057.0, 578.0, 323.0, 197.0, 124.0, 82.0, 61.0, 42.0, 31.0, 16.0, 14.0, 12.0, 8.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84375, -16.259033203125, -15.67431640625, -15.089599609375, -14.5048828125, -13.920166015625, -13.33544921875, -12.750732421875, -12.166015625, -11.581298828125, -10.99658203125, -10.411865234375, -9.8271484375, -9.242431640625, -8.65771484375, -8.072998046875, -7.48828125, -6.903564453125, -6.31884765625, -5.734130859375, -5.1494140625, -4.564697265625, -3.97998046875, -3.395263671875, -2.810546875, -2.225830078125, -1.64111328125, -1.056396484375, -0.4716796875, 0.113037109375, 0.69775390625, 1.282470703125, 1.8671875, 2.451904296875, 3.03662109375, 3.621337890625, 4.2060546875, 4.790771484375, 5.37548828125, 5.960205078125, 6.544921875, 7.129638671875, 7.71435546875, 8.299072265625, 8.8837890625, 9.468505859375, 10.05322265625, 10.637939453125, 11.22265625, 11.807373046875, 12.39208984375, 12.976806640625, 13.5615234375, 14.146240234375, 14.73095703125, 15.315673828125, 15.900390625, 16.485107421875, 17.06982421875, 17.654541015625, 18.2392578125, 18.823974609375, 19.40869140625, 19.993408203125, 20.578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 4.0, 10.0, 3.0, 9.0, 12.0, 9.0, 17.0, 18.0, 22.0, 26.0, 37.0, 52.0, 69.0, 107.0, 113.0, 100.0, 74.0, 63.0, 48.0, 40.0, 28.0, 16.0, 14.0, 12.0, 20.0, 16.0, 5.0, 6.0, 6.0, 2.0, 8.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.29345703125, -9.9462890625, -9.59912109375, -9.251953125, -8.90478515625, -8.5576171875, -8.21044921875, -7.86328125, -7.51611328125, -7.1689453125, -6.82177734375, -6.474609375, -6.12744140625, -5.7802734375, -5.43310546875, -5.0859375, -4.73876953125, -4.3916015625, -4.04443359375, -3.697265625, -3.35009765625, -3.0029296875, -2.65576171875, -2.30859375, -1.96142578125, -1.6142578125, -1.26708984375, -0.919921875, -0.57275390625, -0.2255859375, 0.12158203125, 0.46875, 0.81591796875, 1.1630859375, 1.51025390625, 1.857421875, 2.20458984375, 2.5517578125, 2.89892578125, 3.24609375, 3.59326171875, 3.9404296875, 4.28759765625, 4.634765625, 4.98193359375, 5.3291015625, 5.67626953125, 6.0234375, 6.37060546875, 6.7177734375, 7.06494140625, 7.412109375, 7.75927734375, 8.1064453125, 8.45361328125, 8.80078125, 9.14794921875, 9.4951171875, 9.84228515625, 10.189453125, 10.53662109375, 10.8837890625, 11.23095703125, 11.578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 10.0, 11.0, 21.0, 49.0, 61.0, 116.0, 167.0, 160.0, 140.0, 123.0, 63.0, 24.0, 19.0, 11.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-184.5086669921875, -178.6202392578125, -172.7318115234375, -166.84336853027344, -160.95494079589844, -155.06651306152344, -149.17808532714844, -143.28964233398438, -137.40121459960938, -131.51278686523438, -125.62435150146484, -119.73592376708984, -113.84748840332031, -107.95906066894531, -102.07063293457031, -96.18219757080078, -90.29376983642578, -84.40534210205078, -78.51690673828125, -72.62847900390625, -66.74004364013672, -60.85161590576172, -54.96318435668945, -49.07475280761719, -43.18632125854492, -37.297889709472656, -31.40945816040039, -25.521028518676758, -19.632596969604492, -13.744165420532227, -7.855735778808594, -1.9673042297363281, 3.9211273193359375, 9.809558868408203, 15.697989463806152, 21.5864200592041, 27.474851608276367, 33.36328125, 39.251712799072266, 45.14014434814453, 51.0285758972168, 56.91700744628906, 62.80543899536133, 68.6938705444336, 74.5822982788086, 80.47073364257812, 86.35916137695312, 92.24758911132812, 98.13602447509766, 104.02445220947266, 109.91288757324219, 115.80131530761719, 121.68975067138672, 127.57817840576172, 133.46661376953125, 139.35504150390625, 145.24346923828125, 151.13189697265625, 157.02032470703125, 162.9087677001953, 168.7971954345703, 174.6856231689453, 180.5740509033203, 186.46249389648438, 192.35092163085938]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 9.0, 12.0, 7.0, 9.0, 12.0, 10.0, 10.0, 24.0, 18.0, 29.0, 31.0, 34.0, 40.0, 46.0, 42.0, 49.0, 56.0, 46.0, 49.0, 42.0, 32.0, 45.0, 29.0, 48.0, 51.0, 35.0, 27.0, 36.0, 18.0, 13.0, 15.0, 17.0, 13.0, 7.0, 9.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.49825286865234, -75.96744537353516, -73.43663024902344, -70.90582275390625, -68.37500762939453, -65.84420013427734, -63.31338882446289, -60.78257751464844, -58.251766204833984, -55.72095489501953, -53.19014358520508, -50.659332275390625, -48.12852478027344, -45.59770965576172, -43.06690216064453, -40.53609085083008, -38.005279541015625, -35.47446823120117, -32.94365692138672, -30.4128475189209, -27.882036209106445, -25.351224899291992, -22.820415496826172, -20.28960418701172, -17.758792877197266, -15.227981567382812, -12.697171211242676, -10.166360855102539, -7.635549545288086, -5.104738235473633, -2.573927879333496, -0.043117523193359375, 2.487701416015625, 5.01851224899292, 7.549323081970215, 10.080133438110352, 12.610944747924805, 15.141756057739258, 17.672565460205078, 20.20337677001953, 22.734188079833984, 25.264999389648438, 27.79581069946289, 30.32662010192871, 32.85742950439453, 35.38824462890625, 37.91905212402344, 40.44986343383789, 42.980674743652344, 45.5114860534668, 48.04229736328125, 50.5731086730957, 53.103919982910156, 55.634727478027344, 58.1655387878418, 60.69635009765625, 63.2271614074707, 65.75797271728516, 68.28878021240234, 70.81959533691406, 73.35040283203125, 75.88121795654297, 78.41202545166016, 80.94284057617188, 83.47364807128906]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 13.0, 8.0, 10.0, 27.0, 35.0, 41.0, 47.0, 91.0, 150.0, 291.0, 465.0, 962.0, 2151.0, 6124.0, 23506.0, 136392.0, 3568000.0, 392146.0, 47293.0, 10747.0, 3299.0, 1213.0, 549.0, 295.0, 140.0, 97.0, 60.0, 38.0, 29.0, 18.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -32.02001953125, -30.9775390625, -29.93505859375, -28.892578125, -27.85009765625, -26.8076171875, -25.76513671875, -24.72265625, -23.68017578125, -22.6376953125, -21.59521484375, -20.552734375, -19.51025390625, -18.4677734375, -17.42529296875, -16.3828125, -15.34033203125, -14.2978515625, -13.25537109375, -12.212890625, -11.17041015625, -10.1279296875, -9.08544921875, -8.04296875, -7.00048828125, -5.9580078125, -4.91552734375, -3.873046875, -2.83056640625, -1.7880859375, -0.74560546875, 0.296875, 1.33935546875, 2.3818359375, 3.42431640625, 4.466796875, 5.50927734375, 6.5517578125, 7.59423828125, 8.63671875, 9.67919921875, 10.7216796875, 11.76416015625, 12.806640625, 13.84912109375, 14.8916015625, 15.93408203125, 16.9765625, 18.01904296875, 19.0615234375, 20.10400390625, 21.146484375, 22.18896484375, 23.2314453125, 24.27392578125, 25.31640625, 26.35888671875, 27.4013671875, 28.44384765625, 29.486328125, 30.52880859375, 31.5712890625, 32.61376953125, 33.65625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 6.0, 12.0, 17.0, 18.0, 16.0, 26.0, 36.0, 40.0, 44.0, 47.0, 61.0, 64.0, 54.0, 63.0, 57.0, 62.0, 66.0, 46.0, 44.0, 50.0, 40.0, 24.0, 27.0, 9.0, 14.0, 15.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.309539794921875, -2.22845458984375, -2.147369384765625, -2.0662841796875, -1.985198974609375, -1.90411376953125, -1.823028564453125, -1.741943359375, -1.660858154296875, -1.57977294921875, -1.498687744140625, -1.4176025390625, -1.336517333984375, -1.25543212890625, -1.174346923828125, -1.09326171875, -1.012176513671875, -0.93109130859375, -0.850006103515625, -0.7689208984375, -0.687835693359375, -0.60675048828125, -0.525665283203125, -0.444580078125, -0.363494873046875, -0.28240966796875, -0.201324462890625, -0.1202392578125, -0.039154052734375, 0.04193115234375, 0.123016357421875, 0.2041015625, 0.285186767578125, 0.36627197265625, 0.447357177734375, 0.5284423828125, 0.609527587890625, 0.69061279296875, 0.771697998046875, 0.852783203125, 0.933868408203125, 1.01495361328125, 1.096038818359375, 1.1771240234375, 1.258209228515625, 1.33929443359375, 1.420379638671875, 1.50146484375, 1.582550048828125, 1.66363525390625, 1.744720458984375, 1.8258056640625, 1.906890869140625, 1.98797607421875, 2.069061279296875, 2.150146484375, 2.231231689453125, 2.31231689453125, 2.393402099609375, 2.4744873046875, 2.555572509765625, 2.63665771484375, 2.717742919921875, 2.798828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 13.0, 16.0, 13.0, 26.0, 42.0, 82.0, 107.0, 170.0, 278.0, 439.0, 740.0, 1224.0, 2252.0, 4085.0, 7735.0, 16924.0, 40053.0, 113493.0, 419286.0, 2838692.0, 527776.0, 134266.0, 46969.0, 19549.0, 9013.0, 4648.0, 2541.0, 1443.0, 875.0, 555.0, 349.0, 195.0, 133.0, 89.0, 55.0, 39.0, 27.0, 25.0, 13.0, 9.0, 11.0, 7.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.828125, -18.283447265625, -17.73876953125, -17.194091796875, -16.6494140625, -16.104736328125, -15.56005859375, -15.015380859375, -14.470703125, -13.926025390625, -13.38134765625, -12.836669921875, -12.2919921875, -11.747314453125, -11.20263671875, -10.657958984375, -10.11328125, -9.568603515625, -9.02392578125, -8.479248046875, -7.9345703125, -7.389892578125, -6.84521484375, -6.300537109375, -5.755859375, -5.211181640625, -4.66650390625, -4.121826171875, -3.5771484375, -3.032470703125, -2.48779296875, -1.943115234375, -1.3984375, -0.853759765625, -0.30908203125, 0.235595703125, 0.7802734375, 1.324951171875, 1.86962890625, 2.414306640625, 2.958984375, 3.503662109375, 4.04833984375, 4.593017578125, 5.1376953125, 5.682373046875, 6.22705078125, 6.771728515625, 7.31640625, 7.861083984375, 8.40576171875, 8.950439453125, 9.4951171875, 10.039794921875, 10.58447265625, 11.129150390625, 11.673828125, 12.218505859375, 12.76318359375, 13.307861328125, 13.8525390625, 14.397216796875, 14.94189453125, 15.486572265625, 16.03125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 10.0, 8.0, 9.0, 20.0, 19.0, 30.0, 40.0, 63.0, 97.0, 112.0, 178.0, 305.0, 767.0, 1257.0, 399.0, 225.0, 142.0, 104.0, 66.0, 56.0, 38.0, 24.0, 19.0, 22.0, 9.0, 9.0, 7.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.390625, -5.21746826171875, -5.0443115234375, -4.87115478515625, -4.697998046875, -4.52484130859375, -4.3516845703125, -4.17852783203125, -4.00537109375, -3.83221435546875, -3.6590576171875, -3.48590087890625, -3.312744140625, -3.13958740234375, -2.9664306640625, -2.79327392578125, -2.6201171875, -2.44696044921875, -2.2738037109375, -2.10064697265625, -1.927490234375, -1.75433349609375, -1.5811767578125, -1.40802001953125, -1.23486328125, -1.06170654296875, -0.8885498046875, -0.71539306640625, -0.542236328125, -0.36907958984375, -0.1959228515625, -0.02276611328125, 0.150390625, 0.32354736328125, 0.4967041015625, 0.66986083984375, 0.843017578125, 1.01617431640625, 1.1893310546875, 1.36248779296875, 1.53564453125, 1.70880126953125, 1.8819580078125, 2.05511474609375, 2.228271484375, 2.40142822265625, 2.5745849609375, 2.74774169921875, 2.9208984375, 3.09405517578125, 3.2672119140625, 3.44036865234375, 3.613525390625, 3.78668212890625, 3.9598388671875, 4.13299560546875, 4.30615234375, 4.47930908203125, 4.6524658203125, 4.82562255859375, 4.998779296875, 5.17193603515625, 5.3450927734375, 5.51824951171875, 5.69140625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 18.0, 34.0, 42.0, 66.0, 119.0, 132.0, 125.0, 175.0, 104.0, 69.0, 45.0, 28.0, 14.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.661224365234375, -53.9853401184082, -52.30945587158203, -50.633575439453125, -48.95769119262695, -47.28180694580078, -45.60592269897461, -43.93003845214844, -42.25415802001953, -40.57827377319336, -38.90238952636719, -37.22650909423828, -35.55062484741211, -33.87474060058594, -32.198856353759766, -30.522974014282227, -28.847089767456055, -27.171205520629883, -25.495323181152344, -23.819438934326172, -22.143556594848633, -20.46767234802246, -18.791790008544922, -17.11590576171875, -15.440022468566895, -13.764139175415039, -12.088255882263184, -10.412372589111328, -8.736488342285156, -7.060605049133301, -5.384721755981445, -3.70883846282959, -2.0329551696777344, -0.35707175731658936, 1.3188116550445557, 2.9946951866149902, 4.670578479766846, 6.346462249755859, 8.022345542907715, 9.69822883605957, 11.374112129211426, 13.049995422363281, 14.725878715515137, 16.401762008666992, 18.077646255493164, 19.753528594970703, 21.429412841796875, 23.105297088623047, 24.781179428100586, 26.457063674926758, 28.132946014404297, 29.80883026123047, 31.484712600708008, 33.16059875488281, 34.83647918701172, 36.51236343383789, 38.18824768066406, 39.864131927490234, 41.540016174316406, 43.21589660644531, 44.891780853271484, 46.567665100097656, 48.24354934692383, 49.91943359375, 51.595314025878906]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 5.0, 3.0, 5.0, 9.0, 12.0, 12.0, 9.0, 29.0, 28.0, 28.0, 26.0, 37.0, 29.0, 57.0, 36.0, 35.0, 35.0, 46.0, 52.0, 51.0, 45.0, 40.0, 37.0, 54.0, 38.0, 29.0, 26.0, 32.0, 24.0, 23.0, 26.0, 15.0, 13.0, 14.0, 6.0, 6.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.908897399902344, -19.228694915771484, -18.548490524291992, -17.868288040161133, -17.18808364868164, -16.50788116455078, -15.827676773071289, -15.14747428894043, -14.467269897460938, -13.787066459655762, -13.106863021850586, -12.42665958404541, -11.746456146240234, -11.066252708435059, -10.386049270629883, -9.705846786499023, -9.025643348693848, -8.345439910888672, -7.665236473083496, -6.98503303527832, -6.3048295974731445, -5.624626159667969, -4.944423198699951, -4.264219760894775, -3.5840163230895996, -2.903812885284424, -2.223609447479248, -1.5434062480926514, -0.8632028102874756, -0.1829993724822998, 0.4972038269042969, 1.1774072647094727, 1.8576107025146484, 2.537814140319824, 3.218017578125, 3.8982207775115967, 4.578424453735352, 5.258627891540527, 5.938830852508545, 6.619034290313721, 7.2992377281188965, 7.979441165924072, 8.65964412689209, 9.339847564697266, 10.020051002502441, 10.700254440307617, 11.380457878112793, 12.060661315917969, 12.740864753723145, 13.42106819152832, 14.101271629333496, 14.781475067138672, 15.461678504943848, 16.141881942749023, 16.822084426879883, 17.502288818359375, 18.182491302490234, 18.862693786621094, 19.542898178100586, 20.223100662231445, 20.903305053710938, 21.583507537841797, 22.26371192932129, 22.94391441345215, 23.62411880493164]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 26.0, 30.0, 43.0, 72.0, 116.0, 257.0, 461.0, 925.0, 1835.0, 4292.0, 9609.0, 24647.0, 63961.0, 162715.0, 315785.0, 267359.0, 119378.0, 46058.0, 17642.0, 7184.0, 3045.0, 1495.0, 770.0, 366.0, 203.0, 108.0, 64.0, 36.0, 23.0, 13.0, 9.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.8984375, -14.4580078125, -14.017578125, -13.5771484375, -13.13671875, -12.6962890625, -12.255859375, -11.8154296875, -11.375, -10.9345703125, -10.494140625, -10.0537109375, -9.61328125, -9.1728515625, -8.732421875, -8.2919921875, -7.8515625, -7.4111328125, -6.970703125, -6.5302734375, -6.08984375, -5.6494140625, -5.208984375, -4.7685546875, -4.328125, -3.8876953125, -3.447265625, -3.0068359375, -2.56640625, -2.1259765625, -1.685546875, -1.2451171875, -0.8046875, -0.3642578125, 0.076171875, 0.5166015625, 0.95703125, 1.3974609375, 1.837890625, 2.2783203125, 2.71875, 3.1591796875, 3.599609375, 4.0400390625, 4.48046875, 4.9208984375, 5.361328125, 5.8017578125, 6.2421875, 6.6826171875, 7.123046875, 7.5634765625, 8.00390625, 8.4443359375, 8.884765625, 9.3251953125, 9.765625, 10.2060546875, 10.646484375, 11.0869140625, 11.52734375, 11.9677734375, 12.408203125, 12.8486328125, 13.2890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 1.0, 9.0, 5.0, 2.0, 13.0, 7.0, 21.0, 17.0, 20.0, 23.0, 41.0, 38.0, 36.0, 38.0, 42.0, 42.0, 47.0, 62.0, 57.0, 44.0, 62.0, 58.0, 44.0, 29.0, 32.0, 38.0, 29.0, 25.0, 25.0, 20.0, 16.0, 12.0, 9.0, 5.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.162109375, -2.091339111328125, -2.02056884765625, -1.949798583984375, -1.8790283203125, -1.808258056640625, -1.73748779296875, -1.666717529296875, -1.595947265625, -1.525177001953125, -1.45440673828125, -1.383636474609375, -1.3128662109375, -1.242095947265625, -1.17132568359375, -1.100555419921875, -1.02978515625, -0.959014892578125, -0.88824462890625, -0.817474365234375, -0.7467041015625, -0.675933837890625, -0.60516357421875, -0.534393310546875, -0.463623046875, -0.392852783203125, -0.32208251953125, -0.251312255859375, -0.1805419921875, -0.109771728515625, -0.03900146484375, 0.031768798828125, 0.1025390625, 0.173309326171875, 0.24407958984375, 0.314849853515625, 0.3856201171875, 0.456390380859375, 0.52716064453125, 0.597930908203125, 0.668701171875, 0.739471435546875, 0.81024169921875, 0.881011962890625, 0.9517822265625, 1.022552490234375, 1.09332275390625, 1.164093017578125, 1.23486328125, 1.305633544921875, 1.37640380859375, 1.447174072265625, 1.5179443359375, 1.588714599609375, 1.65948486328125, 1.730255126953125, 1.801025390625, 1.871795654296875, 1.94256591796875, 2.013336181640625, 2.0841064453125, 2.154876708984375, 2.22564697265625, 2.296417236328125, 2.3671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 9.0, 18.0, 18.0, 31.0, 54.0, 85.0, 107.0, 190.0, 297.0, 457.0, 799.0, 1414.0, 2571.0, 5031.0, 11144.0, 24637.0, 59792.0, 142180.0, 289654.0, 277916.0, 132978.0, 55606.0, 23001.0, 10043.0, 4844.0, 2365.0, 1317.0, 774.0, 454.0, 278.0, 157.0, 98.0, 74.0, 47.0, 37.0, 23.0, 13.0, 15.0, 9.0, 3.0, 1.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.6484375, -14.2039794921875, -13.759521484375, -13.3150634765625, -12.87060546875, -12.4261474609375, -11.981689453125, -11.5372314453125, -11.0927734375, -10.6483154296875, -10.203857421875, -9.7593994140625, -9.31494140625, -8.8704833984375, -8.426025390625, -7.9815673828125, -7.537109375, -7.0926513671875, -6.648193359375, -6.2037353515625, -5.75927734375, -5.3148193359375, -4.870361328125, -4.4259033203125, -3.9814453125, -3.5369873046875, -3.092529296875, -2.6480712890625, -2.20361328125, -1.7591552734375, -1.314697265625, -0.8702392578125, -0.42578125, 0.0186767578125, 0.463134765625, 0.9075927734375, 1.35205078125, 1.7965087890625, 2.240966796875, 2.6854248046875, 3.1298828125, 3.5743408203125, 4.018798828125, 4.4632568359375, 4.90771484375, 5.3521728515625, 5.796630859375, 6.2410888671875, 6.685546875, 7.1300048828125, 7.574462890625, 8.0189208984375, 8.46337890625, 8.9078369140625, 9.352294921875, 9.7967529296875, 10.2412109375, 10.6856689453125, 11.130126953125, 11.5745849609375, 12.01904296875, 12.4635009765625, 12.907958984375, 13.3524169921875, 13.796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 8.0, 7.0, 14.0, 18.0, 22.0, 27.0, 18.0, 32.0, 31.0, 35.0, 40.0, 36.0, 40.0, 52.0, 40.0, 45.0, 40.0, 45.0, 32.0, 42.0, 31.0, 46.0, 37.0, 31.0, 31.0, 33.0, 22.0, 24.0, 21.0, 8.0, 13.0, 14.0, 12.0, 5.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.30322265625, -10.9189453125, -10.53466796875, -10.150390625, -9.76611328125, -9.3818359375, -8.99755859375, -8.61328125, -8.22900390625, -7.8447265625, -7.46044921875, -7.076171875, -6.69189453125, -6.3076171875, -5.92333984375, -5.5390625, -5.15478515625, -4.7705078125, -4.38623046875, -4.001953125, -3.61767578125, -3.2333984375, -2.84912109375, -2.46484375, -2.08056640625, -1.6962890625, -1.31201171875, -0.927734375, -0.54345703125, -0.1591796875, 0.22509765625, 0.609375, 0.99365234375, 1.3779296875, 1.76220703125, 2.146484375, 2.53076171875, 2.9150390625, 3.29931640625, 3.68359375, 4.06787109375, 4.4521484375, 4.83642578125, 5.220703125, 5.60498046875, 5.9892578125, 6.37353515625, 6.7578125, 7.14208984375, 7.5263671875, 7.91064453125, 8.294921875, 8.67919921875, 9.0634765625, 9.44775390625, 9.83203125, 10.21630859375, 10.6005859375, 10.98486328125, 11.369140625, 11.75341796875, 12.1376953125, 12.52197265625, 12.90625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 12.0, 10.0, 22.0, 20.0, 33.0, 32.0, 61.0, 72.0, 105.0, 167.0, 275.0, 393.0, 689.0, 1223.0, 2217.0, 4261.0, 9038.0, 20786.0, 56581.0, 185108.0, 434892.0, 221172.0, 67129.0, 23685.0, 9980.0, 4736.0, 2441.0, 1312.0, 730.0, 484.0, 292.0, 183.0, 108.0, 67.0, 47.0, 44.0, 31.0, 26.0, 21.0, 19.0, 13.0, 4.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.765625, -9.4658203125, -9.166015625, -8.8662109375, -8.56640625, -8.2666015625, -7.966796875, -7.6669921875, -7.3671875, -7.0673828125, -6.767578125, -6.4677734375, -6.16796875, -5.8681640625, -5.568359375, -5.2685546875, -4.96875, -4.6689453125, -4.369140625, -4.0693359375, -3.76953125, -3.4697265625, -3.169921875, -2.8701171875, -2.5703125, -2.2705078125, -1.970703125, -1.6708984375, -1.37109375, -1.0712890625, -0.771484375, -0.4716796875, -0.171875, 0.1279296875, 0.427734375, 0.7275390625, 1.02734375, 1.3271484375, 1.626953125, 1.9267578125, 2.2265625, 2.5263671875, 2.826171875, 3.1259765625, 3.42578125, 3.7255859375, 4.025390625, 4.3251953125, 4.625, 4.9248046875, 5.224609375, 5.5244140625, 5.82421875, 6.1240234375, 6.423828125, 6.7236328125, 7.0234375, 7.3232421875, 7.623046875, 7.9228515625, 8.22265625, 8.5224609375, 8.822265625, 9.1220703125, 9.421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 8.0, 14.0, 24.0, 24.0, 30.0, 50.0, 61.0, 94.0, 150.0, 140.0, 126.0, 75.0, 51.0, 36.0, 27.0, 14.0, 11.0, 14.0, 7.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027599334716796875, -0.00267106294631958, -0.0025821924209594727, -0.0024933218955993652, -0.002404451370239258, -0.0023155808448791504, -0.002226710319519043, -0.0021378397941589355, -0.002048969268798828, -0.0019600987434387207, -0.0018712282180786133, -0.0017823576927185059, -0.0016934871673583984, -0.001604616641998291, -0.0015157461166381836, -0.0014268755912780762, -0.0013380050659179688, -0.0012491345405578613, -0.001160264015197754, -0.0010713934898376465, -0.000982522964477539, -0.0008936524391174316, -0.0008047819137573242, -0.0007159113883972168, -0.0006270408630371094, -0.000538170337677002, -0.00044929981231689453, -0.0003604292869567871, -0.0002715587615966797, -0.00018268823623657227, -9.381771087646484e-05, -4.947185516357422e-06, 8.392333984375e-05, 0.00017279386520385742, 0.00026166439056396484, 0.00035053491592407227, 0.0004394054412841797, 0.0005282759666442871, 0.0006171464920043945, 0.000706017017364502, 0.0007948875427246094, 0.0008837580680847168, 0.0009726285934448242, 0.0010614991188049316, 0.001150369644165039, 0.0012392401695251465, 0.001328110694885254, 0.0014169812202453613, 0.0015058517456054688, 0.0015947222709655762, 0.0016835927963256836, 0.001772463321685791, 0.0018613338470458984, 0.0019502043724060059, 0.0020390748977661133, 0.0021279454231262207, 0.002216815948486328, 0.0023056864738464355, 0.002394556999206543, 0.0024834275245666504, 0.002572298049926758, 0.0026611685752868652, 0.0027500391006469727, 0.00283890962600708, 0.0029277801513671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 13.0, 11.0, 25.0, 28.0, 36.0, 70.0, 100.0, 125.0, 231.0, 367.0, 568.0, 995.0, 1770.0, 3477.0, 7434.0, 16208.0, 41422.0, 135768.0, 478727.0, 251137.0, 65740.0, 23933.0, 10176.0, 4637.0, 2368.0, 1274.0, 692.0, 412.0, 264.0, 169.0, 106.0, 73.0, 48.0, 44.0, 22.0, 27.0, 12.0, 10.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.640625, -11.2615966796875, -10.882568359375, -10.5035400390625, -10.12451171875, -9.7454833984375, -9.366455078125, -8.9874267578125, -8.6083984375, -8.2293701171875, -7.850341796875, -7.4713134765625, -7.09228515625, -6.7132568359375, -6.334228515625, -5.9552001953125, -5.576171875, -5.1971435546875, -4.818115234375, -4.4390869140625, -4.06005859375, -3.6810302734375, -3.302001953125, -2.9229736328125, -2.5439453125, -2.1649169921875, -1.785888671875, -1.4068603515625, -1.02783203125, -0.6488037109375, -0.269775390625, 0.1092529296875, 0.48828125, 0.8673095703125, 1.246337890625, 1.6253662109375, 2.00439453125, 2.3834228515625, 2.762451171875, 3.1414794921875, 3.5205078125, 3.8995361328125, 4.278564453125, 4.6575927734375, 5.03662109375, 5.4156494140625, 5.794677734375, 6.1737060546875, 6.552734375, 6.9317626953125, 7.310791015625, 7.6898193359375, 8.06884765625, 8.4478759765625, 8.826904296875, 9.2059326171875, 9.5849609375, 9.9639892578125, 10.343017578125, 10.7220458984375, 11.10107421875, 11.4801025390625, 11.859130859375, 12.2381591796875, 12.6171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 2.0, 2.0, 3.0, 5.0, 10.0, 8.0, 10.0, 20.0, 27.0, 29.0, 33.0, 43.0, 63.0, 115.0, 104.0, 120.0, 96.0, 95.0, 49.0, 46.0, 24.0, 20.0, 15.0, 8.0, 15.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.448974609375, -10.10107421875, -9.753173828125, -9.4052734375, -9.057373046875, -8.70947265625, -8.361572265625, -8.013671875, -7.665771484375, -7.31787109375, -6.969970703125, -6.6220703125, -6.274169921875, -5.92626953125, -5.578369140625, -5.23046875, -4.882568359375, -4.53466796875, -4.186767578125, -3.8388671875, -3.490966796875, -3.14306640625, -2.795166015625, -2.447265625, -2.099365234375, -1.75146484375, -1.403564453125, -1.0556640625, -0.707763671875, -0.35986328125, -0.011962890625, 0.3359375, 0.683837890625, 1.03173828125, 1.379638671875, 1.7275390625, 2.075439453125, 2.42333984375, 2.771240234375, 3.119140625, 3.467041015625, 3.81494140625, 4.162841796875, 4.5107421875, 4.858642578125, 5.20654296875, 5.554443359375, 5.90234375, 6.250244140625, 6.59814453125, 6.946044921875, 7.2939453125, 7.641845703125, 7.98974609375, 8.337646484375, 8.685546875, 9.033447265625, 9.38134765625, 9.729248046875, 10.0771484375, 10.425048828125, 10.77294921875, 11.120849609375, 11.46875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 7.0, 21.0, 31.0, 56.0, 79.0, 106.0, 120.0, 151.0, 123.0, 112.0, 70.0, 50.0, 31.0, 18.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.38300323486328, -92.82000732421875, -88.25701904296875, -83.69402313232422, -79.13102722167969, -74.56803894042969, -70.00504302978516, -65.44204711914062, -60.87905502319336, -56.316062927246094, -51.75306701660156, -47.1900749206543, -42.62708282470703, -38.0640869140625, -33.501094818115234, -28.938100814819336, -24.375106811523438, -19.81211280822754, -15.249119758605957, -10.686126708984375, -6.123132705688477, -1.5601387023925781, 3.0028533935546875, 7.565847396850586, 12.128841400146484, 16.691835403442383, 21.25482940673828, 25.817821502685547, 30.380815505981445, 34.943809509277344, 39.50680160522461, 44.069793701171875, 48.63279724121094, 53.1957893371582, 57.758785247802734, 62.32177734375, 66.88477325439453, 71.44776916503906, 76.01075744628906, 80.5737533569336, 85.13674926757812, 89.69974517822266, 94.26273345947266, 98.82572937011719, 103.38872528076172, 107.95172119140625, 112.51470947265625, 117.07770538330078, 121.64069366455078, 126.20368957519531, 130.7666778564453, 135.32968139648438, 139.89266967773438, 144.45565795898438, 149.01864624023438, 153.58164978027344, 158.14463806152344, 162.70762634277344, 167.2706298828125, 171.8336181640625, 176.3966064453125, 180.95960998535156, 185.52259826660156, 190.08558654785156, 194.64859008789062]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 0.0, 4.0, 3.0, 12.0, 8.0, 10.0, 13.0, 16.0, 20.0, 27.0, 42.0, 48.0, 31.0, 43.0, 45.0, 56.0, 51.0, 55.0, 50.0, 54.0, 53.0, 56.0, 47.0, 43.0, 37.0, 39.0, 19.0, 26.0, 23.0, 13.0, 11.0, 11.0, 7.0, 6.0, 10.0, 2.0, 8.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.67121887207031, -68.75943756103516, -65.84766387939453, -62.935882568359375, -60.024105072021484, -57.112327575683594, -54.20054626464844, -51.28876876831055, -48.376991271972656, -45.465213775634766, -42.553436279296875, -39.64165496826172, -36.72987747192383, -33.81809997558594, -30.906320571899414, -27.99454116821289, -25.082763671875, -22.17098617553711, -19.259206771850586, -16.347427368164062, -13.435649871826172, -10.523871421813965, -7.612092971801758, -4.700313568115234, -1.7885360717773438, 1.1232423782348633, 4.03502082824707, 6.946799278259277, 9.858577728271484, 12.770356178283691, 15.682134628295898, 18.593914031982422, 21.50568389892578, 24.417461395263672, 27.329240798950195, 30.24102020263672, 33.15279769897461, 36.0645751953125, 38.976356506347656, 41.88813400268555, 44.79991149902344, 47.71168899536133, 50.62346649169922, 53.535247802734375, 56.447025299072266, 59.358802795410156, 62.27058410644531, 65.18235778808594, 68.0941390991211, 71.00592041015625, 73.91769409179688, 76.82947540283203, 79.74125671386719, 82.65303039550781, 85.56481170654297, 88.47659301757812, 91.38836669921875, 94.3001480102539, 97.21192169189453, 100.12370300292969, 103.03547668457031, 105.94725799560547, 108.85903930664062, 111.77081298828125, 114.6825942993164]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 9.0, 11.0, 14.0, 25.0, 37.0, 111.0, 210.0, 537.0, 1372.0, 4244.0, 16696.0, 105932.0, 3849198.0, 183662.0, 23444.0, 5670.0, 1867.0, 647.0, 280.0, 116.0, 77.0, 31.0, 28.0, 25.0, 12.0, 8.0, 9.0, 0.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.39501953125, -18.3525390625, -17.31005859375, -16.267578125, -15.22509765625, -14.1826171875, -13.14013671875, -12.09765625, -11.05517578125, -10.0126953125, -8.97021484375, -7.927734375, -6.88525390625, -5.8427734375, -4.80029296875, -3.7578125, -2.71533203125, -1.6728515625, -0.63037109375, 0.412109375, 1.45458984375, 2.4970703125, 3.53955078125, 4.58203125, 5.62451171875, 6.6669921875, 7.70947265625, 8.751953125, 9.79443359375, 10.8369140625, 11.87939453125, 12.921875, 13.96435546875, 15.0068359375, 16.04931640625, 17.091796875, 18.13427734375, 19.1767578125, 20.21923828125, 21.26171875, 22.30419921875, 23.3466796875, 24.38916015625, 25.431640625, 26.47412109375, 27.5166015625, 28.55908203125, 29.6015625, 30.64404296875, 31.6865234375, 32.72900390625, 33.771484375, 34.81396484375, 35.8564453125, 36.89892578125, 37.94140625, 38.98388671875, 40.0263671875, 41.06884765625, 42.111328125, 43.15380859375, 44.1962890625, 45.23876953125, 46.28125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 9.0, 18.0, 10.0, 18.0, 14.0, 22.0, 29.0, 45.0, 50.0, 78.0, 61.0, 68.0, 56.0, 75.0, 53.0, 62.0, 53.0, 62.0, 34.0, 40.0, 32.0, 21.0, 28.0, 18.0, 13.0, 4.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.01751708984375, -1.9178466796875, -1.81817626953125, -1.718505859375, -1.61883544921875, -1.5191650390625, -1.41949462890625, -1.31982421875, -1.22015380859375, -1.1204833984375, -1.02081298828125, -0.921142578125, -0.82147216796875, -0.7218017578125, -0.62213134765625, -0.5224609375, -0.42279052734375, -0.3231201171875, -0.22344970703125, -0.123779296875, -0.02410888671875, 0.0755615234375, 0.17523193359375, 0.27490234375, 0.37457275390625, 0.4742431640625, 0.57391357421875, 0.673583984375, 0.77325439453125, 0.8729248046875, 0.97259521484375, 1.072265625, 1.17193603515625, 1.2716064453125, 1.37127685546875, 1.470947265625, 1.57061767578125, 1.6702880859375, 1.76995849609375, 1.86962890625, 1.96929931640625, 2.0689697265625, 2.16864013671875, 2.268310546875, 2.36798095703125, 2.4676513671875, 2.56732177734375, 2.6669921875, 2.76666259765625, 2.8663330078125, 2.96600341796875, 3.065673828125, 3.16534423828125, 3.2650146484375, 3.36468505859375, 3.46435546875, 3.56402587890625, 3.6636962890625, 3.76336669921875, 3.863037109375, 3.96270751953125, 4.0623779296875, 4.16204833984375, 4.26171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 13.0, 28.0, 34.0, 52.0, 61.0, 96.0, 169.0, 266.0, 505.0, 858.0, 1800.0, 3854.0, 9124.0, 24787.0, 83885.0, 466710.0, 3273951.0, 241555.0, 54833.0, 17875.0, 7165.0, 3067.0, 1499.0, 792.0, 471.0, 300.0, 183.0, 112.0, 79.0, 43.0, 35.0, 16.0, 14.0, 6.0, 11.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0], "bins": [-25.640625, -24.971923828125, -24.30322265625, -23.634521484375, -22.9658203125, -22.297119140625, -21.62841796875, -20.959716796875, -20.291015625, -19.622314453125, -18.95361328125, -18.284912109375, -17.6162109375, -16.947509765625, -16.27880859375, -15.610107421875, -14.94140625, -14.272705078125, -13.60400390625, -12.935302734375, -12.2666015625, -11.597900390625, -10.92919921875, -10.260498046875, -9.591796875, -8.923095703125, -8.25439453125, -7.585693359375, -6.9169921875, -6.248291015625, -5.57958984375, -4.910888671875, -4.2421875, -3.573486328125, -2.90478515625, -2.236083984375, -1.5673828125, -0.898681640625, -0.22998046875, 0.438720703125, 1.107421875, 1.776123046875, 2.44482421875, 3.113525390625, 3.7822265625, 4.450927734375, 5.11962890625, 5.788330078125, 6.45703125, 7.125732421875, 7.79443359375, 8.463134765625, 9.1318359375, 9.800537109375, 10.46923828125, 11.137939453125, 11.806640625, 12.475341796875, 13.14404296875, 13.812744140625, 14.4814453125, 15.150146484375, 15.81884765625, 16.487548828125, 17.15625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 13.0, 14.0, 14.0, 38.0, 52.0, 74.0, 143.0, 218.0, 491.0, 1956.0, 507.0, 199.0, 113.0, 72.0, 42.0, 32.0, 16.0, 13.0, 13.0, 14.0, 5.0, 10.0, 0.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-8.6171875, -8.38739013671875, -8.1575927734375, -7.92779541015625, -7.697998046875, -7.46820068359375, -7.2384033203125, -7.00860595703125, -6.77880859375, -6.54901123046875, -6.3192138671875, -6.08941650390625, -5.859619140625, -5.62982177734375, -5.4000244140625, -5.17022705078125, -4.9404296875, -4.71063232421875, -4.4808349609375, -4.25103759765625, -4.021240234375, -3.79144287109375, -3.5616455078125, -3.33184814453125, -3.10205078125, -2.87225341796875, -2.6424560546875, -2.41265869140625, -2.182861328125, -1.95306396484375, -1.7232666015625, -1.49346923828125, -1.263671875, -1.03387451171875, -0.8040771484375, -0.57427978515625, -0.344482421875, -0.11468505859375, 0.1151123046875, 0.34490966796875, 0.57470703125, 0.80450439453125, 1.0343017578125, 1.26409912109375, 1.493896484375, 1.72369384765625, 1.9534912109375, 2.18328857421875, 2.4130859375, 2.64288330078125, 2.8726806640625, 3.10247802734375, 3.332275390625, 3.56207275390625, 3.7918701171875, 4.02166748046875, 4.25146484375, 4.48126220703125, 4.7110595703125, 4.94085693359375, 5.170654296875, 5.40045166015625, 5.6302490234375, 5.86004638671875, 6.08984375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 19.0, 99.0, 236.0, 336.0, 203.0, 81.0, 23.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.80752563476562, -172.45155334472656, -169.09559631347656, -165.7396240234375, -162.3836669921875, -159.02769470214844, -155.67172241210938, -152.31576538085938, -148.9597930908203, -145.60382080078125, -142.24786376953125, -138.8918914794922, -135.53591918945312, -132.17996215820312, -128.82398986816406, -125.46802520751953, -122.112060546875, -118.75609588623047, -115.40013122558594, -112.04415893554688, -108.68819427490234, -105.33222961425781, -101.97625732421875, -98.62029266357422, -95.26432800292969, -91.90836334228516, -88.55239868164062, -85.19642639160156, -81.84046173095703, -78.4844970703125, -75.12852478027344, -71.7725601196289, -68.41658782958984, -65.06062316894531, -61.704654693603516, -58.34868621826172, -54.99272155761719, -51.636756896972656, -48.28078842163086, -44.92481994628906, -41.56885528564453, -38.212890625, -34.8569221496582, -31.50095558166504, -28.144989013671875, -24.78902244567871, -21.433055877685547, -18.077089309692383, -14.721122741699219, -11.365156173706055, -8.00918960571289, -4.653223037719727, -1.2972564697265625, 2.0587100982666016, 5.414676666259766, 8.77064323425293, 12.126609802246094, 15.482576370239258, 18.838542938232422, 22.194509506225586, 25.55047607421875, 28.906442642211914, 32.26240921020508, 35.618377685546875, 38.974342346191406]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 8.0, 10.0, 10.0, 16.0, 26.0, 26.0, 36.0, 27.0, 52.0, 34.0, 49.0, 60.0, 58.0, 59.0, 56.0, 72.0, 59.0, 51.0, 60.0, 40.0, 34.0, 38.0, 28.0, 21.0, 26.0, 13.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.22268295288086, -26.33050537109375, -25.43832778930664, -24.546152114868164, -23.653974533081055, -22.761796951293945, -21.86962127685547, -20.97744369506836, -20.08526611328125, -19.19308853149414, -18.30091094970703, -17.408735275268555, -16.516557693481445, -15.624380111694336, -14.732203483581543, -13.84002685546875, -12.94784927368164, -12.055671691894531, -11.163495063781738, -10.271318435668945, -9.379140853881836, -8.486963272094727, -7.594786643981934, -6.702609539031982, -5.810432434082031, -4.91825532913208, -4.026078224182129, -3.1339011192321777, -2.2417240142822266, -1.3495469093322754, -0.4573698043823242, 0.43480730056762695, 1.326986312866211, 2.219163417816162, 3.1113405227661133, 4.0035176277160645, 4.895694732666016, 5.787871837615967, 6.680048942565918, 7.572226047515869, 8.46440315246582, 9.35658073425293, 10.248757362365723, 11.140933990478516, 12.033111572265625, 12.925289154052734, 13.817465782165527, 14.70964241027832, 15.60181999206543, 16.49399757385254, 17.386173248291016, 18.278350830078125, 19.170528411865234, 20.062705993652344, 20.954883575439453, 21.84705924987793, 22.73923683166504, 23.63141441345215, 24.523590087890625, 25.415767669677734, 26.307945251464844, 27.200122833251953, 28.092300415039062, 28.98447608947754, 29.87665367126465]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 6.0, 14.0, 12.0, 17.0, 28.0, 41.0, 67.0, 90.0, 125.0, 197.0, 281.0, 448.0, 739.0, 1126.0, 1949.0, 3263.0, 5886.0, 10637.0, 20026.0, 39120.0, 75308.0, 138131.0, 220089.0, 223712.0, 142359.0, 77756.0, 40372.0, 21138.0, 10983.0, 5922.0, 3383.0, 1970.0, 1234.0, 731.0, 472.0, 287.0, 219.0, 140.0, 83.0, 66.0, 41.0, 24.0, 15.0, 18.0, 7.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.625, -10.312744140625, -10.00048828125, -9.688232421875, -9.3759765625, -9.063720703125, -8.75146484375, -8.439208984375, -8.126953125, -7.814697265625, -7.50244140625, -7.190185546875, -6.8779296875, -6.565673828125, -6.25341796875, -5.941162109375, -5.62890625, -5.316650390625, -5.00439453125, -4.692138671875, -4.3798828125, -4.067626953125, -3.75537109375, -3.443115234375, -3.130859375, -2.818603515625, -2.50634765625, -2.194091796875, -1.8818359375, -1.569580078125, -1.25732421875, -0.945068359375, -0.6328125, -0.320556640625, -0.00830078125, 0.303955078125, 0.6162109375, 0.928466796875, 1.24072265625, 1.552978515625, 1.865234375, 2.177490234375, 2.48974609375, 2.802001953125, 3.1142578125, 3.426513671875, 3.73876953125, 4.051025390625, 4.36328125, 4.675537109375, 4.98779296875, 5.300048828125, 5.6123046875, 5.924560546875, 6.23681640625, 6.549072265625, 6.861328125, 7.173583984375, 7.48583984375, 7.798095703125, 8.1103515625, 8.422607421875, 8.73486328125, 9.047119140625, 9.359375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 13.0, 11.0, 10.0, 8.0, 16.0, 12.0, 13.0, 26.0, 23.0, 34.0, 56.0, 49.0, 61.0, 40.0, 62.0, 50.0, 43.0, 48.0, 46.0, 46.0, 41.0, 46.0, 47.0, 29.0, 31.0, 23.0, 24.0, 11.0, 25.0, 11.0, 8.0, 4.0, 7.0, 6.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.2694091796875, -2.187255859375, -2.1051025390625, -2.02294921875, -1.9407958984375, -1.858642578125, -1.7764892578125, -1.6943359375, -1.6121826171875, -1.530029296875, -1.4478759765625, -1.36572265625, -1.2835693359375, -1.201416015625, -1.1192626953125, -1.037109375, -0.9549560546875, -0.872802734375, -0.7906494140625, -0.70849609375, -0.6263427734375, -0.544189453125, -0.4620361328125, -0.3798828125, -0.2977294921875, -0.215576171875, -0.1334228515625, -0.05126953125, 0.0308837890625, 0.113037109375, 0.1951904296875, 0.27734375, 0.3594970703125, 0.441650390625, 0.5238037109375, 0.60595703125, 0.6881103515625, 0.770263671875, 0.8524169921875, 0.9345703125, 1.0167236328125, 1.098876953125, 1.1810302734375, 1.26318359375, 1.3453369140625, 1.427490234375, 1.5096435546875, 1.591796875, 1.6739501953125, 1.756103515625, 1.8382568359375, 1.92041015625, 2.0025634765625, 2.084716796875, 2.1668701171875, 2.2490234375, 2.3311767578125, 2.413330078125, 2.4954833984375, 2.57763671875, 2.6597900390625, 2.741943359375, 2.8240966796875, 2.90625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 5.0, 11.0, 13.0, 23.0, 44.0, 50.0, 82.0, 120.0, 173.0, 311.0, 455.0, 762.0, 1457.0, 2792.0, 5680.0, 12820.0, 30683.0, 76469.0, 183724.0, 325850.0, 232504.0, 101763.0, 40869.0, 16912.0, 7379.0, 3461.0, 1770.0, 946.0, 517.0, 333.0, 195.0, 119.0, 89.0, 52.0, 30.0, 28.0, 14.0, 14.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-14.625, -14.2030029296875, -13.781005859375, -13.3590087890625, -12.93701171875, -12.5150146484375, -12.093017578125, -11.6710205078125, -11.2490234375, -10.8270263671875, -10.405029296875, -9.9830322265625, -9.56103515625, -9.1390380859375, -8.717041015625, -8.2950439453125, -7.873046875, -7.4510498046875, -7.029052734375, -6.6070556640625, -6.18505859375, -5.7630615234375, -5.341064453125, -4.9190673828125, -4.4970703125, -4.0750732421875, -3.653076171875, -3.2310791015625, -2.80908203125, -2.3870849609375, -1.965087890625, -1.5430908203125, -1.12109375, -0.6990966796875, -0.277099609375, 0.1448974609375, 0.56689453125, 0.9888916015625, 1.410888671875, 1.8328857421875, 2.2548828125, 2.6768798828125, 3.098876953125, 3.5208740234375, 3.94287109375, 4.3648681640625, 4.786865234375, 5.2088623046875, 5.630859375, 6.0528564453125, 6.474853515625, 6.8968505859375, 7.31884765625, 7.7408447265625, 8.162841796875, 8.5848388671875, 9.0068359375, 9.4288330078125, 9.850830078125, 10.2728271484375, 10.69482421875, 11.1168212890625, 11.538818359375, 11.9608154296875, 12.3828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 10.0, 7.0, 12.0, 9.0, 26.0, 11.0, 20.0, 25.0, 19.0, 30.0, 36.0, 24.0, 38.0, 48.0, 35.0, 45.0, 39.0, 40.0, 41.0, 46.0, 45.0, 37.0, 32.0, 32.0, 42.0, 33.0, 33.0, 22.0, 27.0, 27.0, 12.0, 11.0, 11.0, 10.0, 10.0, 16.0, 6.0, 5.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.6953125, -10.341064453125, -9.98681640625, -9.632568359375, -9.2783203125, -8.924072265625, -8.56982421875, -8.215576171875, -7.861328125, -7.507080078125, -7.15283203125, -6.798583984375, -6.4443359375, -6.090087890625, -5.73583984375, -5.381591796875, -5.02734375, -4.673095703125, -4.31884765625, -3.964599609375, -3.6103515625, -3.256103515625, -2.90185546875, -2.547607421875, -2.193359375, -1.839111328125, -1.48486328125, -1.130615234375, -0.7763671875, -0.422119140625, -0.06787109375, 0.286376953125, 0.640625, 0.994873046875, 1.34912109375, 1.703369140625, 2.0576171875, 2.411865234375, 2.76611328125, 3.120361328125, 3.474609375, 3.828857421875, 4.18310546875, 4.537353515625, 4.8916015625, 5.245849609375, 5.60009765625, 5.954345703125, 6.30859375, 6.662841796875, 7.01708984375, 7.371337890625, 7.7255859375, 8.079833984375, 8.43408203125, 8.788330078125, 9.142578125, 9.496826171875, 9.85107421875, 10.205322265625, 10.5595703125, 10.913818359375, 11.26806640625, 11.622314453125, 11.9765625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 13.0, 11.0, 29.0, 36.0, 106.0, 213.0, 565.0, 1609.0, 5390.0, 24394.0, 168229.0, 697901.0, 123894.0, 19492.0, 4447.0, 1348.0, 504.0, 196.0, 81.0, 36.0, 21.0, 13.0, 5.0, 6.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.359375, -20.720458984375, -20.08154296875, -19.442626953125, -18.8037109375, -18.164794921875, -17.52587890625, -16.886962890625, -16.248046875, -15.609130859375, -14.97021484375, -14.331298828125, -13.6923828125, -13.053466796875, -12.41455078125, -11.775634765625, -11.13671875, -10.497802734375, -9.85888671875, -9.219970703125, -8.5810546875, -7.942138671875, -7.30322265625, -6.664306640625, -6.025390625, -5.386474609375, -4.74755859375, -4.108642578125, -3.4697265625, -2.830810546875, -2.19189453125, -1.552978515625, -0.9140625, -0.275146484375, 0.36376953125, 1.002685546875, 1.6416015625, 2.280517578125, 2.91943359375, 3.558349609375, 4.197265625, 4.836181640625, 5.47509765625, 6.114013671875, 6.7529296875, 7.391845703125, 8.03076171875, 8.669677734375, 9.30859375, 9.947509765625, 10.58642578125, 11.225341796875, 11.8642578125, 12.503173828125, 13.14208984375, 13.781005859375, 14.419921875, 15.058837890625, 15.69775390625, 16.336669921875, 16.9755859375, 17.614501953125, 18.25341796875, 18.892333984375, 19.53125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 7.0, 9.0, 15.0, 10.0, 22.0, 24.0, 22.0, 50.0, 68.0, 95.0, 130.0, 134.0, 118.0, 55.0, 53.0, 37.0, 19.0, 32.0, 17.0, 16.0, 10.0, 14.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002506256103515625, -0.002411186695098877, -0.002316117286682129, -0.002221047878265381, -0.002125978469848633, -0.0020309090614318848, -0.0019358396530151367, -0.0018407702445983887, -0.0017457008361816406, -0.0016506314277648926, -0.0015555620193481445, -0.0014604926109313965, -0.0013654232025146484, -0.0012703537940979004, -0.0011752843856811523, -0.0010802149772644043, -0.0009851455688476562, -0.0008900761604309082, -0.0007950067520141602, -0.0006999373435974121, -0.0006048679351806641, -0.000509798526763916, -0.00041472911834716797, -0.0003196597099304199, -0.00022459030151367188, -0.00012952089309692383, -3.445148468017578e-05, 6.0617923736572266e-05, 0.0001556873321533203, 0.00025075674057006836, 0.0003458261489868164, 0.00044089555740356445, 0.0005359649658203125, 0.0006310343742370605, 0.0007261037826538086, 0.0008211731910705566, 0.0009162425994873047, 0.0010113120079040527, 0.0011063814163208008, 0.0012014508247375488, 0.0012965202331542969, 0.001391589641571045, 0.001486659049987793, 0.001581728458404541, 0.001676797866821289, 0.0017718672752380371, 0.0018669366836547852, 0.001962006092071533, 0.0020570755004882812, 0.0021521449089050293, 0.0022472143173217773, 0.0023422837257385254, 0.0024373531341552734, 0.0025324225425720215, 0.0026274919509887695, 0.0027225613594055176, 0.0028176307678222656, 0.0029127001762390137, 0.0030077695846557617, 0.0031028389930725098, 0.003197908401489258, 0.003292977809906006, 0.003388047218322754, 0.003483116626739502, 0.00357818603515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 11.0, 11.0, 12.0, 22.0, 24.0, 45.0, 60.0, 111.0, 148.0, 294.0, 460.0, 848.0, 1808.0, 4002.0, 10839.0, 33331.0, 128178.0, 539091.0, 247397.0, 54526.0, 16321.0, 5908.0, 2394.0, 1156.0, 674.0, 328.0, 187.0, 113.0, 93.0, 49.0, 28.0, 26.0, 14.0, 13.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.5234375, -15.0760498046875, -14.628662109375, -14.1812744140625, -13.73388671875, -13.2864990234375, -12.839111328125, -12.3917236328125, -11.9443359375, -11.4969482421875, -11.049560546875, -10.6021728515625, -10.15478515625, -9.7073974609375, -9.260009765625, -8.8126220703125, -8.365234375, -7.9178466796875, -7.470458984375, -7.0230712890625, -6.57568359375, -6.1282958984375, -5.680908203125, -5.2335205078125, -4.7861328125, -4.3387451171875, -3.891357421875, -3.4439697265625, -2.99658203125, -2.5491943359375, -2.101806640625, -1.6544189453125, -1.20703125, -0.7596435546875, -0.312255859375, 0.1351318359375, 0.58251953125, 1.0299072265625, 1.477294921875, 1.9246826171875, 2.3720703125, 2.8194580078125, 3.266845703125, 3.7142333984375, 4.16162109375, 4.6090087890625, 5.056396484375, 5.5037841796875, 5.951171875, 6.3985595703125, 6.845947265625, 7.2933349609375, 7.74072265625, 8.1881103515625, 8.635498046875, 9.0828857421875, 9.5302734375, 9.9776611328125, 10.425048828125, 10.8724365234375, 11.31982421875, 11.7672119140625, 12.214599609375, 12.6619873046875, 13.109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 11.0, 13.0, 9.0, 24.0, 31.0, 40.0, 38.0, 49.0, 69.0, 94.0, 87.0, 85.0, 85.0, 92.0, 56.0, 42.0, 41.0, 29.0, 18.0, 22.0, 10.0, 17.0, 8.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.4140625, -11.0989990234375, -10.783935546875, -10.4688720703125, -10.15380859375, -9.8387451171875, -9.523681640625, -9.2086181640625, -8.8935546875, -8.5784912109375, -8.263427734375, -7.9483642578125, -7.63330078125, -7.3182373046875, -7.003173828125, -6.6881103515625, -6.373046875, -6.0579833984375, -5.742919921875, -5.4278564453125, -5.11279296875, -4.7977294921875, -4.482666015625, -4.1676025390625, -3.8525390625, -3.5374755859375, -3.222412109375, -2.9073486328125, -2.59228515625, -2.2772216796875, -1.962158203125, -1.6470947265625, -1.33203125, -1.0169677734375, -0.701904296875, -0.3868408203125, -0.07177734375, 0.2432861328125, 0.558349609375, 0.8734130859375, 1.1884765625, 1.5035400390625, 1.818603515625, 2.1336669921875, 2.44873046875, 2.7637939453125, 3.078857421875, 3.3939208984375, 3.708984375, 4.0240478515625, 4.339111328125, 4.6541748046875, 4.96923828125, 5.2843017578125, 5.599365234375, 5.9144287109375, 6.2294921875, 6.5445556640625, 6.859619140625, 7.1746826171875, 7.48974609375, 7.8048095703125, 8.119873046875, 8.4349365234375, 8.75]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 15.0, 16.0, 32.0, 55.0, 89.0, 114.0, 120.0, 127.0, 130.0, 100.0, 62.0, 45.0, 29.0, 21.0, 9.0, 13.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.07423400878906, -77.1078109741211, -73.14139556884766, -69.17497253417969, -65.20854949951172, -61.242130279541016, -57.27571105957031, -53.309288024902344, -49.342864990234375, -45.37644577026367, -41.4100227355957, -37.443603515625, -33.47718048095703, -29.510761260986328, -25.544340133666992, -21.577919006347656, -17.611499786376953, -13.645078659057617, -9.678657531738281, -5.712237358093262, -1.7458162307739258, 2.2206039428710938, 6.18702507019043, 10.153446197509766, 14.119867324829102, 18.086288452148438, 22.052709579467773, 26.01913070678711, 29.985549926757812, 33.95197296142578, 37.918392181396484, 41.88481140136719, 45.851234436035156, 49.81765365600586, 53.78407669067383, 57.75049591064453, 61.7169189453125, 65.68333435058594, 69.6497573852539, 73.61618041992188, 77.58260345458984, 81.54902648925781, 85.51544189453125, 89.48186492919922, 93.44828796386719, 97.41470336914062, 101.3811264038086, 105.34754943847656, 109.31396484375, 113.28038787841797, 117.2468032836914, 121.21322631835938, 125.17964935302734, 129.1460723876953, 133.11248779296875, 137.07891845703125, 141.0453338623047, 145.01174926757812, 148.97817993164062, 152.94459533691406, 156.9110107421875, 160.87744140625, 164.84385681152344, 168.81027221679688, 172.77670288085938]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 7.0, 3.0, 4.0, 8.0, 4.0, 11.0, 7.0, 6.0, 14.0, 13.0, 17.0, 14.0, 18.0, 25.0, 24.0, 25.0, 43.0, 23.0, 34.0, 38.0, 36.0, 39.0, 36.0, 41.0, 43.0, 42.0, 47.0, 44.0, 46.0, 35.0, 25.0, 29.0, 27.0, 24.0, 31.0, 24.0, 18.0, 9.0, 12.0, 6.0, 4.0, 17.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-57.22677230834961, -55.3734130859375, -53.520050048828125, -51.666690826416016, -49.81332778930664, -47.95996856689453, -46.106605529785156, -44.25324630737305, -42.39988708496094, -40.54652786254883, -38.69316482543945, -36.839805603027344, -34.98644256591797, -33.13308334350586, -31.279722213745117, -29.426361083984375, -27.572999954223633, -25.71963882446289, -23.86627769470215, -22.012916564941406, -20.159557342529297, -18.306196212768555, -16.452835083007812, -14.599474906921387, -12.746113777160645, -10.892752647399902, -9.039392471313477, -7.186031341552734, -5.33267068862915, -3.4793100357055664, -1.6259489059448242, 0.22741127014160156, 2.0807723999023438, 3.9341330528259277, 5.787493705749512, 7.640854835510254, 9.49421501159668, 11.347576141357422, 13.200937271118164, 15.05429744720459, 16.907657623291016, 18.761018753051758, 20.6143798828125, 22.46773910522461, 24.32110023498535, 26.174461364746094, 28.027822494506836, 29.881183624267578, 31.73454475402832, 33.58790588378906, 35.44126510620117, 37.29462814331055, 39.147987365722656, 41.00135040283203, 42.85470962524414, 44.70806884765625, 46.561431884765625, 48.414791107177734, 50.26815414428711, 52.12151336669922, 53.974876403808594, 55.8282356262207, 57.68159484863281, 59.53495788574219, 61.3883171081543]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 15.0, 14.0, 20.0, 26.0, 42.0, 62.0, 144.0, 214.0, 539.0, 1267.0, 3401.0, 10565.0, 40396.0, 233463.0, 3555086.0, 283022.0, 46720.0, 12257.0, 4030.0, 1639.0, 642.0, 307.0, 154.0, 92.0, 48.0, 29.0, 13.0, 21.0, 12.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.46875, -20.689208984375, -19.90966796875, -19.130126953125, -18.3505859375, -17.571044921875, -16.79150390625, -16.011962890625, -15.232421875, -14.452880859375, -13.67333984375, -12.893798828125, -12.1142578125, -11.334716796875, -10.55517578125, -9.775634765625, -8.99609375, -8.216552734375, -7.43701171875, -6.657470703125, -5.8779296875, -5.098388671875, -4.31884765625, -3.539306640625, -2.759765625, -1.980224609375, -1.20068359375, -0.421142578125, 0.3583984375, 1.137939453125, 1.91748046875, 2.697021484375, 3.4765625, 4.256103515625, 5.03564453125, 5.815185546875, 6.5947265625, 7.374267578125, 8.15380859375, 8.933349609375, 9.712890625, 10.492431640625, 11.27197265625, 12.051513671875, 12.8310546875, 13.610595703125, 14.39013671875, 15.169677734375, 15.94921875, 16.728759765625, 17.50830078125, 18.287841796875, 19.0673828125, 19.846923828125, 20.62646484375, 21.406005859375, 22.185546875, 22.965087890625, 23.74462890625, 24.524169921875, 25.3037109375, 26.083251953125, 26.86279296875, 27.642333984375, 28.421875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 9.0, 6.0, 8.0, 6.0, 16.0, 24.0, 26.0, 24.0, 28.0, 38.0, 35.0, 42.0, 41.0, 48.0, 48.0, 56.0, 47.0, 44.0, 36.0, 51.0, 49.0, 41.0, 34.0, 42.0, 27.0, 31.0, 20.0, 19.0, 15.0, 14.0, 13.0, 7.0, 9.0, 10.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.455078125, -2.3778076171875, -2.300537109375, -2.2232666015625, -2.14599609375, -2.0687255859375, -1.991455078125, -1.9141845703125, -1.8369140625, -1.7596435546875, -1.682373046875, -1.6051025390625, -1.52783203125, -1.4505615234375, -1.373291015625, -1.2960205078125, -1.21875, -1.1414794921875, -1.064208984375, -0.9869384765625, -0.90966796875, -0.8323974609375, -0.755126953125, -0.6778564453125, -0.6005859375, -0.5233154296875, -0.446044921875, -0.3687744140625, -0.29150390625, -0.2142333984375, -0.136962890625, -0.0596923828125, 0.017578125, 0.0948486328125, 0.172119140625, 0.2493896484375, 0.32666015625, 0.4039306640625, 0.481201171875, 0.5584716796875, 0.6357421875, 0.7130126953125, 0.790283203125, 0.8675537109375, 0.94482421875, 1.0220947265625, 1.099365234375, 1.1766357421875, 1.25390625, 1.3311767578125, 1.408447265625, 1.4857177734375, 1.56298828125, 1.6402587890625, 1.717529296875, 1.7947998046875, 1.8720703125, 1.9493408203125, 2.026611328125, 2.1038818359375, 2.18115234375, 2.2584228515625, 2.335693359375, 2.4129638671875, 2.490234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 10.0, 13.0, 20.0, 25.0, 36.0, 44.0, 83.0, 123.0, 167.0, 257.0, 411.0, 746.0, 1258.0, 2272.0, 4536.0, 9860.0, 23357.0, 62969.0, 212381.0, 1544281.0, 1993643.0, 226003.0, 66283.0, 24552.0, 10338.0, 4854.0, 2421.0, 1332.0, 728.0, 465.0, 265.0, 189.0, 114.0, 71.0, 45.0, 30.0, 23.0, 15.0, 14.0, 12.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0], "bins": [-17.78125, -17.301025390625, -16.82080078125, -16.340576171875, -15.8603515625, -15.380126953125, -14.89990234375, -14.419677734375, -13.939453125, -13.459228515625, -12.97900390625, -12.498779296875, -12.0185546875, -11.538330078125, -11.05810546875, -10.577880859375, -10.09765625, -9.617431640625, -9.13720703125, -8.656982421875, -8.1767578125, -7.696533203125, -7.21630859375, -6.736083984375, -6.255859375, -5.775634765625, -5.29541015625, -4.815185546875, -4.3349609375, -3.854736328125, -3.37451171875, -2.894287109375, -2.4140625, -1.933837890625, -1.45361328125, -0.973388671875, -0.4931640625, -0.012939453125, 0.46728515625, 0.947509765625, 1.427734375, 1.907958984375, 2.38818359375, 2.868408203125, 3.3486328125, 3.828857421875, 4.30908203125, 4.789306640625, 5.26953125, 5.749755859375, 6.22998046875, 6.710205078125, 7.1904296875, 7.670654296875, 8.15087890625, 8.631103515625, 9.111328125, 9.591552734375, 10.07177734375, 10.552001953125, 11.0322265625, 11.512451171875, 11.99267578125, 12.472900390625, 12.953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 11.0, 14.0, 12.0, 19.0, 21.0, 50.0, 54.0, 74.0, 106.0, 160.0, 258.0, 444.0, 1149.0, 707.0, 366.0, 183.0, 125.0, 88.0, 44.0, 41.0, 38.0, 21.0, 15.0, 13.0, 9.0, 7.0, 8.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.342529296875, -7.11865234375, -6.894775390625, -6.6708984375, -6.447021484375, -6.22314453125, -5.999267578125, -5.775390625, -5.551513671875, -5.32763671875, -5.103759765625, -4.8798828125, -4.656005859375, -4.43212890625, -4.208251953125, -3.984375, -3.760498046875, -3.53662109375, -3.312744140625, -3.0888671875, -2.864990234375, -2.64111328125, -2.417236328125, -2.193359375, -1.969482421875, -1.74560546875, -1.521728515625, -1.2978515625, -1.073974609375, -0.85009765625, -0.626220703125, -0.40234375, -0.178466796875, 0.04541015625, 0.269287109375, 0.4931640625, 0.717041015625, 0.94091796875, 1.164794921875, 1.388671875, 1.612548828125, 1.83642578125, 2.060302734375, 2.2841796875, 2.508056640625, 2.73193359375, 2.955810546875, 3.1796875, 3.403564453125, 3.62744140625, 3.851318359375, 4.0751953125, 4.299072265625, 4.52294921875, 4.746826171875, 4.970703125, 5.194580078125, 5.41845703125, 5.642333984375, 5.8662109375, 6.090087890625, 6.31396484375, 6.537841796875, 6.76171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 18.0, 46.0, 82.0, 119.0, 175.0, 178.0, 160.0, 96.0, 54.0, 33.0, 17.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.79619598388672, -123.09005737304688, -120.38392639160156, -117.67779541015625, -114.9716567993164, -112.26551818847656, -109.55938720703125, -106.85325622558594, -104.1471176147461, -101.44097900390625, -98.73484802246094, -96.02871704101562, -93.32257843017578, -90.61643981933594, -87.91030883789062, -85.20417785644531, -82.49803924560547, -79.79190063476562, -77.08576965332031, -74.379638671875, -71.67350006103516, -68.96736145019531, -66.26123046875, -63.55509567260742, -60.848960876464844, -58.142826080322266, -55.43669128417969, -52.73055648803711, -50.02442169189453, -47.31828689575195, -44.612152099609375, -41.9060173034668, -39.19988250732422, -36.49374771118164, -33.78761291503906, -31.081478118896484, -28.375343322753906, -25.669208526611328, -22.96307373046875, -20.256938934326172, -17.550804138183594, -14.844669342041016, -12.138534545898438, -9.43239974975586, -6.726264953613281, -4.020130157470703, -1.313995361328125, 1.3921394348144531, 4.098274230957031, 6.804409027099609, 9.510543823242188, 12.216678619384766, 14.922813415527344, 17.628948211669922, 20.3350830078125, 23.041217803955078, 25.747352600097656, 28.453487396240234, 31.159622192382812, 33.86575698852539, 36.57189178466797, 39.27802658081055, 41.984161376953125, 44.6902961730957, 47.39643096923828]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 8.0, 9.0, 14.0, 11.0, 20.0, 21.0, 24.0, 25.0, 41.0, 26.0, 41.0, 29.0, 30.0, 38.0, 34.0, 60.0, 41.0, 36.0, 37.0, 44.0, 41.0, 34.0, 38.0, 34.0, 37.0, 31.0, 30.0, 27.0, 23.0, 23.0, 13.0, 22.0, 8.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.75122833251953, -30.80316734313965, -29.8551082611084, -28.907047271728516, -27.958986282348633, -27.01092529296875, -26.0628662109375, -25.114805221557617, -24.166744232177734, -23.21868324279785, -22.2706241607666, -21.32256317138672, -20.374502182006836, -19.426441192626953, -18.478382110595703, -17.53032112121582, -16.582260131835938, -15.634200096130371, -14.686139106750488, -13.738079071044922, -12.790018081665039, -11.841958045959473, -10.893898010253906, -9.945837020874023, -8.997777938842773, -8.049717903137207, -7.101656913757324, -6.153596878051758, -5.205535888671875, -4.257475852966309, -3.309415340423584, -2.3613548278808594, -1.4132938385009766, -0.46523338556289673, 0.4828270673751831, 1.4308874607086182, 2.3789479732513428, 3.3270082473754883, 4.275068759918213, 5.2231292724609375, 6.171189785003662, 7.119250297546387, 8.067310333251953, 9.015371322631836, 9.963431358337402, 10.911491394042969, 11.859552383422852, 12.807613372802734, 13.7556734085083, 14.703733444213867, 15.65179443359375, 16.599855422973633, 17.547914505004883, 18.495975494384766, 19.44403648376465, 20.39209747314453, 21.34015655517578, 22.288217544555664, 23.236276626586914, 24.184337615966797, 25.13239860534668, 26.080459594726562, 27.028518676757812, 27.976579666137695, 28.924640655517578]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 12.0, 12.0, 15.0, 26.0, 52.0, 105.0, 126.0, 284.0, 659.0, 1494.0, 3815.0, 11180.0, 36224.0, 120401.0, 370121.0, 344716.0, 109478.0, 33264.0, 10379.0, 3485.0, 1457.0, 599.0, 277.0, 149.0, 81.0, 47.0, 27.0, 28.0, 13.0, 10.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -24.01171875, -23.3046875, -22.59765625, -21.890625, -21.18359375, -20.4765625, -19.76953125, -19.0625, -18.35546875, -17.6484375, -16.94140625, -16.234375, -15.52734375, -14.8203125, -14.11328125, -13.40625, -12.69921875, -11.9921875, -11.28515625, -10.578125, -9.87109375, -9.1640625, -8.45703125, -7.75, -7.04296875, -6.3359375, -5.62890625, -4.921875, -4.21484375, -3.5078125, -2.80078125, -2.09375, -1.38671875, -0.6796875, 0.02734375, 0.734375, 1.44140625, 2.1484375, 2.85546875, 3.5625, 4.26953125, 4.9765625, 5.68359375, 6.390625, 7.09765625, 7.8046875, 8.51171875, 9.21875, 9.92578125, 10.6328125, 11.33984375, 12.046875, 12.75390625, 13.4609375, 14.16796875, 14.875, 15.58203125, 16.2890625, 16.99609375, 17.703125, 18.41015625, 19.1171875, 19.82421875, 20.53125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 17.0, 12.0, 19.0, 25.0, 17.0, 23.0, 28.0, 36.0, 44.0, 49.0, 47.0, 43.0, 46.0, 48.0, 49.0, 44.0, 45.0, 49.0, 41.0, 28.0, 23.0, 32.0, 36.0, 23.0, 23.0, 16.0, 19.0, 20.0, 18.0, 6.0, 7.0, 7.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.47265625, -2.396820068359375, -2.32098388671875, -2.245147705078125, -2.1693115234375, -2.093475341796875, -2.01763916015625, -1.941802978515625, -1.865966796875, -1.790130615234375, -1.71429443359375, -1.638458251953125, -1.5626220703125, -1.486785888671875, -1.41094970703125, -1.335113525390625, -1.25927734375, -1.183441162109375, -1.10760498046875, -1.031768798828125, -0.9559326171875, -0.880096435546875, -0.80426025390625, -0.728424072265625, -0.652587890625, -0.576751708984375, -0.50091552734375, -0.425079345703125, -0.3492431640625, -0.273406982421875, -0.19757080078125, -0.121734619140625, -0.0458984375, 0.029937744140625, 0.10577392578125, 0.181610107421875, 0.2574462890625, 0.333282470703125, 0.40911865234375, 0.484954833984375, 0.560791015625, 0.636627197265625, 0.71246337890625, 0.788299560546875, 0.8641357421875, 0.939971923828125, 1.01580810546875, 1.091644287109375, 1.16748046875, 1.243316650390625, 1.31915283203125, 1.394989013671875, 1.4708251953125, 1.546661376953125, 1.62249755859375, 1.698333740234375, 1.774169921875, 1.850006103515625, 1.92584228515625, 2.001678466796875, 2.0775146484375, 2.153350830078125, 2.22918701171875, 2.305023193359375, 2.380859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 9.0, 20.0, 11.0, 24.0, 42.0, 67.0, 98.0, 142.0, 209.0, 304.0, 532.0, 813.0, 1454.0, 2584.0, 4666.0, 9083.0, 18618.0, 39371.0, 84179.0, 178231.0, 297148.0, 213470.0, 103597.0, 48248.0, 22349.0, 10796.0, 5445.0, 2886.0, 1630.0, 990.0, 510.0, 342.0, 227.0, 156.0, 81.0, 75.0, 49.0, 27.0, 26.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.0943603515625, -10.719970703125, -10.3455810546875, -9.97119140625, -9.5968017578125, -9.222412109375, -8.8480224609375, -8.4736328125, -8.0992431640625, -7.724853515625, -7.3504638671875, -6.97607421875, -6.6016845703125, -6.227294921875, -5.8529052734375, -5.478515625, -5.1041259765625, -4.729736328125, -4.3553466796875, -3.98095703125, -3.6065673828125, -3.232177734375, -2.8577880859375, -2.4833984375, -2.1090087890625, -1.734619140625, -1.3602294921875, -0.98583984375, -0.6114501953125, -0.237060546875, 0.1373291015625, 0.51171875, 0.8861083984375, 1.260498046875, 1.6348876953125, 2.00927734375, 2.3836669921875, 2.758056640625, 3.1324462890625, 3.5068359375, 3.8812255859375, 4.255615234375, 4.6300048828125, 5.00439453125, 5.3787841796875, 5.753173828125, 6.1275634765625, 6.501953125, 6.8763427734375, 7.250732421875, 7.6251220703125, 7.99951171875, 8.3739013671875, 8.748291015625, 9.1226806640625, 9.4970703125, 9.8714599609375, 10.245849609375, 10.6202392578125, 10.99462890625, 11.3690185546875, 11.743408203125, 12.1177978515625, 12.4921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 9.0, 4.0, 8.0, 12.0, 8.0, 7.0, 20.0, 20.0, 21.0, 19.0, 35.0, 26.0, 35.0, 42.0, 44.0, 63.0, 47.0, 30.0, 38.0, 45.0, 37.0, 50.0, 47.0, 50.0, 37.0, 33.0, 35.0, 33.0, 22.0, 28.0, 13.0, 15.0, 11.0, 16.0, 6.0, 9.0, 4.0, 5.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.3203125, -12.9146728515625, -12.509033203125, -12.1033935546875, -11.69775390625, -11.2921142578125, -10.886474609375, -10.4808349609375, -10.0751953125, -9.6695556640625, -9.263916015625, -8.8582763671875, -8.45263671875, -8.0469970703125, -7.641357421875, -7.2357177734375, -6.830078125, -6.4244384765625, -6.018798828125, -5.6131591796875, -5.20751953125, -4.8018798828125, -4.396240234375, -3.9906005859375, -3.5849609375, -3.1793212890625, -2.773681640625, -2.3680419921875, -1.96240234375, -1.5567626953125, -1.151123046875, -0.7454833984375, -0.33984375, 0.0657958984375, 0.471435546875, 0.8770751953125, 1.28271484375, 1.6883544921875, 2.093994140625, 2.4996337890625, 2.9052734375, 3.3109130859375, 3.716552734375, 4.1221923828125, 4.52783203125, 4.9334716796875, 5.339111328125, 5.7447509765625, 6.150390625, 6.5560302734375, 6.961669921875, 7.3673095703125, 7.77294921875, 8.1785888671875, 8.584228515625, 8.9898681640625, 9.3955078125, 9.8011474609375, 10.206787109375, 10.6124267578125, 11.01806640625, 11.4237060546875, 11.829345703125, 12.2349853515625, 12.640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 13.0, 10.0, 26.0, 31.0, 33.0, 58.0, 83.0, 143.0, 232.0, 323.0, 574.0, 881.0, 1577.0, 2716.0, 5274.0, 10403.0, 22957.0, 59866.0, 227940.0, 498978.0, 137863.0, 42821.0, 17596.0, 8113.0, 4256.0, 2289.0, 1328.0, 851.0, 498.0, 281.0, 198.0, 108.0, 78.0, 49.0, 27.0, 22.0, 18.0, 11.0, 12.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-13.9453125, -13.5391845703125, -13.133056640625, -12.7269287109375, -12.32080078125, -11.9146728515625, -11.508544921875, -11.1024169921875, -10.6962890625, -10.2901611328125, -9.884033203125, -9.4779052734375, -9.07177734375, -8.6656494140625, -8.259521484375, -7.8533935546875, -7.447265625, -7.0411376953125, -6.635009765625, -6.2288818359375, -5.82275390625, -5.4166259765625, -5.010498046875, -4.6043701171875, -4.1982421875, -3.7921142578125, -3.385986328125, -2.9798583984375, -2.57373046875, -2.1676025390625, -1.761474609375, -1.3553466796875, -0.94921875, -0.5430908203125, -0.136962890625, 0.2691650390625, 0.67529296875, 1.0814208984375, 1.487548828125, 1.8936767578125, 2.2998046875, 2.7059326171875, 3.112060546875, 3.5181884765625, 3.92431640625, 4.3304443359375, 4.736572265625, 5.1427001953125, 5.548828125, 5.9549560546875, 6.361083984375, 6.7672119140625, 7.17333984375, 7.5794677734375, 7.985595703125, 8.3917236328125, 8.7978515625, 9.2039794921875, 9.610107421875, 10.0162353515625, 10.42236328125, 10.8284912109375, 11.234619140625, 11.6407470703125, 12.046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 13.0, 8.0, 14.0, 26.0, 33.0, 28.0, 44.0, 85.0, 139.0, 207.0, 141.0, 77.0, 29.0, 38.0, 31.0, 16.0, 15.0, 10.0, 13.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034961700439453125, -0.003368884325027466, -0.003241598606109619, -0.0031143128871917725, -0.0029870271682739258, -0.002859741449356079, -0.0027324557304382324, -0.0026051700115203857, -0.002477884292602539, -0.0023505985736846924, -0.0022233128547668457, -0.002096027135848999, -0.0019687414169311523, -0.0018414556980133057, -0.001714169979095459, -0.0015868842601776123, -0.0014595985412597656, -0.001332312822341919, -0.0012050271034240723, -0.0010777413845062256, -0.0009504556655883789, -0.0008231699466705322, -0.0006958842277526855, -0.0005685985088348389, -0.0004413127899169922, -0.0003140270709991455, -0.00018674135208129883, -5.945563316345215e-05, 6.783008575439453e-05, 0.0001951158046722412, 0.0003224015235900879, 0.00044968724250793457, 0.0005769729614257812, 0.0007042586803436279, 0.0008315443992614746, 0.0009588301181793213, 0.001086115837097168, 0.0012134015560150146, 0.0013406872749328613, 0.001467972993850708, 0.0015952587127685547, 0.0017225444316864014, 0.001849830150604248, 0.0019771158695220947, 0.0021044015884399414, 0.002231687307357788, 0.0023589730262756348, 0.0024862587451934814, 0.002613544464111328, 0.002740830183029175, 0.0028681159019470215, 0.002995401620864868, 0.003122687339782715, 0.0032499730587005615, 0.003377258777618408, 0.003504544496536255, 0.0036318302154541016, 0.0037591159343719482, 0.003886401653289795, 0.004013687372207642, 0.004140973091125488, 0.004268258810043335, 0.004395544528961182, 0.004522830247879028, 0.004650115966796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 1.0, 7.0, 6.0, 10.0, 16.0, 23.0, 36.0, 43.0, 69.0, 97.0, 138.0, 234.0, 334.0, 524.0, 926.0, 1413.0, 2392.0, 4330.0, 8102.0, 15262.0, 32345.0, 83943.0, 346653.0, 387688.0, 92949.0, 34666.0, 16392.0, 8612.0, 4600.0, 2687.0, 1515.0, 894.0, 515.0, 348.0, 238.0, 161.0, 115.0, 80.0, 55.0, 35.0, 28.0, 16.0, 17.0, 10.0, 8.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.269775390625, -10.90673828125, -10.543701171875, -10.1806640625, -9.817626953125, -9.45458984375, -9.091552734375, -8.728515625, -8.365478515625, -8.00244140625, -7.639404296875, -7.2763671875, -6.913330078125, -6.55029296875, -6.187255859375, -5.82421875, -5.461181640625, -5.09814453125, -4.735107421875, -4.3720703125, -4.009033203125, -3.64599609375, -3.282958984375, -2.919921875, -2.556884765625, -2.19384765625, -1.830810546875, -1.4677734375, -1.104736328125, -0.74169921875, -0.378662109375, -0.015625, 0.347412109375, 0.71044921875, 1.073486328125, 1.4365234375, 1.799560546875, 2.16259765625, 2.525634765625, 2.888671875, 3.251708984375, 3.61474609375, 3.977783203125, 4.3408203125, 4.703857421875, 5.06689453125, 5.429931640625, 5.79296875, 6.156005859375, 6.51904296875, 6.882080078125, 7.2451171875, 7.608154296875, 7.97119140625, 8.334228515625, 8.697265625, 9.060302734375, 9.42333984375, 9.786376953125, 10.1494140625, 10.512451171875, 10.87548828125, 11.238525390625, 11.6015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 6.0, 9.0, 4.0, 6.0, 13.0, 17.0, 15.0, 19.0, 33.0, 48.0, 55.0, 84.0, 95.0, 129.0, 136.0, 90.0, 56.0, 53.0, 23.0, 24.0, 12.0, 10.0, 11.0, 9.0, 11.0, 2.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.5491943359375, -11.184326171875, -10.8194580078125, -10.45458984375, -10.0897216796875, -9.724853515625, -9.3599853515625, -8.9951171875, -8.6302490234375, -8.265380859375, -7.9005126953125, -7.53564453125, -7.1707763671875, -6.805908203125, -6.4410400390625, -6.076171875, -5.7113037109375, -5.346435546875, -4.9815673828125, -4.61669921875, -4.2518310546875, -3.886962890625, -3.5220947265625, -3.1572265625, -2.7923583984375, -2.427490234375, -2.0626220703125, -1.69775390625, -1.3328857421875, -0.968017578125, -0.6031494140625, -0.23828125, 0.1265869140625, 0.491455078125, 0.8563232421875, 1.22119140625, 1.5860595703125, 1.950927734375, 2.3157958984375, 2.6806640625, 3.0455322265625, 3.410400390625, 3.7752685546875, 4.14013671875, 4.5050048828125, 4.869873046875, 5.2347412109375, 5.599609375, 5.9644775390625, 6.329345703125, 6.6942138671875, 7.05908203125, 7.4239501953125, 7.788818359375, 8.1536865234375, 8.5185546875, 8.8834228515625, 9.248291015625, 9.6131591796875, 9.97802734375, 10.3428955078125, 10.707763671875, 11.0726318359375, 11.4375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 18.0, 57.0, 132.0, 230.0, 243.0, 174.0, 77.0, 40.0, 14.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-416.04974365234375, -407.0478820800781, -398.0460205078125, -389.044189453125, -380.0423278808594, -371.04046630859375, -362.0386047363281, -353.0367431640625, -344.034912109375, -335.0330505371094, -326.03118896484375, -317.02935791015625, -308.0274963378906, -299.025634765625, -290.0237731933594, -281.02191162109375, -272.0200500488281, -263.0181884765625, -254.01634216308594, -245.0144805908203, -236.01263427734375, -227.01077270507812, -218.0089111328125, -209.00704956054688, -200.0052032470703, -191.0033416748047, -182.00149536132812, -172.9996337890625, -163.99777221679688, -154.9959259033203, -145.9940643310547, -136.99221801757812, -127.99037170410156, -118.98851776123047, -109.98666381835938, -100.98480224609375, -91.98294830322266, -82.98109436035156, -73.97923278808594, -64.97737884521484, -55.97552490234375, -46.973670959472656, -37.9718132019043, -28.96995735168457, -19.968101501464844, -10.96624755859375, -1.9643898010253906, 7.037467956542969, 16.039321899414062, 25.04117774963379, 34.043033599853516, 43.044891357421875, 52.04674530029297, 61.04859924316406, 70.05046081542969, 79.05231475830078, 88.05416870117188, 97.05602264404297, 106.05787658691406, 115.05973815917969, 124.06159210205078, 133.06344604492188, 142.0653076171875, 151.06716918945312, 160.0690155029297]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 2.0, 6.0, 8.0, 13.0, 4.0, 10.0, 11.0, 16.0, 14.0, 21.0, 20.0, 29.0, 30.0, 35.0, 29.0, 37.0, 30.0, 39.0, 46.0, 49.0, 53.0, 49.0, 37.0, 35.0, 39.0, 43.0, 30.0, 35.0, 35.0, 23.0, 26.0, 28.0, 18.0, 21.0, 9.0, 14.0, 13.0, 7.0, 5.0, 7.0, 6.0, 3.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.68264770507812, -72.4303970336914, -70.17814636230469, -67.92589569091797, -65.67364501953125, -63.421390533447266, -61.16913604736328, -58.91688537597656, -56.664634704589844, -54.412384033203125, -52.160133361816406, -49.90787887573242, -47.6556282043457, -45.403377532958984, -43.151123046875, -40.89887237548828, -38.64662170410156, -36.394371032714844, -34.142120361328125, -31.88986587524414, -29.637615203857422, -27.385364532470703, -25.13311195373535, -22.880859375, -20.62860870361328, -18.376358032226562, -16.12410545349121, -13.871853828430176, -11.61960220336914, -9.367350578308105, -7.11509895324707, -4.862847328186035, -2.610595703125, -0.35834407806396484, 1.8939075469970703, 4.1461591720581055, 6.398410797119141, 8.650662422180176, 10.902914047241211, 13.155165672302246, 15.407417297363281, 17.65966796875, 19.91192054748535, 22.164173126220703, 24.416423797607422, 26.66867446899414, 28.920927047729492, 31.173179626464844, 33.42543029785156, 35.67768096923828, 37.929931640625, 40.182186126708984, 42.4344367980957, 44.68668746948242, 46.938941955566406, 49.191192626953125, 51.443443298339844, 53.69569396972656, 55.94794464111328, 58.200199127197266, 60.452449798583984, 62.7047004699707, 64.95695495605469, 67.2092056274414, 69.46145629882812]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 13.0, 17.0, 26.0, 71.0, 94.0, 191.0, 437.0, 1054.0, 2893.0, 8800.0, 36381.0, 340907.0, 3686628.0, 91786.0, 17183.0, 4826.0, 1654.0, 664.0, 322.0, 142.0, 68.0, 32.0, 23.0, 16.0, 13.0, 7.0, 8.0, 9.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -26.16748046875, -25.2412109375, -24.31494140625, -23.388671875, -22.46240234375, -21.5361328125, -20.60986328125, -19.68359375, -18.75732421875, -17.8310546875, -16.90478515625, -15.978515625, -15.05224609375, -14.1259765625, -13.19970703125, -12.2734375, -11.34716796875, -10.4208984375, -9.49462890625, -8.568359375, -7.64208984375, -6.7158203125, -5.78955078125, -4.86328125, -3.93701171875, -3.0107421875, -2.08447265625, -1.158203125, -0.23193359375, 0.6943359375, 1.62060546875, 2.546875, 3.47314453125, 4.3994140625, 5.32568359375, 6.251953125, 7.17822265625, 8.1044921875, 9.03076171875, 9.95703125, 10.88330078125, 11.8095703125, 12.73583984375, 13.662109375, 14.58837890625, 15.5146484375, 16.44091796875, 17.3671875, 18.29345703125, 19.2197265625, 20.14599609375, 21.072265625, 21.99853515625, 22.9248046875, 23.85107421875, 24.77734375, 25.70361328125, 26.6298828125, 27.55615234375, 28.482421875, 29.40869140625, 30.3349609375, 31.26123046875, 32.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 9.0, 14.0, 22.0, 22.0, 27.0, 26.0, 31.0, 29.0, 30.0, 41.0, 46.0, 42.0, 36.0, 42.0, 49.0, 37.0, 45.0, 55.0, 36.0, 33.0, 38.0, 30.0, 33.0, 29.0, 29.0, 14.0, 19.0, 20.0, 17.0, 11.0, 9.0, 8.0, 13.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.3828125, -2.303802490234375, -2.22479248046875, -2.145782470703125, -2.0667724609375, -1.987762451171875, -1.90875244140625, -1.829742431640625, -1.750732421875, -1.671722412109375, -1.59271240234375, -1.513702392578125, -1.4346923828125, -1.355682373046875, -1.27667236328125, -1.197662353515625, -1.11865234375, -1.039642333984375, -0.96063232421875, -0.881622314453125, -0.8026123046875, -0.723602294921875, -0.64459228515625, -0.565582275390625, -0.486572265625, -0.407562255859375, -0.32855224609375, -0.249542236328125, -0.1705322265625, -0.091522216796875, -0.01251220703125, 0.066497802734375, 0.1455078125, 0.224517822265625, 0.30352783203125, 0.382537841796875, 0.4615478515625, 0.540557861328125, 0.61956787109375, 0.698577880859375, 0.777587890625, 0.856597900390625, 0.93560791015625, 1.014617919921875, 1.0936279296875, 1.172637939453125, 1.25164794921875, 1.330657958984375, 1.40966796875, 1.488677978515625, 1.56768798828125, 1.646697998046875, 1.7257080078125, 1.804718017578125, 1.88372802734375, 1.962738037109375, 2.041748046875, 2.120758056640625, 2.19976806640625, 2.278778076171875, 2.3577880859375, 2.436798095703125, 2.51580810546875, 2.594818115234375, 2.673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 11.0, 21.0, 16.0, 28.0, 55.0, 83.0, 129.0, 202.0, 313.0, 539.0, 904.0, 1644.0, 3262.0, 6652.0, 15689.0, 42366.0, 166435.0, 2988183.0, 811267.0, 103378.0, 30452.0, 11558.0, 5073.0, 2682.0, 1362.0, 771.0, 437.0, 262.0, 176.0, 118.0, 54.0, 45.0, 38.0, 29.0, 12.0, 7.0, 10.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.875, -21.208984375, -20.54296875, -19.876953125, -19.2109375, -18.544921875, -17.87890625, -17.212890625, -16.546875, -15.880859375, -15.21484375, -14.548828125, -13.8828125, -13.216796875, -12.55078125, -11.884765625, -11.21875, -10.552734375, -9.88671875, -9.220703125, -8.5546875, -7.888671875, -7.22265625, -6.556640625, -5.890625, -5.224609375, -4.55859375, -3.892578125, -3.2265625, -2.560546875, -1.89453125, -1.228515625, -0.5625, 0.103515625, 0.76953125, 1.435546875, 2.1015625, 2.767578125, 3.43359375, 4.099609375, 4.765625, 5.431640625, 6.09765625, 6.763671875, 7.4296875, 8.095703125, 8.76171875, 9.427734375, 10.09375, 10.759765625, 11.42578125, 12.091796875, 12.7578125, 13.423828125, 14.08984375, 14.755859375, 15.421875, 16.087890625, 16.75390625, 17.419921875, 18.0859375, 18.751953125, 19.41796875, 20.083984375, 20.75]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 9.0, 7.0, 6.0, 12.0, 16.0, 23.0, 26.0, 34.0, 60.0, 104.0, 133.0, 259.0, 700.0, 1666.0, 426.0, 218.0, 112.0, 62.0, 45.0, 38.0, 19.0, 19.0, 20.0, 11.0, 11.0, 10.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.23468017578125, -4.9888916015625, -4.74310302734375, -4.497314453125, -4.25152587890625, -4.0057373046875, -3.75994873046875, -3.51416015625, -3.26837158203125, -3.0225830078125, -2.77679443359375, -2.531005859375, -2.28521728515625, -2.0394287109375, -1.79364013671875, -1.5478515625, -1.30206298828125, -1.0562744140625, -0.81048583984375, -0.564697265625, -0.31890869140625, -0.0731201171875, 0.17266845703125, 0.41845703125, 0.66424560546875, 0.9100341796875, 1.15582275390625, 1.401611328125, 1.64739990234375, 1.8931884765625, 2.13897705078125, 2.384765625, 2.63055419921875, 2.8763427734375, 3.12213134765625, 3.367919921875, 3.61370849609375, 3.8594970703125, 4.10528564453125, 4.35107421875, 4.59686279296875, 4.8426513671875, 5.08843994140625, 5.334228515625, 5.58001708984375, 5.8258056640625, 6.07159423828125, 6.3173828125, 6.56317138671875, 6.8089599609375, 7.05474853515625, 7.300537109375, 7.54632568359375, 7.7921142578125, 8.03790283203125, 8.28369140625, 8.52947998046875, 8.7752685546875, 9.02105712890625, 9.266845703125, 9.51263427734375, 9.7584228515625, 10.00421142578125, 10.25]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 11.0, 15.0, 14.0, 32.0, 46.0, 56.0, 67.0, 94.0, 89.0, 109.0, 86.0, 91.0, 76.0, 68.0, 34.0, 32.0, 34.0, 16.0, 6.0, 2.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.06221008300781, -60.53546905517578, -59.008731842041016, -57.481990814208984, -55.95525360107422, -54.42851257324219, -52.901771545410156, -51.375030517578125, -49.84829330444336, -48.32155227661133, -46.79481506347656, -45.26807403564453, -43.7413330078125, -42.214595794677734, -40.6878547668457, -39.16111755371094, -37.634376525878906, -36.107635498046875, -34.58089828491211, -33.05415725708008, -31.52741813659668, -30.00067901611328, -28.47393798828125, -26.94719886779785, -25.420459747314453, -23.893720626831055, -22.366981506347656, -20.840240478515625, -19.313501358032227, -17.786762237548828, -16.260021209716797, -14.733282089233398, -13.20654296875, -11.679803848266602, -10.153063774108887, -8.626323699951172, -7.099584579467773, -5.572844982147217, -4.04610538482666, -2.5193653106689453, -0.9926261901855469, 0.5341134071350098, 2.0608530044555664, 3.587592601776123, 5.11433219909668, 6.641071796417236, 8.167811393737793, 9.694551467895508, 11.221290588378906, 12.748029708862305, 14.27476978302002, 15.801509857177734, 17.328248977661133, 18.85498809814453, 20.381729125976562, 21.90846824645996, 23.43520736694336, 24.961946487426758, 26.488685607910156, 28.015426635742188, 29.542165756225586, 31.068904876708984, 32.595645904541016, 34.12238311767578, 35.64912414550781]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 8.0, 13.0, 17.0, 22.0, 23.0, 36.0, 29.0, 33.0, 36.0, 40.0, 51.0, 42.0, 42.0, 43.0, 50.0, 53.0, 47.0, 37.0, 43.0, 54.0, 32.0, 38.0, 28.0, 29.0, 31.0, 19.0, 16.0, 12.0, 13.0, 9.0, 8.0, 8.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.675498962402344, -30.72734260559082, -29.77918815612793, -28.831031799316406, -27.882877349853516, -26.934720993041992, -25.98656463623047, -25.038410186767578, -24.090255737304688, -23.142099380493164, -22.193944931030273, -21.24578857421875, -20.29763412475586, -19.349477767944336, -18.401321411132812, -17.453166961669922, -16.5050106048584, -15.556855201721191, -14.608699798583984, -13.660543441772461, -12.71238899230957, -11.764232635498047, -10.81607723236084, -9.867921829223633, -8.919766426086426, -7.971611022949219, -7.023455619812012, -6.0752997398376465, -5.1271443367004395, -4.178988933563232, -3.230833053588867, -2.28267765045166, -1.3345203399658203, -0.38636481761932373, 0.5617907047271729, 1.509946346282959, 2.458101749420166, 3.406257152557373, 4.354413032531738, 5.302568435668945, 6.250723838806152, 7.198879241943359, 8.147034645080566, 9.095190048217773, 10.043346405029297, 10.991500854492188, 11.939657211303711, 12.887812614440918, 13.835968017578125, 14.784123420715332, 15.732278823852539, 16.680435180664062, 17.628589630126953, 18.576745986938477, 19.52490234375, 20.47305679321289, 21.42121124267578, 22.369367599487305, 23.317522048950195, 24.26567840576172, 25.21383285522461, 26.161989212036133, 27.110145568847656, 28.058300018310547, 29.00645637512207]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 13.0, 8.0, 26.0, 35.0, 51.0, 73.0, 126.0, 206.0, 296.0, 462.0, 764.0, 1311.0, 2301.0, 3905.0, 7098.0, 12875.0, 24889.0, 46846.0, 88059.0, 161587.0, 241891.0, 203603.0, 117416.0, 62538.0, 33349.0, 17510.0, 9180.0, 5109.0, 2826.0, 1652.0, 972.0, 553.0, 357.0, 234.0, 136.0, 95.0, 57.0, 41.0, 24.0, 20.0, 16.0, 9.0, 7.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.7578125, -11.3485107421875, -10.939208984375, -10.5299072265625, -10.12060546875, -9.7113037109375, -9.302001953125, -8.8927001953125, -8.4833984375, -8.0740966796875, -7.664794921875, -7.2554931640625, -6.84619140625, -6.4368896484375, -6.027587890625, -5.6182861328125, -5.208984375, -4.7996826171875, -4.390380859375, -3.9810791015625, -3.57177734375, -3.1624755859375, -2.753173828125, -2.3438720703125, -1.9345703125, -1.5252685546875, -1.115966796875, -0.7066650390625, -0.29736328125, 0.1119384765625, 0.521240234375, 0.9305419921875, 1.33984375, 1.7491455078125, 2.158447265625, 2.5677490234375, 2.97705078125, 3.3863525390625, 3.795654296875, 4.2049560546875, 4.6142578125, 5.0235595703125, 5.432861328125, 5.8421630859375, 6.25146484375, 6.6607666015625, 7.070068359375, 7.4793701171875, 7.888671875, 8.2979736328125, 8.707275390625, 9.1165771484375, 9.52587890625, 9.9351806640625, 10.344482421875, 10.7537841796875, 11.1630859375, 11.5723876953125, 11.981689453125, 12.3909912109375, 12.80029296875, 13.2095947265625, 13.618896484375, 14.0281982421875, 14.4375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 14.0, 5.0, 15.0, 6.0, 18.0, 12.0, 23.0, 20.0, 24.0, 30.0, 37.0, 33.0, 47.0, 43.0, 38.0, 35.0, 44.0, 49.0, 34.0, 38.0, 48.0, 49.0, 43.0, 36.0, 41.0, 28.0, 21.0, 26.0, 20.0, 17.0, 22.0, 10.0, 9.0, 11.0, 5.0, 5.0, 9.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.73828125, -2.652679443359375, -2.56707763671875, -2.481475830078125, -2.3958740234375, -2.310272216796875, -2.22467041015625, -2.139068603515625, -2.053466796875, -1.967864990234375, -1.88226318359375, -1.796661376953125, -1.7110595703125, -1.625457763671875, -1.53985595703125, -1.454254150390625, -1.36865234375, -1.283050537109375, -1.19744873046875, -1.111846923828125, -1.0262451171875, -0.940643310546875, -0.85504150390625, -0.769439697265625, -0.683837890625, -0.598236083984375, -0.51263427734375, -0.427032470703125, -0.3414306640625, -0.255828857421875, -0.17022705078125, -0.084625244140625, 0.0009765625, 0.086578369140625, 0.17218017578125, 0.257781982421875, 0.3433837890625, 0.428985595703125, 0.51458740234375, 0.600189208984375, 0.685791015625, 0.771392822265625, 0.85699462890625, 0.942596435546875, 1.0281982421875, 1.113800048828125, 1.19940185546875, 1.285003662109375, 1.37060546875, 1.456207275390625, 1.54180908203125, 1.627410888671875, 1.7130126953125, 1.798614501953125, 1.88421630859375, 1.969818115234375, 2.055419921875, 2.141021728515625, 2.22662353515625, 2.312225341796875, 2.3978271484375, 2.483428955078125, 2.56903076171875, 2.654632568359375, 2.740234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 6.0, 15.0, 21.0, 27.0, 27.0, 41.0, 61.0, 93.0, 124.0, 169.0, 251.0, 329.0, 587.0, 945.0, 1521.0, 2737.0, 5064.0, 9963.0, 19994.0, 40800.0, 85489.0, 177633.0, 295647.0, 208212.0, 101115.0, 48504.0, 23562.0, 11595.0, 6008.0, 3279.0, 1801.0, 991.0, 644.0, 410.0, 275.0, 170.0, 137.0, 97.0, 36.0, 38.0, 39.0, 25.0, 22.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.03515625, -12.609375, -12.18359375, -11.7578125, -11.33203125, -10.90625, -10.48046875, -10.0546875, -9.62890625, -9.203125, -8.77734375, -8.3515625, -7.92578125, -7.5, -7.07421875, -6.6484375, -6.22265625, -5.796875, -5.37109375, -4.9453125, -4.51953125, -4.09375, -3.66796875, -3.2421875, -2.81640625, -2.390625, -1.96484375, -1.5390625, -1.11328125, -0.6875, -0.26171875, 0.1640625, 0.58984375, 1.015625, 1.44140625, 1.8671875, 2.29296875, 2.71875, 3.14453125, 3.5703125, 3.99609375, 4.421875, 4.84765625, 5.2734375, 5.69921875, 6.125, 6.55078125, 6.9765625, 7.40234375, 7.828125, 8.25390625, 8.6796875, 9.10546875, 9.53125, 9.95703125, 10.3828125, 10.80859375, 11.234375, 11.66015625, 12.0859375, 12.51171875, 12.9375, 13.36328125, 13.7890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 10.0, 13.0, 17.0, 16.0, 22.0, 27.0, 14.0, 35.0, 35.0, 31.0, 33.0, 36.0, 40.0, 52.0, 35.0, 40.0, 59.0, 51.0, 34.0, 43.0, 46.0, 37.0, 32.0, 29.0, 30.0, 26.0, 28.0, 24.0, 11.0, 15.0, 9.0, 10.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.3494873046875, -13.870849609375, -13.3922119140625, -12.91357421875, -12.4349365234375, -11.956298828125, -11.4776611328125, -10.9990234375, -10.5203857421875, -10.041748046875, -9.5631103515625, -9.08447265625, -8.6058349609375, -8.127197265625, -7.6485595703125, -7.169921875, -6.6912841796875, -6.212646484375, -5.7340087890625, -5.25537109375, -4.7767333984375, -4.298095703125, -3.8194580078125, -3.3408203125, -2.8621826171875, -2.383544921875, -1.9049072265625, -1.42626953125, -0.9476318359375, -0.468994140625, 0.0096435546875, 0.48828125, 0.9669189453125, 1.445556640625, 1.9241943359375, 2.40283203125, 2.8814697265625, 3.360107421875, 3.8387451171875, 4.3173828125, 4.7960205078125, 5.274658203125, 5.7532958984375, 6.23193359375, 6.7105712890625, 7.189208984375, 7.6678466796875, 8.146484375, 8.6251220703125, 9.103759765625, 9.5823974609375, 10.06103515625, 10.5396728515625, 11.018310546875, 11.4969482421875, 11.9755859375, 12.4542236328125, 12.932861328125, 13.4114990234375, 13.89013671875, 14.3687744140625, 14.847412109375, 15.3260498046875, 15.8046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 12.0, 11.0, 11.0, 26.0, 39.0, 44.0, 59.0, 104.0, 163.0, 274.0, 474.0, 756.0, 1289.0, 2324.0, 4724.0, 9892.0, 23415.0, 60132.0, 207239.0, 490990.0, 158714.0, 49973.0, 20046.0, 8692.0, 4105.0, 2187.0, 1103.0, 646.0, 419.0, 247.0, 142.0, 99.0, 60.0, 46.0, 29.0, 19.0, 16.0, 8.0, 8.0, 11.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.4765625, -15.0133056640625, -14.550048828125, -14.0867919921875, -13.62353515625, -13.1602783203125, -12.697021484375, -12.2337646484375, -11.7705078125, -11.3072509765625, -10.843994140625, -10.3807373046875, -9.91748046875, -9.4542236328125, -8.990966796875, -8.5277099609375, -8.064453125, -7.6011962890625, -7.137939453125, -6.6746826171875, -6.21142578125, -5.7481689453125, -5.284912109375, -4.8216552734375, -4.3583984375, -3.8951416015625, -3.431884765625, -2.9686279296875, -2.50537109375, -2.0421142578125, -1.578857421875, -1.1156005859375, -0.65234375, -0.1890869140625, 0.274169921875, 0.7374267578125, 1.20068359375, 1.6639404296875, 2.127197265625, 2.5904541015625, 3.0537109375, 3.5169677734375, 3.980224609375, 4.4434814453125, 4.90673828125, 5.3699951171875, 5.833251953125, 6.2965087890625, 6.759765625, 7.2230224609375, 7.686279296875, 8.1495361328125, 8.61279296875, 9.0760498046875, 9.539306640625, 10.0025634765625, 10.4658203125, 10.9290771484375, 11.392333984375, 11.8555908203125, 12.31884765625, 12.7821044921875, 13.245361328125, 13.7086181640625, 14.171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 9.0, 20.0, 17.0, 26.0, 35.0, 40.0, 49.0, 95.0, 126.0, 168.0, 107.0, 65.0, 46.0, 34.0, 39.0, 33.0, 16.0, 12.0, 11.0, 5.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00421905517578125, -0.00408405065536499, -0.0039490461349487305, -0.0038140416145324707, -0.003679037094116211, -0.003544032573699951, -0.0034090280532836914, -0.0032740235328674316, -0.003139019012451172, -0.003004014492034912, -0.0028690099716186523, -0.0027340054512023926, -0.002599000930786133, -0.002463996410369873, -0.0023289918899536133, -0.0021939873695373535, -0.0020589828491210938, -0.001923978328704834, -0.0017889738082885742, -0.0016539692878723145, -0.0015189647674560547, -0.001383960247039795, -0.0012489557266235352, -0.0011139512062072754, -0.0009789466857910156, -0.0008439421653747559, -0.0007089376449584961, -0.0005739331245422363, -0.00043892860412597656, -0.0003039240837097168, -0.00016891956329345703, -3.3915042877197266e-05, 0.0001010894775390625, 0.00023609399795532227, 0.00037109851837158203, 0.0005061030387878418, 0.0006411075592041016, 0.0007761120796203613, 0.0009111166000366211, 0.0010461211204528809, 0.0011811256408691406, 0.0013161301612854004, 0.0014511346817016602, 0.00158613920211792, 0.0017211437225341797, 0.0018561482429504395, 0.0019911527633666992, 0.002126157283782959, 0.0022611618041992188, 0.0023961663246154785, 0.0025311708450317383, 0.002666175365447998, 0.002801179885864258, 0.0029361844062805176, 0.0030711889266967773, 0.003206193447113037, 0.003341197967529297, 0.0034762024879455566, 0.0036112070083618164, 0.003746211528778076, 0.003881216049194336, 0.004016220569610596, 0.0041512250900268555, 0.004286229610443115, 0.004421234130859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 6.0, 13.0, 25.0, 22.0, 53.0, 73.0, 109.0, 193.0, 326.0, 642.0, 1273.0, 2502.0, 5511.0, 12860.0, 33892.0, 112896.0, 560409.0, 230413.0, 53543.0, 19067.0, 7695.0, 3439.0, 1716.0, 820.0, 438.0, 237.0, 149.0, 79.0, 51.0, 32.0, 21.0, 8.0, 11.0, 6.0, 3.0, 4.0, 0.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.3125, -18.756103515625, -18.19970703125, -17.643310546875, -17.0869140625, -16.530517578125, -15.97412109375, -15.417724609375, -14.861328125, -14.304931640625, -13.74853515625, -13.192138671875, -12.6357421875, -12.079345703125, -11.52294921875, -10.966552734375, -10.41015625, -9.853759765625, -9.29736328125, -8.740966796875, -8.1845703125, -7.628173828125, -7.07177734375, -6.515380859375, -5.958984375, -5.402587890625, -4.84619140625, -4.289794921875, -3.7333984375, -3.177001953125, -2.62060546875, -2.064208984375, -1.5078125, -0.951416015625, -0.39501953125, 0.161376953125, 0.7177734375, 1.274169921875, 1.83056640625, 2.386962890625, 2.943359375, 3.499755859375, 4.05615234375, 4.612548828125, 5.1689453125, 5.725341796875, 6.28173828125, 6.838134765625, 7.39453125, 7.950927734375, 8.50732421875, 9.063720703125, 9.6201171875, 10.176513671875, 10.73291015625, 11.289306640625, 11.845703125, 12.402099609375, 12.95849609375, 13.514892578125, 14.0712890625, 14.627685546875, 15.18408203125, 15.740478515625, 16.296875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 7.0, 7.0, 11.0, 11.0, 8.0, 18.0, 22.0, 17.0, 26.0, 29.0, 52.0, 82.0, 100.0, 111.0, 123.0, 80.0, 68.0, 44.0, 29.0, 29.0, 16.0, 17.0, 15.0, 14.0, 8.0, 7.0, 9.0, 5.0, 8.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.71875, -13.32421875, -12.9296875, -12.53515625, -12.140625, -11.74609375, -11.3515625, -10.95703125, -10.5625, -10.16796875, -9.7734375, -9.37890625, -8.984375, -8.58984375, -8.1953125, -7.80078125, -7.40625, -7.01171875, -6.6171875, -6.22265625, -5.828125, -5.43359375, -5.0390625, -4.64453125, -4.25, -3.85546875, -3.4609375, -3.06640625, -2.671875, -2.27734375, -1.8828125, -1.48828125, -1.09375, -0.69921875, -0.3046875, 0.08984375, 0.484375, 0.87890625, 1.2734375, 1.66796875, 2.0625, 2.45703125, 2.8515625, 3.24609375, 3.640625, 4.03515625, 4.4296875, 4.82421875, 5.21875, 5.61328125, 6.0078125, 6.40234375, 6.796875, 7.19140625, 7.5859375, 7.98046875, 8.375, 8.76953125, 9.1640625, 9.55859375, 9.953125, 10.34765625, 10.7421875, 11.13671875, 11.53125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 13.0, 19.0, 34.0, 47.0, 65.0, 87.0, 102.0, 126.0, 127.0, 102.0, 96.0, 62.0, 41.0, 13.0, 22.0, 12.0, 7.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.1421661376953, -171.5607452392578, -165.97933959960938, -160.39791870117188, -154.81649780273438, -149.23507690429688, -143.65365600585938, -138.07225036621094, -132.49082946777344, -126.90940856933594, -121.32799530029297, -115.74658203125, -110.1651611328125, -104.583740234375, -99.00232696533203, -93.42091369628906, -87.83949279785156, -82.25807189941406, -76.6766586303711, -71.09524536132812, -65.51382446289062, -59.93240737915039, -54.350990295410156, -48.76957321166992, -43.18815612792969, -37.60673904418945, -32.02532196044922, -26.443904876708984, -20.86248779296875, -15.281070709228516, -9.699653625488281, -4.118236541748047, 1.46319580078125, 7.044612884521484, 12.626029968261719, 18.207447052001953, 23.788864135742188, 29.370281219482422, 34.951698303222656, 40.53311538696289, 46.114532470703125, 51.69594955444336, 57.277366638183594, 62.85878372192383, 68.44020080566406, 74.02162170410156, 79.60303497314453, 85.1844482421875, 90.765869140625, 96.3472900390625, 101.92870330810547, 107.51011657714844, 113.09153747558594, 118.67295837402344, 124.2543716430664, 129.83578491210938, 135.41720581054688, 140.99862670898438, 146.58004760742188, 152.1614532470703, 157.7428741455078, 163.3242950439453, 168.90570068359375, 174.48712158203125, 180.06854248046875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 7.0, 16.0, 12.0, 18.0, 10.0, 21.0, 23.0, 26.0, 38.0, 33.0, 39.0, 31.0, 35.0, 36.0, 46.0, 47.0, 44.0, 48.0, 36.0, 39.0, 42.0, 25.0, 39.0, 42.0, 35.0, 31.0, 27.0, 27.0, 22.0, 16.0, 18.0, 12.0, 9.0, 7.0, 8.0, 10.0, 3.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-88.88740539550781, -86.19448852539062, -83.50157928466797, -80.80866241455078, -78.11575317382812, -75.42283630371094, -72.72992706298828, -70.0370101928711, -67.34410095214844, -64.65118408203125, -61.958274841308594, -59.26536178588867, -56.57244873046875, -53.87953567504883, -51.186622619628906, -48.49370574951172, -45.8007926940918, -43.107879638671875, -40.41496658325195, -37.72205352783203, -35.02914047241211, -32.33622741699219, -29.643312454223633, -26.95039939880371, -24.25748634338379, -21.564573287963867, -18.871660232543945, -16.17874526977539, -13.485833168029785, -10.792920112609863, -8.100006103515625, -5.407093048095703, -2.7141799926757812, -0.021266698837280273, 2.6716465950012207, 5.364560127258301, 8.057473182678223, 10.750386238098145, 13.443300247192383, 16.136213302612305, 18.829126358032227, 21.52203941345215, 24.21495246887207, 26.907867431640625, 29.600780487060547, 32.29369354248047, 34.98660659790039, 37.67951965332031, 40.372432708740234, 43.065345764160156, 45.75825881958008, 48.451171875, 51.14408493041992, 53.836997985839844, 56.52991485595703, 59.22282409667969, 61.915740966796875, 64.60865783691406, 67.30156707763672, 69.9944839477539, 72.68739318847656, 75.38031005859375, 78.0732192993164, 80.7661361694336, 83.45904541015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 12.0, 15.0, 28.0, 36.0, 67.0, 113.0, 183.0, 294.0, 571.0, 1116.0, 2356.0, 4994.0, 12271.0, 34586.0, 126741.0, 2600409.0, 1248922.0, 110593.0, 30738.0, 11240.0, 4628.0, 2102.0, 1025.0, 519.0, 277.0, 159.0, 86.0, 73.0, 45.0, 20.0, 17.0, 10.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -16.048828125, -15.37890625, -14.708984375, -14.0390625, -13.369140625, -12.69921875, -12.029296875, -11.359375, -10.689453125, -10.01953125, -9.349609375, -8.6796875, -8.009765625, -7.33984375, -6.669921875, -6.0, -5.330078125, -4.66015625, -3.990234375, -3.3203125, -2.650390625, -1.98046875, -1.310546875, -0.640625, 0.029296875, 0.69921875, 1.369140625, 2.0390625, 2.708984375, 3.37890625, 4.048828125, 4.71875, 5.388671875, 6.05859375, 6.728515625, 7.3984375, 8.068359375, 8.73828125, 9.408203125, 10.078125, 10.748046875, 11.41796875, 12.087890625, 12.7578125, 13.427734375, 14.09765625, 14.767578125, 15.4375, 16.107421875, 16.77734375, 17.447265625, 18.1171875, 18.787109375, 19.45703125, 20.126953125, 20.796875, 21.466796875, 22.13671875, 22.806640625, 23.4765625, 24.146484375, 24.81640625, 25.486328125, 26.15625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 7.0, 11.0, 18.0, 18.0, 18.0, 18.0, 32.0, 46.0, 28.0, 38.0, 41.0, 48.0, 25.0, 47.0, 51.0, 46.0, 45.0, 57.0, 41.0, 37.0, 34.0, 34.0, 43.0, 33.0, 27.0, 23.0, 20.0, 19.0, 18.0, 16.0, 10.0, 9.0, 8.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.736328125, -2.638671875, -2.541015625, -2.443359375, -2.345703125, -2.248046875, -2.150390625, -2.052734375, -1.955078125, -1.857421875, -1.759765625, -1.662109375, -1.564453125, -1.466796875, -1.369140625, -1.271484375, -1.173828125, -1.076171875, -0.978515625, -0.880859375, -0.783203125, -0.685546875, -0.587890625, -0.490234375, -0.392578125, -0.294921875, -0.197265625, -0.099609375, -0.001953125, 0.095703125, 0.193359375, 0.291015625, 0.388671875, 0.486328125, 0.583984375, 0.681640625, 0.779296875, 0.876953125, 0.974609375, 1.072265625, 1.169921875, 1.267578125, 1.365234375, 1.462890625, 1.560546875, 1.658203125, 1.755859375, 1.853515625, 1.951171875, 2.048828125, 2.146484375, 2.244140625, 2.341796875, 2.439453125, 2.537109375, 2.634765625, 2.732421875, 2.830078125, 2.927734375, 3.025390625, 3.123046875, 3.220703125, 3.318359375, 3.416015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 17.0, 32.0, 27.0, 60.0, 119.0, 194.0, 377.0, 762.0, 1471.0, 3189.0, 7062.0, 17671.0, 49779.0, 183279.0, 2116916.0, 1564445.0, 170636.0, 48203.0, 17181.0, 6822.0, 2985.0, 1442.0, 733.0, 373.0, 221.0, 95.0, 75.0, 46.0, 14.0, 12.0, 13.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.359375, -13.734375, -13.109375, -12.484375, -11.859375, -11.234375, -10.609375, -9.984375, -9.359375, -8.734375, -8.109375, -7.484375, -6.859375, -6.234375, -5.609375, -4.984375, -4.359375, -3.734375, -3.109375, -2.484375, -1.859375, -1.234375, -0.609375, 0.015625, 0.640625, 1.265625, 1.890625, 2.515625, 3.140625, 3.765625, 4.390625, 5.015625, 5.640625, 6.265625, 6.890625, 7.515625, 8.140625, 8.765625, 9.390625, 10.015625, 10.640625, 11.265625, 11.890625, 12.515625, 13.140625, 13.765625, 14.390625, 15.015625, 15.640625, 16.265625, 16.890625, 17.515625, 18.140625, 18.765625, 19.390625, 20.015625, 20.640625, 21.265625, 21.890625, 22.515625, 23.140625, 23.765625, 24.390625, 25.015625, 25.640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 14.0, 4.0, 17.0, 14.0, 27.0, 38.0, 62.0, 72.0, 117.0, 175.0, 270.0, 455.0, 1224.0, 600.0, 293.0, 185.0, 124.0, 87.0, 63.0, 59.0, 41.0, 20.0, 15.0, 20.0, 14.0, 7.0, 6.0, 9.0, 9.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-8.7421875, -8.4969482421875, -8.251708984375, -8.0064697265625, -7.76123046875, -7.5159912109375, -7.270751953125, -7.0255126953125, -6.7802734375, -6.5350341796875, -6.289794921875, -6.0445556640625, -5.79931640625, -5.5540771484375, -5.308837890625, -5.0635986328125, -4.818359375, -4.5731201171875, -4.327880859375, -4.0826416015625, -3.83740234375, -3.5921630859375, -3.346923828125, -3.1016845703125, -2.8564453125, -2.6112060546875, -2.365966796875, -2.1207275390625, -1.87548828125, -1.6302490234375, -1.385009765625, -1.1397705078125, -0.89453125, -0.6492919921875, -0.404052734375, -0.1588134765625, 0.08642578125, 0.3316650390625, 0.576904296875, 0.8221435546875, 1.0673828125, 1.3126220703125, 1.557861328125, 1.8031005859375, 2.04833984375, 2.2935791015625, 2.538818359375, 2.7840576171875, 3.029296875, 3.2745361328125, 3.519775390625, 3.7650146484375, 4.01025390625, 4.2554931640625, 4.500732421875, 4.7459716796875, 4.9912109375, 5.2364501953125, 5.481689453125, 5.7269287109375, 5.97216796875, 6.2174072265625, 6.462646484375, 6.7078857421875, 6.953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 16.0, 29.0, 52.0, 90.0, 133.0, 161.0, 165.0, 115.0, 98.0, 67.0, 35.0, 13.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.73023986816406, -73.04025268554688, -70.35027313232422, -67.66028594970703, -64.97030639648438, -62.28031921386719, -59.59033203125, -56.90034866333008, -54.210365295410156, -51.520381927490234, -48.83039855957031, -46.140411376953125, -43.4504280090332, -40.76044464111328, -38.070457458496094, -35.38047409057617, -32.69049072265625, -30.000507354736328, -27.310522079467773, -24.62053680419922, -21.930553436279297, -19.240570068359375, -16.55058479309082, -13.860599517822266, -11.170616149902344, -8.480631828308105, -5.790647506713867, -3.100663185119629, -0.4106788635253906, 2.2793054580688477, 4.969289779663086, 7.659275054931641, 10.349266052246094, 13.039250373840332, 15.72923469543457, 18.419219970703125, 21.109203338623047, 23.79918670654297, 26.489171981811523, 29.179157257080078, 31.869140625, 34.55912399291992, 37.249107360839844, 39.93909454345703, 42.62907791137695, 45.319061279296875, 48.00904846191406, 50.699031829833984, 53.389015197753906, 56.07899856567383, 58.76898193359375, 61.45896911621094, 64.14895629882812, 66.83893585205078, 69.52892303466797, 72.21890258789062, 74.90888977050781, 77.598876953125, 80.28885650634766, 82.97884368896484, 85.6688232421875, 88.35881042480469, 91.04879760742188, 93.73878479003906, 96.42876434326172]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 9.0, 10.0, 11.0, 8.0, 10.0, 17.0, 12.0, 13.0, 22.0, 17.0, 16.0, 33.0, 32.0, 31.0, 41.0, 45.0, 49.0, 37.0, 40.0, 35.0, 49.0, 45.0, 34.0, 48.0, 40.0, 35.0, 37.0, 27.0, 26.0, 22.0, 25.0, 20.0, 23.0, 18.0, 11.0, 12.0, 10.0, 1.0, 6.0, 4.0, 9.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.12439727783203, -31.17691993713379, -30.229442596435547, -29.281965255737305, -28.334487915039062, -27.38701057434082, -26.439533233642578, -25.492055892944336, -24.544578552246094, -23.59710121154785, -22.64962387084961, -21.702146530151367, -20.754669189453125, -19.807191848754883, -18.85971450805664, -17.9122371673584, -16.964759826660156, -16.017282485961914, -15.069805145263672, -14.12232780456543, -13.174850463867188, -12.227373123168945, -11.279895782470703, -10.332418441772461, -9.384943008422852, -8.43746566772461, -7.489988327026367, -6.542510986328125, -5.595033645629883, -4.647556781768799, -3.7000794410705566, -2.7526021003723145, -1.805124282836914, -0.8576470017433167, 0.08983027935028076, 1.0373075008392334, 1.9847848415374756, 2.9322619438171387, 3.879739284515381, 4.827216625213623, 5.774693965911865, 6.722171306610107, 7.66964864730835, 8.617125511169434, 9.564602851867676, 10.512080192565918, 11.45955753326416, 12.407034873962402, 13.354512214660645, 14.301989555358887, 15.249466896057129, 16.196943283081055, 17.144420623779297, 18.09189796447754, 19.03937530517578, 19.986852645874023, 20.934329986572266, 21.881807327270508, 22.82928466796875, 23.776762008666992, 24.724239349365234, 25.671716690063477, 26.61919403076172, 27.56667137145996, 28.514148712158203]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 4.0, 9.0, 10.0, 9.0, 16.0, 27.0, 45.0, 66.0, 94.0, 140.0, 210.0, 373.0, 524.0, 960.0, 1614.0, 2728.0, 4881.0, 8943.0, 17660.0, 36470.0, 81228.0, 213430.0, 377425.0, 170431.0, 67331.0, 30738.0, 15020.0, 7851.0, 4216.0, 2451.0, 1405.0, 819.0, 496.0, 302.0, 236.0, 116.0, 84.0, 50.0, 42.0, 38.0, 18.0, 11.0, 10.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.828125, -16.30859375, -15.7890625, -15.26953125, -14.75, -14.23046875, -13.7109375, -13.19140625, -12.671875, -12.15234375, -11.6328125, -11.11328125, -10.59375, -10.07421875, -9.5546875, -9.03515625, -8.515625, -7.99609375, -7.4765625, -6.95703125, -6.4375, -5.91796875, -5.3984375, -4.87890625, -4.359375, -3.83984375, -3.3203125, -2.80078125, -2.28125, -1.76171875, -1.2421875, -0.72265625, -0.203125, 0.31640625, 0.8359375, 1.35546875, 1.875, 2.39453125, 2.9140625, 3.43359375, 3.953125, 4.47265625, 4.9921875, 5.51171875, 6.03125, 6.55078125, 7.0703125, 7.58984375, 8.109375, 8.62890625, 9.1484375, 9.66796875, 10.1875, 10.70703125, 11.2265625, 11.74609375, 12.265625, 12.78515625, 13.3046875, 13.82421875, 14.34375, 14.86328125, 15.3828125, 15.90234375, 16.421875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 7.0, 3.0, 11.0, 25.0, 28.0, 25.0, 24.0, 26.0, 22.0, 33.0, 43.0, 27.0, 42.0, 25.0, 44.0, 43.0, 39.0, 46.0, 44.0, 38.0, 35.0, 36.0, 28.0, 41.0, 24.0, 27.0, 23.0, 27.0, 15.0, 13.0, 18.0, 14.0, 15.0, 9.0, 8.0, 16.0, 4.0, 6.0, 5.0, 6.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.919921875, -2.831573486328125, -2.74322509765625, -2.654876708984375, -2.5665283203125, -2.478179931640625, -2.38983154296875, -2.301483154296875, -2.213134765625, -2.124786376953125, -2.03643798828125, -1.948089599609375, -1.8597412109375, -1.771392822265625, -1.68304443359375, -1.594696044921875, -1.50634765625, -1.417999267578125, -1.32965087890625, -1.241302490234375, -1.1529541015625, -1.064605712890625, -0.97625732421875, -0.887908935546875, -0.799560546875, -0.711212158203125, -0.62286376953125, -0.534515380859375, -0.4461669921875, -0.357818603515625, -0.26947021484375, -0.181121826171875, -0.0927734375, -0.004425048828125, 0.08392333984375, 0.172271728515625, 0.2606201171875, 0.348968505859375, 0.43731689453125, 0.525665283203125, 0.614013671875, 0.702362060546875, 0.79071044921875, 0.879058837890625, 0.9674072265625, 1.055755615234375, 1.14410400390625, 1.232452392578125, 1.32080078125, 1.409149169921875, 1.49749755859375, 1.585845947265625, 1.6741943359375, 1.762542724609375, 1.85089111328125, 1.939239501953125, 2.027587890625, 2.115936279296875, 2.20428466796875, 2.292633056640625, 2.3809814453125, 2.469329833984375, 2.55767822265625, 2.646026611328125, 2.734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 7.0, 14.0, 16.0, 14.0, 28.0, 17.0, 30.0, 52.0, 67.0, 97.0, 161.0, 244.0, 423.0, 749.0, 1401.0, 2973.0, 6376.0, 15391.0, 41125.0, 139531.0, 541202.0, 208781.0, 54695.0, 19530.0, 7951.0, 3698.0, 1738.0, 915.0, 513.0, 265.0, 177.0, 120.0, 66.0, 48.0, 44.0, 25.0, 22.0, 11.0, 12.0, 9.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.671875, -17.970703125, -17.26953125, -16.568359375, -15.8671875, -15.166015625, -14.46484375, -13.763671875, -13.0625, -12.361328125, -11.66015625, -10.958984375, -10.2578125, -9.556640625, -8.85546875, -8.154296875, -7.453125, -6.751953125, -6.05078125, -5.349609375, -4.6484375, -3.947265625, -3.24609375, -2.544921875, -1.84375, -1.142578125, -0.44140625, 0.259765625, 0.9609375, 1.662109375, 2.36328125, 3.064453125, 3.765625, 4.466796875, 5.16796875, 5.869140625, 6.5703125, 7.271484375, 7.97265625, 8.673828125, 9.375, 10.076171875, 10.77734375, 11.478515625, 12.1796875, 12.880859375, 13.58203125, 14.283203125, 14.984375, 15.685546875, 16.38671875, 17.087890625, 17.7890625, 18.490234375, 19.19140625, 19.892578125, 20.59375, 21.294921875, 21.99609375, 22.697265625, 23.3984375, 24.099609375, 24.80078125, 25.501953125, 26.203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 7.0, 7.0, 12.0, 15.0, 12.0, 9.0, 26.0, 15.0, 16.0, 31.0, 34.0, 40.0, 50.0, 47.0, 61.0, 42.0, 52.0, 52.0, 42.0, 51.0, 48.0, 42.0, 41.0, 33.0, 38.0, 37.0, 20.0, 27.0, 8.0, 12.0, 14.0, 4.0, 11.0, 6.0, 1.0, 6.0, 7.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.640625, -17.09228515625, -16.5439453125, -15.99560546875, -15.447265625, -14.89892578125, -14.3505859375, -13.80224609375, -13.25390625, -12.70556640625, -12.1572265625, -11.60888671875, -11.060546875, -10.51220703125, -9.9638671875, -9.41552734375, -8.8671875, -8.31884765625, -7.7705078125, -7.22216796875, -6.673828125, -6.12548828125, -5.5771484375, -5.02880859375, -4.48046875, -3.93212890625, -3.3837890625, -2.83544921875, -2.287109375, -1.73876953125, -1.1904296875, -0.64208984375, -0.09375, 0.45458984375, 1.0029296875, 1.55126953125, 2.099609375, 2.64794921875, 3.1962890625, 3.74462890625, 4.29296875, 4.84130859375, 5.3896484375, 5.93798828125, 6.486328125, 7.03466796875, 7.5830078125, 8.13134765625, 8.6796875, 9.22802734375, 9.7763671875, 10.32470703125, 10.873046875, 11.42138671875, 11.9697265625, 12.51806640625, 13.06640625, 13.61474609375, 14.1630859375, 14.71142578125, 15.259765625, 15.80810546875, 16.3564453125, 16.90478515625, 17.453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 11.0, 20.0, 32.0, 62.0, 127.0, 319.0, 803.0, 3049.0, 16371.0, 113289.0, 803203.0, 93412.0, 13870.0, 2674.0, 739.0, 261.0, 134.0, 75.0, 36.0, 23.0, 19.0, 6.0, 8.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.78125, -31.950439453125, -31.11962890625, -30.288818359375, -29.4580078125, -28.627197265625, -27.79638671875, -26.965576171875, -26.134765625, -25.303955078125, -24.47314453125, -23.642333984375, -22.8115234375, -21.980712890625, -21.14990234375, -20.319091796875, -19.48828125, -18.657470703125, -17.82666015625, -16.995849609375, -16.1650390625, -15.334228515625, -14.50341796875, -13.672607421875, -12.841796875, -12.010986328125, -11.18017578125, -10.349365234375, -9.5185546875, -8.687744140625, -7.85693359375, -7.026123046875, -6.1953125, -5.364501953125, -4.53369140625, -3.702880859375, -2.8720703125, -2.041259765625, -1.21044921875, -0.379638671875, 0.451171875, 1.281982421875, 2.11279296875, 2.943603515625, 3.7744140625, 4.605224609375, 5.43603515625, 6.266845703125, 7.09765625, 7.928466796875, 8.75927734375, 9.590087890625, 10.4208984375, 11.251708984375, 12.08251953125, 12.913330078125, 13.744140625, 14.574951171875, 15.40576171875, 16.236572265625, 17.0673828125, 17.898193359375, 18.72900390625, 19.559814453125, 20.390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 5.0, 2.0, 6.0, 16.0, 8.0, 17.0, 19.0, 21.0, 40.0, 47.0, 98.0, 158.0, 164.0, 130.0, 61.0, 33.0, 33.0, 15.0, 23.0, 15.0, 8.0, 12.0, 9.0, 9.0, 3.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.003582000732421875, -0.003480374813079834, -0.003378748893737793, -0.003277122974395752, -0.003175497055053711, -0.00307387113571167, -0.002972245216369629, -0.002870619297027588, -0.002768993377685547, -0.002667367458343506, -0.002565741539001465, -0.002464115619659424, -0.002362489700317383, -0.002260863780975342, -0.0021592378616333008, -0.0020576119422912598, -0.0019559860229492188, -0.0018543601036071777, -0.0017527341842651367, -0.0016511082649230957, -0.0015494823455810547, -0.0014478564262390137, -0.0013462305068969727, -0.0012446045875549316, -0.0011429786682128906, -0.0010413527488708496, -0.0009397268295288086, -0.0008381009101867676, -0.0007364749908447266, -0.0006348490715026855, -0.0005332231521606445, -0.0004315972328186035, -0.0003299713134765625, -0.00022834539413452148, -0.00012671947479248047, -2.5093555450439453e-05, 7.653236389160156e-05, 0.00017815828323364258, 0.0002797842025756836, 0.0003814101219177246, 0.0004830360412597656, 0.0005846619606018066, 0.0006862878799438477, 0.0007879137992858887, 0.0008895397186279297, 0.0009911656379699707, 0.0010927915573120117, 0.0011944174766540527, 0.0012960433959960938, 0.0013976693153381348, 0.0014992952346801758, 0.0016009211540222168, 0.0017025470733642578, 0.0018041729927062988, 0.0019057989120483398, 0.002007424831390381, 0.002109050750732422, 0.002210676670074463, 0.002312302589416504, 0.002413928508758545, 0.002515554428100586, 0.002617180347442627, 0.002718806266784668, 0.002820432186126709, 0.00292205810546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 13.0, 9.0, 12.0, 16.0, 29.0, 44.0, 88.0, 117.0, 216.0, 389.0, 708.0, 1784.0, 4917.0, 19016.0, 100055.0, 784166.0, 107904.0, 20364.0, 5169.0, 1756.0, 774.0, 430.0, 227.0, 139.0, 79.0, 41.0, 25.0, 14.0, 10.0, 14.0, 9.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.4375, -22.73828125, -22.0390625, -21.33984375, -20.640625, -19.94140625, -19.2421875, -18.54296875, -17.84375, -17.14453125, -16.4453125, -15.74609375, -15.046875, -14.34765625, -13.6484375, -12.94921875, -12.25, -11.55078125, -10.8515625, -10.15234375, -9.453125, -8.75390625, -8.0546875, -7.35546875, -6.65625, -5.95703125, -5.2578125, -4.55859375, -3.859375, -3.16015625, -2.4609375, -1.76171875, -1.0625, -0.36328125, 0.3359375, 1.03515625, 1.734375, 2.43359375, 3.1328125, 3.83203125, 4.53125, 5.23046875, 5.9296875, 6.62890625, 7.328125, 8.02734375, 8.7265625, 9.42578125, 10.125, 10.82421875, 11.5234375, 12.22265625, 12.921875, 13.62109375, 14.3203125, 15.01953125, 15.71875, 16.41796875, 17.1171875, 17.81640625, 18.515625, 19.21484375, 19.9140625, 20.61328125, 21.3125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 4.0, 9.0, 14.0, 7.0, 17.0, 12.0, 33.0, 40.0, 57.0, 118.0, 191.0, 173.0, 100.0, 57.0, 39.0, 22.0, 18.0, 18.0, 12.0, 8.0, 10.0, 4.0, 4.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.3648681640625, -10.925048828125, -10.4852294921875, -10.04541015625, -9.6055908203125, -9.165771484375, -8.7259521484375, -8.2861328125, -7.8463134765625, -7.406494140625, -6.9666748046875, -6.52685546875, -6.0870361328125, -5.647216796875, -5.2073974609375, -4.767578125, -4.3277587890625, -3.887939453125, -3.4481201171875, -3.00830078125, -2.5684814453125, -2.128662109375, -1.6888427734375, -1.2490234375, -0.8092041015625, -0.369384765625, 0.0704345703125, 0.51025390625, 0.9500732421875, 1.389892578125, 1.8297119140625, 2.26953125, 2.7093505859375, 3.149169921875, 3.5889892578125, 4.02880859375, 4.4686279296875, 4.908447265625, 5.3482666015625, 5.7880859375, 6.2279052734375, 6.667724609375, 7.1075439453125, 7.54736328125, 7.9871826171875, 8.427001953125, 8.8668212890625, 9.306640625, 9.7464599609375, 10.186279296875, 10.6260986328125, 11.06591796875, 11.5057373046875, 11.945556640625, 12.3853759765625, 12.8251953125, 13.2650146484375, 13.704833984375, 14.1446533203125, 14.58447265625, 15.0242919921875, 15.464111328125, 15.9039306640625, 16.34375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 21.0, 45.0, 80.0, 134.0, 218.0, 200.0, 119.0, 86.0, 43.0, 24.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-179.44461059570312, -171.34413146972656, -163.24366760253906, -155.1431884765625, -147.042724609375, -138.94224548339844, -130.84176635742188, -122.74130249023438, -114.64083099365234, -106.54035949707031, -98.43988800048828, -90.33941650390625, -82.23893737792969, -74.13847351074219, -66.03799438476562, -57.937522888183594, -49.83705139160156, -41.73657989501953, -33.6361083984375, -25.535633087158203, -17.435161590576172, -9.33469009399414, -1.2342147827148438, 6.8662567138671875, 14.966728210449219, 23.06719970703125, 31.167673110961914, 39.26814651489258, 47.36861801147461, 55.46908950805664, 63.56956481933594, 71.67003631591797, 79.7705078125, 87.87097930908203, 95.97145080566406, 104.07192993164062, 112.17239379882812, 120.27287292480469, 128.37335205078125, 136.47381591796875, 144.57427978515625, 152.6747589111328, 160.7752227783203, 168.87570190429688, 176.97616577148438, 185.07664489746094, 193.1771240234375, 201.277587890625, 209.37806701660156, 217.47854614257812, 225.57901000976562, 233.6794891357422, 241.7799530029297, 249.88043212890625, 257.98089599609375, 266.08135986328125, 274.1818542480469, 282.2823181152344, 290.3828125, 298.4832763671875, 306.583740234375, 314.6842041015625, 322.7846984863281, 330.8851623535156, 338.9856262207031]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 7.0, 7.0, 6.0, 9.0, 13.0, 11.0, 28.0, 15.0, 20.0, 20.0, 26.0, 39.0, 24.0, 34.0, 29.0, 28.0, 46.0, 47.0, 52.0, 54.0, 39.0, 44.0, 43.0, 46.0, 37.0, 35.0, 37.0, 29.0, 38.0, 22.0, 19.0, 11.0, 14.0, 18.0, 12.0, 13.0, 10.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-92.78024291992188, -89.91456604003906, -87.04888916015625, -84.1832046508789, -81.3175277709961, -78.45185089111328, -75.58616638183594, -72.72048950195312, -69.85481262207031, -66.9891357421875, -64.12345886230469, -61.257774353027344, -58.39209747314453, -55.52642059326172, -52.66073989868164, -49.79505920410156, -46.92938232421875, -44.06370544433594, -41.19802474975586, -38.33234405517578, -35.46666717529297, -32.600990295410156, -29.735309600830078, -26.869630813598633, -24.003952026367188, -21.138273239135742, -18.272594451904297, -15.406915664672852, -12.541236877441406, -9.675558090209961, -6.809879302978516, -3.9442005157470703, -1.078521728515625, 1.7871570587158203, 4.652835845947266, 7.518514633178711, 10.384193420410156, 13.249872207641602, 16.115550994873047, 18.981229782104492, 21.846908569335938, 24.712587356567383, 27.578266143798828, 30.443944931030273, 33.30962371826172, 36.17530059814453, 39.04098129272461, 41.90666198730469, 44.7723388671875, 47.63801574707031, 50.50369644165039, 53.36937713623047, 56.23505401611328, 59.100730895996094, 61.96641159057617, 64.83209228515625, 67.69776916503906, 70.56344604492188, 73.42912292480469, 76.29480743408203, 79.16048431396484, 82.02616119384766, 84.891845703125, 87.75752258300781, 90.62319946289062]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 14.0, 27.0, 45.0, 52.0, 136.0, 216.0, 429.0, 853.0, 1893.0, 4382.0, 12165.0, 39820.0, 217237.0, 3643797.0, 213581.0, 39093.0, 12214.0, 4625.0, 1872.0, 847.0, 456.0, 216.0, 113.0, 68.0, 41.0, 19.0, 15.0, 11.0, 10.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.828125, -30.8779296875, -29.927734375, -28.9775390625, -28.02734375, -27.0771484375, -26.126953125, -25.1767578125, -24.2265625, -23.2763671875, -22.326171875, -21.3759765625, -20.42578125, -19.4755859375, -18.525390625, -17.5751953125, -16.625, -15.6748046875, -14.724609375, -13.7744140625, -12.82421875, -11.8740234375, -10.923828125, -9.9736328125, -9.0234375, -8.0732421875, -7.123046875, -6.1728515625, -5.22265625, -4.2724609375, -3.322265625, -2.3720703125, -1.421875, -0.4716796875, 0.478515625, 1.4287109375, 2.37890625, 3.3291015625, 4.279296875, 5.2294921875, 6.1796875, 7.1298828125, 8.080078125, 9.0302734375, 9.98046875, 10.9306640625, 11.880859375, 12.8310546875, 13.78125, 14.7314453125, 15.681640625, 16.6318359375, 17.58203125, 18.5322265625, 19.482421875, 20.4326171875, 21.3828125, 22.3330078125, 23.283203125, 24.2333984375, 25.18359375, 26.1337890625, 27.083984375, 28.0341796875, 28.984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 8.0, 4.0, 9.0, 14.0, 21.0, 23.0, 18.0, 31.0, 30.0, 34.0, 37.0, 50.0, 67.0, 54.0, 56.0, 46.0, 54.0, 46.0, 50.0, 56.0, 34.0, 34.0, 29.0, 32.0, 22.0, 24.0, 14.0, 22.0, 14.0, 15.0, 8.0, 13.0, 6.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.116943359375, -3.98779296875, -3.858642578125, -3.7294921875, -3.600341796875, -3.47119140625, -3.342041015625, -3.212890625, -3.083740234375, -2.95458984375, -2.825439453125, -2.6962890625, -2.567138671875, -2.43798828125, -2.308837890625, -2.1796875, -2.050537109375, -1.92138671875, -1.792236328125, -1.6630859375, -1.533935546875, -1.40478515625, -1.275634765625, -1.146484375, -1.017333984375, -0.88818359375, -0.759033203125, -0.6298828125, -0.500732421875, -0.37158203125, -0.242431640625, -0.11328125, 0.015869140625, 0.14501953125, 0.274169921875, 0.4033203125, 0.532470703125, 0.66162109375, 0.790771484375, 0.919921875, 1.049072265625, 1.17822265625, 1.307373046875, 1.4365234375, 1.565673828125, 1.69482421875, 1.823974609375, 1.953125, 2.082275390625, 2.21142578125, 2.340576171875, 2.4697265625, 2.598876953125, 2.72802734375, 2.857177734375, 2.986328125, 3.115478515625, 3.24462890625, 3.373779296875, 3.5029296875, 3.632080078125, 3.76123046875, 3.890380859375, 4.01953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 9.0, 28.0, 27.0, 35.0, 40.0, 66.0, 99.0, 163.0, 200.0, 305.0, 386.0, 595.0, 997.0, 1527.0, 2770.0, 5114.0, 9919.0, 21197.0, 52553.0, 169172.0, 1506181.0, 2137915.0, 184023.0, 55608.0, 22327.0, 10274.0, 5246.0, 2731.0, 1704.0, 988.0, 667.0, 400.0, 292.0, 194.0, 140.0, 111.0, 71.0, 55.0, 35.0, 40.0, 20.0, 23.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.3125, -18.727783203125, -18.14306640625, -17.558349609375, -16.9736328125, -16.388916015625, -15.80419921875, -15.219482421875, -14.634765625, -14.050048828125, -13.46533203125, -12.880615234375, -12.2958984375, -11.711181640625, -11.12646484375, -10.541748046875, -9.95703125, -9.372314453125, -8.78759765625, -8.202880859375, -7.6181640625, -7.033447265625, -6.44873046875, -5.864013671875, -5.279296875, -4.694580078125, -4.10986328125, -3.525146484375, -2.9404296875, -2.355712890625, -1.77099609375, -1.186279296875, -0.6015625, -0.016845703125, 0.56787109375, 1.152587890625, 1.7373046875, 2.322021484375, 2.90673828125, 3.491455078125, 4.076171875, 4.660888671875, 5.24560546875, 5.830322265625, 6.4150390625, 6.999755859375, 7.58447265625, 8.169189453125, 8.75390625, 9.338623046875, 9.92333984375, 10.508056640625, 11.0927734375, 11.677490234375, 12.26220703125, 12.846923828125, 13.431640625, 14.016357421875, 14.60107421875, 15.185791015625, 15.7705078125, 16.355224609375, 16.93994140625, 17.524658203125, 18.109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 7.0, 14.0, 15.0, 16.0, 27.0, 37.0, 69.0, 96.0, 172.0, 354.0, 1496.0, 999.0, 335.0, 144.0, 95.0, 61.0, 39.0, 23.0, 24.0, 19.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.5382080078125, -9.170166015625, -8.8021240234375, -8.43408203125, -8.0660400390625, -7.697998046875, -7.3299560546875, -6.9619140625, -6.5938720703125, -6.225830078125, -5.8577880859375, -5.48974609375, -5.1217041015625, -4.753662109375, -4.3856201171875, -4.017578125, -3.6495361328125, -3.281494140625, -2.9134521484375, -2.54541015625, -2.1773681640625, -1.809326171875, -1.4412841796875, -1.0732421875, -0.7052001953125, -0.337158203125, 0.0308837890625, 0.39892578125, 0.7669677734375, 1.135009765625, 1.5030517578125, 1.87109375, 2.2391357421875, 2.607177734375, 2.9752197265625, 3.34326171875, 3.7113037109375, 4.079345703125, 4.4473876953125, 4.8154296875, 5.1834716796875, 5.551513671875, 5.9195556640625, 6.28759765625, 6.6556396484375, 7.023681640625, 7.3917236328125, 7.759765625, 8.1278076171875, 8.495849609375, 8.8638916015625, 9.23193359375, 9.5999755859375, 9.968017578125, 10.3360595703125, 10.7041015625, 11.0721435546875, 11.440185546875, 11.8082275390625, 12.17626953125, 12.5443115234375, 12.912353515625, 13.2803955078125, 13.6484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 13.0, 19.0, 37.0, 32.0, 64.0, 66.0, 96.0, 68.0, 83.0, 102.0, 95.0, 89.0, 62.0, 44.0, 45.0, 31.0, 19.0, 6.0, 4.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-77.00627899169922, -75.25033569335938, -73.49440002441406, -71.73845672607422, -69.98251342773438, -68.22657012939453, -66.47063446044922, -64.71469116210938, -62.95874786376953, -61.20280838012695, -59.44686508178711, -57.69092559814453, -55.93498229980469, -54.17904281616211, -52.423099517822266, -50.66716003417969, -48.911216735839844, -47.155277252197266, -45.39933395385742, -43.643394470214844, -41.887451171875, -40.13151168823242, -38.37556838989258, -36.61962890625, -34.86368942260742, -33.107749938964844, -31.351806640625, -29.59586524963379, -27.839923858642578, -26.083984375, -24.328041076660156, -22.572101593017578, -20.816158294677734, -19.060216903686523, -17.304275512695312, -15.548334121704102, -13.79239273071289, -12.036452293395996, -10.280510902404785, -8.524569511413574, -6.768628120422363, -5.012686729431152, -3.2567455768585205, -1.5008044242858887, 0.25513696670532227, 2.011077880859375, 3.767019271850586, 5.522960662841797, 7.278902053833008, 9.034843444824219, 10.79078483581543, 12.54672622680664, 14.302667617797852, 16.058609008789062, 17.81454849243164, 19.570491790771484, 21.326431274414062, 23.082372665405273, 24.838314056396484, 26.594255447387695, 28.350196838378906, 30.106136322021484, 31.862079620361328, 33.618019104003906, 35.37396240234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 8.0, 10.0, 11.0, 16.0, 17.0, 24.0, 25.0, 27.0, 35.0, 34.0, 34.0, 36.0, 25.0, 29.0, 35.0, 48.0, 43.0, 47.0, 27.0, 38.0, 43.0, 38.0, 34.0, 36.0, 31.0, 34.0, 32.0, 15.0, 22.0, 16.0, 15.0, 14.0, 14.0, 13.0, 9.0, 8.0, 3.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.550039291381836, -27.657567977905273, -26.765094757080078, -25.872623443603516, -24.980152130126953, -24.087678909301758, -23.195207595825195, -22.302734375, -21.410263061523438, -20.517791748046875, -19.62531852722168, -18.732847213745117, -17.840373992919922, -16.94790267944336, -16.055431365966797, -15.162959098815918, -14.270486831665039, -13.37801456451416, -12.485542297363281, -11.593070983886719, -10.70059871673584, -9.808126449584961, -8.915655136108398, -8.02318286895752, -7.130710601806641, -6.238238334655762, -5.345766544342041, -4.45329475402832, -3.5608224868774414, -2.6683502197265625, -1.7758784294128418, -0.8834066390991211, 0.009063720703125, 0.9015357494354248, 1.7940077781677246, 2.6864798069000244, 3.578951835632324, 4.471424102783203, 5.363895893096924, 6.2563676834106445, 7.148839950561523, 8.041312217712402, 8.933784484863281, 9.826255798339844, 10.718728065490723, 11.611200332641602, 12.503671646118164, 13.396143913269043, 14.288616180419922, 15.1810884475708, 16.07356071472168, 16.966032028198242, 17.858505249023438, 18.7509765625, 19.643447875976562, 20.535919189453125, 21.42839241027832, 22.320863723754883, 23.213336944580078, 24.10580825805664, 24.998279571533203, 25.8907527923584, 26.78322410583496, 27.675697326660156, 28.56816864013672]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 12.0, 10.0, 7.0, 17.0, 29.0, 41.0, 63.0, 86.0, 165.0, 277.0, 462.0, 911.0, 1858.0, 3757.0, 8356.0, 18583.0, 43353.0, 112738.0, 361413.0, 325034.0, 100430.0, 39117.0, 16901.0, 7816.0, 3504.0, 1688.0, 846.0, 465.0, 238.0, 135.0, 84.0, 72.0, 30.0, 17.0, 11.0, 8.0, 7.0, 6.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-21.890625, -21.298095703125, -20.70556640625, -20.113037109375, -19.5205078125, -18.927978515625, -18.33544921875, -17.742919921875, -17.150390625, -16.557861328125, -15.96533203125, -15.372802734375, -14.7802734375, -14.187744140625, -13.59521484375, -13.002685546875, -12.41015625, -11.817626953125, -11.22509765625, -10.632568359375, -10.0400390625, -9.447509765625, -8.85498046875, -8.262451171875, -7.669921875, -7.077392578125, -6.48486328125, -5.892333984375, -5.2998046875, -4.707275390625, -4.11474609375, -3.522216796875, -2.9296875, -2.337158203125, -1.74462890625, -1.152099609375, -0.5595703125, 0.032958984375, 0.62548828125, 1.218017578125, 1.810546875, 2.403076171875, 2.99560546875, 3.588134765625, 4.1806640625, 4.773193359375, 5.36572265625, 5.958251953125, 6.55078125, 7.143310546875, 7.73583984375, 8.328369140625, 8.9208984375, 9.513427734375, 10.10595703125, 10.698486328125, 11.291015625, 11.883544921875, 12.47607421875, 13.068603515625, 13.6611328125, 14.253662109375, 14.84619140625, 15.438720703125, 16.03125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 9.0, 8.0, 8.0, 15.0, 22.0, 19.0, 25.0, 27.0, 27.0, 30.0, 44.0, 42.0, 47.0, 34.0, 52.0, 43.0, 56.0, 44.0, 59.0, 47.0, 49.0, 34.0, 26.0, 35.0, 32.0, 26.0, 25.0, 24.0, 22.0, 11.0, 11.0, 4.0, 10.0, 10.0, 10.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.80078125, -4.6734619140625, -4.546142578125, -4.4188232421875, -4.29150390625, -4.1641845703125, -4.036865234375, -3.9095458984375, -3.7822265625, -3.6549072265625, -3.527587890625, -3.4002685546875, -3.27294921875, -3.1456298828125, -3.018310546875, -2.8909912109375, -2.763671875, -2.6363525390625, -2.509033203125, -2.3817138671875, -2.25439453125, -2.1270751953125, -1.999755859375, -1.8724365234375, -1.7451171875, -1.6177978515625, -1.490478515625, -1.3631591796875, -1.23583984375, -1.1085205078125, -0.981201171875, -0.8538818359375, -0.7265625, -0.5992431640625, -0.471923828125, -0.3446044921875, -0.21728515625, -0.0899658203125, 0.037353515625, 0.1646728515625, 0.2919921875, 0.4193115234375, 0.546630859375, 0.6739501953125, 0.80126953125, 0.9285888671875, 1.055908203125, 1.1832275390625, 1.310546875, 1.4378662109375, 1.565185546875, 1.6925048828125, 1.81982421875, 1.9471435546875, 2.074462890625, 2.2017822265625, 2.3291015625, 2.4564208984375, 2.583740234375, 2.7110595703125, 2.83837890625, 2.9656982421875, 3.093017578125, 3.2203369140625, 3.34765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 13.0, 18.0, 12.0, 27.0, 38.0, 58.0, 82.0, 175.0, 230.0, 425.0, 798.0, 1539.0, 3027.0, 6741.0, 14731.0, 34909.0, 103319.0, 469351.0, 297018.0, 68603.0, 25707.0, 11330.0, 5167.0, 2429.0, 1236.0, 637.0, 344.0, 194.0, 128.0, 86.0, 47.0, 39.0, 29.0, 15.0, 10.0, 10.0, 8.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-19.421875, -18.811767578125, -18.20166015625, -17.591552734375, -16.9814453125, -16.371337890625, -15.76123046875, -15.151123046875, -14.541015625, -13.930908203125, -13.32080078125, -12.710693359375, -12.1005859375, -11.490478515625, -10.88037109375, -10.270263671875, -9.66015625, -9.050048828125, -8.43994140625, -7.829833984375, -7.2197265625, -6.609619140625, -5.99951171875, -5.389404296875, -4.779296875, -4.169189453125, -3.55908203125, -2.948974609375, -2.3388671875, -1.728759765625, -1.11865234375, -0.508544921875, 0.1015625, 0.711669921875, 1.32177734375, 1.931884765625, 2.5419921875, 3.152099609375, 3.76220703125, 4.372314453125, 4.982421875, 5.592529296875, 6.20263671875, 6.812744140625, 7.4228515625, 8.032958984375, 8.64306640625, 9.253173828125, 9.86328125, 10.473388671875, 11.08349609375, 11.693603515625, 12.3037109375, 12.913818359375, 13.52392578125, 14.134033203125, 14.744140625, 15.354248046875, 15.96435546875, 16.574462890625, 17.1845703125, 17.794677734375, 18.40478515625, 19.014892578125, 19.625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 14.0, 13.0, 18.0, 21.0, 25.0, 31.0, 39.0, 60.0, 58.0, 84.0, 76.0, 69.0, 63.0, 62.0, 74.0, 52.0, 54.0, 45.0, 31.0, 23.0, 16.0, 17.0, 11.0, 12.0, 4.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.849853515625, -23.07470703125, -22.299560546875, -21.5244140625, -20.749267578125, -19.97412109375, -19.198974609375, -18.423828125, -17.648681640625, -16.87353515625, -16.098388671875, -15.3232421875, -14.548095703125, -13.77294921875, -12.997802734375, -12.22265625, -11.447509765625, -10.67236328125, -9.897216796875, -9.1220703125, -8.346923828125, -7.57177734375, -6.796630859375, -6.021484375, -5.246337890625, -4.47119140625, -3.696044921875, -2.9208984375, -2.145751953125, -1.37060546875, -0.595458984375, 0.1796875, 0.954833984375, 1.72998046875, 2.505126953125, 3.2802734375, 4.055419921875, 4.83056640625, 5.605712890625, 6.380859375, 7.156005859375, 7.93115234375, 8.706298828125, 9.4814453125, 10.256591796875, 11.03173828125, 11.806884765625, 12.58203125, 13.357177734375, 14.13232421875, 14.907470703125, 15.6826171875, 16.457763671875, 17.23291015625, 18.008056640625, 18.783203125, 19.558349609375, 20.33349609375, 21.108642578125, 21.8837890625, 22.658935546875, 23.43408203125, 24.209228515625, 24.984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 8.0, 12.0, 13.0, 24.0, 29.0, 68.0, 79.0, 136.0, 242.0, 449.0, 823.0, 1731.0, 3867.0, 8545.0, 19278.0, 46536.0, 178658.0, 584743.0, 132343.0, 39791.0, 16887.0, 7493.0, 3460.0, 1579.0, 760.0, 403.0, 239.0, 122.0, 79.0, 52.0, 27.0, 25.0, 14.0, 12.0, 9.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.6612548828125, -9.353759765625, -9.0462646484375, -8.73876953125, -8.4312744140625, -8.123779296875, -7.8162841796875, -7.5087890625, -7.2012939453125, -6.893798828125, -6.5863037109375, -6.27880859375, -5.9713134765625, -5.663818359375, -5.3563232421875, -5.048828125, -4.7413330078125, -4.433837890625, -4.1263427734375, -3.81884765625, -3.5113525390625, -3.203857421875, -2.8963623046875, -2.5888671875, -2.2813720703125, -1.973876953125, -1.6663818359375, -1.35888671875, -1.0513916015625, -0.743896484375, -0.4364013671875, -0.12890625, 0.1785888671875, 0.486083984375, 0.7935791015625, 1.10107421875, 1.4085693359375, 1.716064453125, 2.0235595703125, 2.3310546875, 2.6385498046875, 2.946044921875, 3.2535400390625, 3.56103515625, 3.8685302734375, 4.176025390625, 4.4835205078125, 4.791015625, 5.0985107421875, 5.406005859375, 5.7135009765625, 6.02099609375, 6.3284912109375, 6.635986328125, 6.9434814453125, 7.2509765625, 7.5584716796875, 7.865966796875, 8.1734619140625, 8.48095703125, 8.7884521484375, 9.095947265625, 9.4034423828125, 9.7109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 16.0, 12.0, 9.0, 16.0, 20.0, 52.0, 101.0, 281.0, 273.0, 80.0, 34.0, 21.0, 15.0, 12.0, 11.0, 6.0, 6.0, 11.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006015777587890625, -0.0058481693267822266, -0.005680561065673828, -0.00551295280456543, -0.005345344543457031, -0.005177736282348633, -0.005010128021240234, -0.004842519760131836, -0.0046749114990234375, -0.004507303237915039, -0.004339694976806641, -0.004172086715698242, -0.004004478454589844, -0.0038368701934814453, -0.003669261932373047, -0.0035016536712646484, -0.00333404541015625, -0.0031664371490478516, -0.002998828887939453, -0.0028312206268310547, -0.0026636123657226562, -0.002496004104614258, -0.0023283958435058594, -0.002160787582397461, -0.0019931793212890625, -0.001825571060180664, -0.0016579627990722656, -0.0014903545379638672, -0.0013227462768554688, -0.0011551380157470703, -0.0009875297546386719, -0.0008199214935302734, -0.000652313232421875, -0.00048470497131347656, -0.0003170967102050781, -0.0001494884490966797, 1.811981201171875e-05, 0.0001857280731201172, 0.0003533363342285156, 0.0005209445953369141, 0.0006885528564453125, 0.0008561611175537109, 0.0010237693786621094, 0.0011913776397705078, 0.0013589859008789062, 0.0015265941619873047, 0.0016942024230957031, 0.0018618106842041016, 0.0020294189453125, 0.0021970272064208984, 0.002364635467529297, 0.0025322437286376953, 0.0026998519897460938, 0.002867460250854492, 0.0030350685119628906, 0.003202676773071289, 0.0033702850341796875, 0.003537893295288086, 0.0037055015563964844, 0.003873109817504883, 0.004040718078613281, 0.00420832633972168, 0.004375934600830078, 0.0045435428619384766, 0.004711151123046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 14.0, 16.0, 21.0, 29.0, 40.0, 60.0, 93.0, 136.0, 247.0, 401.0, 779.0, 1461.0, 2849.0, 6095.0, 12785.0, 30155.0, 89384.0, 555803.0, 258130.0, 51613.0, 20315.0, 9180.0, 4336.0, 2053.0, 1060.0, 608.0, 302.0, 200.0, 101.0, 74.0, 50.0, 36.0, 34.0, 23.0, 17.0, 12.0, 13.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5859375, -9.2843017578125, -8.982666015625, -8.6810302734375, -8.37939453125, -8.0777587890625, -7.776123046875, -7.4744873046875, -7.1728515625, -6.8712158203125, -6.569580078125, -6.2679443359375, -5.96630859375, -5.6646728515625, -5.363037109375, -5.0614013671875, -4.759765625, -4.4581298828125, -4.156494140625, -3.8548583984375, -3.55322265625, -3.2515869140625, -2.949951171875, -2.6483154296875, -2.3466796875, -2.0450439453125, -1.743408203125, -1.4417724609375, -1.14013671875, -0.8385009765625, -0.536865234375, -0.2352294921875, 0.06640625, 0.3680419921875, 0.669677734375, 0.9713134765625, 1.27294921875, 1.5745849609375, 1.876220703125, 2.1778564453125, 2.4794921875, 2.7811279296875, 3.082763671875, 3.3843994140625, 3.68603515625, 3.9876708984375, 4.289306640625, 4.5909423828125, 4.892578125, 5.1942138671875, 5.495849609375, 5.7974853515625, 6.09912109375, 6.4007568359375, 6.702392578125, 7.0040283203125, 7.3056640625, 7.6072998046875, 7.908935546875, 8.2105712890625, 8.51220703125, 8.8138427734375, 9.115478515625, 9.4171142578125, 9.71875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 7.0, 6.0, 11.0, 18.0, 18.0, 19.0, 16.0, 37.0, 34.0, 68.0, 96.0, 128.0, 125.0, 114.0, 72.0, 51.0, 37.0, 16.0, 17.0, 12.0, 10.0, 8.0, 7.0, 4.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.50146484375, -7.2451171875, -6.98876953125, -6.732421875, -6.47607421875, -6.2197265625, -5.96337890625, -5.70703125, -5.45068359375, -5.1943359375, -4.93798828125, -4.681640625, -4.42529296875, -4.1689453125, -3.91259765625, -3.65625, -3.39990234375, -3.1435546875, -2.88720703125, -2.630859375, -2.37451171875, -2.1181640625, -1.86181640625, -1.60546875, -1.34912109375, -1.0927734375, -0.83642578125, -0.580078125, -0.32373046875, -0.0673828125, 0.18896484375, 0.4453125, 0.70166015625, 0.9580078125, 1.21435546875, 1.470703125, 1.72705078125, 1.9833984375, 2.23974609375, 2.49609375, 2.75244140625, 3.0087890625, 3.26513671875, 3.521484375, 3.77783203125, 4.0341796875, 4.29052734375, 4.546875, 4.80322265625, 5.0595703125, 5.31591796875, 5.572265625, 5.82861328125, 6.0849609375, 6.34130859375, 6.59765625, 6.85400390625, 7.1103515625, 7.36669921875, 7.623046875, 7.87939453125, 8.1357421875, 8.39208984375, 8.6484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 14.0, 28.0, 36.0, 62.0, 83.0, 100.0, 127.0, 123.0, 114.0, 94.0, 63.0, 58.0, 40.0, 17.0, 11.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-222.4858856201172, -217.77609252929688, -213.06629943847656, -208.35650634765625, -203.64671325683594, -198.93692016601562, -194.22711181640625, -189.51731872558594, -184.80752563476562, -180.0977325439453, -175.387939453125, -170.6781463623047, -165.96835327148438, -161.258544921875, -156.54876708984375, -151.83895874023438, -147.12918090820312, -142.4193878173828, -137.7095947265625, -132.9998016357422, -128.29000854492188, -123.58020782470703, -118.87041473388672, -114.16061401367188, -109.45082092285156, -104.74102783203125, -100.03123474121094, -95.32144165039062, -90.61164093017578, -85.90184783935547, -81.19205474853516, -76.48225402832031, -71.7724609375, -67.06266784667969, -62.35287094116211, -57.6430778503418, -52.93328094482422, -48.223487854003906, -43.513694763183594, -38.803897857666016, -34.0941047668457, -29.384309768676758, -24.674514770507812, -19.9647216796875, -15.254926681518555, -10.54513168334961, -5.835338592529297, -1.1255416870117188, 3.5842514038085938, 8.294046401977539, 13.003840446472168, 17.713634490966797, 22.423429489135742, 27.133224487304688, 31.843017578125, 36.55281448364258, 41.26260757446289, 45.9724006652832, 50.68219757080078, 55.391990661621094, 60.101783752441406, 64.81158447265625, 69.52137756347656, 74.23117065429688, 78.94096374511719]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 13.0, 5.0, 14.0, 12.0, 18.0, 13.0, 15.0, 18.0, 37.0, 28.0, 30.0, 24.0, 27.0, 29.0, 33.0, 32.0, 53.0, 51.0, 46.0, 33.0, 54.0, 41.0, 39.0, 47.0, 38.0, 34.0, 23.0, 33.0, 31.0, 22.0, 20.0, 11.0, 18.0, 15.0, 11.0, 8.0, 4.0, 5.0, 5.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-74.47787475585938, -72.0730972290039, -69.66831970214844, -67.26354217529297, -64.8587646484375, -62.45398712158203, -60.04920959472656, -57.644432067871094, -55.239654541015625, -52.834877014160156, -50.43009948730469, -48.02532196044922, -45.62054443359375, -43.21576690673828, -40.81098937988281, -38.406211853027344, -36.001434326171875, -33.596656799316406, -31.191879272460938, -28.78710174560547, -26.38232421875, -23.97754669189453, -21.572769165039062, -19.167991638183594, -16.763214111328125, -14.358436584472656, -11.953659057617188, -9.548881530761719, -7.14410400390625, -4.739326477050781, -2.3345489501953125, 0.07022857666015625, 2.4750137329101562, 4.879791259765625, 7.284568786621094, 9.689346313476562, 12.094123840332031, 14.4989013671875, 16.90367889404297, 19.308456420898438, 21.713233947753906, 24.118011474609375, 26.522789001464844, 28.927566528320312, 31.33234405517578, 33.73712158203125, 36.14189910888672, 38.54667663574219, 40.951454162597656, 43.356231689453125, 45.761009216308594, 48.16578674316406, 50.57056427001953, 52.975341796875, 55.38011932373047, 57.78489685058594, 60.189674377441406, 62.594451904296875, 64.99922943115234, 67.40400695800781, 69.80878448486328, 72.21356201171875, 74.61833953857422, 77.02311706542969, 79.42789459228516]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 12.0, 10.0, 13.0, 27.0, 35.0, 53.0, 65.0, 116.0, 161.0, 284.0, 501.0, 869.0, 1795.0, 3793.0, 8460.0, 21523.0, 64528.0, 312642.0, 3450970.0, 239877.0, 54564.0, 18943.0, 7835.0, 3483.0, 1659.0, 866.0, 428.0, 277.0, 171.0, 111.0, 61.0, 47.0, 31.0, 20.0, 20.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.96875, -33.0849609375, -32.201171875, -31.3173828125, -30.43359375, -29.5498046875, -28.666015625, -27.7822265625, -26.8984375, -26.0146484375, -25.130859375, -24.2470703125, -23.36328125, -22.4794921875, -21.595703125, -20.7119140625, -19.828125, -18.9443359375, -18.060546875, -17.1767578125, -16.29296875, -15.4091796875, -14.525390625, -13.6416015625, -12.7578125, -11.8740234375, -10.990234375, -10.1064453125, -9.22265625, -8.3388671875, -7.455078125, -6.5712890625, -5.6875, -4.8037109375, -3.919921875, -3.0361328125, -2.15234375, -1.2685546875, -0.384765625, 0.4990234375, 1.3828125, 2.2666015625, 3.150390625, 4.0341796875, 4.91796875, 5.8017578125, 6.685546875, 7.5693359375, 8.453125, 9.3369140625, 10.220703125, 11.1044921875, 11.98828125, 12.8720703125, 13.755859375, 14.6396484375, 15.5234375, 16.4072265625, 17.291015625, 18.1748046875, 19.05859375, 19.9423828125, 20.826171875, 21.7099609375, 22.59375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 17.0, 18.0, 20.0, 25.0, 15.0, 22.0, 29.0, 37.0, 39.0, 38.0, 39.0, 48.0, 55.0, 42.0, 59.0, 43.0, 43.0, 33.0, 38.0, 38.0, 31.0, 32.0, 38.0, 23.0, 23.0, 21.0, 21.0, 20.0, 13.0, 14.0, 10.0, 12.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.54296875, -4.4156494140625, -4.288330078125, -4.1610107421875, -4.03369140625, -3.9063720703125, -3.779052734375, -3.6517333984375, -3.5244140625, -3.3970947265625, -3.269775390625, -3.1424560546875, -3.01513671875, -2.8878173828125, -2.760498046875, -2.6331787109375, -2.505859375, -2.3785400390625, -2.251220703125, -2.1239013671875, -1.99658203125, -1.8692626953125, -1.741943359375, -1.6146240234375, -1.4873046875, -1.3599853515625, -1.232666015625, -1.1053466796875, -0.97802734375, -0.8507080078125, -0.723388671875, -0.5960693359375, -0.46875, -0.3414306640625, -0.214111328125, -0.0867919921875, 0.04052734375, 0.1678466796875, 0.295166015625, 0.4224853515625, 0.5498046875, 0.6771240234375, 0.804443359375, 0.9317626953125, 1.05908203125, 1.1864013671875, 1.313720703125, 1.4410400390625, 1.568359375, 1.6956787109375, 1.822998046875, 1.9503173828125, 2.07763671875, 2.2049560546875, 2.332275390625, 2.4595947265625, 2.5869140625, 2.7142333984375, 2.841552734375, 2.9688720703125, 3.09619140625, 3.2235107421875, 3.350830078125, 3.4781494140625, 3.60546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 9.0, 7.0, 19.0, 17.0, 30.0, 48.0, 61.0, 91.0, 150.0, 186.0, 295.0, 435.0, 643.0, 912.0, 1473.0, 2350.0, 4248.0, 8230.0, 16518.0, 38378.0, 106181.0, 506481.0, 3095106.0, 278025.0, 75885.0, 29253.0, 13139.0, 6468.0, 3534.0, 2096.0, 1327.0, 857.0, 556.0, 376.0, 284.0, 203.0, 128.0, 86.0, 68.0, 47.0, 24.0, 14.0, 17.0, 8.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.59375, -24.802490234375, -24.01123046875, -23.219970703125, -22.4287109375, -21.637451171875, -20.84619140625, -20.054931640625, -19.263671875, -18.472412109375, -17.68115234375, -16.889892578125, -16.0986328125, -15.307373046875, -14.51611328125, -13.724853515625, -12.93359375, -12.142333984375, -11.35107421875, -10.559814453125, -9.7685546875, -8.977294921875, -8.18603515625, -7.394775390625, -6.603515625, -5.812255859375, -5.02099609375, -4.229736328125, -3.4384765625, -2.647216796875, -1.85595703125, -1.064697265625, -0.2734375, 0.517822265625, 1.30908203125, 2.100341796875, 2.8916015625, 3.682861328125, 4.47412109375, 5.265380859375, 6.056640625, 6.847900390625, 7.63916015625, 8.430419921875, 9.2216796875, 10.012939453125, 10.80419921875, 11.595458984375, 12.38671875, 13.177978515625, 13.96923828125, 14.760498046875, 15.5517578125, 16.343017578125, 17.13427734375, 17.925537109375, 18.716796875, 19.508056640625, 20.29931640625, 21.090576171875, 21.8818359375, 22.673095703125, 23.46435546875, 24.255615234375, 25.046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 6.0, 7.0, 25.0, 28.0, 40.0, 31.0, 60.0, 99.0, 174.0, 359.0, 1431.0, 974.0, 303.0, 151.0, 90.0, 70.0, 57.0, 31.0, 24.0, 21.0, 18.0, 9.0, 5.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7117919921875, -10.314208984375, -9.9166259765625, -9.51904296875, -9.1214599609375, -8.723876953125, -8.3262939453125, -7.9287109375, -7.5311279296875, -7.133544921875, -6.7359619140625, -6.33837890625, -5.9407958984375, -5.543212890625, -5.1456298828125, -4.748046875, -4.3504638671875, -3.952880859375, -3.5552978515625, -3.15771484375, -2.7601318359375, -2.362548828125, -1.9649658203125, -1.5673828125, -1.1697998046875, -0.772216796875, -0.3746337890625, 0.02294921875, 0.4205322265625, 0.818115234375, 1.2156982421875, 1.61328125, 2.0108642578125, 2.408447265625, 2.8060302734375, 3.20361328125, 3.6011962890625, 3.998779296875, 4.3963623046875, 4.7939453125, 5.1915283203125, 5.589111328125, 5.9866943359375, 6.38427734375, 6.7818603515625, 7.179443359375, 7.5770263671875, 7.974609375, 8.3721923828125, 8.769775390625, 9.1673583984375, 9.56494140625, 9.9625244140625, 10.360107421875, 10.7576904296875, 11.1552734375, 11.5528564453125, 11.950439453125, 12.3480224609375, 12.74560546875, 13.1431884765625, 13.540771484375, 13.9383544921875, 14.3359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 7.0, 22.0, 18.0, 40.0, 57.0, 76.0, 107.0, 104.0, 122.0, 122.0, 100.0, 70.0, 58.0, 34.0, 23.0, 8.0, 6.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-122.13401794433594, -119.43634033203125, -116.73866271972656, -114.04098510742188, -111.34329986572266, -108.64562225341797, -105.94794464111328, -103.2502670288086, -100.55258178710938, -97.85490417480469, -95.1572265625, -92.45954895019531, -89.7618637084961, -87.0641860961914, -84.36650848388672, -81.66883087158203, -78.97115325927734, -76.27347564697266, -73.57579803466797, -70.87811279296875, -68.18043518066406, -65.48275756835938, -62.78507995605469, -60.08740234375, -57.38972091674805, -54.69204330444336, -51.994361877441406, -49.29668426513672, -46.59900665283203, -43.90132522583008, -41.20364761352539, -38.50596618652344, -35.80829620361328, -33.110618591308594, -30.41293716430664, -27.715259552001953, -25.017580032348633, -22.319900512695312, -19.622222900390625, -16.924543380737305, -14.226863861083984, -11.529184341430664, -8.83150577545166, -6.133827209472656, -3.436147689819336, -0.7384681701660156, 1.9592094421386719, 4.656888961791992, 7.3545684814453125, 10.052248001098633, 12.749926567077637, 15.44760513305664, 18.14528465270996, 20.84296417236328, 23.54064178466797, 26.23832130432129, 28.93600082397461, 31.63368034362793, 34.33135986328125, 37.02903747558594, 39.726715087890625, 42.42439651489258, 45.122074127197266, 47.81975555419922, 50.517433166503906]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 3.0, 22.0, 13.0, 15.0, 15.0, 27.0, 21.0, 25.0, 27.0, 31.0, 46.0, 48.0, 45.0, 48.0, 40.0, 55.0, 53.0, 53.0, 52.0, 46.0, 43.0, 37.0, 39.0, 22.0, 25.0, 23.0, 24.0, 19.0, 12.0, 11.0, 13.0, 3.0, 10.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.869972229003906, -46.35736846923828, -44.844764709472656, -43.332157135009766, -41.81955337524414, -40.306949615478516, -38.794342041015625, -37.28173828125, -35.769134521484375, -34.25653076171875, -32.743927001953125, -31.231319427490234, -29.71871566772461, -28.206111907958984, -26.693506240844727, -25.18090057373047, -23.668296813964844, -22.15569305419922, -20.64308738708496, -19.130481719970703, -17.617877960205078, -16.105274200439453, -14.592668533325195, -13.080063819885254, -11.567459106445312, -10.054854393005371, -8.54224967956543, -7.029644966125488, -5.517040252685547, -4.0044355392456055, -2.491830825805664, -0.9792261123657227, 0.5333786010742188, 2.04598331451416, 3.5585880279541016, 5.071192741394043, 6.583797454833984, 8.096402168273926, 9.609006881713867, 11.121611595153809, 12.63421630859375, 14.146821022033691, 15.659425735473633, 17.17203140258789, 18.684635162353516, 20.19723892211914, 21.7098445892334, 23.222450256347656, 24.73505401611328, 26.247657775878906, 27.760263442993164, 29.272869110107422, 30.785472869873047, 32.29807662963867, 33.81068420410156, 35.32328796386719, 36.83589172363281, 38.34849548339844, 39.86109924316406, 41.37370681762695, 42.88631057739258, 44.3989143371582, 45.911521911621094, 47.42412567138672, 48.936729431152344]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 20.0, 24.0, 26.0, 46.0, 53.0, 88.0, 158.0, 237.0, 424.0, 723.0, 1386.0, 2582.0, 4870.0, 9728.0, 19623.0, 38670.0, 75235.0, 150515.0, 281812.0, 230081.0, 114242.0, 57816.0, 29652.0, 14899.0, 7483.0, 3739.0, 1948.0, 1043.0, 524.0, 332.0, 186.0, 105.0, 84.0, 46.0, 38.0, 33.0, 24.0, 22.0, 12.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.171875, -17.63427734375, -17.0966796875, -16.55908203125, -16.021484375, -15.48388671875, -14.9462890625, -14.40869140625, -13.87109375, -13.33349609375, -12.7958984375, -12.25830078125, -11.720703125, -11.18310546875, -10.6455078125, -10.10791015625, -9.5703125, -9.03271484375, -8.4951171875, -7.95751953125, -7.419921875, -6.88232421875, -6.3447265625, -5.80712890625, -5.26953125, -4.73193359375, -4.1943359375, -3.65673828125, -3.119140625, -2.58154296875, -2.0439453125, -1.50634765625, -0.96875, -0.43115234375, 0.1064453125, 0.64404296875, 1.181640625, 1.71923828125, 2.2568359375, 2.79443359375, 3.33203125, 3.86962890625, 4.4072265625, 4.94482421875, 5.482421875, 6.02001953125, 6.5576171875, 7.09521484375, 7.6328125, 8.17041015625, 8.7080078125, 9.24560546875, 9.783203125, 10.32080078125, 10.8583984375, 11.39599609375, 11.93359375, 12.47119140625, 13.0087890625, 13.54638671875, 14.083984375, 14.62158203125, 15.1591796875, 15.69677734375, 16.234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 11.0, 7.0, 12.0, 15.0, 12.0, 15.0, 17.0, 13.0, 25.0, 18.0, 36.0, 24.0, 43.0, 27.0, 37.0, 32.0, 47.0, 43.0, 49.0, 46.0, 43.0, 43.0, 31.0, 46.0, 30.0, 39.0, 34.0, 30.0, 32.0, 25.0, 24.0, 22.0, 13.0, 13.0, 12.0, 6.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.34765625, -4.20330810546875, -4.0589599609375, -3.91461181640625, -3.770263671875, -3.62591552734375, -3.4815673828125, -3.33721923828125, -3.19287109375, -3.04852294921875, -2.9041748046875, -2.75982666015625, -2.615478515625, -2.47113037109375, -2.3267822265625, -2.18243408203125, -2.0380859375, -1.89373779296875, -1.7493896484375, -1.60504150390625, -1.460693359375, -1.31634521484375, -1.1719970703125, -1.02764892578125, -0.88330078125, -0.73895263671875, -0.5946044921875, -0.45025634765625, -0.305908203125, -0.16156005859375, -0.0172119140625, 0.12713623046875, 0.271484375, 0.41583251953125, 0.5601806640625, 0.70452880859375, 0.848876953125, 0.99322509765625, 1.1375732421875, 1.28192138671875, 1.42626953125, 1.57061767578125, 1.7149658203125, 1.85931396484375, 2.003662109375, 2.14801025390625, 2.2923583984375, 2.43670654296875, 2.5810546875, 2.72540283203125, 2.8697509765625, 3.01409912109375, 3.158447265625, 3.30279541015625, 3.4471435546875, 3.59149169921875, 3.73583984375, 3.88018798828125, 4.0245361328125, 4.16888427734375, 4.313232421875, 4.45758056640625, 4.6019287109375, 4.74627685546875, 4.890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 6.0, 11.0, 22.0, 10.0, 34.0, 43.0, 54.0, 92.0, 152.0, 223.0, 286.0, 536.0, 907.0, 1620.0, 3489.0, 8754.0, 23801.0, 66273.0, 194543.0, 469535.0, 179403.0, 61616.0, 21883.0, 7997.0, 3397.0, 1609.0, 838.0, 502.0, 288.0, 182.0, 140.0, 82.0, 49.0, 50.0, 33.0, 24.0, 14.0, 14.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.539794921875, -22.76708984375, -21.994384765625, -21.2216796875, -20.448974609375, -19.67626953125, -18.903564453125, -18.130859375, -17.358154296875, -16.58544921875, -15.812744140625, -15.0400390625, -14.267333984375, -13.49462890625, -12.721923828125, -11.94921875, -11.176513671875, -10.40380859375, -9.631103515625, -8.8583984375, -8.085693359375, -7.31298828125, -6.540283203125, -5.767578125, -4.994873046875, -4.22216796875, -3.449462890625, -2.6767578125, -1.904052734375, -1.13134765625, -0.358642578125, 0.4140625, 1.186767578125, 1.95947265625, 2.732177734375, 3.5048828125, 4.277587890625, 5.05029296875, 5.822998046875, 6.595703125, 7.368408203125, 8.14111328125, 8.913818359375, 9.6865234375, 10.459228515625, 11.23193359375, 12.004638671875, 12.77734375, 13.550048828125, 14.32275390625, 15.095458984375, 15.8681640625, 16.640869140625, 17.41357421875, 18.186279296875, 18.958984375, 19.731689453125, 20.50439453125, 21.277099609375, 22.0498046875, 22.822509765625, 23.59521484375, 24.367919921875, 25.140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 12.0, 3.0, 11.0, 12.0, 15.0, 11.0, 27.0, 22.0, 22.0, 30.0, 29.0, 48.0, 29.0, 44.0, 52.0, 48.0, 60.0, 56.0, 48.0, 43.0, 36.0, 44.0, 40.0, 48.0, 28.0, 28.0, 21.0, 24.0, 23.0, 19.0, 18.0, 6.0, 8.0, 2.0, 3.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.703125, -27.864990234375, -27.02685546875, -26.188720703125, -25.3505859375, -24.512451171875, -23.67431640625, -22.836181640625, -21.998046875, -21.159912109375, -20.32177734375, -19.483642578125, -18.6455078125, -17.807373046875, -16.96923828125, -16.131103515625, -15.29296875, -14.454833984375, -13.61669921875, -12.778564453125, -11.9404296875, -11.102294921875, -10.26416015625, -9.426025390625, -8.587890625, -7.749755859375, -6.91162109375, -6.073486328125, -5.2353515625, -4.397216796875, -3.55908203125, -2.720947265625, -1.8828125, -1.044677734375, -0.20654296875, 0.631591796875, 1.4697265625, 2.307861328125, 3.14599609375, 3.984130859375, 4.822265625, 5.660400390625, 6.49853515625, 7.336669921875, 8.1748046875, 9.012939453125, 9.85107421875, 10.689208984375, 11.52734375, 12.365478515625, 13.20361328125, 14.041748046875, 14.8798828125, 15.718017578125, 16.55615234375, 17.394287109375, 18.232421875, 19.070556640625, 19.90869140625, 20.746826171875, 21.5849609375, 22.423095703125, 23.26123046875, 24.099365234375, 24.9375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 13.0, 21.0, 30.0, 44.0, 88.0, 142.0, 320.0, 956.0, 3931.0, 40307.0, 921206.0, 74220.0, 5376.0, 1143.0, 374.0, 158.0, 96.0, 47.0, 22.0, 28.0, 8.0, 8.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.28125, -47.35498046875, -45.4287109375, -43.50244140625, -41.576171875, -39.64990234375, -37.7236328125, -35.79736328125, -33.87109375, -31.94482421875, -30.0185546875, -28.09228515625, -26.166015625, -24.23974609375, -22.3134765625, -20.38720703125, -18.4609375, -16.53466796875, -14.6083984375, -12.68212890625, -10.755859375, -8.82958984375, -6.9033203125, -4.97705078125, -3.05078125, -1.12451171875, 0.8017578125, 2.72802734375, 4.654296875, 6.58056640625, 8.5068359375, 10.43310546875, 12.359375, 14.28564453125, 16.2119140625, 18.13818359375, 20.064453125, 21.99072265625, 23.9169921875, 25.84326171875, 27.76953125, 29.69580078125, 31.6220703125, 33.54833984375, 35.474609375, 37.40087890625, 39.3271484375, 41.25341796875, 43.1796875, 45.10595703125, 47.0322265625, 48.95849609375, 50.884765625, 52.81103515625, 54.7373046875, 56.66357421875, 58.58984375, 60.51611328125, 62.4423828125, 64.36865234375, 66.294921875, 68.22119140625, 70.1474609375, 72.07373046875, 74.0]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 6.0, 10.0, 13.0, 19.0, 31.0, 44.0, 46.0, 61.0, 97.0, 197.0, 183.0, 88.0, 50.0, 44.0, 35.0, 20.0, 17.0, 11.0, 10.0, 5.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003997802734375, -0.0038068294525146484, -0.003615856170654297, -0.0034248828887939453, -0.0032339096069335938, -0.003042936325073242, -0.0028519630432128906, -0.002660989761352539, -0.0024700164794921875, -0.002279043197631836, -0.0020880699157714844, -0.0018970966339111328, -0.0017061233520507812, -0.0015151500701904297, -0.0013241767883300781, -0.0011332035064697266, -0.000942230224609375, -0.0007512569427490234, -0.0005602836608886719, -0.0003693103790283203, -0.00017833709716796875, 1.2636184692382812e-05, 0.00020360946655273438, 0.00039458274841308594, 0.0005855560302734375, 0.0007765293121337891, 0.0009675025939941406, 0.0011584758758544922, 0.0013494491577148438, 0.0015404224395751953, 0.0017313957214355469, 0.0019223690032958984, 0.00211334228515625, 0.0023043155670166016, 0.002495288848876953, 0.0026862621307373047, 0.0028772354125976562, 0.003068208694458008, 0.0032591819763183594, 0.003450155258178711, 0.0036411285400390625, 0.003832101821899414, 0.004023075103759766, 0.004214048385620117, 0.004405021667480469, 0.00459599494934082, 0.004786968231201172, 0.0049779415130615234, 0.005168914794921875, 0.0053598880767822266, 0.005550861358642578, 0.00574183464050293, 0.005932807922363281, 0.006123781204223633, 0.006314754486083984, 0.006505727767944336, 0.0066967010498046875, 0.006887674331665039, 0.007078647613525391, 0.007269620895385742, 0.007460594177246094, 0.007651567459106445, 0.007842540740966797, 0.008033514022827148, 0.0082244873046875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 15.0, 18.0, 24.0, 30.0, 62.0, 129.0, 206.0, 396.0, 778.0, 1827.0, 4757.0, 17368.0, 185646.0, 772879.0, 50182.0, 8794.0, 2962.0, 1222.0, 578.0, 321.0, 136.0, 68.0, 66.0, 30.0, 27.0, 6.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-56.40625, -55.00537109375, -53.6044921875, -52.20361328125, -50.802734375, -49.40185546875, -48.0009765625, -46.60009765625, -45.19921875, -43.79833984375, -42.3974609375, -40.99658203125, -39.595703125, -38.19482421875, -36.7939453125, -35.39306640625, -33.9921875, -32.59130859375, -31.1904296875, -29.78955078125, -28.388671875, -26.98779296875, -25.5869140625, -24.18603515625, -22.78515625, -21.38427734375, -19.9833984375, -18.58251953125, -17.181640625, -15.78076171875, -14.3798828125, -12.97900390625, -11.578125, -10.17724609375, -8.7763671875, -7.37548828125, -5.974609375, -4.57373046875, -3.1728515625, -1.77197265625, -0.37109375, 1.02978515625, 2.4306640625, 3.83154296875, 5.232421875, 6.63330078125, 8.0341796875, 9.43505859375, 10.8359375, 12.23681640625, 13.6376953125, 15.03857421875, 16.439453125, 17.84033203125, 19.2412109375, 20.64208984375, 22.04296875, 23.44384765625, 24.8447265625, 26.24560546875, 27.646484375, 29.04736328125, 30.4482421875, 31.84912109375, 33.25]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 7.0, 6.0, 11.0, 16.0, 16.0, 23.0, 48.0, 85.0, 116.0, 211.0, 166.0, 88.0, 60.0, 46.0, 20.0, 21.0, 18.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.015625, -27.971923828125, -26.92822265625, -25.884521484375, -24.8408203125, -23.797119140625, -22.75341796875, -21.709716796875, -20.666015625, -19.622314453125, -18.57861328125, -17.534912109375, -16.4912109375, -15.447509765625, -14.40380859375, -13.360107421875, -12.31640625, -11.272705078125, -10.22900390625, -9.185302734375, -8.1416015625, -7.097900390625, -6.05419921875, -5.010498046875, -3.966796875, -2.923095703125, -1.87939453125, -0.835693359375, 0.2080078125, 1.251708984375, 2.29541015625, 3.339111328125, 4.3828125, 5.426513671875, 6.47021484375, 7.513916015625, 8.5576171875, 9.601318359375, 10.64501953125, 11.688720703125, 12.732421875, 13.776123046875, 14.81982421875, 15.863525390625, 16.9072265625, 17.950927734375, 18.99462890625, 20.038330078125, 21.08203125, 22.125732421875, 23.16943359375, 24.213134765625, 25.2568359375, 26.300537109375, 27.34423828125, 28.387939453125, 29.431640625, 30.475341796875, 31.51904296875, 32.562744140625, 33.6064453125, 34.650146484375, 35.69384765625, 36.737548828125, 37.78125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 27.0, 43.0, 84.0, 131.0, 171.0, 168.0, 148.0, 95.0, 49.0, 32.0, 19.0, 7.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-459.84710693359375, -447.7350769042969, -435.6230163574219, -423.510986328125, -411.39892578125, -399.2868957519531, -387.17486572265625, -375.06280517578125, -362.9507751464844, -350.8387451171875, -338.7266845703125, -326.6146545410156, -314.50262451171875, -302.39056396484375, -290.2785339355469, -278.16650390625, -266.054443359375, -253.94239807128906, -241.83035278320312, -229.71832275390625, -217.6062774658203, -205.49423217773438, -193.3822021484375, -181.27015686035156, -169.15811157226562, -157.0460662841797, -144.93402099609375, -132.82199096679688, -120.70994567871094, -108.597900390625, -96.4858627319336, -84.37382507324219, -72.26177978515625, -60.14973831176758, -48.037696838378906, -35.925655364990234, -23.813613891601562, -11.70157241821289, 0.41046905517578125, 12.522506713867188, 24.634552001953125, 36.7465934753418, 48.85863494873047, 60.97067642211914, 73.08271789550781, 85.19476318359375, 97.30680084228516, 109.41883850097656, 121.5308837890625, 133.64292907714844, 145.75497436523438, 157.86700439453125, 169.9790496826172, 182.09109497070312, 194.203125, 206.31517028808594, 218.42721557617188, 230.5392608642578, 242.65130615234375, 254.76333618164062, 266.8753662109375, 278.9874267578125, 291.0994567871094, 303.21148681640625, 315.32354736328125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 6.0, 12.0, 5.0, 15.0, 10.0, 6.0, 15.0, 16.0, 17.0, 19.0, 21.0, 27.0, 20.0, 32.0, 37.0, 43.0, 44.0, 45.0, 40.0, 37.0, 32.0, 38.0, 41.0, 44.0, 32.0, 45.0, 32.0, 28.0, 33.0, 36.0, 21.0, 20.0, 26.0, 17.0, 16.0, 3.0, 11.0, 16.0, 7.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-131.43313598632812, -127.40620422363281, -123.3792724609375, -119.35234069824219, -115.32540130615234, -111.29846954345703, -107.27153778076172, -103.2446060180664, -99.21766662597656, -95.19073486328125, -91.16380310058594, -87.13687133789062, -83.10993194580078, -79.08300018310547, -75.05606842041016, -71.02913665771484, -67.00220489501953, -62.97527313232422, -58.94833755493164, -54.92140579223633, -50.89447021484375, -46.86753845214844, -42.840606689453125, -38.81367492675781, -34.786739349365234, -30.75980567932129, -26.732872009277344, -22.70594024658203, -18.679006576538086, -14.65207290649414, -10.625141143798828, -6.598207473754883, -2.5712814331054688, 1.4556517601013184, 5.4825849533081055, 9.509517669677734, 13.53645133972168, 17.563385009765625, 21.590316772460938, 25.617250442504883, 29.644184112548828, 33.67111587524414, 37.69805145263672, 41.72498321533203, 45.751914978027344, 49.77885055541992, 53.805782318115234, 57.83271789550781, 61.859649658203125, 65.88658142089844, 69.91351318359375, 73.94044494628906, 77.9673843383789, 81.99431610107422, 86.02124786376953, 90.04817962646484, 94.07511901855469, 98.10205078125, 102.12898254394531, 106.15591430664062, 110.18285369873047, 114.20978546142578, 118.2367172241211, 122.2636489868164, 126.29058074951172]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 10.0, 12.0, 8.0, 24.0, 24.0, 36.0, 71.0, 114.0, 166.0, 230.0, 397.0, 615.0, 966.0, 1622.0, 2922.0, 5249.0, 10225.0, 21007.0, 46718.0, 122851.0, 512927.0, 2974841.0, 327674.0, 93263.0, 37099.0, 16846.0, 8238.0, 4315.0, 2360.0, 1331.0, 771.0, 450.0, 304.0, 193.0, 128.0, 89.0, 54.0, 36.0, 31.0, 16.0, 16.0, 7.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.555908203125, -20.84619140625, -20.136474609375, -19.4267578125, -18.717041015625, -18.00732421875, -17.297607421875, -16.587890625, -15.878173828125, -15.16845703125, -14.458740234375, -13.7490234375, -13.039306640625, -12.32958984375, -11.619873046875, -10.91015625, -10.200439453125, -9.49072265625, -8.781005859375, -8.0712890625, -7.361572265625, -6.65185546875, -5.942138671875, -5.232421875, -4.522705078125, -3.81298828125, -3.103271484375, -2.3935546875, -1.683837890625, -0.97412109375, -0.264404296875, 0.4453125, 1.155029296875, 1.86474609375, 2.574462890625, 3.2841796875, 3.993896484375, 4.70361328125, 5.413330078125, 6.123046875, 6.832763671875, 7.54248046875, 8.252197265625, 8.9619140625, 9.671630859375, 10.38134765625, 11.091064453125, 11.80078125, 12.510498046875, 13.22021484375, 13.929931640625, 14.6396484375, 15.349365234375, 16.05908203125, 16.768798828125, 17.478515625, 18.188232421875, 18.89794921875, 19.607666015625, 20.3173828125, 21.027099609375, 21.73681640625, 22.446533203125, 23.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 5.0, 14.0, 14.0, 24.0, 28.0, 41.0, 39.0, 45.0, 41.0, 47.0, 51.0, 46.0, 53.0, 54.0, 39.0, 41.0, 64.0, 37.0, 43.0, 40.0, 36.0, 25.0, 30.0, 24.0, 21.0, 15.0, 17.0, 10.0, 7.0, 8.0, 6.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.4144287109375, -5.219482421875, -5.0245361328125, -4.82958984375, -4.6346435546875, -4.439697265625, -4.2447509765625, -4.0498046875, -3.8548583984375, -3.659912109375, -3.4649658203125, -3.27001953125, -3.0750732421875, -2.880126953125, -2.6851806640625, -2.490234375, -2.2952880859375, -2.100341796875, -1.9053955078125, -1.71044921875, -1.5155029296875, -1.320556640625, -1.1256103515625, -0.9306640625, -0.7357177734375, -0.540771484375, -0.3458251953125, -0.15087890625, 0.0440673828125, 0.239013671875, 0.4339599609375, 0.62890625, 0.8238525390625, 1.018798828125, 1.2137451171875, 1.40869140625, 1.6036376953125, 1.798583984375, 1.9935302734375, 2.1884765625, 2.3834228515625, 2.578369140625, 2.7733154296875, 2.96826171875, 3.1632080078125, 3.358154296875, 3.5531005859375, 3.748046875, 3.9429931640625, 4.137939453125, 4.3328857421875, 4.52783203125, 4.7227783203125, 4.917724609375, 5.1126708984375, 5.3076171875, 5.5025634765625, 5.697509765625, 5.8924560546875, 6.08740234375, 6.2823486328125, 6.477294921875, 6.6722412109375, 6.8671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 10.0, 5.0, 11.0, 17.0, 25.0, 48.0, 52.0, 80.0, 117.0, 178.0, 337.0, 516.0, 770.0, 1593.0, 3323.0, 7136.0, 17962.0, 51312.0, 193563.0, 2406181.0, 1282276.0, 156667.0, 43734.0, 15509.0, 6435.0, 2959.0, 1444.0, 757.0, 477.0, 281.0, 176.0, 122.0, 70.0, 42.0, 32.0, 24.0, 18.0, 10.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-43.40625, -42.291259765625, -41.17626953125, -40.061279296875, -38.9462890625, -37.831298828125, -36.71630859375, -35.601318359375, -34.486328125, -33.371337890625, -32.25634765625, -31.141357421875, -30.0263671875, -28.911376953125, -27.79638671875, -26.681396484375, -25.56640625, -24.451416015625, -23.33642578125, -22.221435546875, -21.1064453125, -19.991455078125, -18.87646484375, -17.761474609375, -16.646484375, -15.531494140625, -14.41650390625, -13.301513671875, -12.1865234375, -11.071533203125, -9.95654296875, -8.841552734375, -7.7265625, -6.611572265625, -5.49658203125, -4.381591796875, -3.2666015625, -2.151611328125, -1.03662109375, 0.078369140625, 1.193359375, 2.308349609375, 3.42333984375, 4.538330078125, 5.6533203125, 6.768310546875, 7.88330078125, 8.998291015625, 10.11328125, 11.228271484375, 12.34326171875, 13.458251953125, 14.5732421875, 15.688232421875, 16.80322265625, 17.918212890625, 19.033203125, 20.148193359375, 21.26318359375, 22.378173828125, 23.4931640625, 24.608154296875, 25.72314453125, 26.838134765625, 27.953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 11.0, 12.0, 19.0, 25.0, 33.0, 42.0, 82.0, 103.0, 168.0, 298.0, 718.0, 1365.0, 477.0, 230.0, 158.0, 84.0, 65.0, 48.0, 39.0, 12.0, 20.0, 14.0, 12.0, 9.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.802978515625, -13.18408203125, -12.565185546875, -11.9462890625, -11.327392578125, -10.70849609375, -10.089599609375, -9.470703125, -8.851806640625, -8.23291015625, -7.614013671875, -6.9951171875, -6.376220703125, -5.75732421875, -5.138427734375, -4.51953125, -3.900634765625, -3.28173828125, -2.662841796875, -2.0439453125, -1.425048828125, -0.80615234375, -0.187255859375, 0.431640625, 1.050537109375, 1.66943359375, 2.288330078125, 2.9072265625, 3.526123046875, 4.14501953125, 4.763916015625, 5.3828125, 6.001708984375, 6.62060546875, 7.239501953125, 7.8583984375, 8.477294921875, 9.09619140625, 9.715087890625, 10.333984375, 10.952880859375, 11.57177734375, 12.190673828125, 12.8095703125, 13.428466796875, 14.04736328125, 14.666259765625, 15.28515625, 15.904052734375, 16.52294921875, 17.141845703125, 17.7607421875, 18.379638671875, 18.99853515625, 19.617431640625, 20.236328125, 20.855224609375, 21.47412109375, 22.093017578125, 22.7119140625, 23.330810546875, 23.94970703125, 24.568603515625, 25.1875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 12.0, 38.0, 66.0, 156.0, 218.0, 217.0, 162.0, 73.0, 36.0, 16.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.23800659179688, -110.52970886230469, -101.82141876220703, -93.11312866210938, -84.40483093261719, -75.696533203125, -66.98824310302734, -58.27994918823242, -49.5716552734375, -40.86336135864258, -32.155067443847656, -23.446773529052734, -14.738479614257812, -6.030185699462891, 2.6781082153320312, 11.386402130126953, 20.094696044921875, 28.802989959716797, 37.51128387451172, 46.21957778930664, 54.92787170410156, 63.636165618896484, 72.3444595336914, 81.05274963378906, 89.76104736328125, 98.46934509277344, 107.1776351928711, 115.88592529296875, 124.59422302246094, 133.30252075195312, 142.01080322265625, 150.71910095214844, 159.4273681640625, 168.1356658935547, 176.84396362304688, 185.55224609375, 194.2605438232422, 202.96884155273438, 211.6771240234375, 220.3854217529297, 229.09371948242188, 237.80201721191406, 246.51031494140625, 255.21859741210938, 263.9268798828125, 272.63519287109375, 281.3434753417969, 290.0517883300781, 298.76007080078125, 307.4683532714844, 316.1766662597656, 324.88494873046875, 333.59326171875, 342.3015441894531, 351.00982666015625, 359.7181396484375, 368.4264221191406, 377.13470458984375, 385.843017578125, 394.5513000488281, 403.25958251953125, 411.9678955078125, 420.6761779785156, 429.3844909667969, 438.0927734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 10.0, 13.0, 9.0, 11.0, 26.0, 22.0, 26.0, 25.0, 40.0, 35.0, 31.0, 39.0, 47.0, 51.0, 52.0, 46.0, 45.0, 38.0, 41.0, 34.0, 41.0, 48.0, 32.0, 36.0, 28.0, 29.0, 27.0, 25.0, 16.0, 19.0, 13.0, 7.0, 8.0, 2.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.80278778076172, -87.22354888916016, -84.6443099975586, -82.06507110595703, -79.48583984375, -76.90660095214844, -74.32736206054688, -71.74812316894531, -69.16888427734375, -66.58964538574219, -64.01040649414062, -61.43117141723633, -58.851932525634766, -56.2726936340332, -53.693458557128906, -51.114219665527344, -48.53498077392578, -45.95574188232422, -43.376502990722656, -40.79726791381836, -38.2180290222168, -35.638790130615234, -33.05955505371094, -30.480316162109375, -27.901077270507812, -25.32183837890625, -22.74260139465332, -20.16336441040039, -17.584125518798828, -15.004887580871582, -12.425649642944336, -9.846412658691406, -7.2671661376953125, -4.687928199768066, -2.1086902618408203, 0.4705476760864258, 3.049785614013672, 5.629023551940918, 8.208261489868164, 10.787498474121094, 13.366737365722656, 15.945975303649902, 18.52521324157715, 21.104450225830078, 23.68368911743164, 26.262928009033203, 28.842164993286133, 31.421401977539062, 34.000640869140625, 36.57987976074219, 39.15911865234375, 41.73835372924805, 44.31759262084961, 46.89683151245117, 49.47606658935547, 52.05530548095703, 54.634544372558594, 57.213783264160156, 59.79302215576172, 62.372257232666016, 64.95149230957031, 67.53073120117188, 70.10997009277344, 72.689208984375, 75.26844787597656]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 12.0, 20.0, 32.0, 30.0, 62.0, 91.0, 121.0, 183.0, 253.0, 401.0, 651.0, 1005.0, 1633.0, 2838.0, 4549.0, 7708.0, 13768.0, 23998.0, 42344.0, 74248.0, 123280.0, 179085.0, 195176.0, 150900.0, 95199.0, 55479.0, 31641.0, 18349.0, 10297.0, 5958.0, 3493.0, 2139.0, 1311.0, 784.0, 476.0, 320.0, 211.0, 154.0, 93.0, 80.0, 38.0, 41.0, 22.0, 18.0, 13.0, 8.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.640625, -14.1719970703125, -13.703369140625, -13.2347412109375, -12.76611328125, -12.2974853515625, -11.828857421875, -11.3602294921875, -10.8916015625, -10.4229736328125, -9.954345703125, -9.4857177734375, -9.01708984375, -8.5484619140625, -8.079833984375, -7.6112060546875, -7.142578125, -6.6739501953125, -6.205322265625, -5.7366943359375, -5.26806640625, -4.7994384765625, -4.330810546875, -3.8621826171875, -3.3935546875, -2.9249267578125, -2.456298828125, -1.9876708984375, -1.51904296875, -1.0504150390625, -0.581787109375, -0.1131591796875, 0.35546875, 0.8240966796875, 1.292724609375, 1.7613525390625, 2.22998046875, 2.6986083984375, 3.167236328125, 3.6358642578125, 4.1044921875, 4.5731201171875, 5.041748046875, 5.5103759765625, 5.97900390625, 6.4476318359375, 6.916259765625, 7.3848876953125, 7.853515625, 8.3221435546875, 8.790771484375, 9.2593994140625, 9.72802734375, 10.1966552734375, 10.665283203125, 11.1339111328125, 11.6025390625, 12.0711669921875, 12.539794921875, 13.0084228515625, 13.47705078125, 13.9456787109375, 14.414306640625, 14.8829345703125, 15.3515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 9.0, 9.0, 13.0, 10.0, 10.0, 25.0, 18.0, 21.0, 34.0, 29.0, 38.0, 40.0, 44.0, 38.0, 49.0, 41.0, 56.0, 53.0, 49.0, 56.0, 47.0, 43.0, 35.0, 29.0, 35.0, 19.0, 27.0, 14.0, 15.0, 20.0, 14.0, 7.0, 17.0, 4.0, 4.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.35546875, -7.138916015625, -6.92236328125, -6.705810546875, -6.4892578125, -6.272705078125, -6.05615234375, -5.839599609375, -5.623046875, -5.406494140625, -5.18994140625, -4.973388671875, -4.7568359375, -4.540283203125, -4.32373046875, -4.107177734375, -3.890625, -3.674072265625, -3.45751953125, -3.240966796875, -3.0244140625, -2.807861328125, -2.59130859375, -2.374755859375, -2.158203125, -1.941650390625, -1.72509765625, -1.508544921875, -1.2919921875, -1.075439453125, -0.85888671875, -0.642333984375, -0.42578125, -0.209228515625, 0.00732421875, 0.223876953125, 0.4404296875, 0.656982421875, 0.87353515625, 1.090087890625, 1.306640625, 1.523193359375, 1.73974609375, 1.956298828125, 2.1728515625, 2.389404296875, 2.60595703125, 2.822509765625, 3.0390625, 3.255615234375, 3.47216796875, 3.688720703125, 3.9052734375, 4.121826171875, 4.33837890625, 4.554931640625, 4.771484375, 4.988037109375, 5.20458984375, 5.421142578125, 5.6376953125, 5.854248046875, 6.07080078125, 6.287353515625, 6.50390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 6.0, 14.0, 14.0, 18.0, 27.0, 55.0, 70.0, 94.0, 158.0, 260.0, 454.0, 868.0, 2179.0, 6189.0, 23650.0, 108780.0, 420036.0, 367884.0, 88981.0, 19578.0, 5364.0, 1926.0, 832.0, 415.0, 236.0, 153.0, 93.0, 53.0, 40.0, 28.0, 23.0, 12.0, 8.0, 14.0, 3.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.6865234375, -34.310546875, -32.9345703125, -31.55859375, -30.1826171875, -28.806640625, -27.4306640625, -26.0546875, -24.6787109375, -23.302734375, -21.9267578125, -20.55078125, -19.1748046875, -17.798828125, -16.4228515625, -15.046875, -13.6708984375, -12.294921875, -10.9189453125, -9.54296875, -8.1669921875, -6.791015625, -5.4150390625, -4.0390625, -2.6630859375, -1.287109375, 0.0888671875, 1.46484375, 2.8408203125, 4.216796875, 5.5927734375, 6.96875, 8.3447265625, 9.720703125, 11.0966796875, 12.47265625, 13.8486328125, 15.224609375, 16.6005859375, 17.9765625, 19.3525390625, 20.728515625, 22.1044921875, 23.48046875, 24.8564453125, 26.232421875, 27.6083984375, 28.984375, 30.3603515625, 31.736328125, 33.1123046875, 34.48828125, 35.8642578125, 37.240234375, 38.6162109375, 39.9921875, 41.3681640625, 42.744140625, 44.1201171875, 45.49609375, 46.8720703125, 48.248046875, 49.6240234375, 51.0]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 7.0, 11.0, 7.0, 12.0, 13.0, 15.0, 24.0, 26.0, 20.0, 31.0, 27.0, 42.0, 39.0, 36.0, 47.0, 33.0, 54.0, 56.0, 44.0, 51.0, 40.0, 50.0, 51.0, 44.0, 28.0, 29.0, 26.0, 22.0, 17.0, 9.0, 16.0, 12.0, 11.0, 5.0, 11.0, 7.0, 8.0, 10.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.8125, -39.46435546875, -38.1162109375, -36.76806640625, -35.419921875, -34.07177734375, -32.7236328125, -31.37548828125, -30.02734375, -28.67919921875, -27.3310546875, -25.98291015625, -24.634765625, -23.28662109375, -21.9384765625, -20.59033203125, -19.2421875, -17.89404296875, -16.5458984375, -15.19775390625, -13.849609375, -12.50146484375, -11.1533203125, -9.80517578125, -8.45703125, -7.10888671875, -5.7607421875, -4.41259765625, -3.064453125, -1.71630859375, -0.3681640625, 0.97998046875, 2.328125, 3.67626953125, 5.0244140625, 6.37255859375, 7.720703125, 9.06884765625, 10.4169921875, 11.76513671875, 13.11328125, 14.46142578125, 15.8095703125, 17.15771484375, 18.505859375, 19.85400390625, 21.2021484375, 22.55029296875, 23.8984375, 25.24658203125, 26.5947265625, 27.94287109375, 29.291015625, 30.63916015625, 31.9873046875, 33.33544921875, 34.68359375, 36.03173828125, 37.3798828125, 38.72802734375, 40.076171875, 41.42431640625, 42.7724609375, 44.12060546875, 45.46875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 11.0, 6.0, 10.0, 9.0, 14.0, 15.0, 17.0, 33.0, 43.0, 38.0, 74.0, 99.0, 257.0, 483.0, 1120.0, 3443.0, 14784.0, 122010.0, 678991.0, 198182.0, 21793.0, 4493.0, 1397.0, 558.0, 247.0, 123.0, 79.0, 47.0, 34.0, 33.0, 20.0, 19.0, 18.0, 10.0, 3.0, 10.0, 8.0, 7.0, 8.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.28125, -36.234130859375, -35.18701171875, -34.139892578125, -33.0927734375, -32.045654296875, -30.99853515625, -29.951416015625, -28.904296875, -27.857177734375, -26.81005859375, -25.762939453125, -24.7158203125, -23.668701171875, -22.62158203125, -21.574462890625, -20.52734375, -19.480224609375, -18.43310546875, -17.385986328125, -16.3388671875, -15.291748046875, -14.24462890625, -13.197509765625, -12.150390625, -11.103271484375, -10.05615234375, -9.009033203125, -7.9619140625, -6.914794921875, -5.86767578125, -4.820556640625, -3.7734375, -2.726318359375, -1.67919921875, -0.632080078125, 0.4150390625, 1.462158203125, 2.50927734375, 3.556396484375, 4.603515625, 5.650634765625, 6.69775390625, 7.744873046875, 8.7919921875, 9.839111328125, 10.88623046875, 11.933349609375, 12.98046875, 14.027587890625, 15.07470703125, 16.121826171875, 17.1689453125, 18.216064453125, 19.26318359375, 20.310302734375, 21.357421875, 22.404541015625, 23.45166015625, 24.498779296875, 25.5458984375, 26.593017578125, 27.64013671875, 28.687255859375, 29.734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 11.0, 13.0, 18.0, 25.0, 44.0, 47.0, 77.0, 102.0, 136.0, 110.0, 126.0, 96.0, 62.0, 38.0, 33.0, 16.0, 23.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0048675537109375, -0.004666566848754883, -0.004465579986572266, -0.0042645931243896484, -0.004063606262207031, -0.003862619400024414, -0.003661632537841797, -0.0034606456756591797, -0.0032596588134765625, -0.0030586719512939453, -0.002857685089111328, -0.002656698226928711, -0.0024557113647460938, -0.0022547245025634766, -0.0020537376403808594, -0.0018527507781982422, -0.001651763916015625, -0.0014507770538330078, -0.0012497901916503906, -0.0010488033294677734, -0.0008478164672851562, -0.0006468296051025391, -0.0004458427429199219, -0.0002448558807373047, -4.38690185546875e-05, 0.0001571178436279297, 0.0003581047058105469, 0.0005590915679931641, 0.0007600784301757812, 0.0009610652923583984, 0.0011620521545410156, 0.0013630390167236328, 0.00156402587890625, 0.0017650127410888672, 0.0019659996032714844, 0.0021669864654541016, 0.0023679733276367188, 0.002568960189819336, 0.002769947052001953, 0.0029709339141845703, 0.0031719207763671875, 0.0033729076385498047, 0.003573894500732422, 0.003774881362915039, 0.003975868225097656, 0.0041768550872802734, 0.004377841949462891, 0.004578828811645508, 0.004779815673828125, 0.004980802536010742, 0.005181789398193359, 0.0053827762603759766, 0.005583763122558594, 0.005784749984741211, 0.005985736846923828, 0.006186723709106445, 0.0063877105712890625, 0.00658869743347168, 0.006789684295654297, 0.006990671157836914, 0.007191658020019531, 0.0073926448822021484, 0.007593631744384766, 0.007794618606567383, 0.00799560546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 14.0, 31.0, 28.0, 51.0, 83.0, 166.0, 326.0, 812.0, 2104.0, 7714.0, 46149.0, 425555.0, 496463.0, 56377.0, 8781.0, 2242.0, 855.0, 358.0, 184.0, 107.0, 54.0, 43.0, 24.0, 13.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.670166015625, -35.65283203125, -34.635498046875, -33.6181640625, -32.600830078125, -31.58349609375, -30.566162109375, -29.548828125, -28.531494140625, -27.51416015625, -26.496826171875, -25.4794921875, -24.462158203125, -23.44482421875, -22.427490234375, -21.41015625, -20.392822265625, -19.37548828125, -18.358154296875, -17.3408203125, -16.323486328125, -15.30615234375, -14.288818359375, -13.271484375, -12.254150390625, -11.23681640625, -10.219482421875, -9.2021484375, -8.184814453125, -7.16748046875, -6.150146484375, -5.1328125, -4.115478515625, -3.09814453125, -2.080810546875, -1.0634765625, -0.046142578125, 0.97119140625, 1.988525390625, 3.005859375, 4.023193359375, 5.04052734375, 6.057861328125, 7.0751953125, 8.092529296875, 9.10986328125, 10.127197265625, 11.14453125, 12.161865234375, 13.17919921875, 14.196533203125, 15.2138671875, 16.231201171875, 17.24853515625, 18.265869140625, 19.283203125, 20.300537109375, 21.31787109375, 22.335205078125, 23.3525390625, 24.369873046875, 25.38720703125, 26.404541015625, 27.421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 6.0, 12.0, 20.0, 36.0, 40.0, 51.0, 71.0, 96.0, 129.0, 129.0, 99.0, 85.0, 79.0, 31.0, 34.0, 24.0, 17.0, 12.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.71875, -33.808837890625, -32.89892578125, -31.989013671875, -31.0791015625, -30.169189453125, -29.25927734375, -28.349365234375, -27.439453125, -26.529541015625, -25.61962890625, -24.709716796875, -23.7998046875, -22.889892578125, -21.97998046875, -21.070068359375, -20.16015625, -19.250244140625, -18.34033203125, -17.430419921875, -16.5205078125, -15.610595703125, -14.70068359375, -13.790771484375, -12.880859375, -11.970947265625, -11.06103515625, -10.151123046875, -9.2412109375, -8.331298828125, -7.42138671875, -6.511474609375, -5.6015625, -4.691650390625, -3.78173828125, -2.871826171875, -1.9619140625, -1.052001953125, -0.14208984375, 0.767822265625, 1.677734375, 2.587646484375, 3.49755859375, 4.407470703125, 5.3173828125, 6.227294921875, 7.13720703125, 8.047119140625, 8.95703125, 9.866943359375, 10.77685546875, 11.686767578125, 12.5966796875, 13.506591796875, 14.41650390625, 15.326416015625, 16.236328125, 17.146240234375, 18.05615234375, 18.966064453125, 19.8759765625, 20.785888671875, 21.69580078125, 22.605712890625, 23.515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 8.0, 19.0, 60.0, 163.0, 284.0, 243.0, 152.0, 46.0, 26.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.5849609375, -113.4738540649414, -90.36274719238281, -67.25163269042969, -44.140525817871094, -21.0294189453125, 2.081695556640625, 25.192794799804688, 48.30390930175781, 71.4150161743164, 94.526123046875, 117.63723754882812, 140.74835205078125, 163.8594512939453, 186.97056579589844, 210.0816650390625, 233.19277954101562, 256.30389404296875, 279.4150085449219, 302.526123046875, 325.63720703125, 348.7483215332031, 371.85943603515625, 394.97052001953125, 418.0816650390625, 441.1927795410156, 464.30389404296875, 487.41497802734375, 510.5260925292969, 533.63720703125, 556.748291015625, 579.8594360351562, 602.9705200195312, 626.0816040039062, 649.1927490234375, 672.3038330078125, 695.4149780273438, 718.5260620117188, 741.63720703125, 764.748291015625, 787.859375, 810.970458984375, 834.0816040039062, 857.1926879882812, 880.3038330078125, 903.4149169921875, 926.5260009765625, 949.6371459960938, 972.748291015625, 995.859375, 1018.9705200195312, 1042.0816650390625, 1065.1927490234375, 1088.3038330078125, 1111.4149169921875, 1134.5260009765625, 1157.6370849609375, 1180.7481689453125, 1203.8592529296875, 1226.970458984375, 1250.08154296875, 1273.192626953125, 1296.3037109375, 1319.414794921875, 1342.5260009765625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 4.0, 6.0, 9.0, 6.0, 14.0, 13.0, 14.0, 18.0, 18.0, 40.0, 34.0, 37.0, 33.0, 52.0, 39.0, 59.0, 45.0, 51.0, 39.0, 44.0, 32.0, 53.0, 33.0, 47.0, 40.0, 38.0, 37.0, 21.0, 19.0, 20.0, 15.0, 12.0, 10.0, 15.0, 7.0, 8.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.56011962890625, -215.1356658935547, -207.71121215820312, -200.28675842285156, -192.8623046875, -185.43783569335938, -178.01339721679688, -170.58892822265625, -163.1644744873047, -155.74002075195312, -148.31556701660156, -140.89111328125, -133.46665954589844, -126.04219818115234, -118.61774444580078, -111.19328308105469, -103.76883697509766, -96.3443832397461, -88.91992950439453, -81.49546813964844, -74.07101440429688, -66.64656066894531, -59.22210693359375, -51.79764938354492, -44.37319564819336, -36.9487419128418, -29.52428436279297, -22.099830627441406, -14.675374984741211, -7.250919342041016, 0.17353439331054688, 7.597991943359375, 15.022445678710938, 22.446901321411133, 29.871356964111328, 37.29581069946289, 44.72026824951172, 52.14472198486328, 59.569175720214844, 66.99363708496094, 74.4180908203125, 81.84254455566406, 89.26699829101562, 96.69145202636719, 104.11591339111328, 111.54036712646484, 118.9648208618164, 126.3892822265625, 133.813720703125, 141.23817443847656, 148.66262817382812, 156.0870819091797, 163.51153564453125, 170.93600463867188, 178.36044311523438, 185.784912109375, 193.20936584472656, 200.63381958007812, 208.0582733154297, 215.48272705078125, 222.9071807861328, 230.33163452148438, 237.756103515625, 245.18055725097656, 252.60501098632812]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 4.0, 6.0, 12.0, 12.0, 8.0, 14.0, 19.0, 34.0, 33.0, 65.0, 88.0, 127.0, 217.0, 349.0, 714.0, 1310.0, 2532.0, 5962.0, 17358.0, 105010.0, 3996259.0, 44262.0, 11269.0, 4393.0, 1946.0, 952.0, 527.0, 277.0, 188.0, 85.0, 72.0, 58.0, 38.0, 20.0, 7.0, 13.0, 11.0, 8.0, 6.0, 4.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-53.3125, -51.7587890625, -50.205078125, -48.6513671875, -47.09765625, -45.5439453125, -43.990234375, -42.4365234375, -40.8828125, -39.3291015625, -37.775390625, -36.2216796875, -34.66796875, -33.1142578125, -31.560546875, -30.0068359375, -28.453125, -26.8994140625, -25.345703125, -23.7919921875, -22.23828125, -20.6845703125, -19.130859375, -17.5771484375, -16.0234375, -14.4697265625, -12.916015625, -11.3623046875, -9.80859375, -8.2548828125, -6.701171875, -5.1474609375, -3.59375, -2.0400390625, -0.486328125, 1.0673828125, 2.62109375, 4.1748046875, 5.728515625, 7.2822265625, 8.8359375, 10.3896484375, 11.943359375, 13.4970703125, 15.05078125, 16.6044921875, 18.158203125, 19.7119140625, 21.265625, 22.8193359375, 24.373046875, 25.9267578125, 27.48046875, 29.0341796875, 30.587890625, 32.1416015625, 33.6953125, 35.2490234375, 36.802734375, 38.3564453125, 39.91015625, 41.4638671875, 43.017578125, 44.5712890625, 46.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 12.0, 10.0, 14.0, 12.0, 19.0, 20.0, 30.0, 35.0, 40.0, 45.0, 53.0, 45.0, 43.0, 54.0, 48.0, 70.0, 53.0, 62.0, 48.0, 50.0, 38.0, 33.0, 35.0, 28.0, 29.0, 21.0, 11.0, 9.0, 6.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.5546875, -11.232177734375, -10.90966796875, -10.587158203125, -10.2646484375, -9.942138671875, -9.61962890625, -9.297119140625, -8.974609375, -8.652099609375, -8.32958984375, -8.007080078125, -7.6845703125, -7.362060546875, -7.03955078125, -6.717041015625, -6.39453125, -6.072021484375, -5.74951171875, -5.427001953125, -5.1044921875, -4.781982421875, -4.45947265625, -4.136962890625, -3.814453125, -3.491943359375, -3.16943359375, -2.846923828125, -2.5244140625, -2.201904296875, -1.87939453125, -1.556884765625, -1.234375, -0.911865234375, -0.58935546875, -0.266845703125, 0.0556640625, 0.378173828125, 0.70068359375, 1.023193359375, 1.345703125, 1.668212890625, 1.99072265625, 2.313232421875, 2.6357421875, 2.958251953125, 3.28076171875, 3.603271484375, 3.92578125, 4.248291015625, 4.57080078125, 4.893310546875, 5.2158203125, 5.538330078125, 5.86083984375, 6.183349609375, 6.505859375, 6.828369140625, 7.15087890625, 7.473388671875, 7.7958984375, 8.118408203125, 8.44091796875, 8.763427734375, 9.0859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 15.0, 26.0, 40.0, 45.0, 83.0, 93.0, 154.0, 202.0, 336.0, 487.0, 710.0, 1192.0, 2017.0, 3941.0, 9032.0, 31728.0, 3570056.0, 529627.0, 27318.0, 8241.0, 3641.0, 1993.0, 1126.0, 721.0, 456.0, 293.0, 199.0, 135.0, 99.0, 84.0, 55.0, 37.0, 25.0, 17.0, 12.0, 8.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-65.5625, -63.7392578125, -61.916015625, -60.0927734375, -58.26953125, -56.4462890625, -54.623046875, -52.7998046875, -50.9765625, -49.1533203125, -47.330078125, -45.5068359375, -43.68359375, -41.8603515625, -40.037109375, -38.2138671875, -36.390625, -34.5673828125, -32.744140625, -30.9208984375, -29.09765625, -27.2744140625, -25.451171875, -23.6279296875, -21.8046875, -19.9814453125, -18.158203125, -16.3349609375, -14.51171875, -12.6884765625, -10.865234375, -9.0419921875, -7.21875, -5.3955078125, -3.572265625, -1.7490234375, 0.07421875, 1.8974609375, 3.720703125, 5.5439453125, 7.3671875, 9.1904296875, 11.013671875, 12.8369140625, 14.66015625, 16.4833984375, 18.306640625, 20.1298828125, 21.953125, 23.7763671875, 25.599609375, 27.4228515625, 29.24609375, 31.0693359375, 32.892578125, 34.7158203125, 36.5390625, 38.3623046875, 40.185546875, 42.0087890625, 43.83203125, 45.6552734375, 47.478515625, 49.3017578125, 51.125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 11.0, 8.0, 11.0, 19.0, 48.0, 58.0, 187.0, 3240.0, 303.0, 76.0, 46.0, 16.0, 7.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9609375, -10.5921630859375, -10.223388671875, -9.8546142578125, -9.48583984375, -9.1170654296875, -8.748291015625, -8.3795166015625, -8.0107421875, -7.6419677734375, -7.273193359375, -6.9044189453125, -6.53564453125, -6.1668701171875, -5.798095703125, -5.4293212890625, -5.060546875, -4.6917724609375, -4.322998046875, -3.9542236328125, -3.58544921875, -3.2166748046875, -2.847900390625, -2.4791259765625, -2.1103515625, -1.7415771484375, -1.372802734375, -1.0040283203125, -0.63525390625, -0.2664794921875, 0.102294921875, 0.4710693359375, 0.83984375, 1.2086181640625, 1.577392578125, 1.9461669921875, 2.31494140625, 2.6837158203125, 3.052490234375, 3.4212646484375, 3.7900390625, 4.1588134765625, 4.527587890625, 4.8963623046875, 5.26513671875, 5.6339111328125, 6.002685546875, 6.3714599609375, 6.740234375, 7.1090087890625, 7.477783203125, 7.8465576171875, 8.21533203125, 8.5841064453125, 8.952880859375, 9.3216552734375, 9.6904296875, 10.0592041015625, 10.427978515625, 10.7967529296875, 11.16552734375, 11.5343017578125, 11.903076171875, 12.2718505859375, 12.640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 12.0, 26.0, 30.0, 51.0, 87.0, 88.0, 117.0, 140.0, 139.0, 99.0, 75.0, 44.0, 37.0, 19.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.23152160644531, -55.60279083251953, -53.974056243896484, -52.3453254699707, -50.716590881347656, -49.087860107421875, -47.459129333496094, -45.83039855957031, -44.201663970947266, -42.572933197021484, -40.94419860839844, -39.315467834472656, -37.686737060546875, -36.05800247192383, -34.42927169799805, -32.800537109375, -31.17180633544922, -29.543073654174805, -27.91434097290039, -26.28561019897461, -24.656877517700195, -23.02814483642578, -21.3994140625, -19.770681381225586, -18.141948699951172, -16.513216018676758, -14.88448429107666, -13.255752563476562, -11.627019882202148, -9.998287200927734, -8.369555473327637, -6.740823745727539, -5.112087249755859, -3.4833550453186035, -1.8546228408813477, -0.2258906364440918, 1.402841567993164, 3.031574249267578, 4.660305976867676, 6.289037704467773, 7.9177703857421875, 9.546503067016602, 11.1752347946167, 12.803966522216797, 14.432699203491211, 16.061431884765625, 17.690162658691406, 19.31889533996582, 20.947628021240234, 22.57636070251465, 24.205093383789062, 25.833824157714844, 27.462556838989258, 29.091289520263672, 30.720020294189453, 32.3487548828125, 33.97748565673828, 35.60621643066406, 37.23495101928711, 38.86368179321289, 40.49241638183594, 42.12114715576172, 43.7498779296875, 45.37860870361328, 47.00734329223633]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 9.0, 9.0, 13.0, 20.0, 9.0, 24.0, 22.0, 29.0, 28.0, 39.0, 35.0, 39.0, 37.0, 40.0, 38.0, 38.0, 40.0, 38.0, 44.0, 40.0, 37.0, 31.0, 25.0, 34.0, 37.0, 30.0, 30.0, 25.0, 20.0, 17.0, 19.0, 14.0, 15.0, 8.0, 10.0, 8.0, 5.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.760135650634766, -17.093189239501953, -16.426244735717773, -15.759298324584961, -15.092351913452148, -14.425406455993652, -13.758460998535156, -13.091514587402344, -12.424568176269531, -11.757622718811035, -11.090676307678223, -10.423730850219727, -9.756784439086914, -9.089838981628418, -8.422893524169922, -7.755947113037109, -7.089001655578613, -6.422055721282959, -5.755109786987305, -5.088164329528809, -4.421217918395996, -3.754272222518921, -3.0873265266418457, -2.4203805923461914, -1.753434658050537, -1.0864887237548828, -0.41954290866851807, 0.24740290641784668, 0.914348840713501, 1.5812947750091553, 2.2482404708862305, 2.9151864051818848, 3.582132339477539, 4.249078273773193, 4.916024208068848, 5.582969665527344, 6.249916076660156, 6.916861534118652, 7.583807468414307, 8.250753402709961, 8.917699813842773, 9.58464527130127, 10.251591682434082, 10.918537139892578, 11.58548355102539, 12.252429008483887, 12.919374465942383, 13.586320877075195, 14.253266334533691, 14.920211791992188, 15.587158203125, 16.254104614257812, 16.921049118041992, 17.587995529174805, 18.254941940307617, 18.921886444091797, 19.58883285522461, 20.255779266357422, 20.9227237701416, 21.589670181274414, 22.256616592407227, 22.92356300354004, 23.59050750732422, 24.25745391845703, 24.924400329589844]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 3.0, 7.0, 6.0, 6.0, 11.0, 15.0, 24.0, 37.0, 55.0, 96.0, 142.0, 294.0, 434.0, 733.0, 1357.0, 2429.0, 4463.0, 8506.0, 16945.0, 33613.0, 65998.0, 126819.0, 215370.0, 238573.0, 159333.0, 84604.0, 43082.0, 21886.0, 11042.0, 5780.0, 2983.0, 1646.0, 928.0, 524.0, 311.0, 185.0, 106.0, 64.0, 47.0, 27.0, 27.0, 13.0, 5.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.1875, -20.549072265625, -19.91064453125, -19.272216796875, -18.6337890625, -17.995361328125, -17.35693359375, -16.718505859375, -16.080078125, -15.441650390625, -14.80322265625, -14.164794921875, -13.5263671875, -12.887939453125, -12.24951171875, -11.611083984375, -10.97265625, -10.334228515625, -9.69580078125, -9.057373046875, -8.4189453125, -7.780517578125, -7.14208984375, -6.503662109375, -5.865234375, -5.226806640625, -4.58837890625, -3.949951171875, -3.3115234375, -2.673095703125, -2.03466796875, -1.396240234375, -0.7578125, -0.119384765625, 0.51904296875, 1.157470703125, 1.7958984375, 2.434326171875, 3.07275390625, 3.711181640625, 4.349609375, 4.988037109375, 5.62646484375, 6.264892578125, 6.9033203125, 7.541748046875, 8.18017578125, 8.818603515625, 9.45703125, 10.095458984375, 10.73388671875, 11.372314453125, 12.0107421875, 12.649169921875, 13.28759765625, 13.926025390625, 14.564453125, 15.202880859375, 15.84130859375, 16.479736328125, 17.1181640625, 17.756591796875, 18.39501953125, 19.033447265625, 19.671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 11.0, 10.0, 20.0, 17.0, 15.0, 26.0, 23.0, 42.0, 40.0, 35.0, 33.0, 47.0, 55.0, 60.0, 66.0, 75.0, 55.0, 53.0, 43.0, 39.0, 35.0, 23.0, 32.0, 30.0, 22.0, 17.0, 18.0, 8.0, 14.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.9765625, -10.6494140625, -10.322265625, -9.9951171875, -9.66796875, -9.3408203125, -9.013671875, -8.6865234375, -8.359375, -8.0322265625, -7.705078125, -7.3779296875, -7.05078125, -6.7236328125, -6.396484375, -6.0693359375, -5.7421875, -5.4150390625, -5.087890625, -4.7607421875, -4.43359375, -4.1064453125, -3.779296875, -3.4521484375, -3.125, -2.7978515625, -2.470703125, -2.1435546875, -1.81640625, -1.4892578125, -1.162109375, -0.8349609375, -0.5078125, -0.1806640625, 0.146484375, 0.4736328125, 0.80078125, 1.1279296875, 1.455078125, 1.7822265625, 2.109375, 2.4365234375, 2.763671875, 3.0908203125, 3.41796875, 3.7451171875, 4.072265625, 4.3994140625, 4.7265625, 5.0537109375, 5.380859375, 5.7080078125, 6.03515625, 6.3623046875, 6.689453125, 7.0166015625, 7.34375, 7.6708984375, 7.998046875, 8.3251953125, 8.65234375, 8.9794921875, 9.306640625, 9.6337890625, 9.9609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 8.0, 13.0, 12.0, 24.0, 17.0, 30.0, 41.0, 78.0, 94.0, 161.0, 243.0, 431.0, 986.0, 2761.0, 9771.0, 48528.0, 292871.0, 551306.0, 113073.0, 20141.0, 4776.0, 1630.0, 654.0, 312.0, 179.0, 123.0, 80.0, 47.0, 40.0, 38.0, 16.0, 16.0, 12.0, 7.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.15625, -49.46435546875, -47.7724609375, -46.08056640625, -44.388671875, -42.69677734375, -41.0048828125, -39.31298828125, -37.62109375, -35.92919921875, -34.2373046875, -32.54541015625, -30.853515625, -29.16162109375, -27.4697265625, -25.77783203125, -24.0859375, -22.39404296875, -20.7021484375, -19.01025390625, -17.318359375, -15.62646484375, -13.9345703125, -12.24267578125, -10.55078125, -8.85888671875, -7.1669921875, -5.47509765625, -3.783203125, -2.09130859375, -0.3994140625, 1.29248046875, 2.984375, 4.67626953125, 6.3681640625, 8.06005859375, 9.751953125, 11.44384765625, 13.1357421875, 14.82763671875, 16.51953125, 18.21142578125, 19.9033203125, 21.59521484375, 23.287109375, 24.97900390625, 26.6708984375, 28.36279296875, 30.0546875, 31.74658203125, 33.4384765625, 35.13037109375, 36.822265625, 38.51416015625, 40.2060546875, 41.89794921875, 43.58984375, 45.28173828125, 46.9736328125, 48.66552734375, 50.357421875, 52.04931640625, 53.7412109375, 55.43310546875, 57.125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 6.0, 10.0, 8.0, 8.0, 11.0, 10.0, 14.0, 25.0, 23.0, 23.0, 32.0, 23.0, 55.0, 50.0, 51.0, 55.0, 56.0, 48.0, 66.0, 64.0, 48.0, 56.0, 38.0, 38.0, 33.0, 27.0, 27.0, 21.0, 18.0, 13.0, 11.0, 7.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-71.0, -69.0048828125, -67.009765625, -65.0146484375, -63.01953125, -61.0244140625, -59.029296875, -57.0341796875, -55.0390625, -53.0439453125, -51.048828125, -49.0537109375, -47.05859375, -45.0634765625, -43.068359375, -41.0732421875, -39.078125, -37.0830078125, -35.087890625, -33.0927734375, -31.09765625, -29.1025390625, -27.107421875, -25.1123046875, -23.1171875, -21.1220703125, -19.126953125, -17.1318359375, -15.13671875, -13.1416015625, -11.146484375, -9.1513671875, -7.15625, -5.1611328125, -3.166015625, -1.1708984375, 0.82421875, 2.8193359375, 4.814453125, 6.8095703125, 8.8046875, 10.7998046875, 12.794921875, 14.7900390625, 16.78515625, 18.7802734375, 20.775390625, 22.7705078125, 24.765625, 26.7607421875, 28.755859375, 30.7509765625, 32.74609375, 34.7412109375, 36.736328125, 38.7314453125, 40.7265625, 42.7216796875, 44.716796875, 46.7119140625, 48.70703125, 50.7021484375, 52.697265625, 54.6923828125, 56.6875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 9.0, 19.0, 33.0, 52.0, 71.0, 122.0, 190.0, 307.0, 633.0, 1244.0, 2714.0, 6338.0, 18297.0, 64703.0, 253734.0, 468371.0, 167032.0, 42876.0, 12731.0, 4713.0, 2070.0, 936.0, 577.0, 281.0, 179.0, 107.0, 62.0, 34.0, 24.0, 14.0, 16.0, 12.0, 6.0, 6.0, 2.0, 4.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.8125, -17.2938232421875, -16.775146484375, -16.2564697265625, -15.73779296875, -15.2191162109375, -14.700439453125, -14.1817626953125, -13.6630859375, -13.1444091796875, -12.625732421875, -12.1070556640625, -11.58837890625, -11.0697021484375, -10.551025390625, -10.0323486328125, -9.513671875, -8.9949951171875, -8.476318359375, -7.9576416015625, -7.43896484375, -6.9202880859375, -6.401611328125, -5.8829345703125, -5.3642578125, -4.8455810546875, -4.326904296875, -3.8082275390625, -3.28955078125, -2.7708740234375, -2.252197265625, -1.7335205078125, -1.21484375, -0.6961669921875, -0.177490234375, 0.3411865234375, 0.85986328125, 1.3785400390625, 1.897216796875, 2.4158935546875, 2.9345703125, 3.4532470703125, 3.971923828125, 4.4906005859375, 5.00927734375, 5.5279541015625, 6.046630859375, 6.5653076171875, 7.083984375, 7.6026611328125, 8.121337890625, 8.6400146484375, 9.15869140625, 9.6773681640625, 10.196044921875, 10.7147216796875, 11.2333984375, 11.7520751953125, 12.270751953125, 12.7894287109375, 13.30810546875, 13.8267822265625, 14.345458984375, 14.8641357421875, 15.3828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 9.0, 4.0, 8.0, 7.0, 13.0, 17.0, 35.0, 33.0, 37.0, 43.0, 51.0, 73.0, 63.0, 72.0, 85.0, 69.0, 71.0, 61.0, 45.0, 52.0, 27.0, 24.0, 18.0, 20.0, 15.0, 11.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034122467041015625, -0.003303736448287964, -0.0031952261924743652, -0.0030867159366607666, -0.002978205680847168, -0.0028696954250335693, -0.0027611851692199707, -0.002652674913406372, -0.0025441646575927734, -0.002435654401779175, -0.002327144145965576, -0.0022186338901519775, -0.002110123634338379, -0.0020016133785247803, -0.0018931031227111816, -0.001784592866897583, -0.0016760826110839844, -0.0015675723552703857, -0.0014590620994567871, -0.0013505518436431885, -0.0012420415878295898, -0.0011335313320159912, -0.0010250210762023926, -0.0009165108203887939, -0.0008080005645751953, -0.0006994903087615967, -0.000590980052947998, -0.0004824697971343994, -0.0003739595413208008, -0.00026544928550720215, -0.00015693902969360352, -4.842877388000488e-05, 6.008148193359375e-05, 0.00016859173774719238, 0.000277101993560791, 0.00038561224937438965, 0.0004941225051879883, 0.0006026327610015869, 0.0007111430168151855, 0.0008196532726287842, 0.0009281635284423828, 0.0010366737842559814, 0.00114518404006958, 0.0012536942958831787, 0.0013622045516967773, 0.001470714807510376, 0.0015792250633239746, 0.0016877353191375732, 0.0017962455749511719, 0.0019047558307647705, 0.002013266086578369, 0.0021217763423919678, 0.0022302865982055664, 0.002338796854019165, 0.0024473071098327637, 0.0025558173656463623, 0.002664327621459961, 0.0027728378772735596, 0.002881348133087158, 0.002989858388900757, 0.0030983686447143555, 0.003206878900527954, 0.0033153891563415527, 0.0034238994121551514, 0.00353240966796875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 18.0, 6.0, 16.0, 21.0, 33.0, 72.0, 82.0, 172.0, 242.0, 418.0, 807.0, 1747.0, 3995.0, 11487.0, 44385.0, 199211.0, 504531.0, 213379.0, 47318.0, 12608.0, 4216.0, 1803.0, 837.0, 465.0, 259.0, 136.0, 104.0, 44.0, 35.0, 30.0, 20.0, 14.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.421875, -17.85546875, -17.2890625, -16.72265625, -16.15625, -15.58984375, -15.0234375, -14.45703125, -13.890625, -13.32421875, -12.7578125, -12.19140625, -11.625, -11.05859375, -10.4921875, -9.92578125, -9.359375, -8.79296875, -8.2265625, -7.66015625, -7.09375, -6.52734375, -5.9609375, -5.39453125, -4.828125, -4.26171875, -3.6953125, -3.12890625, -2.5625, -1.99609375, -1.4296875, -0.86328125, -0.296875, 0.26953125, 0.8359375, 1.40234375, 1.96875, 2.53515625, 3.1015625, 3.66796875, 4.234375, 4.80078125, 5.3671875, 5.93359375, 6.5, 7.06640625, 7.6328125, 8.19921875, 8.765625, 9.33203125, 9.8984375, 10.46484375, 11.03125, 11.59765625, 12.1640625, 12.73046875, 13.296875, 13.86328125, 14.4296875, 14.99609375, 15.5625, 16.12890625, 16.6953125, 17.26171875, 17.828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 11.0, 5.0, 17.0, 27.0, 21.0, 45.0, 49.0, 63.0, 47.0, 60.0, 67.0, 97.0, 77.0, 73.0, 60.0, 65.0, 52.0, 26.0, 25.0, 25.0, 27.0, 8.0, 9.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.921875, -21.310302734375, -20.69873046875, -20.087158203125, -19.4755859375, -18.864013671875, -18.25244140625, -17.640869140625, -17.029296875, -16.417724609375, -15.80615234375, -15.194580078125, -14.5830078125, -13.971435546875, -13.35986328125, -12.748291015625, -12.13671875, -11.525146484375, -10.91357421875, -10.302001953125, -9.6904296875, -9.078857421875, -8.46728515625, -7.855712890625, -7.244140625, -6.632568359375, -6.02099609375, -5.409423828125, -4.7978515625, -4.186279296875, -3.57470703125, -2.963134765625, -2.3515625, -1.739990234375, -1.12841796875, -0.516845703125, 0.0947265625, 0.706298828125, 1.31787109375, 1.929443359375, 2.541015625, 3.152587890625, 3.76416015625, 4.375732421875, 4.9873046875, 5.598876953125, 6.21044921875, 6.822021484375, 7.43359375, 8.045166015625, 8.65673828125, 9.268310546875, 9.8798828125, 10.491455078125, 11.10302734375, 11.714599609375, 12.326171875, 12.937744140625, 13.54931640625, 14.160888671875, 14.7724609375, 15.384033203125, 15.99560546875, 16.607177734375, 17.21875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 9.0, 7.0, 29.0, 45.0, 78.0, 136.0, 173.0, 173.0, 108.0, 112.0, 68.0, 35.0, 12.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-622.3218994140625, -608.274169921875, -594.2264404296875, -580.1787719726562, -566.1310424804688, -552.0833129882812, -538.0355834960938, -523.9878540039062, -509.9401550292969, -495.8924255371094, -481.8447265625, -467.7969970703125, -453.7492980957031, -439.7015686035156, -425.65386962890625, -411.60614013671875, -397.55841064453125, -383.51068115234375, -369.4629821777344, -355.4152526855469, -341.3675537109375, -327.31982421875, -313.2720947265625, -299.2243957519531, -285.17669677734375, -271.12896728515625, -257.0812683105469, -243.03353881835938, -228.98582458496094, -214.9381103515625, -200.89039611816406, -186.84268188476562, -172.79495239257812, -158.7472381591797, -144.69952392578125, -130.65179443359375, -116.60408020019531, -102.55636596679688, -88.50865173339844, -74.46092987060547, -60.41321563720703, -46.36549758911133, -32.317779541015625, -18.270065307617188, -4.222347259521484, 9.825370788574219, 23.873085021972656, 37.920806884765625, 51.96852111816406, 66.0162353515625, 80.06395721435547, 94.1116714477539, 108.15939331054688, 122.20710754394531, 136.25482177734375, 150.30255126953125, 164.35025024414062, 178.39796447753906, 192.4456787109375, 206.493408203125, 220.54112243652344, 234.58883666992188, 248.6365509033203, 262.68426513671875, 276.73199462890625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 6.0, 3.0, 6.0, 10.0, 13.0, 8.0, 14.0, 15.0, 19.0, 17.0, 17.0, 26.0, 26.0, 29.0, 32.0, 31.0, 41.0, 39.0, 43.0, 38.0, 46.0, 36.0, 57.0, 39.0, 45.0, 38.0, 29.0, 27.0, 32.0, 35.0, 31.0, 24.0, 17.0, 16.0, 11.0, 12.0, 12.0, 13.0, 8.0, 6.0, 6.0, 4.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-229.58389282226562, -222.65179443359375, -215.71969604492188, -208.78759765625, -201.85549926757812, -194.92340087890625, -187.9912872314453, -181.05918884277344, -174.12709045410156, -167.1949920654297, -160.2628936767578, -153.33079528808594, -146.398681640625, -139.46658325195312, -132.53448486328125, -125.60238647460938, -118.6702880859375, -111.73818969726562, -104.80609130859375, -97.87398529052734, -90.94188690185547, -84.0097885131836, -77.07768249511719, -70.14558410644531, -63.21348571777344, -56.28138732910156, -49.34928512573242, -42.41718292236328, -35.485084533691406, -28.55298614501953, -21.62088394165039, -14.68878173828125, -7.7566680908203125, -0.8245677947998047, 6.107532501220703, 13.039632797241211, 19.97173309326172, 26.903831481933594, 33.835933685302734, 40.768035888671875, 47.70013427734375, 54.632232666015625, 61.564334869384766, 68.4964370727539, 75.42853546142578, 82.36063385009766, 89.29273986816406, 96.22483825683594, 103.15693664550781, 110.08903503417969, 117.02113342285156, 123.95323944091797, 130.88534545898438, 137.81744384765625, 144.74954223632812, 151.681640625, 158.61373901367188, 165.54583740234375, 172.47793579101562, 179.4100341796875, 186.34213256835938, 193.27423095703125, 200.2063446044922, 207.13844299316406, 214.07054138183594]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 14.0, 15.0, 23.0, 26.0, 21.0, 35.0, 31.0, 62.0, 85.0, 121.0, 157.0, 246.0, 397.0, 681.0, 1306.0, 2544.0, 5885.0, 17354.0, 95306.0, 3991038.0, 55839.0, 13191.0, 4876.0, 2149.0, 1120.0, 594.0, 378.0, 240.0, 145.0, 100.0, 90.0, 48.0, 38.0, 27.0, 25.0, 13.0, 13.0, 8.0, 6.0, 12.0, 8.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-51.21875, -49.72900390625, -48.2392578125, -46.74951171875, -45.259765625, -43.77001953125, -42.2802734375, -40.79052734375, -39.30078125, -37.81103515625, -36.3212890625, -34.83154296875, -33.341796875, -31.85205078125, -30.3623046875, -28.87255859375, -27.3828125, -25.89306640625, -24.4033203125, -22.91357421875, -21.423828125, -19.93408203125, -18.4443359375, -16.95458984375, -15.46484375, -13.97509765625, -12.4853515625, -10.99560546875, -9.505859375, -8.01611328125, -6.5263671875, -5.03662109375, -3.546875, -2.05712890625, -0.5673828125, 0.92236328125, 2.412109375, 3.90185546875, 5.3916015625, 6.88134765625, 8.37109375, 9.86083984375, 11.3505859375, 12.84033203125, 14.330078125, 15.81982421875, 17.3095703125, 18.79931640625, 20.2890625, 21.77880859375, 23.2685546875, 24.75830078125, 26.248046875, 27.73779296875, 29.2275390625, 30.71728515625, 32.20703125, 33.69677734375, 35.1865234375, 36.67626953125, 38.166015625, 39.65576171875, 41.1455078125, 42.63525390625, 44.125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 9.0, 13.0, 12.0, 24.0, 21.0, 20.0, 30.0, 37.0, 57.0, 49.0, 66.0, 43.0, 43.0, 53.0, 48.0, 50.0, 65.0, 45.0, 49.0, 40.0, 36.0, 30.0, 30.0, 20.0, 16.0, 20.0, 17.0, 7.0, 7.0, 6.0, 4.0, 2.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.9453125, -9.62451171875, -9.3037109375, -8.98291015625, -8.662109375, -8.34130859375, -8.0205078125, -7.69970703125, -7.37890625, -7.05810546875, -6.7373046875, -6.41650390625, -6.095703125, -5.77490234375, -5.4541015625, -5.13330078125, -4.8125, -4.49169921875, -4.1708984375, -3.85009765625, -3.529296875, -3.20849609375, -2.8876953125, -2.56689453125, -2.24609375, -1.92529296875, -1.6044921875, -1.28369140625, -0.962890625, -0.64208984375, -0.3212890625, -0.00048828125, 0.3203125, 0.64111328125, 0.9619140625, 1.28271484375, 1.603515625, 1.92431640625, 2.2451171875, 2.56591796875, 2.88671875, 3.20751953125, 3.5283203125, 3.84912109375, 4.169921875, 4.49072265625, 4.8115234375, 5.13232421875, 5.453125, 5.77392578125, 6.0947265625, 6.41552734375, 6.736328125, 7.05712890625, 7.3779296875, 7.69873046875, 8.01953125, 8.34033203125, 8.6611328125, 8.98193359375, 9.302734375, 9.62353515625, 9.9443359375, 10.26513671875, 10.5859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 28.0, 18.0, 28.0, 37.0, 55.0, 71.0, 96.0, 122.0, 167.0, 241.0, 314.0, 451.0, 623.0, 826.0, 1313.0, 1838.0, 2982.0, 4717.0, 8598.0, 17651.0, 45961.0, 256101.0, 3702210.0, 92798.0, 27437.0, 11897.0, 6370.0, 3718.0, 2316.0, 1547.0, 1022.0, 726.0, 516.0, 375.0, 294.0, 200.0, 139.0, 116.0, 81.0, 73.0, 32.0, 30.0, 39.0, 27.0, 10.0, 12.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-30.84375, -29.85693359375, -28.8701171875, -27.88330078125, -26.896484375, -25.90966796875, -24.9228515625, -23.93603515625, -22.94921875, -21.96240234375, -20.9755859375, -19.98876953125, -19.001953125, -18.01513671875, -17.0283203125, -16.04150390625, -15.0546875, -14.06787109375, -13.0810546875, -12.09423828125, -11.107421875, -10.12060546875, -9.1337890625, -8.14697265625, -7.16015625, -6.17333984375, -5.1865234375, -4.19970703125, -3.212890625, -2.22607421875, -1.2392578125, -0.25244140625, 0.734375, 1.72119140625, 2.7080078125, 3.69482421875, 4.681640625, 5.66845703125, 6.6552734375, 7.64208984375, 8.62890625, 9.61572265625, 10.6025390625, 11.58935546875, 12.576171875, 13.56298828125, 14.5498046875, 15.53662109375, 16.5234375, 17.51025390625, 18.4970703125, 19.48388671875, 20.470703125, 21.45751953125, 22.4443359375, 23.43115234375, 24.41796875, 25.40478515625, 26.3916015625, 27.37841796875, 28.365234375, 29.35205078125, 30.3388671875, 31.32568359375, 32.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 5.0, 8.0, 3.0, 10.0, 12.0, 11.0, 22.0, 35.0, 47.0, 143.0, 402.0, 3015.0, 162.0, 60.0, 40.0, 25.0, 24.0, 11.0, 6.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.138916015625, -10.77001953125, -10.401123046875, -10.0322265625, -9.663330078125, -9.29443359375, -8.925537109375, -8.556640625, -8.187744140625, -7.81884765625, -7.449951171875, -7.0810546875, -6.712158203125, -6.34326171875, -5.974365234375, -5.60546875, -5.236572265625, -4.86767578125, -4.498779296875, -4.1298828125, -3.760986328125, -3.39208984375, -3.023193359375, -2.654296875, -2.285400390625, -1.91650390625, -1.547607421875, -1.1787109375, -0.809814453125, -0.44091796875, -0.072021484375, 0.296875, 0.665771484375, 1.03466796875, 1.403564453125, 1.7724609375, 2.141357421875, 2.51025390625, 2.879150390625, 3.248046875, 3.616943359375, 3.98583984375, 4.354736328125, 4.7236328125, 5.092529296875, 5.46142578125, 5.830322265625, 6.19921875, 6.568115234375, 6.93701171875, 7.305908203125, 7.6748046875, 8.043701171875, 8.41259765625, 8.781494140625, 9.150390625, 9.519287109375, 9.88818359375, 10.257080078125, 10.6259765625, 10.994873046875, 11.36376953125, 11.732666015625, 12.1015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 5.0, 6.0, 11.0, 19.0, 29.0, 43.0, 62.0, 72.0, 107.0, 110.0, 117.0, 118.0, 95.0, 63.0, 49.0, 32.0, 9.0, 23.0, 5.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.309356689453125, -34.74346923828125, -33.177581787109375, -31.611692428588867, -30.045804977416992, -28.479915618896484, -26.91402816772461, -25.348140716552734, -23.78225326538086, -22.216365814208984, -20.650476455688477, -19.0845890045166, -17.518701553344727, -15.952813148498535, -14.386924743652344, -12.821037292480469, -11.255147933959961, -9.68925952911377, -8.123372077941895, -6.557483673095703, -4.99159574508667, -3.4257078170776367, -1.8598194122314453, -0.2939319610595703, 1.271956443786621, 2.8378443717956543, 4.4037322998046875, 5.969620704650879, 7.535508632659912, 9.101396560668945, 10.667284965515137, 12.233172416687012, 13.799060821533203, 15.364949226379395, 16.930837631225586, 18.49672508239746, 20.062612533569336, 21.628501892089844, 23.19438934326172, 24.760276794433594, 26.32616424560547, 27.892051696777344, 29.45794105529785, 31.023828506469727, 32.589717864990234, 34.15560531616211, 35.721492767333984, 37.28738021850586, 38.853271484375, 40.419158935546875, 41.98504638671875, 43.550933837890625, 45.116825103759766, 46.68271255493164, 48.248600006103516, 49.81448745727539, 51.380374908447266, 52.94626235961914, 54.512149810791016, 56.078041076660156, 57.64392852783203, 59.209815979003906, 60.77570343017578, 62.341590881347656, 63.90747833251953]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 5.0, 7.0, 9.0, 7.0, 12.0, 11.0, 14.0, 12.0, 21.0, 19.0, 17.0, 27.0, 32.0, 34.0, 34.0, 44.0, 44.0, 32.0, 27.0, 44.0, 35.0, 49.0, 41.0, 48.0, 35.0, 39.0, 28.0, 39.0, 30.0, 30.0, 29.0, 18.0, 19.0, 20.0, 8.0, 13.0, 8.0, 11.0, 11.0, 5.0, 5.0, 4.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.32943344116211, -23.56981086730957, -22.81018829345703, -22.050565719604492, -21.290943145751953, -20.531320571899414, -19.771697998046875, -19.012075424194336, -18.252452850341797, -17.492830276489258, -16.73320770263672, -15.97358512878418, -15.21396255493164, -14.454339981079102, -13.694717407226562, -12.935094833374023, -12.175472259521484, -11.415849685668945, -10.656227111816406, -9.896604537963867, -9.136981964111328, -8.377359390258789, -7.61773681640625, -6.858114242553711, -6.098491668701172, -5.338869094848633, -4.579246520996094, -3.8196239471435547, -3.0600013732910156, -2.3003787994384766, -1.5407562255859375, -0.7811336517333984, -0.021511077880859375, 0.7381114959716797, 1.4977340698242188, 2.257356643676758, 3.016979217529297, 3.776601791381836, 4.536224365234375, 5.295846939086914, 6.055469512939453, 6.815092086791992, 7.574714660644531, 8.33433723449707, 9.09395980834961, 9.853582382202148, 10.613204956054688, 11.372827529907227, 12.132450103759766, 12.892072677612305, 13.651695251464844, 14.411317825317383, 15.170940399169922, 15.930562973022461, 16.690185546875, 17.44980812072754, 18.209430694580078, 18.969053268432617, 19.728675842285156, 20.488298416137695, 21.247920989990234, 22.007543563842773, 22.767166137695312, 23.52678871154785, 24.28641128540039]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 6.0, 12.0, 12.0, 14.0, 29.0, 47.0, 68.0, 122.0, 232.0, 317.0, 557.0, 945.0, 1656.0, 3059.0, 5459.0, 10270.0, 19096.0, 35877.0, 67991.0, 124539.0, 199140.0, 223959.0, 160088.0, 90668.0, 48488.0, 25755.0, 13597.0, 7350.0, 3949.0, 2257.0, 1230.0, 684.0, 434.0, 243.0, 144.0, 77.0, 64.0, 42.0, 25.0, 18.0, 13.0, 8.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.63916015625, -16.1064453125, -15.57373046875, -15.041015625, -14.50830078125, -13.9755859375, -13.44287109375, -12.91015625, -12.37744140625, -11.8447265625, -11.31201171875, -10.779296875, -10.24658203125, -9.7138671875, -9.18115234375, -8.6484375, -8.11572265625, -7.5830078125, -7.05029296875, -6.517578125, -5.98486328125, -5.4521484375, -4.91943359375, -4.38671875, -3.85400390625, -3.3212890625, -2.78857421875, -2.255859375, -1.72314453125, -1.1904296875, -0.65771484375, -0.125, 0.40771484375, 0.9404296875, 1.47314453125, 2.005859375, 2.53857421875, 3.0712890625, 3.60400390625, 4.13671875, 4.66943359375, 5.2021484375, 5.73486328125, 6.267578125, 6.80029296875, 7.3330078125, 7.86572265625, 8.3984375, 8.93115234375, 9.4638671875, 9.99658203125, 10.529296875, 11.06201171875, 11.5947265625, 12.12744140625, 12.66015625, 13.19287109375, 13.7255859375, 14.25830078125, 14.791015625, 15.32373046875, 15.8564453125, 16.38916015625, 16.921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 15.0, 10.0, 14.0, 14.0, 16.0, 25.0, 25.0, 23.0, 36.0, 31.0, 38.0, 44.0, 52.0, 41.0, 40.0, 56.0, 47.0, 42.0, 49.0, 46.0, 40.0, 25.0, 34.0, 35.0, 24.0, 27.0, 20.0, 20.0, 9.0, 11.0, 12.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0, -8.714599609375, -8.42919921875, -8.143798828125, -7.8583984375, -7.572998046875, -7.28759765625, -7.002197265625, -6.716796875, -6.431396484375, -6.14599609375, -5.860595703125, -5.5751953125, -5.289794921875, -5.00439453125, -4.718994140625, -4.43359375, -4.148193359375, -3.86279296875, -3.577392578125, -3.2919921875, -3.006591796875, -2.72119140625, -2.435791015625, -2.150390625, -1.864990234375, -1.57958984375, -1.294189453125, -1.0087890625, -0.723388671875, -0.43798828125, -0.152587890625, 0.1328125, 0.418212890625, 0.70361328125, 0.989013671875, 1.2744140625, 1.559814453125, 1.84521484375, 2.130615234375, 2.416015625, 2.701416015625, 2.98681640625, 3.272216796875, 3.5576171875, 3.843017578125, 4.12841796875, 4.413818359375, 4.69921875, 4.984619140625, 5.27001953125, 5.555419921875, 5.8408203125, 6.126220703125, 6.41162109375, 6.697021484375, 6.982421875, 7.267822265625, 7.55322265625, 7.838623046875, 8.1240234375, 8.409423828125, 8.69482421875, 8.980224609375, 9.265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 8.0, 9.0, 20.0, 22.0, 41.0, 62.0, 82.0, 159.0, 323.0, 764.0, 2208.0, 10501.0, 105367.0, 748967.0, 161335.0, 14342.0, 2622.0, 869.0, 382.0, 185.0, 85.0, 56.0, 45.0, 27.0, 18.0, 13.0, 8.0, 11.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.4375, -70.2802734375, -68.123046875, -65.9658203125, -63.80859375, -61.6513671875, -59.494140625, -57.3369140625, -55.1796875, -53.0224609375, -50.865234375, -48.7080078125, -46.55078125, -44.3935546875, -42.236328125, -40.0791015625, -37.921875, -35.7646484375, -33.607421875, -31.4501953125, -29.29296875, -27.1357421875, -24.978515625, -22.8212890625, -20.6640625, -18.5068359375, -16.349609375, -14.1923828125, -12.03515625, -9.8779296875, -7.720703125, -5.5634765625, -3.40625, -1.2490234375, 0.908203125, 3.0654296875, 5.22265625, 7.3798828125, 9.537109375, 11.6943359375, 13.8515625, 16.0087890625, 18.166015625, 20.3232421875, 22.48046875, 24.6376953125, 26.794921875, 28.9521484375, 31.109375, 33.2666015625, 35.423828125, 37.5810546875, 39.73828125, 41.8955078125, 44.052734375, 46.2099609375, 48.3671875, 50.5244140625, 52.681640625, 54.8388671875, 56.99609375, 59.1533203125, 61.310546875, 63.4677734375, 65.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 9.0, 7.0, 11.0, 12.0, 8.0, 17.0, 31.0, 31.0, 24.0, 40.0, 35.0, 36.0, 35.0, 44.0, 59.0, 48.0, 69.0, 45.0, 57.0, 51.0, 46.0, 38.0, 31.0, 32.0, 30.0, 25.0, 24.0, 16.0, 14.0, 14.0, 11.0, 9.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-65.0, -63.27294921875, -61.5458984375, -59.81884765625, -58.091796875, -56.36474609375, -54.6376953125, -52.91064453125, -51.18359375, -49.45654296875, -47.7294921875, -46.00244140625, -44.275390625, -42.54833984375, -40.8212890625, -39.09423828125, -37.3671875, -35.64013671875, -33.9130859375, -32.18603515625, -30.458984375, -28.73193359375, -27.0048828125, -25.27783203125, -23.55078125, -21.82373046875, -20.0966796875, -18.36962890625, -16.642578125, -14.91552734375, -13.1884765625, -11.46142578125, -9.734375, -8.00732421875, -6.2802734375, -4.55322265625, -2.826171875, -1.09912109375, 0.6279296875, 2.35498046875, 4.08203125, 5.80908203125, 7.5361328125, 9.26318359375, 10.990234375, 12.71728515625, 14.4443359375, 16.17138671875, 17.8984375, 19.62548828125, 21.3525390625, 23.07958984375, 24.806640625, 26.53369140625, 28.2607421875, 29.98779296875, 31.71484375, 33.44189453125, 35.1689453125, 36.89599609375, 38.623046875, 40.35009765625, 42.0771484375, 43.80419921875, 45.53125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 5.0, 5.0, 6.0, 9.0, 13.0, 13.0, 35.0, 44.0, 65.0, 105.0, 182.0, 397.0, 748.0, 1967.0, 6927.0, 34491.0, 321655.0, 596530.0, 69359.0, 11004.0, 2861.0, 1018.0, 499.0, 261.0, 136.0, 87.0, 45.0, 34.0, 16.0, 9.0, 11.0, 6.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.75, -25.91845703125, -25.0869140625, -24.25537109375, -23.423828125, -22.59228515625, -21.7607421875, -20.92919921875, -20.09765625, -19.26611328125, -18.4345703125, -17.60302734375, -16.771484375, -15.93994140625, -15.1083984375, -14.27685546875, -13.4453125, -12.61376953125, -11.7822265625, -10.95068359375, -10.119140625, -9.28759765625, -8.4560546875, -7.62451171875, -6.79296875, -5.96142578125, -5.1298828125, -4.29833984375, -3.466796875, -2.63525390625, -1.8037109375, -0.97216796875, -0.140625, 0.69091796875, 1.5224609375, 2.35400390625, 3.185546875, 4.01708984375, 4.8486328125, 5.68017578125, 6.51171875, 7.34326171875, 8.1748046875, 9.00634765625, 9.837890625, 10.66943359375, 11.5009765625, 12.33251953125, 13.1640625, 13.99560546875, 14.8271484375, 15.65869140625, 16.490234375, 17.32177734375, 18.1533203125, 18.98486328125, 19.81640625, 20.64794921875, 21.4794921875, 22.31103515625, 23.142578125, 23.97412109375, 24.8056640625, 25.63720703125, 26.46875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 12.0, 14.0, 23.0, 21.0, 31.0, 52.0, 64.0, 67.0, 112.0, 129.0, 109.0, 89.0, 72.0, 56.0, 45.0, 25.0, 18.0, 22.0, 12.0, 12.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00499725341796875, -0.004824697971343994, -0.004652142524719238, -0.004479587078094482, -0.0043070316314697266, -0.004134476184844971, -0.003961920738220215, -0.003789365291595459, -0.003616809844970703, -0.0034442543983459473, -0.0032716989517211914, -0.0030991435050964355, -0.0029265880584716797, -0.002754032611846924, -0.002581477165222168, -0.002408921718597412, -0.0022363662719726562, -0.0020638108253479004, -0.0018912553787231445, -0.0017186999320983887, -0.0015461444854736328, -0.001373589038848877, -0.001201033592224121, -0.0010284781455993652, -0.0008559226989746094, -0.0006833672523498535, -0.0005108118057250977, -0.0003382563591003418, -0.00016570091247558594, 6.854534149169922e-06, 0.00017940998077392578, 0.00035196542739868164, 0.0005245208740234375, 0.0006970763206481934, 0.0008696317672729492, 0.001042187213897705, 0.001214742660522461, 0.0013872981071472168, 0.0015598535537719727, 0.0017324090003967285, 0.0019049644470214844, 0.0020775198936462402, 0.002250075340270996, 0.002422630786895752, 0.002595186233520508, 0.0027677416801452637, 0.0029402971267700195, 0.0031128525733947754, 0.0032854080200195312, 0.003457963466644287, 0.003630518913269043, 0.003803074359893799, 0.003975629806518555, 0.0041481852531433105, 0.004320740699768066, 0.004493296146392822, 0.004665851593017578, 0.004838407039642334, 0.00501096248626709, 0.005183517932891846, 0.0053560733795166016, 0.005528628826141357, 0.005701184272766113, 0.005873739719390869, 0.006046295166015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 14.0, 9.0, 11.0, 29.0, 38.0, 79.0, 125.0, 188.0, 383.0, 862.0, 2285.0, 7655.0, 42870.0, 432204.0, 499263.0, 49716.0, 8476.0, 2448.0, 917.0, 424.0, 243.0, 124.0, 66.0, 36.0, 37.0, 17.0, 13.0, 6.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.484375, -30.63427734375, -29.7841796875, -28.93408203125, -28.083984375, -27.23388671875, -26.3837890625, -25.53369140625, -24.68359375, -23.83349609375, -22.9833984375, -22.13330078125, -21.283203125, -20.43310546875, -19.5830078125, -18.73291015625, -17.8828125, -17.03271484375, -16.1826171875, -15.33251953125, -14.482421875, -13.63232421875, -12.7822265625, -11.93212890625, -11.08203125, -10.23193359375, -9.3818359375, -8.53173828125, -7.681640625, -6.83154296875, -5.9814453125, -5.13134765625, -4.28125, -3.43115234375, -2.5810546875, -1.73095703125, -0.880859375, -0.03076171875, 0.8193359375, 1.66943359375, 2.51953125, 3.36962890625, 4.2197265625, 5.06982421875, 5.919921875, 6.77001953125, 7.6201171875, 8.47021484375, 9.3203125, 10.17041015625, 11.0205078125, 11.87060546875, 12.720703125, 13.57080078125, 14.4208984375, 15.27099609375, 16.12109375, 16.97119140625, 17.8212890625, 18.67138671875, 19.521484375, 20.37158203125, 21.2216796875, 22.07177734375, 22.921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 15.0, 19.0, 28.0, 55.0, 108.0, 115.0, 157.0, 137.0, 127.0, 85.0, 78.0, 34.0, 19.0, 11.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5625, -55.279052734375, -53.99560546875, -52.712158203125, -51.4287109375, -50.145263671875, -48.86181640625, -47.578369140625, -46.294921875, -45.011474609375, -43.72802734375, -42.444580078125, -41.1611328125, -39.877685546875, -38.59423828125, -37.310791015625, -36.02734375, -34.743896484375, -33.46044921875, -32.177001953125, -30.8935546875, -29.610107421875, -28.32666015625, -27.043212890625, -25.759765625, -24.476318359375, -23.19287109375, -21.909423828125, -20.6259765625, -19.342529296875, -18.05908203125, -16.775634765625, -15.4921875, -14.208740234375, -12.92529296875, -11.641845703125, -10.3583984375, -9.074951171875, -7.79150390625, -6.508056640625, -5.224609375, -3.941162109375, -2.65771484375, -1.374267578125, -0.0908203125, 1.192626953125, 2.47607421875, 3.759521484375, 5.04296875, 6.326416015625, 7.60986328125, 8.893310546875, 10.1767578125, 11.460205078125, 12.74365234375, 14.027099609375, 15.310546875, 16.593994140625, 17.87744140625, 19.160888671875, 20.4443359375, 21.727783203125, 23.01123046875, 24.294677734375, 25.578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 8.0, 9.0, 18.0, 33.0, 48.0, 72.0, 151.0, 145.0, 144.0, 140.0, 107.0, 53.0, 33.0, 19.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.70428466796875, -259.2803955078125, -245.8564910888672, -232.43260192871094, -219.00869750976562, -205.58480834960938, -192.16091918945312, -178.73703002929688, -165.31312561035156, -151.8892364501953, -138.46533203125, -125.04144287109375, -111.61754608154297, -98.19364929199219, -84.76976013183594, -71.34586334228516, -57.921966552734375, -44.498069763183594, -31.074176788330078, -17.650283813476562, -4.226387023925781, 9.197509765625, 22.62139892578125, 36.04529571533203, 49.46919250488281, 62.893089294433594, 76.31698608398438, 89.74087524414062, 103.1647720336914, 116.58866882324219, 130.01255798339844, 143.43646240234375, 156.8603515625, 170.28424072265625, 183.70814514160156, 197.1320343017578, 210.55593872070312, 223.97982788085938, 237.40371704101562, 250.82760620117188, 264.25152587890625, 277.6754150390625, 291.09930419921875, 304.523193359375, 317.9471130371094, 331.3710021972656, 344.7948913574219, 358.2187805175781, 371.6426696777344, 385.0665588378906, 398.4904479980469, 411.91436767578125, 425.3382568359375, 438.76214599609375, 452.18603515625, 465.60992431640625, 479.0338134765625, 492.45770263671875, 505.881591796875, 519.3054809570312, 532.7293701171875, 546.1533203125, 559.5771484375, 573.0010986328125, 586.4249877929688]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 8.0, 4.0, 10.0, 13.0, 10.0, 20.0, 12.0, 26.0, 27.0, 30.0, 30.0, 40.0, 52.0, 32.0, 40.0, 43.0, 53.0, 51.0, 50.0, 59.0, 36.0, 51.0, 53.0, 35.0, 39.0, 29.0, 13.0, 23.0, 17.0, 19.0, 9.0, 12.0, 13.0, 9.0, 3.0, 8.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.95574951171875, -244.38369750976562, -236.81163024902344, -229.2395782470703, -221.66751098632812, -214.095458984375, -206.5233917236328, -198.9513397216797, -191.3792724609375, -183.80722045898438, -176.2351531982422, -168.66310119628906, -161.09103393554688, -153.51898193359375, -145.94691467285156, -138.37486267089844, -130.80279541015625, -123.2307357788086, -115.65867614746094, -108.08661651611328, -100.51455688476562, -92.9425048828125, -85.37043762207031, -77.79838562011719, -70.22633361816406, -62.654273986816406, -55.08221435546875, -47.510154724121094, -39.93809509277344, -32.36603927612305, -24.79397964477539, -17.221920013427734, -9.649856567382812, -2.0777974128723145, 5.494261741638184, 13.066320419311523, 20.63838005065918, 28.210437774658203, 35.78249740600586, 43.354557037353516, 50.92661666870117, 58.49867630004883, 66.07073211669922, 73.64279174804688, 81.21485137939453, 88.78691101074219, 96.35897064208984, 103.9310302734375, 111.50308990478516, 119.07514953613281, 126.64720916748047, 134.21926879882812, 141.79132080078125, 149.36338806152344, 156.93544006347656, 164.50750732421875, 172.07955932617188, 179.651611328125, 187.2236785888672, 194.7957305908203, 202.3677978515625, 209.93984985351562, 217.5119171142578, 225.08396911621094, 232.65603637695312]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 6.0, 11.0, 17.0, 24.0, 26.0, 41.0, 50.0, 77.0, 123.0, 192.0, 301.0, 581.0, 1064.0, 2219.0, 5477.0, 17363.0, 3944348.0, 198028.0, 14802.0, 5003.0, 2121.0, 1012.0, 471.0, 344.0, 197.0, 114.0, 85.0, 53.0, 38.0, 28.0, 14.0, 10.0, 9.0, 15.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-76.25, -74.2919921875, -72.333984375, -70.3759765625, -68.41796875, -66.4599609375, -64.501953125, -62.5439453125, -60.5859375, -58.6279296875, -56.669921875, -54.7119140625, -52.75390625, -50.7958984375, -48.837890625, -46.8798828125, -44.921875, -42.9638671875, -41.005859375, -39.0478515625, -37.08984375, -35.1318359375, -33.173828125, -31.2158203125, -29.2578125, -27.2998046875, -25.341796875, -23.3837890625, -21.42578125, -19.4677734375, -17.509765625, -15.5517578125, -13.59375, -11.6357421875, -9.677734375, -7.7197265625, -5.76171875, -3.8037109375, -1.845703125, 0.1123046875, 2.0703125, 4.0283203125, 5.986328125, 7.9443359375, 9.90234375, 11.8603515625, 13.818359375, 15.7763671875, 17.734375, 19.6923828125, 21.650390625, 23.6083984375, 25.56640625, 27.5244140625, 29.482421875, 31.4404296875, 33.3984375, 35.3564453125, 37.314453125, 39.2724609375, 41.23046875, 43.1884765625, 45.146484375, 47.1044921875, 49.0625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 5.0, 14.0, 20.0, 18.0, 21.0, 29.0, 38.0, 59.0, 59.0, 73.0, 71.0, 68.0, 82.0, 60.0, 66.0, 68.0, 48.0, 42.0, 38.0, 34.0, 15.0, 15.0, 14.0, 10.0, 1.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-20.359375, -19.863525390625, -19.36767578125, -18.871826171875, -18.3759765625, -17.880126953125, -17.38427734375, -16.888427734375, -16.392578125, -15.896728515625, -15.40087890625, -14.905029296875, -14.4091796875, -13.913330078125, -13.41748046875, -12.921630859375, -12.42578125, -11.929931640625, -11.43408203125, -10.938232421875, -10.4423828125, -9.946533203125, -9.45068359375, -8.954833984375, -8.458984375, -7.963134765625, -7.46728515625, -6.971435546875, -6.4755859375, -5.979736328125, -5.48388671875, -4.988037109375, -4.4921875, -3.996337890625, -3.50048828125, -3.004638671875, -2.5087890625, -2.012939453125, -1.51708984375, -1.021240234375, -0.525390625, -0.029541015625, 0.46630859375, 0.962158203125, 1.4580078125, 1.953857421875, 2.44970703125, 2.945556640625, 3.44140625, 3.937255859375, 4.43310546875, 4.928955078125, 5.4248046875, 5.920654296875, 6.41650390625, 6.912353515625, 7.408203125, 7.904052734375, 8.39990234375, 8.895751953125, 9.3916015625, 9.887451171875, 10.38330078125, 10.879150390625, 11.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 15.0, 23.0, 31.0, 30.0, 51.0, 56.0, 69.0, 120.0, 147.0, 187.0, 304.0, 456.0, 652.0, 1108.0, 1901.0, 3977.0, 11190.0, 54705.0, 4022416.0, 73891.0, 12820.0, 4437.0, 2146.0, 1231.0, 721.0, 436.0, 308.0, 238.0, 168.0, 120.0, 83.0, 66.0, 43.0, 29.0, 29.0, 21.0, 8.0, 14.0, 4.0, 1.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.03125, -48.3388671875, -46.646484375, -44.9541015625, -43.26171875, -41.5693359375, -39.876953125, -38.1845703125, -36.4921875, -34.7998046875, -33.107421875, -31.4150390625, -29.72265625, -28.0302734375, -26.337890625, -24.6455078125, -22.953125, -21.2607421875, -19.568359375, -17.8759765625, -16.18359375, -14.4912109375, -12.798828125, -11.1064453125, -9.4140625, -7.7216796875, -6.029296875, -4.3369140625, -2.64453125, -0.9521484375, 0.740234375, 2.4326171875, 4.125, 5.8173828125, 7.509765625, 9.2021484375, 10.89453125, 12.5869140625, 14.279296875, 15.9716796875, 17.6640625, 19.3564453125, 21.048828125, 22.7412109375, 24.43359375, 26.1259765625, 27.818359375, 29.5107421875, 31.203125, 32.8955078125, 34.587890625, 36.2802734375, 37.97265625, 39.6650390625, 41.357421875, 43.0498046875, 44.7421875, 46.4345703125, 48.126953125, 49.8193359375, 51.51171875, 53.2041015625, 54.896484375, 56.5888671875, 58.28125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 13.0, 15.0, 41.0, 66.0, 554.0, 3218.0, 80.0, 37.0, 15.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.2119140625, -15.689453125, -15.1669921875, -14.64453125, -14.1220703125, -13.599609375, -13.0771484375, -12.5546875, -12.0322265625, -11.509765625, -10.9873046875, -10.46484375, -9.9423828125, -9.419921875, -8.8974609375, -8.375, -7.8525390625, -7.330078125, -6.8076171875, -6.28515625, -5.7626953125, -5.240234375, -4.7177734375, -4.1953125, -3.6728515625, -3.150390625, -2.6279296875, -2.10546875, -1.5830078125, -1.060546875, -0.5380859375, -0.015625, 0.5068359375, 1.029296875, 1.5517578125, 2.07421875, 2.5966796875, 3.119140625, 3.6416015625, 4.1640625, 4.6865234375, 5.208984375, 5.7314453125, 6.25390625, 6.7763671875, 7.298828125, 7.8212890625, 8.34375, 8.8662109375, 9.388671875, 9.9111328125, 10.43359375, 10.9560546875, 11.478515625, 12.0009765625, 12.5234375, 13.0458984375, 13.568359375, 14.0908203125, 14.61328125, 15.1357421875, 15.658203125, 16.1806640625, 16.703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 10.0, 15.0, 15.0, 13.0, 26.0, 38.0, 32.0, 55.0, 68.0, 84.0, 93.0, 84.0, 72.0, 89.0, 52.0, 58.0, 28.0, 34.0, 31.0, 19.0, 17.0, 16.0, 9.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-32.59568786621094, -31.655426025390625, -30.715166091918945, -29.774904251098633, -28.834644317626953, -27.89438247680664, -26.954120635986328, -26.01386070251465, -25.07360076904297, -24.133338928222656, -23.193078994750977, -22.252817153930664, -21.312557220458984, -20.372295379638672, -19.43203353881836, -18.49177360534668, -17.551511764526367, -16.611249923706055, -15.670989990234375, -14.730728149414062, -13.790468215942383, -12.85020637512207, -11.909945487976074, -10.969684600830078, -10.029423713684082, -9.089162826538086, -8.14890193939209, -7.2086405754089355, -6.2683796882629395, -5.328118801116943, -4.387857437133789, -3.447596549987793, -2.5073375701904297, -1.567076563835144, -0.6268155574798584, 0.3134455680847168, 1.253706455230713, 2.193967342376709, 3.1342287063598633, 4.074489593505859, 5.0147504806518555, 5.955011367797852, 6.895272254943848, 7.835533618927002, 8.775794982910156, 9.716054916381836, 10.656316757202148, 11.596577644348145, 12.53683853149414, 13.477099418640137, 14.417360305786133, 15.357622146606445, 16.297882080078125, 17.238143920898438, 18.17840576171875, 19.11866569519043, 20.05892562866211, 20.999187469482422, 21.9394474029541, 22.879709243774414, 23.819969177246094, 24.760231018066406, 25.70049285888672, 26.6407527923584, 27.58101463317871]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 5.0, 18.0, 5.0, 11.0, 10.0, 16.0, 14.0, 19.0, 25.0, 24.0, 30.0, 26.0, 27.0, 32.0, 29.0, 33.0, 41.0, 46.0, 46.0, 34.0, 44.0, 38.0, 47.0, 33.0, 48.0, 32.0, 42.0, 33.0, 34.0, 26.0, 15.0, 13.0, 15.0, 10.0, 16.0, 7.0, 11.0, 10.0, 8.0, 4.0, 7.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-22.058170318603516, -21.379589080810547, -20.70100975036621, -20.022430419921875, -19.343849182128906, -18.665267944335938, -17.9866886138916, -17.308109283447266, -16.629528045654297, -15.950947761535645, -15.272367477416992, -14.59378719329834, -13.915206909179688, -13.236626625061035, -12.558046340942383, -11.87946605682373, -11.200885772705078, -10.522305488586426, -9.843725204467773, -9.165144920349121, -8.486564636230469, -7.807984352111816, -7.129404067993164, -6.450823783874512, -5.772243499755859, -5.093663215637207, -4.415082931518555, -3.7365026473999023, -3.05792236328125, -2.3793420791625977, -1.7007617950439453, -1.022181510925293, -0.3436012268066406, 0.3349790573120117, 1.013559341430664, 1.6921396255493164, 2.3707199096679688, 3.049300193786621, 3.7278804779052734, 4.406460762023926, 5.085041046142578, 5.7636213302612305, 6.442201614379883, 7.120781898498535, 7.7993621826171875, 8.47794246673584, 9.156522750854492, 9.835103034973145, 10.513683319091797, 11.19226360321045, 11.870843887329102, 12.549424171447754, 13.228004455566406, 13.906584739685059, 14.585165023803711, 15.263745307922363, 15.942325592041016, 16.620906829833984, 17.29948616027832, 17.978065490722656, 18.656646728515625, 19.335227966308594, 20.01380729675293, 20.692386627197266, 21.370967864990234]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 15.0, 39.0, 67.0, 127.0, 226.0, 411.0, 965.0, 2225.0, 6468.0, 19107.0, 65871.0, 230055.0, 443187.0, 197632.0, 56225.0, 16695.0, 5529.0, 2042.0, 834.0, 385.0, 198.0, 106.0, 51.0, 32.0, 17.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.765625, -25.753173828125, -24.74072265625, -23.728271484375, -22.7158203125, -21.703369140625, -20.69091796875, -19.678466796875, -18.666015625, -17.653564453125, -16.64111328125, -15.628662109375, -14.6162109375, -13.603759765625, -12.59130859375, -11.578857421875, -10.56640625, -9.553955078125, -8.54150390625, -7.529052734375, -6.5166015625, -5.504150390625, -4.49169921875, -3.479248046875, -2.466796875, -1.454345703125, -0.44189453125, 0.570556640625, 1.5830078125, 2.595458984375, 3.60791015625, 4.620361328125, 5.6328125, 6.645263671875, 7.65771484375, 8.670166015625, 9.6826171875, 10.695068359375, 11.70751953125, 12.719970703125, 13.732421875, 14.744873046875, 15.75732421875, 16.769775390625, 17.7822265625, 18.794677734375, 19.80712890625, 20.819580078125, 21.83203125, 22.844482421875, 23.85693359375, 24.869384765625, 25.8818359375, 26.894287109375, 27.90673828125, 28.919189453125, 29.931640625, 30.944091796875, 31.95654296875, 32.968994140625, 33.9814453125, 34.993896484375, 36.00634765625, 37.018798828125, 38.03125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 3.0, 14.0, 15.0, 13.0, 25.0, 32.0, 24.0, 38.0, 54.0, 41.0, 53.0, 47.0, 62.0, 65.0, 57.0, 47.0, 66.0, 55.0, 48.0, 38.0, 31.0, 28.0, 29.0, 24.0, 22.0, 9.0, 10.0, 9.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-15.640625, -15.204345703125, -14.76806640625, -14.331787109375, -13.8955078125, -13.459228515625, -13.02294921875, -12.586669921875, -12.150390625, -11.714111328125, -11.27783203125, -10.841552734375, -10.4052734375, -9.968994140625, -9.53271484375, -9.096435546875, -8.66015625, -8.223876953125, -7.78759765625, -7.351318359375, -6.9150390625, -6.478759765625, -6.04248046875, -5.606201171875, -5.169921875, -4.733642578125, -4.29736328125, -3.861083984375, -3.4248046875, -2.988525390625, -2.55224609375, -2.115966796875, -1.6796875, -1.243408203125, -0.80712890625, -0.370849609375, 0.0654296875, 0.501708984375, 0.93798828125, 1.374267578125, 1.810546875, 2.246826171875, 2.68310546875, 3.119384765625, 3.5556640625, 3.991943359375, 4.42822265625, 4.864501953125, 5.30078125, 5.737060546875, 6.17333984375, 6.609619140625, 7.0458984375, 7.482177734375, 7.91845703125, 8.354736328125, 8.791015625, 9.227294921875, 9.66357421875, 10.099853515625, 10.5361328125, 10.972412109375, 11.40869140625, 11.844970703125, 12.28125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 17.0, 20.0, 30.0, 28.0, 45.0, 84.0, 125.0, 167.0, 287.0, 557.0, 1094.0, 2404.0, 8373.0, 55530.0, 602467.0, 337339.0, 30509.0, 5526.0, 1869.0, 805.0, 476.0, 264.0, 150.0, 101.0, 83.0, 46.0, 33.0, 31.0, 21.0, 15.0, 8.0, 8.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-74.875, -72.84375, -70.8125, -68.78125, -66.75, -64.71875, -62.6875, -60.65625, -58.625, -56.59375, -54.5625, -52.53125, -50.5, -48.46875, -46.4375, -44.40625, -42.375, -40.34375, -38.3125, -36.28125, -34.25, -32.21875, -30.1875, -28.15625, -26.125, -24.09375, -22.0625, -20.03125, -18.0, -15.96875, -13.9375, -11.90625, -9.875, -7.84375, -5.8125, -3.78125, -1.75, 0.28125, 2.3125, 4.34375, 6.375, 8.40625, 10.4375, 12.46875, 14.5, 16.53125, 18.5625, 20.59375, 22.625, 24.65625, 26.6875, 28.71875, 30.75, 32.78125, 34.8125, 36.84375, 38.875, 40.90625, 42.9375, 44.96875, 47.0, 49.03125, 51.0625, 53.09375, 55.125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 4.0, 10.0, 13.0, 21.0, 21.0, 23.0, 30.0, 38.0, 46.0, 53.0, 65.0, 62.0, 79.0, 78.0, 73.0, 70.0, 54.0, 49.0, 39.0, 29.0, 30.0, 27.0, 18.0, 15.0, 8.0, 6.0, 12.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-112.9375, -109.9365234375, -106.935546875, -103.9345703125, -100.93359375, -97.9326171875, -94.931640625, -91.9306640625, -88.9296875, -85.9287109375, -82.927734375, -79.9267578125, -76.92578125, -73.9248046875, -70.923828125, -67.9228515625, -64.921875, -61.9208984375, -58.919921875, -55.9189453125, -52.91796875, -49.9169921875, -46.916015625, -43.9150390625, -40.9140625, -37.9130859375, -34.912109375, -31.9111328125, -28.91015625, -25.9091796875, -22.908203125, -19.9072265625, -16.90625, -13.9052734375, -10.904296875, -7.9033203125, -4.90234375, -1.9013671875, 1.099609375, 4.1005859375, 7.1015625, 10.1025390625, 13.103515625, 16.1044921875, 19.10546875, 22.1064453125, 25.107421875, 28.1083984375, 31.109375, 34.1103515625, 37.111328125, 40.1123046875, 43.11328125, 46.1142578125, 49.115234375, 52.1162109375, 55.1171875, 58.1181640625, 61.119140625, 64.1201171875, 67.12109375, 70.1220703125, 73.123046875, 76.1240234375, 79.125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 13.0, 14.0, 36.0, 32.0, 49.0, 56.0, 90.0, 129.0, 213.0, 350.0, 847.0, 2912.0, 20865.0, 721503.0, 286630.0, 11194.0, 2005.0, 689.0, 287.0, 185.0, 119.0, 74.0, 53.0, 46.0, 28.0, 16.0, 30.0, 20.0, 8.0, 15.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.78125, -59.0869140625, -57.392578125, -55.6982421875, -54.00390625, -52.3095703125, -50.615234375, -48.9208984375, -47.2265625, -45.5322265625, -43.837890625, -42.1435546875, -40.44921875, -38.7548828125, -37.060546875, -35.3662109375, -33.671875, -31.9775390625, -30.283203125, -28.5888671875, -26.89453125, -25.2001953125, -23.505859375, -21.8115234375, -20.1171875, -18.4228515625, -16.728515625, -15.0341796875, -13.33984375, -11.6455078125, -9.951171875, -8.2568359375, -6.5625, -4.8681640625, -3.173828125, -1.4794921875, 0.21484375, 1.9091796875, 3.603515625, 5.2978515625, 6.9921875, 8.6865234375, 10.380859375, 12.0751953125, 13.76953125, 15.4638671875, 17.158203125, 18.8525390625, 20.546875, 22.2412109375, 23.935546875, 25.6298828125, 27.32421875, 29.0185546875, 30.712890625, 32.4072265625, 34.1015625, 35.7958984375, 37.490234375, 39.1845703125, 40.87890625, 42.5732421875, 44.267578125, 45.9619140625, 47.65625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 7.0, 5.0, 8.0, 6.0, 11.0, 11.0, 13.0, 20.0, 24.0, 50.0, 50.0, 74.0, 93.0, 97.0, 108.0, 77.0, 84.0, 66.0, 38.0, 26.0, 29.0, 18.0, 22.0, 11.0, 10.0, 7.0, 10.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.005313873291015625, -0.005152761936187744, -0.004991650581359863, -0.004830539226531982, -0.0046694278717041016, -0.004508316516876221, -0.00434720516204834, -0.004186093807220459, -0.004024982452392578, -0.0038638710975646973, -0.0037027597427368164, -0.0035416483879089355, -0.0033805370330810547, -0.003219425678253174, -0.003058314323425293, -0.002897202968597412, -0.0027360916137695312, -0.0025749802589416504, -0.0024138689041137695, -0.0022527575492858887, -0.002091646194458008, -0.001930534839630127, -0.001769423484802246, -0.0016083121299743652, -0.0014472007751464844, -0.0012860894203186035, -0.0011249780654907227, -0.0009638667106628418, -0.0008027553558349609, -0.0006416440010070801, -0.0004805326461791992, -0.00031942129135131836, -0.0001583099365234375, 2.8014183044433594e-06, 0.00016391277313232422, 0.0003250241279602051, 0.00048613548278808594, 0.0006472468376159668, 0.0008083581924438477, 0.0009694695472717285, 0.0011305809020996094, 0.0012916922569274902, 0.001452803611755371, 0.001613914966583252, 0.0017750263214111328, 0.0019361376762390137, 0.0020972490310668945, 0.0022583603858947754, 0.0024194717407226562, 0.002580583095550537, 0.002741694450378418, 0.002902805805206299, 0.0030639171600341797, 0.0032250285148620605, 0.0033861398696899414, 0.0035472512245178223, 0.003708362579345703, 0.003869473934173584, 0.004030585289001465, 0.004191696643829346, 0.0043528079986572266, 0.004513919353485107, 0.004675030708312988, 0.004836142063140869, 0.00499725341796875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 7.0, 9.0, 10.0, 11.0, 20.0, 23.0, 20.0, 27.0, 39.0, 41.0, 57.0, 80.0, 96.0, 176.0, 243.0, 484.0, 878.0, 2207.0, 6549.0, 30474.0, 356646.0, 590710.0, 46062.0, 8574.0, 2670.0, 1045.0, 514.0, 243.0, 161.0, 112.0, 83.0, 68.0, 46.0, 31.0, 29.0, 19.0, 15.0, 20.0, 9.0, 10.0, 6.0, 10.0, 5.0, 2.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.96875, -33.87939453125, -32.7900390625, -31.70068359375, -30.611328125, -29.52197265625, -28.4326171875, -27.34326171875, -26.25390625, -25.16455078125, -24.0751953125, -22.98583984375, -21.896484375, -20.80712890625, -19.7177734375, -18.62841796875, -17.5390625, -16.44970703125, -15.3603515625, -14.27099609375, -13.181640625, -12.09228515625, -11.0029296875, -9.91357421875, -8.82421875, -7.73486328125, -6.6455078125, -5.55615234375, -4.466796875, -3.37744140625, -2.2880859375, -1.19873046875, -0.109375, 0.97998046875, 2.0693359375, 3.15869140625, 4.248046875, 5.33740234375, 6.4267578125, 7.51611328125, 8.60546875, 9.69482421875, 10.7841796875, 11.87353515625, 12.962890625, 14.05224609375, 15.1416015625, 16.23095703125, 17.3203125, 18.40966796875, 19.4990234375, 20.58837890625, 21.677734375, 22.76708984375, 23.8564453125, 24.94580078125, 26.03515625, 27.12451171875, 28.2138671875, 29.30322265625, 30.392578125, 31.48193359375, 32.5712890625, 33.66064453125, 34.75]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 14.0, 13.0, 20.0, 27.0, 57.0, 71.0, 110.0, 136.0, 123.0, 110.0, 73.0, 58.0, 41.0, 32.0, 14.0, 14.0, 4.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.375, -37.1044921875, -35.833984375, -34.5634765625, -33.29296875, -32.0224609375, -30.751953125, -29.4814453125, -28.2109375, -26.9404296875, -25.669921875, -24.3994140625, -23.12890625, -21.8583984375, -20.587890625, -19.3173828125, -18.046875, -16.7763671875, -15.505859375, -14.2353515625, -12.96484375, -11.6943359375, -10.423828125, -9.1533203125, -7.8828125, -6.6123046875, -5.341796875, -4.0712890625, -2.80078125, -1.5302734375, -0.259765625, 1.0107421875, 2.28125, 3.5517578125, 4.822265625, 6.0927734375, 7.36328125, 8.6337890625, 9.904296875, 11.1748046875, 12.4453125, 13.7158203125, 14.986328125, 16.2568359375, 17.52734375, 18.7978515625, 20.068359375, 21.3388671875, 22.609375, 23.8798828125, 25.150390625, 26.4208984375, 27.69140625, 28.9619140625, 30.232421875, 31.5029296875, 32.7734375, 34.0439453125, 35.314453125, 36.5849609375, 37.85546875, 39.1259765625, 40.396484375, 41.6669921875, 42.9375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 26.0, 85.0, 239.0, 338.0, 191.0, 79.0, 22.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1312.932373046875, -1284.653076171875, -1256.3736572265625, -1228.0943603515625, -1199.8150634765625, -1171.53564453125, -1143.25634765625, -1114.97705078125, -1086.69775390625, -1058.41845703125, -1030.1390380859375, -1001.8597412109375, -973.5804443359375, -945.3010864257812, -917.021728515625, -888.742431640625, -860.4630126953125, -832.1836547851562, -803.9043579101562, -775.625, -747.345703125, -719.0663452148438, -690.7869873046875, -662.5076904296875, -634.2283325195312, -605.948974609375, -577.669677734375, -549.3903198242188, -521.1109619140625, -492.8316650390625, -464.55230712890625, -436.2729797363281, -407.9936828613281, -379.71435546875, -351.43499755859375, -323.1556701660156, -294.8763427734375, -266.5970153808594, -238.3176727294922, -210.038330078125, -181.75900268554688, -153.47967529296875, -125.20033264160156, -96.9209976196289, -68.64166259765625, -40.362335205078125, -12.082992553710938, 16.19635009765625, 44.475677490234375, 72.75501251220703, 101.03434753417969, 129.31369018554688, 157.593017578125, 185.87234497070312, 214.1516876220703, 242.4310302734375, 270.7103576660156, 298.98968505859375, 327.26904296875, 355.5483703613281, 383.82769775390625, 412.1070251464844, 440.3863525390625, 468.66571044921875, 496.9450378417969]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 6.0, 10.0, 17.0, 18.0, 14.0, 15.0, 23.0, 30.0, 24.0, 29.0, 33.0, 38.0, 54.0, 54.0, 42.0, 56.0, 43.0, 43.0, 42.0, 41.0, 51.0, 34.0, 32.0, 27.0, 32.0, 28.0, 24.0, 21.0, 16.0, 17.0, 14.0, 8.0, 8.0, 9.0, 7.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-265.7063903808594, -257.3807373046875, -249.05506896972656, -240.72940063476562, -232.40374755859375, -224.07809448242188, -215.75242614746094, -207.4267578125, -199.10110473632812, -190.77545166015625, -182.4497833251953, -174.12411499023438, -165.7984619140625, -157.47280883789062, -149.1471405029297, -140.82147216796875, -132.49581909179688, -124.17015838623047, -115.84449768066406, -107.51883697509766, -99.19317626953125, -90.86751556396484, -82.54185485839844, -74.21619415283203, -65.89053344726562, -57.56487274169922, -49.23921203613281, -40.913551330566406, -32.587890625, -24.262229919433594, -15.936569213867188, -7.610908508300781, 0.7147216796875, 9.040382385253906, 17.366043090820312, 25.69170379638672, 34.017364501953125, 42.34302520751953, 50.66868591308594, 58.994346618652344, 67.32000732421875, 75.64566802978516, 83.97132873535156, 92.29698944091797, 100.62265014648438, 108.94831085205078, 117.27397155761719, 125.5996322631836, 133.92529296875, 142.25094604492188, 150.5766143798828, 158.90228271484375, 167.22793579101562, 175.5535888671875, 183.87925720214844, 192.20492553710938, 200.53057861328125, 208.85623168945312, 217.18190002441406, 225.507568359375, 233.83322143554688, 242.15887451171875, 250.4845428466797, 258.8102111816406, 267.1358642578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 6.0, 9.0, 10.0, 12.0, 15.0, 42.0, 65.0, 95.0, 195.0, 484.0, 1739.0, 17797.0, 4120615.0, 48862.0, 3085.0, 669.0, 256.0, 131.0, 74.0, 38.0, 35.0, 22.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-150.0, -146.5634765625, -143.126953125, -139.6904296875, -136.25390625, -132.8173828125, -129.380859375, -125.9443359375, -122.5078125, -119.0712890625, -115.634765625, -112.1982421875, -108.76171875, -105.3251953125, -101.888671875, -98.4521484375, -95.015625, -91.5791015625, -88.142578125, -84.7060546875, -81.26953125, -77.8330078125, -74.396484375, -70.9599609375, -67.5234375, -64.0869140625, -60.650390625, -57.2138671875, -53.77734375, -50.3408203125, -46.904296875, -43.4677734375, -40.03125, -36.5947265625, -33.158203125, -29.7216796875, -26.28515625, -22.8486328125, -19.412109375, -15.9755859375, -12.5390625, -9.1025390625, -5.666015625, -2.2294921875, 1.20703125, 4.6435546875, 8.080078125, 11.5166015625, 14.953125, 18.3896484375, 21.826171875, 25.2626953125, 28.69921875, 32.1357421875, 35.572265625, 39.0087890625, 42.4453125, 45.8818359375, 49.318359375, 52.7548828125, 56.19140625, 59.6279296875, 63.064453125, 66.5009765625, 69.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 12.0, 10.0, 11.0, 9.0, 20.0, 23.0, 28.0, 34.0, 44.0, 41.0, 63.0, 66.0, 59.0, 55.0, 66.0, 57.0, 63.0, 57.0, 41.0, 43.0, 36.0, 32.0, 32.0, 12.0, 24.0, 7.0, 16.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5234375, -11.0843505859375, -10.645263671875, -10.2061767578125, -9.76708984375, -9.3280029296875, -8.888916015625, -8.4498291015625, -8.0107421875, -7.5716552734375, -7.132568359375, -6.6934814453125, -6.25439453125, -5.8153076171875, -5.376220703125, -4.9371337890625, -4.498046875, -4.0589599609375, -3.619873046875, -3.1807861328125, -2.74169921875, -2.3026123046875, -1.863525390625, -1.4244384765625, -0.9853515625, -0.5462646484375, -0.107177734375, 0.3319091796875, 0.77099609375, 1.2100830078125, 1.649169921875, 2.0882568359375, 2.52734375, 2.9664306640625, 3.405517578125, 3.8446044921875, 4.28369140625, 4.7227783203125, 5.161865234375, 5.6009521484375, 6.0400390625, 6.4791259765625, 6.918212890625, 7.3572998046875, 7.79638671875, 8.2354736328125, 8.674560546875, 9.1136474609375, 9.552734375, 9.9918212890625, 10.430908203125, 10.8699951171875, 11.30908203125, 11.7481689453125, 12.187255859375, 12.6263427734375, 13.0654296875, 13.5045166015625, 13.943603515625, 14.3826904296875, 14.82177734375, 15.2608642578125, 15.699951171875, 16.1390380859375, 16.578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 9.0, 2.0, 3.0, 8.0, 15.0, 9.0, 14.0, 21.0, 30.0, 41.0, 61.0, 82.0, 113.0, 217.0, 278.0, 443.0, 645.0, 1084.0, 1814.0, 4142.0, 10422.0, 36338.0, 436843.0, 3625341.0, 52674.0, 13229.0, 4936.0, 2182.0, 1213.0, 665.0, 417.0, 305.0, 212.0, 131.0, 78.0, 79.0, 52.0, 40.0, 24.0, 23.0, 13.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0], "bins": [-49.125, -47.7646484375, -46.404296875, -45.0439453125, -43.68359375, -42.3232421875, -40.962890625, -39.6025390625, -38.2421875, -36.8818359375, -35.521484375, -34.1611328125, -32.80078125, -31.4404296875, -30.080078125, -28.7197265625, -27.359375, -25.9990234375, -24.638671875, -23.2783203125, -21.91796875, -20.5576171875, -19.197265625, -17.8369140625, -16.4765625, -15.1162109375, -13.755859375, -12.3955078125, -11.03515625, -9.6748046875, -8.314453125, -6.9541015625, -5.59375, -4.2333984375, -2.873046875, -1.5126953125, -0.15234375, 1.2080078125, 2.568359375, 3.9287109375, 5.2890625, 6.6494140625, 8.009765625, 9.3701171875, 10.73046875, 12.0908203125, 13.451171875, 14.8115234375, 16.171875, 17.5322265625, 18.892578125, 20.2529296875, 21.61328125, 22.9736328125, 24.333984375, 25.6943359375, 27.0546875, 28.4150390625, 29.775390625, 31.1357421875, 32.49609375, 33.8564453125, 35.216796875, 36.5771484375, 37.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 4.0, 11.0, 9.0, 27.0, 41.0, 67.0, 144.0, 2443.0, 975.0, 148.0, 77.0, 30.0, 26.0, 18.0, 10.0, 7.0, 4.0, 10.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.625, -25.95849609375, -25.2919921875, -24.62548828125, -23.958984375, -23.29248046875, -22.6259765625, -21.95947265625, -21.29296875, -20.62646484375, -19.9599609375, -19.29345703125, -18.626953125, -17.96044921875, -17.2939453125, -16.62744140625, -15.9609375, -15.29443359375, -14.6279296875, -13.96142578125, -13.294921875, -12.62841796875, -11.9619140625, -11.29541015625, -10.62890625, -9.96240234375, -9.2958984375, -8.62939453125, -7.962890625, -7.29638671875, -6.6298828125, -5.96337890625, -5.296875, -4.63037109375, -3.9638671875, -3.29736328125, -2.630859375, -1.96435546875, -1.2978515625, -0.63134765625, 0.03515625, 0.70166015625, 1.3681640625, 2.03466796875, 2.701171875, 3.36767578125, 4.0341796875, 4.70068359375, 5.3671875, 6.03369140625, 6.7001953125, 7.36669921875, 8.033203125, 8.69970703125, 9.3662109375, 10.03271484375, 10.69921875, 11.36572265625, 12.0322265625, 12.69873046875, 13.365234375, 14.03173828125, 14.6982421875, 15.36474609375, 16.03125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 13.0, 11.0, 18.0, 32.0, 35.0, 53.0, 76.0, 84.0, 130.0, 130.0, 123.0, 79.0, 59.0, 52.0, 32.0, 22.0, 14.0, 2.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-100.0392837524414, -97.57948303222656, -95.11967468261719, -92.65987396240234, -90.2000732421875, -87.74026489257812, -85.28046417236328, -82.82066345214844, -80.36085510253906, -77.90105438232422, -75.44124603271484, -72.9814453125, -70.52163696289062, -68.06183624267578, -65.60203552246094, -63.14223098754883, -60.68242645263672, -58.22262191772461, -55.7628173828125, -53.303016662597656, -50.84321212768555, -48.38340759277344, -45.923606872558594, -43.463802337646484, -41.003997802734375, -38.544193267822266, -36.084388732910156, -33.62458801269531, -31.164783477783203, -28.704978942871094, -26.245176315307617, -23.78537368774414, -21.32556915283203, -18.865764617919922, -16.405961990356445, -13.946158409118652, -11.48635482788086, -9.026551246643066, -6.566747665405273, -4.106945037841797, -1.6471405029296875, 0.8126630783081055, 3.2724666595458984, 5.732270240783691, 8.192073822021484, 10.651877403259277, 13.11168098449707, 15.571483612060547, 18.031288146972656, 20.491092681884766, 22.950895309448242, 25.41069793701172, 27.870502471923828, 30.330307006835938, 32.79010772705078, 35.24991226196289, 37.709716796875, 40.16952133178711, 42.62932586669922, 45.08912658691406, 47.54893112182617, 50.00873565673828, 52.468536376953125, 54.928340911865234, 57.388145446777344]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 13.0, 18.0, 10.0, 11.0, 18.0, 11.0, 20.0, 23.0, 22.0, 25.0, 42.0, 35.0, 44.0, 46.0, 35.0, 57.0, 41.0, 42.0, 55.0, 46.0, 41.0, 33.0, 42.0, 37.0, 28.0, 29.0, 28.0, 25.0, 17.0, 16.0, 22.0, 11.0, 10.0, 10.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.80430603027344, -43.32239532470703, -41.84048843383789, -40.358577728271484, -38.87666702270508, -37.39475631713867, -35.91284942626953, -34.430938720703125, -32.94902801513672, -31.467119216918945, -29.98520851135254, -28.503299713134766, -27.02138900756836, -25.539480209350586, -24.057571411132812, -22.575660705566406, -21.093751907348633, -19.61184310913086, -18.129932403564453, -16.64802360534668, -15.166112899780273, -13.6842041015625, -12.20229434967041, -10.72038459777832, -9.23847484588623, -7.756565093994141, -6.274655342102051, -4.792746067047119, -3.3108363151550293, -1.8289265632629395, -0.3470172882080078, 1.134892463684082, 2.616802215576172, 4.098711967468262, 5.580621719360352, 7.062530994415283, 8.544441223144531, 10.026350021362305, 11.508259773254395, 12.990169525146484, 14.472079277038574, 15.953989028930664, 17.435897827148438, 18.917808532714844, 20.399717330932617, 21.881628036499023, 23.363536834716797, 24.845447540283203, 26.327356338500977, 27.80926513671875, 29.291175842285156, 30.77308464050293, 32.2549934387207, 33.73690414428711, 35.218814849853516, 36.700721740722656, 38.18263244628906, 39.66454315185547, 41.14645004272461, 42.628360748291016, 44.11027145385742, 45.59218215942383, 47.07408905029297, 48.555999755859375, 50.03791046142578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 10.0, 10.0, 15.0, 18.0, 37.0, 66.0, 94.0, 228.0, 530.0, 1512.0, 4490.0, 16565.0, 68036.0, 278272.0, 486094.0, 144262.0, 35300.0, 8895.0, 2565.0, 861.0, 344.0, 161.0, 91.0, 38.0, 21.0, 10.0, 11.0, 6.0, 5.0, 9.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34375, -43.9384765625, -42.533203125, -41.1279296875, -39.72265625, -38.3173828125, -36.912109375, -35.5068359375, -34.1015625, -32.6962890625, -31.291015625, -29.8857421875, -28.48046875, -27.0751953125, -25.669921875, -24.2646484375, -22.859375, -21.4541015625, -20.048828125, -18.6435546875, -17.23828125, -15.8330078125, -14.427734375, -13.0224609375, -11.6171875, -10.2119140625, -8.806640625, -7.4013671875, -5.99609375, -4.5908203125, -3.185546875, -1.7802734375, -0.375, 1.0302734375, 2.435546875, 3.8408203125, 5.24609375, 6.6513671875, 8.056640625, 9.4619140625, 10.8671875, 12.2724609375, 13.677734375, 15.0830078125, 16.48828125, 17.8935546875, 19.298828125, 20.7041015625, 22.109375, 23.5146484375, 24.919921875, 26.3251953125, 27.73046875, 29.1357421875, 30.541015625, 31.9462890625, 33.3515625, 34.7568359375, 36.162109375, 37.5673828125, 38.97265625, 40.3779296875, 41.783203125, 43.1884765625, 44.59375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 8.0, 12.0, 11.0, 17.0, 16.0, 33.0, 38.0, 36.0, 42.0, 40.0, 47.0, 56.0, 66.0, 61.0, 72.0, 62.0, 50.0, 46.0, 42.0, 47.0, 41.0, 20.0, 26.0, 26.0, 18.0, 15.0, 11.0, 7.0, 7.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.75341796875, -11.2880859375, -10.82275390625, -10.357421875, -9.89208984375, -9.4267578125, -8.96142578125, -8.49609375, -8.03076171875, -7.5654296875, -7.10009765625, -6.634765625, -6.16943359375, -5.7041015625, -5.23876953125, -4.7734375, -4.30810546875, -3.8427734375, -3.37744140625, -2.912109375, -2.44677734375, -1.9814453125, -1.51611328125, -1.05078125, -0.58544921875, -0.1201171875, 0.34521484375, 0.810546875, 1.27587890625, 1.7412109375, 2.20654296875, 2.671875, 3.13720703125, 3.6025390625, 4.06787109375, 4.533203125, 4.99853515625, 5.4638671875, 5.92919921875, 6.39453125, 6.85986328125, 7.3251953125, 7.79052734375, 8.255859375, 8.72119140625, 9.1865234375, 9.65185546875, 10.1171875, 10.58251953125, 11.0478515625, 11.51318359375, 11.978515625, 12.44384765625, 12.9091796875, 13.37451171875, 13.83984375, 14.30517578125, 14.7705078125, 15.23583984375, 15.701171875, 16.16650390625, 16.6318359375, 17.09716796875, 17.5625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 10.0, 5.0, 11.0, 14.0, 22.0, 30.0, 22.0, 38.0, 67.0, 101.0, 172.0, 267.0, 421.0, 821.0, 1788.0, 4884.0, 23710.0, 295515.0, 657395.0, 50644.0, 7748.0, 2474.0, 1003.0, 567.0, 290.0, 193.0, 109.0, 55.0, 50.0, 28.0, 23.0, 27.0, 24.0, 7.0, 9.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.1875, -73.8193359375, -71.451171875, -69.0830078125, -66.71484375, -64.3466796875, -61.978515625, -59.6103515625, -57.2421875, -54.8740234375, -52.505859375, -50.1376953125, -47.76953125, -45.4013671875, -43.033203125, -40.6650390625, -38.296875, -35.9287109375, -33.560546875, -31.1923828125, -28.82421875, -26.4560546875, -24.087890625, -21.7197265625, -19.3515625, -16.9833984375, -14.615234375, -12.2470703125, -9.87890625, -7.5107421875, -5.142578125, -2.7744140625, -0.40625, 1.9619140625, 4.330078125, 6.6982421875, 9.06640625, 11.4345703125, 13.802734375, 16.1708984375, 18.5390625, 20.9072265625, 23.275390625, 25.6435546875, 28.01171875, 30.3798828125, 32.748046875, 35.1162109375, 37.484375, 39.8525390625, 42.220703125, 44.5888671875, 46.95703125, 49.3251953125, 51.693359375, 54.0615234375, 56.4296875, 58.7978515625, 61.166015625, 63.5341796875, 65.90234375, 68.2705078125, 70.638671875, 73.0068359375, 75.375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 12.0, 5.0, 13.0, 14.0, 25.0, 25.0, 24.0, 29.0, 29.0, 41.0, 52.0, 51.0, 57.0, 59.0, 63.0, 59.0, 57.0, 40.0, 52.0, 61.0, 32.0, 27.0, 19.0, 29.0, 29.0, 19.0, 11.0, 15.0, 9.0, 8.0, 9.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-78.0, -75.94775390625, -73.8955078125, -71.84326171875, -69.791015625, -67.73876953125, -65.6865234375, -63.63427734375, -61.58203125, -59.52978515625, -57.4775390625, -55.42529296875, -53.373046875, -51.32080078125, -49.2685546875, -47.21630859375, -45.1640625, -43.11181640625, -41.0595703125, -39.00732421875, -36.955078125, -34.90283203125, -32.8505859375, -30.79833984375, -28.74609375, -26.69384765625, -24.6416015625, -22.58935546875, -20.537109375, -18.48486328125, -16.4326171875, -14.38037109375, -12.328125, -10.27587890625, -8.2236328125, -6.17138671875, -4.119140625, -2.06689453125, -0.0146484375, 2.03759765625, 4.08984375, 6.14208984375, 8.1943359375, 10.24658203125, 12.298828125, 14.35107421875, 16.4033203125, 18.45556640625, 20.5078125, 22.56005859375, 24.6123046875, 26.66455078125, 28.716796875, 30.76904296875, 32.8212890625, 34.87353515625, 36.92578125, 38.97802734375, 41.0302734375, 43.08251953125, 45.134765625, 47.18701171875, 49.2392578125, 51.29150390625, 53.34375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 6.0, 11.0, 15.0, 15.0, 17.0, 35.0, 32.0, 38.0, 60.0, 58.0, 115.0, 189.0, 292.0, 397.0, 646.0, 1033.0, 1867.0, 3555.0, 9017.0, 38219.0, 290303.0, 597948.0, 78763.0, 14932.0, 5103.0, 2271.0, 1305.0, 762.0, 513.0, 333.0, 206.0, 129.0, 96.0, 87.0, 57.0, 40.0, 23.0, 18.0, 10.0, 10.0, 3.0, 5.0, 5.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-21.5, -20.810791015625, -20.12158203125, -19.432373046875, -18.7431640625, -18.053955078125, -17.36474609375, -16.675537109375, -15.986328125, -15.297119140625, -14.60791015625, -13.918701171875, -13.2294921875, -12.540283203125, -11.85107421875, -11.161865234375, -10.47265625, -9.783447265625, -9.09423828125, -8.405029296875, -7.7158203125, -7.026611328125, -6.33740234375, -5.648193359375, -4.958984375, -4.269775390625, -3.58056640625, -2.891357421875, -2.2021484375, -1.512939453125, -0.82373046875, -0.134521484375, 0.5546875, 1.243896484375, 1.93310546875, 2.622314453125, 3.3115234375, 4.000732421875, 4.68994140625, 5.379150390625, 6.068359375, 6.757568359375, 7.44677734375, 8.135986328125, 8.8251953125, 9.514404296875, 10.20361328125, 10.892822265625, 11.58203125, 12.271240234375, 12.96044921875, 13.649658203125, 14.3388671875, 15.028076171875, 15.71728515625, 16.406494140625, 17.095703125, 17.784912109375, 18.47412109375, 19.163330078125, 19.8525390625, 20.541748046875, 21.23095703125, 21.920166015625, 22.609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 13.0, 24.0, 37.0, 59.0, 94.0, 196.0, 238.0, 134.0, 81.0, 50.0, 23.0, 22.0, 10.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01397705078125, -0.013590455055236816, -0.013203859329223633, -0.01281726360321045, -0.012430667877197266, -0.012044072151184082, -0.011657476425170898, -0.011270880699157715, -0.010884284973144531, -0.010497689247131348, -0.010111093521118164, -0.00972449779510498, -0.009337902069091797, -0.008951306343078613, -0.00856471061706543, -0.008178114891052246, -0.0077915191650390625, -0.007404923439025879, -0.007018327713012695, -0.006631731986999512, -0.006245136260986328, -0.0058585405349731445, -0.005471944808959961, -0.005085349082946777, -0.004698753356933594, -0.00431215763092041, -0.0039255619049072266, -0.003538966178894043, -0.0031523704528808594, -0.0027657747268676758, -0.002379179000854492, -0.0019925832748413086, -0.001605987548828125, -0.0012193918228149414, -0.0008327960968017578, -0.0004462003707885742, -5.9604644775390625e-05, 0.00032699108123779297, 0.0007135868072509766, 0.0011001825332641602, 0.0014867782592773438, 0.0018733739852905273, 0.002259969711303711, 0.0026465654373168945, 0.003033161163330078, 0.0034197568893432617, 0.0038063526153564453, 0.004192948341369629, 0.0045795440673828125, 0.004966139793395996, 0.00535273551940918, 0.005739331245422363, 0.006125926971435547, 0.0065125226974487305, 0.006899118423461914, 0.007285714149475098, 0.007672309875488281, 0.008058905601501465, 0.008445501327514648, 0.008832097053527832, 0.009218692779541016, 0.0096052885055542, 0.009991884231567383, 0.010378479957580566, 0.01076507568359375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 5.0, 6.0, 3.0, 9.0, 10.0, 11.0, 14.0, 13.0, 25.0, 32.0, 62.0, 71.0, 84.0, 168.0, 264.0, 431.0, 919.0, 2041.0, 5364.0, 22726.0, 233137.0, 695807.0, 70249.0, 10937.0, 3255.0, 1310.0, 646.0, 307.0, 206.0, 120.0, 90.0, 48.0, 39.0, 22.0, 27.0, 18.0, 15.0, 12.0, 10.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.4375, -24.6240234375, -23.810546875, -22.9970703125, -22.18359375, -21.3701171875, -20.556640625, -19.7431640625, -18.9296875, -18.1162109375, -17.302734375, -16.4892578125, -15.67578125, -14.8623046875, -14.048828125, -13.2353515625, -12.421875, -11.6083984375, -10.794921875, -9.9814453125, -9.16796875, -8.3544921875, -7.541015625, -6.7275390625, -5.9140625, -5.1005859375, -4.287109375, -3.4736328125, -2.66015625, -1.8466796875, -1.033203125, -0.2197265625, 0.59375, 1.4072265625, 2.220703125, 3.0341796875, 3.84765625, 4.6611328125, 5.474609375, 6.2880859375, 7.1015625, 7.9150390625, 8.728515625, 9.5419921875, 10.35546875, 11.1689453125, 11.982421875, 12.7958984375, 13.609375, 14.4228515625, 15.236328125, 16.0498046875, 16.86328125, 17.6767578125, 18.490234375, 19.3037109375, 20.1171875, 20.9306640625, 21.744140625, 22.5576171875, 23.37109375, 24.1845703125, 24.998046875, 25.8115234375, 26.625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 7.0, 17.0, 15.0, 22.0, 22.0, 41.0, 50.0, 77.0, 113.0, 101.0, 116.0, 93.0, 68.0, 73.0, 45.0, 30.0, 21.0, 19.0, 10.0, 12.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.131103515625, -22.34033203125, -21.549560546875, -20.7587890625, -19.968017578125, -19.17724609375, -18.386474609375, -17.595703125, -16.804931640625, -16.01416015625, -15.223388671875, -14.4326171875, -13.641845703125, -12.85107421875, -12.060302734375, -11.26953125, -10.478759765625, -9.68798828125, -8.897216796875, -8.1064453125, -7.315673828125, -6.52490234375, -5.734130859375, -4.943359375, -4.152587890625, -3.36181640625, -2.571044921875, -1.7802734375, -0.989501953125, -0.19873046875, 0.592041015625, 1.3828125, 2.173583984375, 2.96435546875, 3.755126953125, 4.5458984375, 5.336669921875, 6.12744140625, 6.918212890625, 7.708984375, 8.499755859375, 9.29052734375, 10.081298828125, 10.8720703125, 11.662841796875, 12.45361328125, 13.244384765625, 14.03515625, 14.825927734375, 15.61669921875, 16.407470703125, 17.1982421875, 17.989013671875, 18.77978515625, 19.570556640625, 20.361328125, 21.152099609375, 21.94287109375, 22.733642578125, 23.5244140625, 24.315185546875, 25.10595703125, 25.896728515625, 26.6875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 28.0, 51.0, 140.0, 256.0, 241.0, 179.0, 66.0, 17.0, 11.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-515.661376953125, -491.096923828125, -466.5324401855469, -441.9679870605469, -417.40350341796875, -392.83905029296875, -368.27459716796875, -343.71014404296875, -319.1456604003906, -294.5812072753906, -270.0167236328125, -245.4522705078125, -220.88780212402344, -196.32333374023438, -171.75888061523438, -147.1944122314453, -122.62994384765625, -98.06547546386719, -73.50101470947266, -48.936553955078125, -24.372085571289062, 0.1923828125, 24.7568359375, 49.32130432128906, 73.88577270507812, 98.45024108886719, 123.01470184326172, 147.57916259765625, 172.1436309814453, 196.70809936523438, 221.27255249023438, 245.83702087402344, 270.4014892578125, 294.9659423828125, 319.5304260253906, 344.0948791503906, 368.65936279296875, 393.22381591796875, 417.78826904296875, 442.35272216796875, 466.9172058105469, 491.4816589355469, 516.046142578125, 540.610595703125, 565.175048828125, 589.739501953125, 614.303955078125, 638.8684692382812, 663.4329223632812, 687.9973754882812, 712.5618286132812, 737.1263427734375, 761.6907958984375, 786.2552490234375, 810.8197021484375, 835.3841552734375, 859.9486083984375, 884.5130615234375, 909.0775146484375, 933.6419677734375, 958.2064819335938, 982.7709350585938, 1007.3353881835938, 1031.89990234375, 1056.46435546875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 7.0, 5.0, 5.0, 8.0, 17.0, 20.0, 33.0, 22.0, 21.0, 22.0, 30.0, 50.0, 30.0, 36.0, 48.0, 45.0, 40.0, 40.0, 50.0, 48.0, 45.0, 42.0, 39.0, 34.0, 28.0, 39.0, 31.0, 30.0, 23.0, 18.0, 11.0, 13.0, 10.0, 10.0, 9.0, 11.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.60385131835938, -213.53805541992188, -205.47225952148438, -197.40646362304688, -189.34066772460938, -181.27487182617188, -173.20907592773438, -165.14328002929688, -157.07748413085938, -149.01168823242188, -140.94589233398438, -132.88009643554688, -124.81430053710938, -116.74850463867188, -108.68270874023438, -100.61691284179688, -92.55111694335938, -84.48532104492188, -76.41952514648438, -68.35372924804688, -60.287933349609375, -52.222137451171875, -44.156341552734375, -36.090545654296875, -28.024749755859375, -19.958953857421875, -11.893157958984375, -3.827362060546875, 4.238433837890625, 12.304229736328125, 20.370025634765625, 28.435821533203125, 36.50164794921875, 44.56744384765625, 52.63323974609375, 60.69903564453125, 68.76483154296875, 76.83062744140625, 84.89642333984375, 92.96221923828125, 101.02801513671875, 109.09381103515625, 117.15960693359375, 125.22540283203125, 133.29119873046875, 141.35699462890625, 149.42279052734375, 157.48858642578125, 165.55438232421875, 173.62017822265625, 181.68597412109375, 189.75177001953125, 197.81756591796875, 205.88336181640625, 213.94915771484375, 222.01495361328125, 230.08074951171875, 238.14654541015625, 246.21234130859375, 254.27813720703125, 262.34393310546875, 270.40972900390625, 278.47552490234375, 286.54132080078125, 294.60711669921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 6.0, 7.0, 13.0, 28.0, 41.0, 73.0, 130.0, 310.0, 934.0, 3796.0, 22337.0, 391578.0, 3667322.0, 93952.0, 10779.0, 2105.0, 557.0, 180.0, 69.0, 30.0, 17.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-81.4375, -79.715576171875, -77.99365234375, -76.271728515625, -74.5498046875, -72.827880859375, -71.10595703125, -69.384033203125, -67.662109375, -65.940185546875, -64.21826171875, -62.496337890625, -60.7744140625, -59.052490234375, -57.33056640625, -55.608642578125, -53.88671875, -52.164794921875, -50.44287109375, -48.720947265625, -46.9990234375, -45.277099609375, -43.55517578125, -41.833251953125, -40.111328125, -38.389404296875, -36.66748046875, -34.945556640625, -33.2236328125, -31.501708984375, -29.77978515625, -28.057861328125, -26.3359375, -24.614013671875, -22.89208984375, -21.170166015625, -19.4482421875, -17.726318359375, -16.00439453125, -14.282470703125, -12.560546875, -10.838623046875, -9.11669921875, -7.394775390625, -5.6728515625, -3.950927734375, -2.22900390625, -0.507080078125, 1.21484375, 2.936767578125, 4.65869140625, 6.380615234375, 8.1025390625, 9.824462890625, 11.54638671875, 13.268310546875, 14.990234375, 16.712158203125, 18.43408203125, 20.156005859375, 21.8779296875, 23.599853515625, 25.32177734375, 27.043701171875, 28.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 7.0, 6.0, 12.0, 14.0, 21.0, 13.0, 19.0, 45.0, 49.0, 43.0, 40.0, 53.0, 73.0, 72.0, 66.0, 73.0, 62.0, 50.0, 57.0, 47.0, 32.0, 36.0, 21.0, 23.0, 19.0, 10.0, 11.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.09375, -18.595947265625, -18.09814453125, -17.600341796875, -17.1025390625, -16.604736328125, -16.10693359375, -15.609130859375, -15.111328125, -14.613525390625, -14.11572265625, -13.617919921875, -13.1201171875, -12.622314453125, -12.12451171875, -11.626708984375, -11.12890625, -10.631103515625, -10.13330078125, -9.635498046875, -9.1376953125, -8.639892578125, -8.14208984375, -7.644287109375, -7.146484375, -6.648681640625, -6.15087890625, -5.653076171875, -5.1552734375, -4.657470703125, -4.15966796875, -3.661865234375, -3.1640625, -2.666259765625, -2.16845703125, -1.670654296875, -1.1728515625, -0.675048828125, -0.17724609375, 0.320556640625, 0.818359375, 1.316162109375, 1.81396484375, 2.311767578125, 2.8095703125, 3.307373046875, 3.80517578125, 4.302978515625, 4.80078125, 5.298583984375, 5.79638671875, 6.294189453125, 6.7919921875, 7.289794921875, 7.78759765625, 8.285400390625, 8.783203125, 9.281005859375, 9.77880859375, 10.276611328125, 10.7744140625, 11.272216796875, 11.77001953125, 12.267822265625, 12.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 7.0, 14.0, 17.0, 22.0, 39.0, 67.0, 115.0, 246.0, 725.0, 2549.0, 13152.0, 144688.0, 3818930.0, 193980.0, 15706.0, 2809.0, 711.0, 237.0, 118.0, 63.0, 27.0, 18.0, 13.0, 9.0, 8.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.25, -54.130859375, -52.01171875, -49.892578125, -47.7734375, -45.654296875, -43.53515625, -41.416015625, -39.296875, -37.177734375, -35.05859375, -32.939453125, -30.8203125, -28.701171875, -26.58203125, -24.462890625, -22.34375, -20.224609375, -18.10546875, -15.986328125, -13.8671875, -11.748046875, -9.62890625, -7.509765625, -5.390625, -3.271484375, -1.15234375, 0.966796875, 3.0859375, 5.205078125, 7.32421875, 9.443359375, 11.5625, 13.681640625, 15.80078125, 17.919921875, 20.0390625, 22.158203125, 24.27734375, 26.396484375, 28.515625, 30.634765625, 32.75390625, 34.873046875, 36.9921875, 39.111328125, 41.23046875, 43.349609375, 45.46875, 47.587890625, 49.70703125, 51.826171875, 53.9453125, 56.064453125, 58.18359375, 60.302734375, 62.421875, 64.541015625, 66.66015625, 68.779296875, 70.8984375, 73.017578125, 75.13671875, 77.255859375, 79.375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 6.0, 12.0, 8.0, 23.0, 27.0, 40.0, 47.0, 74.0, 129.0, 261.0, 508.0, 1054.0, 877.0, 401.0, 208.0, 124.0, 72.0, 44.0, 31.0, 22.0, 25.0, 15.0, 16.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.0, -47.59619140625, -46.1923828125, -44.78857421875, -43.384765625, -41.98095703125, -40.5771484375, -39.17333984375, -37.76953125, -36.36572265625, -34.9619140625, -33.55810546875, -32.154296875, -30.75048828125, -29.3466796875, -27.94287109375, -26.5390625, -25.13525390625, -23.7314453125, -22.32763671875, -20.923828125, -19.52001953125, -18.1162109375, -16.71240234375, -15.30859375, -13.90478515625, -12.5009765625, -11.09716796875, -9.693359375, -8.28955078125, -6.8857421875, -5.48193359375, -4.078125, -2.67431640625, -1.2705078125, 0.13330078125, 1.537109375, 2.94091796875, 4.3447265625, 5.74853515625, 7.15234375, 8.55615234375, 9.9599609375, 11.36376953125, 12.767578125, 14.17138671875, 15.5751953125, 16.97900390625, 18.3828125, 19.78662109375, 21.1904296875, 22.59423828125, 23.998046875, 25.40185546875, 26.8056640625, 28.20947265625, 29.61328125, 31.01708984375, 32.4208984375, 33.82470703125, 35.228515625, 36.63232421875, 38.0361328125, 39.43994140625, 40.84375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 16.0, 42.0, 89.0, 164.0, 234.0, 218.0, 116.0, 58.0, 29.0, 7.0, 10.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-739.2955322265625, -722.4287719726562, -705.56201171875, -688.6952514648438, -671.8284912109375, -654.9617309570312, -638.094970703125, -621.2282104492188, -604.3614501953125, -587.4946899414062, -570.6279296875, -553.7611694335938, -536.8944091796875, -520.0276489257812, -503.160888671875, -486.29412841796875, -469.4273986816406, -452.5606384277344, -435.6938781738281, -418.8271179199219, -401.9603576660156, -385.0935974121094, -368.22686767578125, -351.360107421875, -334.49334716796875, -317.6265869140625, -300.75982666015625, -283.89306640625, -267.02630615234375, -250.1595458984375, -233.2928009033203, -216.42604064941406, -199.55929565429688, -182.69253540039062, -165.82577514648438, -148.95901489257812, -132.09225463867188, -115.22550201416016, -98.35874938964844, -81.49198913574219, -64.62522888183594, -47.75846862792969, -30.891712188720703, -14.024955749511719, 2.8418045043945312, 19.70856475830078, 36.5753173828125, 53.44207763671875, 70.308837890625, 87.17559814453125, 104.0423583984375, 120.90911102294922, 137.77587890625, 154.64263916015625, 171.50938415527344, 188.3761444091797, 205.24290466308594, 222.1096649169922, 238.97642517089844, 255.84317016601562, 272.7099304199219, 289.5766906738281, 306.4434509277344, 323.3102111816406, 340.1769714355469]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 6.0, 7.0, 9.0, 20.0, 16.0, 28.0, 22.0, 27.0, 44.0, 35.0, 46.0, 51.0, 63.0, 46.0, 31.0, 47.0, 55.0, 45.0, 49.0, 43.0, 41.0, 42.0, 31.0, 29.0, 24.0, 27.0, 24.0, 13.0, 14.0, 16.0, 10.0, 7.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-211.08856201171875, -204.92901611328125, -198.7694549560547, -192.6099090576172, -186.4503631591797, -180.29080200195312, -174.13125610351562, -167.97171020507812, -161.81216430664062, -155.65261840820312, -149.49305725097656, -143.33351135253906, -137.17396545410156, -131.014404296875, -124.8548583984375, -118.6953125, -112.53575134277344, -106.3761978149414, -100.2166519165039, -94.05709838867188, -87.89755249023438, -81.73799896240234, -75.57844543457031, -69.41889953613281, -63.25934600830078, -57.099796295166016, -50.94024658203125, -44.78069305419922, -38.62114334106445, -32.46159362792969, -26.302040100097656, -20.14249038696289, -13.982925415039062, -7.8233747482299805, -1.6638240814208984, 4.4957275390625, 10.655277252197266, 16.81482696533203, 22.974380493164062, 29.133930206298828, 35.293479919433594, 41.45302963256836, 47.612579345703125, 53.772132873535156, 59.93168258666992, 66.09123229980469, 72.25078582763672, 78.41033935546875, 84.56988525390625, 90.72943878173828, 96.88898468017578, 103.04853820800781, 109.20808410644531, 115.36763763427734, 121.52719116210938, 127.68673706054688, 133.84628295898438, 140.00582885742188, 146.16539001464844, 152.32493591308594, 158.48448181152344, 164.64404296875, 170.8035888671875, 176.963134765625, 183.12269592285156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 0.0, 8.0, 11.0, 6.0, 14.0, 34.0, 50.0, 87.0, 139.0, 262.0, 475.0, 899.0, 1792.0, 4089.0, 9252.0, 23853.0, 66415.0, 210059.0, 435495.0, 194954.0, 61986.0, 22037.0, 8944.0, 3975.0, 1705.0, 962.0, 461.0, 265.0, 129.0, 74.0, 50.0, 31.0, 10.0, 17.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.0625, -34.014892578125, -32.96728515625, -31.919677734375, -30.8720703125, -29.824462890625, -28.77685546875, -27.729248046875, -26.681640625, -25.634033203125, -24.58642578125, -23.538818359375, -22.4912109375, -21.443603515625, -20.39599609375, -19.348388671875, -18.30078125, -17.253173828125, -16.20556640625, -15.157958984375, -14.1103515625, -13.062744140625, -12.01513671875, -10.967529296875, -9.919921875, -8.872314453125, -7.82470703125, -6.777099609375, -5.7294921875, -4.681884765625, -3.63427734375, -2.586669921875, -1.5390625, -0.491455078125, 0.55615234375, 1.603759765625, 2.6513671875, 3.698974609375, 4.74658203125, 5.794189453125, 6.841796875, 7.889404296875, 8.93701171875, 9.984619140625, 11.0322265625, 12.079833984375, 13.12744140625, 14.175048828125, 15.22265625, 16.270263671875, 17.31787109375, 18.365478515625, 19.4130859375, 20.460693359375, 21.50830078125, 22.555908203125, 23.603515625, 24.651123046875, 25.69873046875, 26.746337890625, 27.7939453125, 28.841552734375, 29.88916015625, 30.936767578125, 31.984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 8.0, 7.0, 18.0, 13.0, 22.0, 19.0, 22.0, 27.0, 36.0, 36.0, 37.0, 42.0, 40.0, 46.0, 58.0, 46.0, 62.0, 49.0, 37.0, 36.0, 44.0, 35.0, 39.0, 34.0, 22.0, 26.0, 24.0, 16.0, 20.0, 9.0, 10.0, 7.0, 13.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.4375, -12.0577392578125, -11.677978515625, -11.2982177734375, -10.91845703125, -10.5386962890625, -10.158935546875, -9.7791748046875, -9.3994140625, -9.0196533203125, -8.639892578125, -8.2601318359375, -7.88037109375, -7.5006103515625, -7.120849609375, -6.7410888671875, -6.361328125, -5.9815673828125, -5.601806640625, -5.2220458984375, -4.84228515625, -4.4625244140625, -4.082763671875, -3.7030029296875, -3.3232421875, -2.9434814453125, -2.563720703125, -2.1839599609375, -1.80419921875, -1.4244384765625, -1.044677734375, -0.6649169921875, -0.28515625, 0.0946044921875, 0.474365234375, 0.8541259765625, 1.23388671875, 1.6136474609375, 1.993408203125, 2.3731689453125, 2.7529296875, 3.1326904296875, 3.512451171875, 3.8922119140625, 4.27197265625, 4.6517333984375, 5.031494140625, 5.4112548828125, 5.791015625, 6.1707763671875, 6.550537109375, 6.9302978515625, 7.31005859375, 7.6898193359375, 8.069580078125, 8.4493408203125, 8.8291015625, 9.2088623046875, 9.588623046875, 9.9683837890625, 10.34814453125, 10.7279052734375, 11.107666015625, 11.4874267578125, 11.8671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 16.0, 20.0, 28.0, 36.0, 59.0, 68.0, 121.0, 164.0, 291.0, 482.0, 909.0, 1703.0, 4428.0, 17443.0, 133714.0, 777264.0, 90996.0, 13398.0, 3782.0, 1653.0, 765.0, 423.0, 268.0, 169.0, 105.0, 66.0, 31.0, 36.0, 29.0, 13.0, 11.0, 15.0, 8.0, 6.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.9375, -68.5263671875, -66.115234375, -63.7041015625, -61.29296875, -58.8818359375, -56.470703125, -54.0595703125, -51.6484375, -49.2373046875, -46.826171875, -44.4150390625, -42.00390625, -39.5927734375, -37.181640625, -34.7705078125, -32.359375, -29.9482421875, -27.537109375, -25.1259765625, -22.71484375, -20.3037109375, -17.892578125, -15.4814453125, -13.0703125, -10.6591796875, -8.248046875, -5.8369140625, -3.42578125, -1.0146484375, 1.396484375, 3.8076171875, 6.21875, 8.6298828125, 11.041015625, 13.4521484375, 15.86328125, 18.2744140625, 20.685546875, 23.0966796875, 25.5078125, 27.9189453125, 30.330078125, 32.7412109375, 35.15234375, 37.5634765625, 39.974609375, 42.3857421875, 44.796875, 47.2080078125, 49.619140625, 52.0302734375, 54.44140625, 56.8525390625, 59.263671875, 61.6748046875, 64.0859375, 66.4970703125, 68.908203125, 71.3193359375, 73.73046875, 76.1416015625, 78.552734375, 80.9638671875, 83.375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 14.0, 11.0, 25.0, 26.0, 38.0, 46.0, 57.0, 52.0, 58.0, 55.0, 76.0, 66.0, 69.0, 65.0, 54.0, 38.0, 50.0, 34.0, 32.0, 26.0, 25.0, 10.0, 8.0, 8.0, 10.0, 6.0, 3.0, 4.0, 0.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.8125, -61.259765625, -58.70703125, -56.154296875, -53.6015625, -51.048828125, -48.49609375, -45.943359375, -43.390625, -40.837890625, -38.28515625, -35.732421875, -33.1796875, -30.626953125, -28.07421875, -25.521484375, -22.96875, -20.416015625, -17.86328125, -15.310546875, -12.7578125, -10.205078125, -7.65234375, -5.099609375, -2.546875, 0.005859375, 2.55859375, 5.111328125, 7.6640625, 10.216796875, 12.76953125, 15.322265625, 17.875, 20.427734375, 22.98046875, 25.533203125, 28.0859375, 30.638671875, 33.19140625, 35.744140625, 38.296875, 40.849609375, 43.40234375, 45.955078125, 48.5078125, 51.060546875, 53.61328125, 56.166015625, 58.71875, 61.271484375, 63.82421875, 66.376953125, 68.9296875, 71.482421875, 74.03515625, 76.587890625, 79.140625, 81.693359375, 84.24609375, 86.798828125, 89.3515625, 91.904296875, 94.45703125, 97.009765625, 99.5625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 12.0, 17.0, 21.0, 34.0, 48.0, 49.0, 91.0, 174.0, 302.0, 453.0, 1200.0, 3484.0, 15459.0, 173898.0, 791178.0, 50857.0, 7423.0, 2076.0, 761.0, 364.0, 210.0, 127.0, 87.0, 57.0, 37.0, 29.0, 21.0, 17.0, 13.0, 9.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.65625, -37.42041015625, -36.1845703125, -34.94873046875, -33.712890625, -32.47705078125, -31.2412109375, -30.00537109375, -28.76953125, -27.53369140625, -26.2978515625, -25.06201171875, -23.826171875, -22.59033203125, -21.3544921875, -20.11865234375, -18.8828125, -17.64697265625, -16.4111328125, -15.17529296875, -13.939453125, -12.70361328125, -11.4677734375, -10.23193359375, -8.99609375, -7.76025390625, -6.5244140625, -5.28857421875, -4.052734375, -2.81689453125, -1.5810546875, -0.34521484375, 0.890625, 2.12646484375, 3.3623046875, 4.59814453125, 5.833984375, 7.06982421875, 8.3056640625, 9.54150390625, 10.77734375, 12.01318359375, 13.2490234375, 14.48486328125, 15.720703125, 16.95654296875, 18.1923828125, 19.42822265625, 20.6640625, 21.89990234375, 23.1357421875, 24.37158203125, 25.607421875, 26.84326171875, 28.0791015625, 29.31494140625, 30.55078125, 31.78662109375, 33.0224609375, 34.25830078125, 35.494140625, 36.72998046875, 37.9658203125, 39.20166015625, 40.4375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 20.0, 20.0, 21.0, 40.0, 55.0, 84.0, 120.0, 199.0, 133.0, 95.0, 46.0, 46.0, 28.0, 12.0, 17.0, 21.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01050567626953125, -0.010217547416687012, -0.009929418563842773, -0.009641289710998535, -0.009353160858154297, -0.009065032005310059, -0.00877690315246582, -0.008488774299621582, -0.008200645446777344, -0.007912516593933105, -0.007624387741088867, -0.007336258888244629, -0.007048130035400391, -0.006760001182556152, -0.006471872329711914, -0.006183743476867676, -0.0058956146240234375, -0.005607485771179199, -0.005319356918334961, -0.005031228065490723, -0.004743099212646484, -0.004454970359802246, -0.004166841506958008, -0.0038787126541137695, -0.0035905838012695312, -0.003302454948425293, -0.0030143260955810547, -0.0027261972427368164, -0.002438068389892578, -0.00214993953704834, -0.0018618106842041016, -0.0015736818313598633, -0.001285552978515625, -0.0009974241256713867, -0.0007092952728271484, -0.00042116641998291016, -0.00013303756713867188, 0.0001550912857055664, 0.0004432201385498047, 0.000731348991394043, 0.0010194778442382812, 0.0013076066970825195, 0.0015957355499267578, 0.001883864402770996, 0.0021719932556152344, 0.0024601221084594727, 0.002748250961303711, 0.0030363798141479492, 0.0033245086669921875, 0.0036126375198364258, 0.003900766372680664, 0.004188895225524902, 0.004477024078369141, 0.004765152931213379, 0.005053281784057617, 0.0053414106369018555, 0.005629539489746094, 0.005917668342590332, 0.00620579719543457, 0.006493926048278809, 0.006782054901123047, 0.007070183753967285, 0.0073583126068115234, 0.007646441459655762, 0.0079345703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 10.0, 14.0, 11.0, 27.0, 30.0, 31.0, 57.0, 101.0, 131.0, 222.0, 392.0, 781.0, 1822.0, 4895.0, 20933.0, 203279.0, 741770.0, 58644.0, 9768.0, 3029.0, 1201.0, 583.0, 309.0, 178.0, 106.0, 76.0, 45.0, 35.0, 16.0, 19.0, 9.0, 9.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-39.5625, -38.500732421875, -37.43896484375, -36.377197265625, -35.3154296875, -34.253662109375, -33.19189453125, -32.130126953125, -31.068359375, -30.006591796875, -28.94482421875, -27.883056640625, -26.8212890625, -25.759521484375, -24.69775390625, -23.635986328125, -22.57421875, -21.512451171875, -20.45068359375, -19.388916015625, -18.3271484375, -17.265380859375, -16.20361328125, -15.141845703125, -14.080078125, -13.018310546875, -11.95654296875, -10.894775390625, -9.8330078125, -8.771240234375, -7.70947265625, -6.647705078125, -5.5859375, -4.524169921875, -3.46240234375, -2.400634765625, -1.3388671875, -0.277099609375, 0.78466796875, 1.846435546875, 2.908203125, 3.969970703125, 5.03173828125, 6.093505859375, 7.1552734375, 8.217041015625, 9.27880859375, 10.340576171875, 11.40234375, 12.464111328125, 13.52587890625, 14.587646484375, 15.6494140625, 16.711181640625, 17.77294921875, 18.834716796875, 19.896484375, 20.958251953125, 22.02001953125, 23.081787109375, 24.1435546875, 25.205322265625, 26.26708984375, 27.328857421875, 28.390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 4.0, 6.0, 1.0, 4.0, 4.0, 12.0, 9.0, 9.0, 11.0, 22.0, 36.0, 45.0, 55.0, 56.0, 89.0, 115.0, 108.0, 96.0, 85.0, 58.0, 40.0, 24.0, 32.0, 19.0, 14.0, 14.0, 5.0, 12.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -36.147705078125, -35.20166015625, -34.255615234375, -33.3095703125, -32.363525390625, -31.41748046875, -30.471435546875, -29.525390625, -28.579345703125, -27.63330078125, -26.687255859375, -25.7412109375, -24.795166015625, -23.84912109375, -22.903076171875, -21.95703125, -21.010986328125, -20.06494140625, -19.118896484375, -18.1728515625, -17.226806640625, -16.28076171875, -15.334716796875, -14.388671875, -13.442626953125, -12.49658203125, -11.550537109375, -10.6044921875, -9.658447265625, -8.71240234375, -7.766357421875, -6.8203125, -5.874267578125, -4.92822265625, -3.982177734375, -3.0361328125, -2.090087890625, -1.14404296875, -0.197998046875, 0.748046875, 1.694091796875, 2.64013671875, 3.586181640625, 4.5322265625, 5.478271484375, 6.42431640625, 7.370361328125, 8.31640625, 9.262451171875, 10.20849609375, 11.154541015625, 12.1005859375, 13.046630859375, 13.99267578125, 14.938720703125, 15.884765625, 16.830810546875, 17.77685546875, 18.722900390625, 19.6689453125, 20.614990234375, 21.56103515625, 22.507080078125, 23.453125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 17.0, 52.0, 149.0, 211.0, 289.0, 162.0, 50.0, 28.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1084.7186279296875, -1061.2403564453125, -1037.7620849609375, -1014.2838745117188, -990.8056640625, -967.327392578125, -943.84912109375, -920.3709106445312, -896.8926391601562, -873.4143676757812, -849.9361572265625, -826.4578857421875, -802.9796752929688, -779.5014038085938, -756.023193359375, -732.544921875, -709.066650390625, -685.58837890625, -662.1101684570312, -638.6318969726562, -615.1536865234375, -591.6754150390625, -568.1971435546875, -544.7189331054688, -521.24072265625, -497.7624816894531, -474.28424072265625, -450.80596923828125, -427.3277282714844, -403.8494873046875, -380.3712463378906, -356.89300537109375, -333.41473388671875, -309.9364929199219, -286.458251953125, -262.97998046875, -239.50173950195312, -216.02349853515625, -192.54525756835938, -169.06700134277344, -145.58876037597656, -122.11051177978516, -98.63226318359375, -75.15402221679688, -51.67577362060547, -28.197525024414062, -4.7192840576171875, 18.75897216796875, 42.237213134765625, 65.71546173095703, 89.19371032714844, 112.67195129394531, 136.15020751953125, 159.62844848632812, 183.106689453125, 206.58494567871094, 230.0631866455078, 253.5414276123047, 277.0196838378906, 300.4979248046875, 323.9761657714844, 347.45440673828125, 370.93267822265625, 394.4109191894531, 417.88916015625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 6.0, 4.0, 6.0, 5.0, 10.0, 8.0, 7.0, 14.0, 18.0, 26.0, 30.0, 23.0, 27.0, 27.0, 31.0, 34.0, 38.0, 34.0, 40.0, 55.0, 38.0, 57.0, 41.0, 38.0, 30.0, 45.0, 35.0, 33.0, 37.0, 28.0, 19.0, 28.0, 23.0, 16.0, 23.0, 18.0, 9.0, 12.0, 8.0, 2.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-212.09805297851562, -205.34762573242188, -198.59719848632812, -191.84677124023438, -185.0963592529297, -178.34593200683594, -171.5955047607422, -164.84507751464844, -158.09466552734375, -151.34423828125, -144.59381103515625, -137.8433837890625, -131.0929718017578, -124.34254455566406, -117.59211730957031, -110.84169006347656, -104.09126281738281, -97.34083557128906, -90.59041595458984, -83.8399887084961, -77.08956909179688, -70.33914184570312, -63.588714599609375, -56.83829116821289, -50.087867736816406, -43.33744430541992, -36.58702087402344, -29.836593627929688, -23.086170196533203, -16.33574676513672, -9.585319519042969, -2.8348960876464844, 3.91552734375, 10.6659517288208, 17.4163761138916, 24.16680145263672, 30.917224884033203, 37.66764831542969, 44.41807556152344, 51.16849899291992, 57.918922424316406, 64.66934967041016, 71.41976928710938, 78.17019653320312, 84.92062377929688, 91.6710433959961, 98.42147064208984, 105.17189025878906, 111.92231750488281, 118.67274475097656, 125.42316436767578, 132.173583984375, 138.92401123046875, 145.6744384765625, 152.42486572265625, 159.17529296875, 165.92572021484375, 172.6761474609375, 179.42657470703125, 186.177001953125, 192.9274139404297, 199.67784118652344, 206.4282684326172, 213.17869567871094, 219.92910766601562]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 8.0, 8.0, 13.0, 16.0, 27.0, 52.0, 108.0, 242.0, 688.0, 3584.0, 65027.0, 4069529.0, 50779.0, 3074.0, 650.0, 240.0, 110.0, 52.0, 24.0, 14.0, 12.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.3125, -100.4794921875, -97.646484375, -94.8134765625, -91.98046875, -89.1474609375, -86.314453125, -83.4814453125, -80.6484375, -77.8154296875, -74.982421875, -72.1494140625, -69.31640625, -66.4833984375, -63.650390625, -60.8173828125, -57.984375, -55.1513671875, -52.318359375, -49.4853515625, -46.65234375, -43.8193359375, -40.986328125, -38.1533203125, -35.3203125, -32.4873046875, -29.654296875, -26.8212890625, -23.98828125, -21.1552734375, -18.322265625, -15.4892578125, -12.65625, -9.8232421875, -6.990234375, -4.1572265625, -1.32421875, 1.5087890625, 4.341796875, 7.1748046875, 10.0078125, 12.8408203125, 15.673828125, 18.5068359375, 21.33984375, 24.1728515625, 27.005859375, 29.8388671875, 32.671875, 35.5048828125, 38.337890625, 41.1708984375, 44.00390625, 46.8369140625, 49.669921875, 52.5029296875, 55.3359375, 58.1689453125, 61.001953125, 63.8349609375, 66.66796875, 69.5009765625, 72.333984375, 75.1669921875, 78.0]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 11.0, 8.0, 10.0, 20.0, 15.0, 15.0, 26.0, 27.0, 45.0, 36.0, 43.0, 52.0, 67.0, 58.0, 58.0, 62.0, 68.0, 58.0, 41.0, 47.0, 37.0, 36.0, 32.0, 22.0, 19.0, 10.0, 19.0, 9.0, 14.0, 3.0, 4.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6484375, -13.207763671875, -12.76708984375, -12.326416015625, -11.8857421875, -11.445068359375, -11.00439453125, -10.563720703125, -10.123046875, -9.682373046875, -9.24169921875, -8.801025390625, -8.3603515625, -7.919677734375, -7.47900390625, -7.038330078125, -6.59765625, -6.156982421875, -5.71630859375, -5.275634765625, -4.8349609375, -4.394287109375, -3.95361328125, -3.512939453125, -3.072265625, -2.631591796875, -2.19091796875, -1.750244140625, -1.3095703125, -0.868896484375, -0.42822265625, 0.012451171875, 0.453125, 0.893798828125, 1.33447265625, 1.775146484375, 2.2158203125, 2.656494140625, 3.09716796875, 3.537841796875, 3.978515625, 4.419189453125, 4.85986328125, 5.300537109375, 5.7412109375, 6.181884765625, 6.62255859375, 7.063232421875, 7.50390625, 7.944580078125, 8.38525390625, 8.825927734375, 9.2666015625, 9.707275390625, 10.14794921875, 10.588623046875, 11.029296875, 11.469970703125, 11.91064453125, 12.351318359375, 12.7919921875, 13.232666015625, 13.67333984375, 14.114013671875, 14.5546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 7.0, 4.0, 11.0, 16.0, 20.0, 36.0, 42.0, 61.0, 112.0, 179.0, 329.0, 720.0, 1634.0, 4038.0, 12703.0, 59044.0, 861178.0, 3086193.0, 135389.0, 22064.0, 6088.0, 2172.0, 1014.0, 516.0, 215.0, 155.0, 105.0, 63.0, 43.0, 32.0, 25.0, 16.0, 12.0, 13.0, 4.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.21875, -41.73876953125, -40.2587890625, -38.77880859375, -37.298828125, -35.81884765625, -34.3388671875, -32.85888671875, -31.37890625, -29.89892578125, -28.4189453125, -26.93896484375, -25.458984375, -23.97900390625, -22.4990234375, -21.01904296875, -19.5390625, -18.05908203125, -16.5791015625, -15.09912109375, -13.619140625, -12.13916015625, -10.6591796875, -9.17919921875, -7.69921875, -6.21923828125, -4.7392578125, -3.25927734375, -1.779296875, -0.29931640625, 1.1806640625, 2.66064453125, 4.140625, 5.62060546875, 7.1005859375, 8.58056640625, 10.060546875, 11.54052734375, 13.0205078125, 14.50048828125, 15.98046875, 17.46044921875, 18.9404296875, 20.42041015625, 21.900390625, 23.38037109375, 24.8603515625, 26.34033203125, 27.8203125, 29.30029296875, 30.7802734375, 32.26025390625, 33.740234375, 35.22021484375, 36.7001953125, 38.18017578125, 39.66015625, 41.14013671875, 42.6201171875, 44.10009765625, 45.580078125, 47.06005859375, 48.5400390625, 50.02001953125, 51.5]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 8.0, 23.0, 13.0, 19.0, 29.0, 49.0, 46.0, 77.0, 120.0, 212.0, 341.0, 569.0, 792.0, 669.0, 380.0, 238.0, 141.0, 91.0, 66.0, 38.0, 41.0, 12.0, 24.0, 13.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.80419921875, -30.7333984375, -29.66259765625, -28.591796875, -27.52099609375, -26.4501953125, -25.37939453125, -24.30859375, -23.23779296875, -22.1669921875, -21.09619140625, -20.025390625, -18.95458984375, -17.8837890625, -16.81298828125, -15.7421875, -14.67138671875, -13.6005859375, -12.52978515625, -11.458984375, -10.38818359375, -9.3173828125, -8.24658203125, -7.17578125, -6.10498046875, -5.0341796875, -3.96337890625, -2.892578125, -1.82177734375, -0.7509765625, 0.31982421875, 1.390625, 2.46142578125, 3.5322265625, 4.60302734375, 5.673828125, 6.74462890625, 7.8154296875, 8.88623046875, 9.95703125, 11.02783203125, 12.0986328125, 13.16943359375, 14.240234375, 15.31103515625, 16.3818359375, 17.45263671875, 18.5234375, 19.59423828125, 20.6650390625, 21.73583984375, 22.806640625, 23.87744140625, 24.9482421875, 26.01904296875, 27.08984375, 28.16064453125, 29.2314453125, 30.30224609375, 31.373046875, 32.44384765625, 33.5146484375, 34.58544921875, 35.65625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 12.0, 23.0, 32.0, 58.0, 98.0, 152.0, 200.0, 156.0, 101.0, 61.0, 34.0, 18.0, 15.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-529.5617065429688, -512.80517578125, -496.048583984375, -479.29205322265625, -462.5354919433594, -445.7789306640625, -429.02239990234375, -412.2658386230469, -395.50927734375, -378.7527160644531, -361.99615478515625, -345.2396240234375, -328.4830627441406, -311.72650146484375, -294.969970703125, -278.2134094238281, -261.45684814453125, -244.70028686523438, -227.94374084472656, -211.18719482421875, -194.43063354492188, -177.674072265625, -160.9175262451172, -144.16098022460938, -127.4044189453125, -110.64786529541016, -93.89131164550781, -77.13475799560547, -60.378204345703125, -43.62165069580078, -26.865097045898438, -10.108543395996094, 6.64801025390625, 23.404563903808594, 40.16111755371094, 56.91767120361328, 73.67422485351562, 90.43077850341797, 107.18733215332031, 123.94388580322266, 140.700439453125, 157.45700073242188, 174.2135467529297, 190.9700927734375, 207.72665405273438, 224.48321533203125, 241.23976135253906, 257.9963073730469, 274.75286865234375, 291.5094299316406, 308.2659912109375, 325.02252197265625, 341.7790832519531, 358.53564453125, 375.29217529296875, 392.0487365722656, 408.8052978515625, 425.5618591308594, 442.31842041015625, 459.074951171875, 475.8315124511719, 492.58807373046875, 509.3446044921875, 526.1011962890625, 542.8577270507812]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 6.0, 9.0, 15.0, 13.0, 22.0, 28.0, 23.0, 37.0, 38.0, 55.0, 46.0, 60.0, 70.0, 72.0, 66.0, 64.0, 66.0, 47.0, 47.0, 40.0, 35.0, 27.0, 26.0, 12.0, 15.0, 12.0, 17.0, 6.0, 4.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.57196044921875, -299.9285888671875, -291.2852478027344, -282.6418762207031, -273.99853515625, -265.35516357421875, -256.7117919921875, -248.0684356689453, -239.42507934570312, -230.78172302246094, -222.13836669921875, -213.4949951171875, -204.8516387939453, -196.20828247070312, -187.56491088867188, -178.9215545654297, -170.2781982421875, -161.6348419189453, -152.99148559570312, -144.34811401367188, -135.7047576904297, -127.0614013671875, -118.41803741455078, -109.77467346191406, -101.13131713867188, -92.48796081542969, -83.84459686279297, -75.20123291015625, -66.55787658691406, -57.91451644897461, -49.271156311035156, -40.6277961730957, -31.984466552734375, -23.341106414794922, -14.697746276855469, -6.054386138916016, 2.5889739990234375, 11.23233413696289, 19.875694274902344, 28.519054412841797, 37.16241455078125, 45.8057746887207, 54.449134826660156, 63.09249496459961, 71.73585510253906, 80.37921142578125, 89.02257537841797, 97.66593933105469, 106.30929565429688, 114.95265197753906, 123.59601593017578, 132.2393798828125, 140.8827362060547, 149.52609252929688, 158.16946411132812, 166.8128204345703, 175.4561767578125, 184.0995330810547, 192.74288940429688, 201.38626098632812, 210.0296173095703, 218.6729736328125, 227.31634521484375, 235.95970153808594, 244.60305786132812]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 12.0, 17.0, 17.0, 35.0, 35.0, 48.0, 77.0, 121.0, 201.0, 293.0, 501.0, 831.0, 1686.0, 3570.0, 8298.0, 21339.0, 68128.0, 284722.0, 479663.0, 121415.0, 34756.0, 12554.0, 5189.0, 2268.0, 1172.0, 628.0, 332.0, 207.0, 123.0, 78.0, 59.0, 35.0, 42.0, 23.0, 13.0, 9.0, 7.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.15625, -45.595703125, -44.03515625, -42.474609375, -40.9140625, -39.353515625, -37.79296875, -36.232421875, -34.671875, -33.111328125, -31.55078125, -29.990234375, -28.4296875, -26.869140625, -25.30859375, -23.748046875, -22.1875, -20.626953125, -19.06640625, -17.505859375, -15.9453125, -14.384765625, -12.82421875, -11.263671875, -9.703125, -8.142578125, -6.58203125, -5.021484375, -3.4609375, -1.900390625, -0.33984375, 1.220703125, 2.78125, 4.341796875, 5.90234375, 7.462890625, 9.0234375, 10.583984375, 12.14453125, 13.705078125, 15.265625, 16.826171875, 18.38671875, 19.947265625, 21.5078125, 23.068359375, 24.62890625, 26.189453125, 27.75, 29.310546875, 30.87109375, 32.431640625, 33.9921875, 35.552734375, 37.11328125, 38.673828125, 40.234375, 41.794921875, 43.35546875, 44.916015625, 46.4765625, 48.037109375, 49.59765625, 51.158203125, 52.71875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 9.0, 8.0, 19.0, 21.0, 35.0, 35.0, 55.0, 63.0, 74.0, 96.0, 96.0, 94.0, 84.0, 79.0, 74.0, 50.0, 28.0, 27.0, 14.0, 13.0, 8.0, 8.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.0625, -28.14892578125, -27.2353515625, -26.32177734375, -25.408203125, -24.49462890625, -23.5810546875, -22.66748046875, -21.75390625, -20.84033203125, -19.9267578125, -19.01318359375, -18.099609375, -17.18603515625, -16.2724609375, -15.35888671875, -14.4453125, -13.53173828125, -12.6181640625, -11.70458984375, -10.791015625, -9.87744140625, -8.9638671875, -8.05029296875, -7.13671875, -6.22314453125, -5.3095703125, -4.39599609375, -3.482421875, -2.56884765625, -1.6552734375, -0.74169921875, 0.171875, 1.08544921875, 1.9990234375, 2.91259765625, 3.826171875, 4.73974609375, 5.6533203125, 6.56689453125, 7.48046875, 8.39404296875, 9.3076171875, 10.22119140625, 11.134765625, 12.04833984375, 12.9619140625, 13.87548828125, 14.7890625, 15.70263671875, 16.6162109375, 17.52978515625, 18.443359375, 19.35693359375, 20.2705078125, 21.18408203125, 22.09765625, 23.01123046875, 23.9248046875, 24.83837890625, 25.751953125, 26.66552734375, 27.5791015625, 28.49267578125, 29.40625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 1.0, 2.0, 5.0, 14.0, 15.0, 17.0, 32.0, 39.0, 70.0, 88.0, 131.0, 253.0, 506.0, 1054.0, 2637.0, 8953.0, 80743.0, 883190.0, 58753.0, 7669.0, 2268.0, 991.0, 472.0, 227.0, 129.0, 87.0, 61.0, 39.0, 23.0, 14.0, 13.0, 12.0, 8.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-164.5, -159.859375, -155.21875, -150.578125, -145.9375, -141.296875, -136.65625, -132.015625, -127.375, -122.734375, -118.09375, -113.453125, -108.8125, -104.171875, -99.53125, -94.890625, -90.25, -85.609375, -80.96875, -76.328125, -71.6875, -67.046875, -62.40625, -57.765625, -53.125, -48.484375, -43.84375, -39.203125, -34.5625, -29.921875, -25.28125, -20.640625, -16.0, -11.359375, -6.71875, -2.078125, 2.5625, 7.203125, 11.84375, 16.484375, 21.125, 25.765625, 30.40625, 35.046875, 39.6875, 44.328125, 48.96875, 53.609375, 58.25, 62.890625, 67.53125, 72.171875, 76.8125, 81.453125, 86.09375, 90.734375, 95.375, 100.015625, 104.65625, 109.296875, 113.9375, 118.578125, 123.21875, 127.859375, 132.5]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 13.0, 8.0, 11.0, 11.0, 14.0, 19.0, 25.0, 40.0, 46.0, 47.0, 62.0, 70.0, 73.0, 75.0, 70.0, 54.0, 57.0, 46.0, 53.0, 44.0, 29.0, 29.0, 17.0, 13.0, 18.0, 9.0, 7.0, 9.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-111.4375, -108.3466796875, -105.255859375, -102.1650390625, -99.07421875, -95.9833984375, -92.892578125, -89.8017578125, -86.7109375, -83.6201171875, -80.529296875, -77.4384765625, -74.34765625, -71.2568359375, -68.166015625, -65.0751953125, -61.984375, -58.8935546875, -55.802734375, -52.7119140625, -49.62109375, -46.5302734375, -43.439453125, -40.3486328125, -37.2578125, -34.1669921875, -31.076171875, -27.9853515625, -24.89453125, -21.8037109375, -18.712890625, -15.6220703125, -12.53125, -9.4404296875, -6.349609375, -3.2587890625, -0.16796875, 2.9228515625, 6.013671875, 9.1044921875, 12.1953125, 15.2861328125, 18.376953125, 21.4677734375, 24.55859375, 27.6494140625, 30.740234375, 33.8310546875, 36.921875, 40.0126953125, 43.103515625, 46.1943359375, 49.28515625, 52.3759765625, 55.466796875, 58.5576171875, 61.6484375, 64.7392578125, 67.830078125, 70.9208984375, 74.01171875, 77.1025390625, 80.193359375, 83.2841796875, 86.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 9.0, 9.0, 13.0, 13.0, 22.0, 36.0, 70.0, 100.0, 158.0, 271.0, 421.0, 884.0, 1814.0, 4470.0, 18727.0, 921483.0, 86983.0, 7560.0, 2758.0, 1254.0, 601.0, 331.0, 186.0, 123.0, 71.0, 59.0, 39.0, 20.0, 17.0, 14.0, 13.0, 8.0, 0.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.0, -100.501953125, -97.00390625, -93.505859375, -90.0078125, -86.509765625, -83.01171875, -79.513671875, -76.015625, -72.517578125, -69.01953125, -65.521484375, -62.0234375, -58.525390625, -55.02734375, -51.529296875, -48.03125, -44.533203125, -41.03515625, -37.537109375, -34.0390625, -30.541015625, -27.04296875, -23.544921875, -20.046875, -16.548828125, -13.05078125, -9.552734375, -6.0546875, -2.556640625, 0.94140625, 4.439453125, 7.9375, 11.435546875, 14.93359375, 18.431640625, 21.9296875, 25.427734375, 28.92578125, 32.423828125, 35.921875, 39.419921875, 42.91796875, 46.416015625, 49.9140625, 53.412109375, 56.91015625, 60.408203125, 63.90625, 67.404296875, 70.90234375, 74.400390625, 77.8984375, 81.396484375, 84.89453125, 88.392578125, 91.890625, 95.388671875, 98.88671875, 102.384765625, 105.8828125, 109.380859375, 112.87890625, 116.376953125, 119.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 26.0, 84.0, 335.0, 384.0, 87.0, 35.0, 13.0, 10.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.03781318664550781, -0.036594390869140625, -0.03537559509277344, -0.03415679931640625, -0.03293800354003906, -0.031719207763671875, -0.030500411987304688, -0.0292816162109375, -0.028062820434570312, -0.026844024658203125, -0.025625228881835938, -0.02440643310546875, -0.023187637329101562, -0.021968841552734375, -0.020750045776367188, -0.01953125, -0.018312454223632812, -0.017093658447265625, -0.015874862670898438, -0.01465606689453125, -0.013437271118164062, -0.012218475341796875, -0.010999679565429688, -0.0097808837890625, -0.008562088012695312, -0.007343292236328125, -0.0061244964599609375, -0.00490570068359375, -0.0036869049072265625, -0.002468109130859375, -0.0012493133544921875, -3.0517578125e-05, 0.0011882781982421875, 0.002407073974609375, 0.0036258697509765625, 0.00484466552734375, 0.0060634613037109375, 0.007282257080078125, 0.008501052856445312, 0.0097198486328125, 0.010938644409179688, 0.012157440185546875, 0.013376235961914062, 0.01459503173828125, 0.015813827514648438, 0.017032623291015625, 0.018251419067382812, 0.01947021484375, 0.020689010620117188, 0.021907806396484375, 0.023126602172851562, 0.02434539794921875, 0.025564193725585938, 0.026782989501953125, 0.028001785278320312, 0.0292205810546875, 0.030439376831054688, 0.031658172607421875, 0.03287696838378906, 0.03409576416015625, 0.03531455993652344, 0.036533355712890625, 0.03775215148925781, 0.038970947265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 15.0, 20.0, 34.0, 50.0, 75.0, 151.0, 292.0, 625.0, 1588.0, 5565.0, 52461.0, 959017.0, 22672.0, 3768.0, 1163.0, 475.0, 240.0, 128.0, 71.0, 38.0, 22.0, 18.0, 10.0, 7.0, 7.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5, -95.416015625, -91.33203125, -87.248046875, -83.1640625, -79.080078125, -74.99609375, -70.912109375, -66.828125, -62.744140625, -58.66015625, -54.576171875, -50.4921875, -46.408203125, -42.32421875, -38.240234375, -34.15625, -30.072265625, -25.98828125, -21.904296875, -17.8203125, -13.736328125, -9.65234375, -5.568359375, -1.484375, 2.599609375, 6.68359375, 10.767578125, 14.8515625, 18.935546875, 23.01953125, 27.103515625, 31.1875, 35.271484375, 39.35546875, 43.439453125, 47.5234375, 51.607421875, 55.69140625, 59.775390625, 63.859375, 67.943359375, 72.02734375, 76.111328125, 80.1953125, 84.279296875, 88.36328125, 92.447265625, 96.53125, 100.615234375, 104.69921875, 108.783203125, 112.8671875, 116.951171875, 121.03515625, 125.119140625, 129.203125, 133.287109375, 137.37109375, 141.455078125, 145.5390625, 149.623046875, 153.70703125, 157.791015625, 161.875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 8.0, 5.0, 10.0, 32.0, 32.0, 84.0, 197.0, 284.0, 169.0, 74.0, 39.0, 21.0, 9.0, 5.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -67.59765625, -64.9453125, -62.29296875, -59.640625, -56.98828125, -54.3359375, -51.68359375, -49.03125, -46.37890625, -43.7265625, -41.07421875, -38.421875, -35.76953125, -33.1171875, -30.46484375, -27.8125, -25.16015625, -22.5078125, -19.85546875, -17.203125, -14.55078125, -11.8984375, -9.24609375, -6.59375, -3.94140625, -1.2890625, 1.36328125, 4.015625, 6.66796875, 9.3203125, 11.97265625, 14.625, 17.27734375, 19.9296875, 22.58203125, 25.234375, 27.88671875, 30.5390625, 33.19140625, 35.84375, 38.49609375, 41.1484375, 43.80078125, 46.453125, 49.10546875, 51.7578125, 54.41015625, 57.0625, 59.71484375, 62.3671875, 65.01953125, 67.671875, 70.32421875, 72.9765625, 75.62890625, 78.28125, 80.93359375, 83.5859375, 86.23828125, 88.890625, 91.54296875, 94.1953125, 96.84765625, 99.5]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 11.0, 16.0, 41.0, 193.0, 453.0, 203.0, 56.0, 20.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2727.38623046875, -2661.7666015625, -2596.14697265625, -2530.527099609375, -2464.907470703125, -2399.287841796875, -2333.668212890625, -2268.04833984375, -2202.4287109375, -2136.80908203125, -2071.189453125, -2005.5697021484375, -1939.949951171875, -1874.330322265625, -1808.710693359375, -1743.0909423828125, -1677.4713134765625, -1611.8516845703125, -1546.23193359375, -1480.6123046875, -1414.9925537109375, -1349.3729248046875, -1283.753173828125, -1218.133544921875, -1152.513916015625, -1086.894287109375, -1021.2745361328125, -955.6549072265625, -890.03515625, -824.41552734375, -758.7958374023438, -693.1761474609375, -627.5562744140625, -561.9365844726562, -496.31689453125, -430.6972351074219, -365.0775451660156, -299.4578552246094, -233.83819580078125, -168.218505859375, -102.59881591796875, -36.97913360595703, 28.640548706054688, 94.26022338867188, 159.87991333007812, 225.49960327148438, 291.1192626953125, 356.73895263671875, 422.358642578125, 487.97833251953125, 553.5980224609375, 619.2176513671875, 684.83740234375, 750.45703125, 816.0767211914062, 881.6964111328125, 947.3161010742188, 1012.935791015625, 1078.555419921875, 1144.1751708984375, 1209.7947998046875, 1275.41455078125, 1341.0341796875, 1406.65380859375, 1472.2735595703125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 3.0, 11.0, 6.0, 2.0, 7.0, 17.0, 19.0, 23.0, 24.0, 23.0, 34.0, 42.0, 48.0, 32.0, 45.0, 75.0, 94.0, 82.0, 63.0, 47.0, 48.0, 45.0, 37.0, 35.0, 20.0, 28.0, 17.0, 15.0, 20.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-403.5238952636719, -387.91912841796875, -372.3143615722656, -356.7095947265625, -341.1048278808594, -325.50006103515625, -309.895263671875, -294.29052734375, -278.68572998046875, -263.0809631347656, -247.4761962890625, -231.87142944335938, -216.26666259765625, -200.66189575195312, -185.05711364746094, -169.4523468017578, -153.84759521484375, -138.24282836914062, -122.6380615234375, -107.03328704833984, -91.42852020263672, -75.8237533569336, -60.21897888183594, -44.61421203613281, -29.009445190429688, -13.40467643737793, 2.200092315673828, 17.80486297607422, 33.409629821777344, 49.01439666748047, 64.61917114257812, 80.22393798828125, 95.82867431640625, 111.43344116210938, 127.0382080078125, 142.64297485351562, 158.24774169921875, 173.85250854492188, 189.45729064941406, 205.0620574951172, 220.6668243408203, 236.27159118652344, 251.87635803222656, 267.48114013671875, 283.0859069824219, 298.690673828125, 314.2954406738281, 329.90020751953125, 345.5049743652344, 361.1097412109375, 376.7145080566406, 392.31927490234375, 407.9240417480469, 423.52880859375, 439.13360595703125, 454.73834228515625, 470.3431396484375, 485.9479064941406, 501.55267333984375, 517.157470703125, 532.76220703125, 548.3670043945312, 563.9717407226562, 579.5765380859375, 595.1812744140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 10.0, 11.0, 12.0, 25.0, 22.0, 32.0, 40.0, 63.0, 95.0, 146.0, 238.0, 277.0, 514.0, 894.0, 1818.0, 4080.0, 12683.0, 62945.0, 1120385.0, 2825849.0, 131242.0, 21673.0, 6218.0, 2330.0, 1071.0, 588.0, 322.0, 220.0, 121.0, 115.0, 67.0, 48.0, 24.0, 29.0, 12.0, 14.0, 8.0, 5.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.09375, -49.4541015625, -47.814453125, -46.1748046875, -44.53515625, -42.8955078125, -41.255859375, -39.6162109375, -37.9765625, -36.3369140625, -34.697265625, -33.0576171875, -31.41796875, -29.7783203125, -28.138671875, -26.4990234375, -24.859375, -23.2197265625, -21.580078125, -19.9404296875, -18.30078125, -16.6611328125, -15.021484375, -13.3818359375, -11.7421875, -10.1025390625, -8.462890625, -6.8232421875, -5.18359375, -3.5439453125, -1.904296875, -0.2646484375, 1.375, 3.0146484375, 4.654296875, 6.2939453125, 7.93359375, 9.5732421875, 11.212890625, 12.8525390625, 14.4921875, 16.1318359375, 17.771484375, 19.4111328125, 21.05078125, 22.6904296875, 24.330078125, 25.9697265625, 27.609375, 29.2490234375, 30.888671875, 32.5283203125, 34.16796875, 35.8076171875, 37.447265625, 39.0869140625, 40.7265625, 42.3662109375, 44.005859375, 45.6455078125, 47.28515625, 48.9248046875, 50.564453125, 52.2041015625, 53.84375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 10.0, 15.0, 20.0, 29.0, 31.0, 37.0, 49.0, 51.0, 58.0, 63.0, 68.0, 73.0, 86.0, 67.0, 72.0, 55.0, 50.0, 33.0, 21.0, 20.0, 21.0, 14.0, 9.0, 9.0, 3.0, 4.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.406005859375, -22.70263671875, -21.999267578125, -21.2958984375, -20.592529296875, -19.88916015625, -19.185791015625, -18.482421875, -17.779052734375, -17.07568359375, -16.372314453125, -15.6689453125, -14.965576171875, -14.26220703125, -13.558837890625, -12.85546875, -12.152099609375, -11.44873046875, -10.745361328125, -10.0419921875, -9.338623046875, -8.63525390625, -7.931884765625, -7.228515625, -6.525146484375, -5.82177734375, -5.118408203125, -4.4150390625, -3.711669921875, -3.00830078125, -2.304931640625, -1.6015625, -0.898193359375, -0.19482421875, 0.508544921875, 1.2119140625, 1.915283203125, 2.61865234375, 3.322021484375, 4.025390625, 4.728759765625, 5.43212890625, 6.135498046875, 6.8388671875, 7.542236328125, 8.24560546875, 8.948974609375, 9.65234375, 10.355712890625, 11.05908203125, 11.762451171875, 12.4658203125, 13.169189453125, 13.87255859375, 14.575927734375, 15.279296875, 15.982666015625, 16.68603515625, 17.389404296875, 18.0927734375, 18.796142578125, 19.49951171875, 20.202880859375, 20.90625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 15.0, 11.0, 30.0, 41.0, 40.0, 104.0, 247.0, 6294.0, 4184951.0, 1994.0, 190.0, 98.0, 86.0, 59.0, 36.0, 36.0, 21.0, 15.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-393.0, -374.625, -356.25, -337.875, -319.5, -301.125, -282.75, -264.375, -246.0, -227.625, -209.25, -190.875, -172.5, -154.125, -135.75, -117.375, -99.0, -80.625, -62.25, -43.875, -25.5, -7.125, 11.25, 29.625, 48.0, 66.375, 84.75, 103.125, 121.5, 139.875, 158.25, 176.625, 195.0, 213.375, 231.75, 250.125, 268.5, 286.875, 305.25, 323.625, 342.0, 360.375, 378.75, 397.125, 415.5, 433.875, 452.25, 470.625, 489.0, 507.375, 525.75, 544.125, 562.5, 580.875, 599.25, 617.625, 636.0, 654.375, 672.75, 691.125, 709.5, 727.875, 746.25, 764.625, 783.0]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 20.0, 105.0, 736.0, 2712.0, 393.0, 79.0, 21.0, 9.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.375, -143.998046875, -134.62109375, -125.244140625, -115.8671875, -106.490234375, -97.11328125, -87.736328125, -78.359375, -68.982421875, -59.60546875, -50.228515625, -40.8515625, -31.474609375, -22.09765625, -12.720703125, -3.34375, 6.033203125, 15.41015625, 24.787109375, 34.1640625, 43.541015625, 52.91796875, 62.294921875, 71.671875, 81.048828125, 90.42578125, 99.802734375, 109.1796875, 118.556640625, 127.93359375, 137.310546875, 146.6875, 156.064453125, 165.44140625, 174.818359375, 184.1953125, 193.572265625, 202.94921875, 212.326171875, 221.703125, 231.080078125, 240.45703125, 249.833984375, 259.2109375, 268.587890625, 277.96484375, 287.341796875, 296.71875, 306.095703125, 315.47265625, 324.849609375, 334.2265625, 343.603515625, 352.98046875, 362.357421875, 371.734375, 381.111328125, 390.48828125, 399.865234375, 409.2421875, 418.619140625, 427.99609375, 437.373046875, 446.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 12.0, 15.0, 20.0, 56.0, 92.0, 207.0, 254.0, 158.0, 64.0, 31.0, 26.0, 13.0, 15.0, 12.0, 5.0, 10.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1908.9403076171875, -1856.1849365234375, -1803.429443359375, -1750.674072265625, -1697.9185791015625, -1645.1632080078125, -1592.40771484375, -1539.65234375, -1486.89697265625, -1434.1416015625, -1381.3861083984375, -1328.6307373046875, -1275.875244140625, -1223.119873046875, -1170.364501953125, -1117.6090087890625, -1064.853515625, -1012.0980834960938, -959.3426513671875, -906.5872802734375, -853.831787109375, -801.076416015625, -748.3209838867188, -695.5655517578125, -642.8101196289062, -590.0546875, -537.2992553710938, -484.5438537597656, -431.7884216308594, -379.0329895019531, -326.277587890625, -273.52215576171875, -220.7667236328125, -168.01129150390625, -115.25587463378906, -62.500457763671875, -9.745025634765625, 43.010406494140625, 95.76580810546875, 148.521240234375, 201.27667236328125, 254.0321044921875, 306.78753662109375, 359.5429382324219, 412.2983703613281, 465.0538024902344, 517.8092041015625, 570.5646362304688, 623.320068359375, 676.0755004882812, 728.8309326171875, 781.5863037109375, 834.341796875, 887.09716796875, 939.8526000976562, 992.6080322265625, 1045.363525390625, 1098.118896484375, 1150.8743896484375, 1203.6297607421875, 1256.38525390625, 1309.140625, 1361.89599609375, 1414.6514892578125, 1467.4068603515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 13.0, 11.0, 13.0, 17.0, 20.0, 26.0, 27.0, 36.0, 27.0, 33.0, 45.0, 39.0, 46.0, 44.0, 54.0, 50.0, 49.0, 39.0, 54.0, 28.0, 39.0, 37.0, 32.0, 29.0, 20.0, 21.0, 29.0, 13.0, 14.0, 20.0, 9.0, 9.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-631.1177978515625, -611.6443481445312, -592.1708374023438, -572.6973876953125, -553.223876953125, -533.7504272460938, -514.2769775390625, -494.803466796875, -475.33001708984375, -455.8565368652344, -436.383056640625, -416.90960693359375, -397.4361267089844, -377.962646484375, -358.4891662597656, -339.01568603515625, -319.5422058105469, -300.0687255859375, -280.5952453613281, -261.12176513671875, -241.6483154296875, -222.17483520507812, -202.70135498046875, -183.22789001464844, -163.75440979003906, -144.2809295654297, -124.80746459960938, -105.333984375, -85.86051177978516, -66.38703918457031, -46.91355895996094, -27.440093994140625, -7.96661376953125, 11.506860733032227, 30.980335235595703, 50.45381164550781, 69.92728424072266, 89.4007568359375, 108.87423706054688, 128.3477020263672, 147.82118225097656, 167.29466247558594, 186.76812744140625, 206.24160766601562, 225.715087890625, 245.1885528564453, 264.66204833984375, 284.135498046875, 303.6089782714844, 323.08245849609375, 342.5559387207031, 362.0294189453125, 381.50286865234375, 400.9763488769531, 420.4498291015625, 439.92327880859375, 459.39678955078125, 478.8702697753906, 498.34375, 517.8171997070312, 537.2907104492188, 556.76416015625, 576.2376708984375, 595.7111206054688, 615.1845703125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 9.0, 14.0, 21.0, 29.0, 35.0, 59.0, 90.0, 123.0, 205.0, 328.0, 550.0, 950.0, 1755.0, 3705.0, 8205.0, 22202.0, 77930.0, 394728.0, 416063.0, 81762.0, 23064.0, 8632.0, 3754.0, 1861.0, 1003.0, 557.0, 329.0, 211.0, 116.0, 87.0, 54.0, 32.0, 23.0, 16.0, 15.0, 9.0, 5.0, 3.0, 7.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5, -76.4443359375, -73.388671875, -70.3330078125, -67.27734375, -64.2216796875, -61.166015625, -58.1103515625, -55.0546875, -51.9990234375, -48.943359375, -45.8876953125, -42.83203125, -39.7763671875, -36.720703125, -33.6650390625, -30.609375, -27.5537109375, -24.498046875, -21.4423828125, -18.38671875, -15.3310546875, -12.275390625, -9.2197265625, -6.1640625, -3.1083984375, -0.052734375, 3.0029296875, 6.05859375, 9.1142578125, 12.169921875, 15.2255859375, 18.28125, 21.3369140625, 24.392578125, 27.4482421875, 30.50390625, 33.5595703125, 36.615234375, 39.6708984375, 42.7265625, 45.7822265625, 48.837890625, 51.8935546875, 54.94921875, 58.0048828125, 61.060546875, 64.1162109375, 67.171875, 70.2275390625, 73.283203125, 76.3388671875, 79.39453125, 82.4501953125, 85.505859375, 88.5615234375, 91.6171875, 94.6728515625, 97.728515625, 100.7841796875, 103.83984375, 106.8955078125, 109.951171875, 113.0068359375, 116.0625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 3.0, 7.0, 4.0, 6.0, 13.0, 11.0, 9.0, 11.0, 19.0, 21.0, 31.0, 38.0, 33.0, 49.0, 56.0, 44.0, 38.0, 46.0, 62.0, 52.0, 61.0, 62.0, 61.0, 47.0, 34.0, 29.0, 22.0, 21.0, 15.0, 10.0, 18.0, 16.0, 8.0, 9.0, 10.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.947998046875, -25.97412109375, -25.000244140625, -24.0263671875, -23.052490234375, -22.07861328125, -21.104736328125, -20.130859375, -19.156982421875, -18.18310546875, -17.209228515625, -16.2353515625, -15.261474609375, -14.28759765625, -13.313720703125, -12.33984375, -11.365966796875, -10.39208984375, -9.418212890625, -8.4443359375, -7.470458984375, -6.49658203125, -5.522705078125, -4.548828125, -3.574951171875, -2.60107421875, -1.627197265625, -0.6533203125, 0.320556640625, 1.29443359375, 2.268310546875, 3.2421875, 4.216064453125, 5.18994140625, 6.163818359375, 7.1376953125, 8.111572265625, 9.08544921875, 10.059326171875, 11.033203125, 12.007080078125, 12.98095703125, 13.954833984375, 14.9287109375, 15.902587890625, 16.87646484375, 17.850341796875, 18.82421875, 19.798095703125, 20.77197265625, 21.745849609375, 22.7197265625, 23.693603515625, 24.66748046875, 25.641357421875, 26.615234375, 27.589111328125, 28.56298828125, 29.536865234375, 30.5107421875, 31.484619140625, 32.45849609375, 33.432373046875, 34.40625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 9.0, 9.0, 16.0, 18.0, 33.0, 44.0, 73.0, 172.0, 364.0, 894.0, 3561.0, 48695.0, 975898.0, 15374.0, 2143.0, 627.0, 264.0, 141.0, 67.0, 41.0, 37.0, 14.0, 12.0, 12.0, 8.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-530.5, -514.09375, -497.6875, -481.28125, -464.875, -448.46875, -432.0625, -415.65625, -399.25, -382.84375, -366.4375, -350.03125, -333.625, -317.21875, -300.8125, -284.40625, -268.0, -251.59375, -235.1875, -218.78125, -202.375, -185.96875, -169.5625, -153.15625, -136.75, -120.34375, -103.9375, -87.53125, -71.125, -54.71875, -38.3125, -21.90625, -5.5, 10.90625, 27.3125, 43.71875, 60.125, 76.53125, 92.9375, 109.34375, 125.75, 142.15625, 158.5625, 174.96875, 191.375, 207.78125, 224.1875, 240.59375, 257.0, 273.40625, 289.8125, 306.21875, 322.625, 339.03125, 355.4375, 371.84375, 388.25, 404.65625, 421.0625, 437.46875, 453.875, 470.28125, 486.6875, 503.09375, 519.5]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 0.0, 2.0, 5.0, 5.0, 7.0, 18.0, 15.0, 28.0, 33.0, 41.0, 59.0, 75.0, 68.0, 90.0, 74.0, 86.0, 69.0, 69.0, 54.0, 46.0, 34.0, 30.0, 17.0, 19.0, 13.0, 6.0, 6.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-246.125, -238.81640625, -231.5078125, -224.19921875, -216.890625, -209.58203125, -202.2734375, -194.96484375, -187.65625, -180.34765625, -173.0390625, -165.73046875, -158.421875, -151.11328125, -143.8046875, -136.49609375, -129.1875, -121.87890625, -114.5703125, -107.26171875, -99.953125, -92.64453125, -85.3359375, -78.02734375, -70.71875, -63.41015625, -56.1015625, -48.79296875, -41.484375, -34.17578125, -26.8671875, -19.55859375, -12.25, -4.94140625, 2.3671875, 9.67578125, 16.984375, 24.29296875, 31.6015625, 38.91015625, 46.21875, 53.52734375, 60.8359375, 68.14453125, 75.453125, 82.76171875, 90.0703125, 97.37890625, 104.6875, 111.99609375, 119.3046875, 126.61328125, 133.921875, 141.23046875, 148.5390625, 155.84765625, 163.15625, 170.46484375, 177.7734375, 185.08203125, 192.390625, 199.69921875, 207.0078125, 214.31640625, 221.625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 12.0, 7.0, 13.0, 24.0, 30.0, 43.0, 63.0, 69.0, 125.0, 223.0, 388.0, 671.0, 1242.0, 2907.0, 7721.0, 34378.0, 834559.0, 142439.0, 14878.0, 4641.0, 1940.0, 935.0, 493.0, 263.0, 148.0, 76.0, 58.0, 50.0, 36.0, 19.0, 30.0, 11.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-130.125, -126.380859375, -122.63671875, -118.892578125, -115.1484375, -111.404296875, -107.66015625, -103.916015625, -100.171875, -96.427734375, -92.68359375, -88.939453125, -85.1953125, -81.451171875, -77.70703125, -73.962890625, -70.21875, -66.474609375, -62.73046875, -58.986328125, -55.2421875, -51.498046875, -47.75390625, -44.009765625, -40.265625, -36.521484375, -32.77734375, -29.033203125, -25.2890625, -21.544921875, -17.80078125, -14.056640625, -10.3125, -6.568359375, -2.82421875, 0.919921875, 4.6640625, 8.408203125, 12.15234375, 15.896484375, 19.640625, 23.384765625, 27.12890625, 30.873046875, 34.6171875, 38.361328125, 42.10546875, 45.849609375, 49.59375, 53.337890625, 57.08203125, 60.826171875, 64.5703125, 68.314453125, 72.05859375, 75.802734375, 79.546875, 83.291015625, 87.03515625, 90.779296875, 94.5234375, 98.267578125, 102.01171875, 105.755859375, 109.5]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 12.0, 19.0, 29.0, 46.0, 106.0, 205.0, 270.0, 130.0, 60.0, 38.0, 23.0, 12.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0435791015625, -0.04226350784301758, -0.040947914123535156, -0.039632320404052734, -0.03831672668457031, -0.03700113296508789, -0.03568553924560547, -0.03436994552612305, -0.033054351806640625, -0.0317387580871582, -0.03042316436767578, -0.02910757064819336, -0.027791976928710938, -0.026476383209228516, -0.025160789489746094, -0.023845195770263672, -0.02252960205078125, -0.021214008331298828, -0.019898414611816406, -0.018582820892333984, -0.017267227172851562, -0.01595163345336914, -0.014636039733886719, -0.013320446014404297, -0.012004852294921875, -0.010689258575439453, -0.009373664855957031, -0.00805807113647461, -0.0067424774169921875, -0.005426883697509766, -0.004111289978027344, -0.002795696258544922, -0.0014801025390625, -0.00016450881958007812, 0.0011510848999023438, 0.0024666786193847656, 0.0037822723388671875, 0.005097866058349609, 0.006413459777832031, 0.007729053497314453, 0.009044647216796875, 0.010360240936279297, 0.011675834655761719, 0.01299142837524414, 0.014307022094726562, 0.015622615814208984, 0.016938209533691406, 0.018253803253173828, 0.01956939697265625, 0.020884990692138672, 0.022200584411621094, 0.023516178131103516, 0.024831771850585938, 0.02614736557006836, 0.02746295928955078, 0.028778553009033203, 0.030094146728515625, 0.03140974044799805, 0.03272533416748047, 0.03404092788696289, 0.03535652160644531, 0.036672115325927734, 0.037987709045410156, 0.03930330276489258, 0.040618896484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 1.0, 6.0, 12.0, 20.0, 19.0, 33.0, 54.0, 72.0, 95.0, 183.0, 314.0, 745.0, 2083.0, 8802.0, 88998.0, 914640.0, 25498.0, 4472.0, 1342.0, 478.0, 244.0, 136.0, 98.0, 57.0, 36.0, 25.0, 20.0, 18.0, 14.0, 14.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-181.375, -176.234375, -171.09375, -165.953125, -160.8125, -155.671875, -150.53125, -145.390625, -140.25, -135.109375, -129.96875, -124.828125, -119.6875, -114.546875, -109.40625, -104.265625, -99.125, -93.984375, -88.84375, -83.703125, -78.5625, -73.421875, -68.28125, -63.140625, -58.0, -52.859375, -47.71875, -42.578125, -37.4375, -32.296875, -27.15625, -22.015625, -16.875, -11.734375, -6.59375, -1.453125, 3.6875, 8.828125, 13.96875, 19.109375, 24.25, 29.390625, 34.53125, 39.671875, 44.8125, 49.953125, 55.09375, 60.234375, 65.375, 70.515625, 75.65625, 80.796875, 85.9375, 91.078125, 96.21875, 101.359375, 106.5, 111.640625, 116.78125, 121.921875, 127.0625, 132.203125, 137.34375, 142.484375, 147.625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 14.0, 8.0, 18.0, 24.0, 38.0, 46.0, 66.0, 97.0, 108.0, 165.0, 117.0, 86.0, 52.0, 35.0, 19.0, 19.0, 19.0, 13.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25, -61.8935546875, -59.537109375, -57.1806640625, -54.82421875, -52.4677734375, -50.111328125, -47.7548828125, -45.3984375, -43.0419921875, -40.685546875, -38.3291015625, -35.97265625, -33.6162109375, -31.259765625, -28.9033203125, -26.546875, -24.1904296875, -21.833984375, -19.4775390625, -17.12109375, -14.7646484375, -12.408203125, -10.0517578125, -7.6953125, -5.3388671875, -2.982421875, -0.6259765625, 1.73046875, 4.0869140625, 6.443359375, 8.7998046875, 11.15625, 13.5126953125, 15.869140625, 18.2255859375, 20.58203125, 22.9384765625, 25.294921875, 27.6513671875, 30.0078125, 32.3642578125, 34.720703125, 37.0771484375, 39.43359375, 41.7900390625, 44.146484375, 46.5029296875, 48.859375, 51.2158203125, 53.572265625, 55.9287109375, 58.28515625, 60.6416015625, 62.998046875, 65.3544921875, 67.7109375, 70.0673828125, 72.423828125, 74.7802734375, 77.13671875, 79.4931640625, 81.849609375, 84.2060546875, 86.5625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 12.0, 16.0, 29.0, 70.0, 146.0, 319.0, 181.0, 103.0, 49.0, 26.0, 7.0, 17.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1589.79541015625, -1532.422119140625, -1475.048828125, -1417.6756591796875, -1360.3023681640625, -1302.9290771484375, -1245.5557861328125, -1188.1826171875, -1130.809326171875, -1073.43603515625, -1016.0628051757812, -958.6895141601562, -901.3162841796875, -843.9429931640625, -786.5697021484375, -729.1964721679688, -671.8231811523438, -614.4498901367188, -557.07666015625, -499.703369140625, -442.33013916015625, -384.95684814453125, -327.5835876464844, -270.2103271484375, -212.83706665039062, -155.46380615234375, -98.09053802490234, -40.71726989746094, 16.655990600585938, 74.02926635742188, 131.40252685546875, 188.77578735351562, 246.1490478515625, 303.5223083496094, 360.89556884765625, 418.26885986328125, 475.64208984375, 533.015380859375, 590.388671875, 647.7619018554688, 705.1351318359375, 762.5084228515625, 819.8816528320312, 877.2549438476562, 934.628173828125, 992.00146484375, 1049.374755859375, 1106.748046875, 1164.121337890625, 1221.49462890625, 1278.867919921875, 1336.2410888671875, 1393.6143798828125, 1450.9876708984375, 1508.3609619140625, 1565.734130859375, 1623.107421875, 1680.480712890625, 1737.85400390625, 1795.2271728515625, 1852.6004638671875, 1909.9737548828125, 1967.3470458984375, 2024.72021484375, 2082.093505859375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 18.0, 5.0, 16.0, 21.0, 14.0, 21.0, 25.0, 32.0, 30.0, 33.0, 44.0, 40.0, 56.0, 84.0, 79.0, 67.0, 50.0, 47.0, 42.0, 35.0, 32.0, 31.0, 23.0, 19.0, 15.0, 13.0, 15.0, 10.0, 15.0, 5.0, 9.0, 7.0, 3.0, 7.0, 7.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-904.7769775390625, -875.1094970703125, -845.4420166015625, -815.7745361328125, -786.1071166992188, -756.4396362304688, -726.7721557617188, -697.1046752929688, -667.437255859375, -637.769775390625, -608.102294921875, -578.434814453125, -548.7673950195312, -519.0999145507812, -489.43243408203125, -459.76495361328125, -430.09747314453125, -400.42999267578125, -370.7625427246094, -341.0950622558594, -311.4276123046875, -281.7601318359375, -252.0926513671875, -222.42518615722656, -192.75772094726562, -163.0902557373047, -133.42279052734375, -103.75531005859375, -74.08784484863281, -44.420379638671875, -14.752899169921875, 14.914566040039062, 44.58209228515625, 74.24955749511719, 103.91703033447266, 133.58450317382812, 163.25196838378906, 192.91943359375, 222.5869140625, 252.25437927246094, 281.9218444824219, 311.5893249511719, 341.25677490234375, 370.92425537109375, 400.59173583984375, 430.2591857910156, 459.9266662597656, 489.5941162109375, 519.2615966796875, 548.9290771484375, 578.5965576171875, 608.2640380859375, 637.9314575195312, 667.5989379882812, 697.2664184570312, 726.9338989257812, 756.601318359375, 786.268798828125, 815.936279296875, 845.603759765625, 875.2711791992188, 904.9386596679688, 934.6061401367188, 964.2736206054688, 993.9411010742188]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 7.0, 17.0, 24.0, 42.0, 67.0, 104.0, 204.0, 324.0, 696.0, 1449.0, 3857.0, 15467.0, 287532.0, 3770021.0, 99857.0, 9872.0, 2538.0, 1041.0, 485.0, 237.0, 155.0, 84.0, 66.0, 36.0, 26.0, 27.0, 10.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -78.6318359375, -74.951171875, -71.2705078125, -67.58984375, -63.9091796875, -60.228515625, -56.5478515625, -52.8671875, -49.1865234375, -45.505859375, -41.8251953125, -38.14453125, -34.4638671875, -30.783203125, -27.1025390625, -23.421875, -19.7412109375, -16.060546875, -12.3798828125, -8.69921875, -5.0185546875, -1.337890625, 2.3427734375, 6.0234375, 9.7041015625, 13.384765625, 17.0654296875, 20.74609375, 24.4267578125, 28.107421875, 31.7880859375, 35.46875, 39.1494140625, 42.830078125, 46.5107421875, 50.19140625, 53.8720703125, 57.552734375, 61.2333984375, 64.9140625, 68.5947265625, 72.275390625, 75.9560546875, 79.63671875, 83.3173828125, 86.998046875, 90.6787109375, 94.359375, 98.0400390625, 101.720703125, 105.4013671875, 109.08203125, 112.7626953125, 116.443359375, 120.1240234375, 123.8046875, 127.4853515625, 131.166015625, 134.8466796875, 138.52734375, 142.2080078125, 145.888671875, 149.5693359375, 153.25]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 12.0, 14.0, 16.0, 23.0, 35.0, 49.0, 53.0, 67.0, 80.0, 89.0, 96.0, 99.0, 89.0, 52.0, 59.0, 43.0, 33.0, 24.0, 20.0, 9.0, 8.0, 10.0, 9.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -64.068359375, -62.44921875, -60.830078125, -59.2109375, -57.591796875, -55.97265625, -54.353515625, -52.734375, -51.115234375, -49.49609375, -47.876953125, -46.2578125, -44.638671875, -43.01953125, -41.400390625, -39.78125, -38.162109375, -36.54296875, -34.923828125, -33.3046875, -31.685546875, -30.06640625, -28.447265625, -26.828125, -25.208984375, -23.58984375, -21.970703125, -20.3515625, -18.732421875, -17.11328125, -15.494140625, -13.875, -12.255859375, -10.63671875, -9.017578125, -7.3984375, -5.779296875, -4.16015625, -2.541015625, -0.921875, 0.697265625, 2.31640625, 3.935546875, 5.5546875, 7.173828125, 8.79296875, 10.412109375, 12.03125, 13.650390625, 15.26953125, 16.888671875, 18.5078125, 20.126953125, 21.74609375, 23.365234375, 24.984375, 26.603515625, 28.22265625, 29.841796875, 31.4609375, 33.080078125, 34.69921875, 36.318359375, 37.9375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 12.0, 28.0, 28.0, 56.0, 72.0, 111.0, 190.0, 250.0, 853.0, 26642.0, 4161580.0, 3585.0, 339.0, 162.0, 113.0, 83.0, 56.0, 37.0, 26.0, 15.0, 11.0, 6.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-658.0, -638.2421875, -618.484375, -598.7265625, -578.96875, -559.2109375, -539.453125, -519.6953125, -499.9375, -480.1796875, -460.421875, -440.6640625, -420.90625, -401.1484375, -381.390625, -361.6328125, -341.875, -322.1171875, -302.359375, -282.6015625, -262.84375, -243.0859375, -223.328125, -203.5703125, -183.8125, -164.0546875, -144.296875, -124.5390625, -104.78125, -85.0234375, -65.265625, -45.5078125, -25.75, -5.9921875, 13.765625, 33.5234375, 53.28125, 73.0390625, 92.796875, 112.5546875, 132.3125, 152.0703125, 171.828125, 191.5859375, 211.34375, 231.1015625, 250.859375, 270.6171875, 290.375, 310.1328125, 329.890625, 349.6484375, 369.40625, 389.1640625, 408.921875, 428.6796875, 448.4375, 468.1953125, 487.953125, 507.7109375, 527.46875, 547.2265625, 566.984375, 586.7421875, 606.5]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 40.0, 149.0, 1479.0, 2139.0, 192.0, 36.0, 24.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.75, -492.8046875, -479.859375, -466.9140625, -453.96875, -441.0234375, -428.078125, -415.1328125, -402.1875, -389.2421875, -376.296875, -363.3515625, -350.40625, -337.4609375, -324.515625, -311.5703125, -298.625, -285.6796875, -272.734375, -259.7890625, -246.84375, -233.8984375, -220.953125, -208.0078125, -195.0625, -182.1171875, -169.171875, -156.2265625, -143.28125, -130.3359375, -117.390625, -104.4453125, -91.5, -78.5546875, -65.609375, -52.6640625, -39.71875, -26.7734375, -13.828125, -0.8828125, 12.0625, 25.0078125, 37.953125, 50.8984375, 63.84375, 76.7890625, 89.734375, 102.6796875, 115.625, 128.5703125, 141.515625, 154.4609375, 167.40625, 180.3515625, 193.296875, 206.2421875, 219.1875, 232.1328125, 245.078125, 258.0234375, 270.96875, 283.9140625, 296.859375, 309.8046875, 322.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 16.0, 22.0, 48.0, 123.0, 351.0, 265.0, 88.0, 49.0, 13.0, 12.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2425.044921875, -2338.379150390625, -2251.713134765625, -2165.04736328125, -2078.38134765625, -1991.715576171875, -1905.0496826171875, -1818.3837890625, -1731.7178955078125, -1645.052001953125, -1558.3861083984375, -1471.72021484375, -1385.054443359375, -1298.388427734375, -1211.72265625, -1125.0567626953125, -1038.390869140625, -951.7249755859375, -865.05908203125, -778.3932495117188, -691.7273559570312, -605.0614624023438, -518.3956298828125, -431.729736328125, -345.0638427734375, -258.39794921875, -171.73208618164062, -85.06622314453125, 1.59967041015625, 88.26556396484375, 174.931396484375, 261.5972900390625, 348.263427734375, 434.9293212890625, 521.59521484375, 608.2610473632812, 694.9269409179688, 781.5928344726562, 868.2586669921875, 954.924560546875, 1041.5904541015625, 1128.25634765625, 1214.9222412109375, 1301.588134765625, 1388.25390625, 1474.919921875, 1561.585693359375, 1648.2515869140625, 1734.91748046875, 1821.5833740234375, 1908.249267578125, 1994.9150390625, 2081.5810546875, 2168.246826171875, 2254.91259765625, 2341.57861328125, 2428.24462890625, 2514.910400390625, 2601.576416015625, 2688.2421875, 2774.908203125, 2861.573974609375, 2948.23974609375, 3034.90576171875, 3121.571533203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 12.0, 9.0, 14.0, 16.0, 14.0, 18.0, 26.0, 44.0, 43.0, 54.0, 54.0, 70.0, 72.0, 50.0, 59.0, 66.0, 60.0, 55.0, 54.0, 30.0, 52.0, 38.0, 19.0, 16.0, 13.0, 15.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.1383972167969, -485.39404296875, -465.649658203125, -445.9053039550781, -426.16094970703125, -406.41656494140625, -386.6722106933594, -366.9278564453125, -347.1834716796875, -327.4391174316406, -307.6947326660156, -287.95037841796875, -268.20599365234375, -248.46163940429688, -228.71728515625, -208.97291564941406, -189.22854614257812, -169.4841766357422, -149.73980712890625, -129.99545288085938, -110.25108337402344, -90.5067138671875, -70.7623519897461, -51.01799011230469, -31.27362060546875, -11.529254913330078, 8.215110778808594, 27.959476470947266, 47.70384216308594, 67.44821166992188, 87.19257354736328, 106.93693542480469, 126.68133544921875, 146.4257049560547, 166.17007446289062, 185.9144287109375, 205.65879821777344, 225.40316772460938, 245.14752197265625, 264.89190673828125, 284.6362609863281, 304.380615234375, 324.125, 343.8693542480469, 363.61370849609375, 383.35809326171875, 403.1024475097656, 422.8468017578125, 442.5911865234375, 462.3355407714844, 482.0799255371094, 501.82427978515625, 521.5686645507812, 541.31298828125, 561.057373046875, 580.8017578125, 600.546142578125, 620.29052734375, 640.0348510742188, 659.7792358398438, 679.5236206054688, 699.2679443359375, 719.0123291015625, 738.7567138671875, 758.5010375976562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 7.0, 7.0, 15.0, 16.0, 21.0, 41.0, 54.0, 93.0, 126.0, 189.0, 359.0, 650.0, 1167.0, 2321.0, 4949.0, 11900.0, 34633.0, 162593.0, 653819.0, 126264.0, 29901.0, 10456.0, 4378.0, 2077.0, 1017.0, 610.0, 328.0, 170.0, 125.0, 71.0, 51.0, 38.0, 29.0, 18.0, 16.0, 9.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-166.25, -161.421875, -156.59375, -151.765625, -146.9375, -142.109375, -137.28125, -132.453125, -127.625, -122.796875, -117.96875, -113.140625, -108.3125, -103.484375, -98.65625, -93.828125, -89.0, -84.171875, -79.34375, -74.515625, -69.6875, -64.859375, -60.03125, -55.203125, -50.375, -45.546875, -40.71875, -35.890625, -31.0625, -26.234375, -21.40625, -16.578125, -11.75, -6.921875, -2.09375, 2.734375, 7.5625, 12.390625, 17.21875, 22.046875, 26.875, 31.703125, 36.53125, 41.359375, 46.1875, 51.015625, 55.84375, 60.671875, 65.5, 70.328125, 75.15625, 79.984375, 84.8125, 89.640625, 94.46875, 99.296875, 104.125, 108.953125, 113.78125, 118.609375, 123.4375, 128.265625, 133.09375, 137.921875, 142.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 11.0, 13.0, 23.0, 36.0, 30.0, 43.0, 68.0, 67.0, 65.0, 96.0, 93.0, 89.0, 82.0, 49.0, 51.0, 36.0, 29.0, 26.0, 29.0, 14.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-78.6875, -76.83056640625, -74.9736328125, -73.11669921875, -71.259765625, -69.40283203125, -67.5458984375, -65.68896484375, -63.83203125, -61.97509765625, -60.1181640625, -58.26123046875, -56.404296875, -54.54736328125, -52.6904296875, -50.83349609375, -48.9765625, -47.11962890625, -45.2626953125, -43.40576171875, -41.548828125, -39.69189453125, -37.8349609375, -35.97802734375, -34.12109375, -32.26416015625, -30.4072265625, -28.55029296875, -26.693359375, -24.83642578125, -22.9794921875, -21.12255859375, -19.265625, -17.40869140625, -15.5517578125, -13.69482421875, -11.837890625, -9.98095703125, -8.1240234375, -6.26708984375, -4.41015625, -2.55322265625, -0.6962890625, 1.16064453125, 3.017578125, 4.87451171875, 6.7314453125, 8.58837890625, 10.4453125, 12.30224609375, 14.1591796875, 16.01611328125, 17.873046875, 19.72998046875, 21.5869140625, 23.44384765625, 25.30078125, 27.15771484375, 29.0146484375, 30.87158203125, 32.728515625, 34.58544921875, 36.4423828125, 38.29931640625, 40.15625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 6.0, 7.0, 18.0, 16.0, 21.0, 29.0, 30.0, 37.0, 74.0, 115.0, 174.0, 271.0, 602.0, 1420.0, 4129.0, 20276.0, 648498.0, 349110.0, 17424.0, 3638.0, 1270.0, 562.0, 312.0, 161.0, 110.0, 70.0, 42.0, 25.0, 33.0, 15.0, 17.0, 9.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-310.5, -298.5390625, -286.578125, -274.6171875, -262.65625, -250.6953125, -238.734375, -226.7734375, -214.8125, -202.8515625, -190.890625, -178.9296875, -166.96875, -155.0078125, -143.046875, -131.0859375, -119.125, -107.1640625, -95.203125, -83.2421875, -71.28125, -59.3203125, -47.359375, -35.3984375, -23.4375, -11.4765625, 0.484375, 12.4453125, 24.40625, 36.3671875, 48.328125, 60.2890625, 72.25, 84.2109375, 96.171875, 108.1328125, 120.09375, 132.0546875, 144.015625, 155.9765625, 167.9375, 179.8984375, 191.859375, 203.8203125, 215.78125, 227.7421875, 239.703125, 251.6640625, 263.625, 275.5859375, 287.546875, 299.5078125, 311.46875, 323.4296875, 335.390625, 347.3515625, 359.3125, 371.2734375, 383.234375, 395.1953125, 407.15625, 419.1171875, 431.078125, 443.0390625, 455.0]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 6.0, 8.0, 6.0, 6.0, 10.0, 11.0, 15.0, 19.0, 22.0, 29.0, 33.0, 49.0, 42.0, 47.0, 39.0, 48.0, 44.0, 53.0, 47.0, 41.0, 51.0, 50.0, 54.0, 35.0, 29.0, 36.0, 28.0, 24.0, 18.0, 19.0, 13.0, 11.0, 9.0, 5.0, 7.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-186.0, -180.703125, -175.40625, -170.109375, -164.8125, -159.515625, -154.21875, -148.921875, -143.625, -138.328125, -133.03125, -127.734375, -122.4375, -117.140625, -111.84375, -106.546875, -101.25, -95.953125, -90.65625, -85.359375, -80.0625, -74.765625, -69.46875, -64.171875, -58.875, -53.578125, -48.28125, -42.984375, -37.6875, -32.390625, -27.09375, -21.796875, -16.5, -11.203125, -5.90625, -0.609375, 4.6875, 9.984375, 15.28125, 20.578125, 25.875, 31.171875, 36.46875, 41.765625, 47.0625, 52.359375, 57.65625, 62.953125, 68.25, 73.546875, 78.84375, 84.140625, 89.4375, 94.734375, 100.03125, 105.328125, 110.625, 115.921875, 121.21875, 126.515625, 131.8125, 137.109375, 142.40625, 147.703125, 153.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 3.0, 11.0, 13.0, 18.0, 30.0, 29.0, 57.0, 81.0, 108.0, 211.0, 292.0, 508.0, 914.0, 1816.0, 3947.0, 9879.0, 31135.0, 162880.0, 727409.0, 76838.0, 19313.0, 6807.0, 2965.0, 1398.0, 737.0, 463.0, 249.0, 130.0, 92.0, 55.0, 58.0, 32.0, 20.0, 11.0, 9.0, 15.0, 8.0, 8.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.1533203125, -63.431640625, -60.7099609375, -57.98828125, -55.2666015625, -52.544921875, -49.8232421875, -47.1015625, -44.3798828125, -41.658203125, -38.9365234375, -36.21484375, -33.4931640625, -30.771484375, -28.0498046875, -25.328125, -22.6064453125, -19.884765625, -17.1630859375, -14.44140625, -11.7197265625, -8.998046875, -6.2763671875, -3.5546875, -0.8330078125, 1.888671875, 4.6103515625, 7.33203125, 10.0537109375, 12.775390625, 15.4970703125, 18.21875, 20.9404296875, 23.662109375, 26.3837890625, 29.10546875, 31.8271484375, 34.548828125, 37.2705078125, 39.9921875, 42.7138671875, 45.435546875, 48.1572265625, 50.87890625, 53.6005859375, 56.322265625, 59.0439453125, 61.765625, 64.4873046875, 67.208984375, 69.9306640625, 72.65234375, 75.3740234375, 78.095703125, 80.8173828125, 83.5390625, 86.2607421875, 88.982421875, 91.7041015625, 94.42578125, 97.1474609375, 99.869140625, 102.5908203125, 105.3125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 9.0, 3.0, 7.0, 7.0, 10.0, 15.0, 21.0, 34.0, 41.0, 68.0, 142.0, 236.0, 154.0, 79.0, 46.0, 31.0, 14.0, 23.0, 9.0, 16.0, 4.0, 0.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02935791015625, -0.028165817260742188, -0.026973724365234375, -0.025781631469726562, -0.02458953857421875, -0.023397445678710938, -0.022205352783203125, -0.021013259887695312, -0.0198211669921875, -0.018629074096679688, -0.017436981201171875, -0.016244888305664062, -0.01505279541015625, -0.013860702514648438, -0.012668609619140625, -0.011476516723632812, -0.010284423828125, -0.009092330932617188, -0.007900238037109375, -0.0067081451416015625, -0.00551605224609375, -0.0043239593505859375, -0.003131866455078125, -0.0019397735595703125, -0.0007476806640625, 0.0004444122314453125, 0.001636505126953125, 0.0028285980224609375, 0.00402069091796875, 0.0052127838134765625, 0.006404876708984375, 0.0075969696044921875, 0.0087890625, 0.009981155395507812, 0.011173248291015625, 0.012365341186523438, 0.01355743408203125, 0.014749526977539062, 0.015941619873046875, 0.017133712768554688, 0.0183258056640625, 0.019517898559570312, 0.020709991455078125, 0.021902084350585938, 0.02309417724609375, 0.024286270141601562, 0.025478363037109375, 0.026670455932617188, 0.027862548828125, 0.029054641723632812, 0.030246734619140625, 0.03143882751464844, 0.03263092041015625, 0.03382301330566406, 0.035015106201171875, 0.03620719909667969, 0.0373992919921875, 0.03859138488769531, 0.039783477783203125, 0.04097557067871094, 0.04216766357421875, 0.04335975646972656, 0.044551849365234375, 0.04574394226074219, 0.04693603515625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 7.0, 17.0, 10.0, 28.0, 40.0, 49.0, 69.0, 121.0, 191.0, 367.0, 785.0, 1758.0, 5080.0, 24750.0, 300825.0, 669411.0, 34652.0, 6455.0, 1967.0, 833.0, 421.0, 245.0, 174.0, 93.0, 60.0, 40.0, 26.0, 23.0, 12.0, 10.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-140.625, -136.9326171875, -133.240234375, -129.5478515625, -125.85546875, -122.1630859375, -118.470703125, -114.7783203125, -111.0859375, -107.3935546875, -103.701171875, -100.0087890625, -96.31640625, -92.6240234375, -88.931640625, -85.2392578125, -81.546875, -77.8544921875, -74.162109375, -70.4697265625, -66.77734375, -63.0849609375, -59.392578125, -55.7001953125, -52.0078125, -48.3154296875, -44.623046875, -40.9306640625, -37.23828125, -33.5458984375, -29.853515625, -26.1611328125, -22.46875, -18.7763671875, -15.083984375, -11.3916015625, -7.69921875, -4.0068359375, -0.314453125, 3.3779296875, 7.0703125, 10.7626953125, 14.455078125, 18.1474609375, 21.83984375, 25.5322265625, 29.224609375, 32.9169921875, 36.609375, 40.3017578125, 43.994140625, 47.6865234375, 51.37890625, 55.0712890625, 58.763671875, 62.4560546875, 66.1484375, 69.8408203125, 73.533203125, 77.2255859375, 80.91796875, 84.6103515625, 88.302734375, 91.9951171875, 95.6875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 14.0, 11.0, 8.0, 8.0, 20.0, 30.0, 27.0, 31.0, 39.0, 64.0, 90.0, 93.0, 89.0, 77.0, 65.0, 59.0, 46.0, 38.0, 22.0, 31.0, 19.0, 15.0, 14.0, 15.0, 9.0, 10.0, 6.0, 4.0, 1.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.28125, -48.51123046875, -46.7412109375, -44.97119140625, -43.201171875, -41.43115234375, -39.6611328125, -37.89111328125, -36.12109375, -34.35107421875, -32.5810546875, -30.81103515625, -29.041015625, -27.27099609375, -25.5009765625, -23.73095703125, -21.9609375, -20.19091796875, -18.4208984375, -16.65087890625, -14.880859375, -13.11083984375, -11.3408203125, -9.57080078125, -7.80078125, -6.03076171875, -4.2607421875, -2.49072265625, -0.720703125, 1.04931640625, 2.8193359375, 4.58935546875, 6.359375, 8.12939453125, 9.8994140625, 11.66943359375, 13.439453125, 15.20947265625, 16.9794921875, 18.74951171875, 20.51953125, 22.28955078125, 24.0595703125, 25.82958984375, 27.599609375, 29.36962890625, 31.1396484375, 32.90966796875, 34.6796875, 36.44970703125, 38.2197265625, 39.98974609375, 41.759765625, 43.52978515625, 45.2998046875, 47.06982421875, 48.83984375, 50.60986328125, 52.3798828125, 54.14990234375, 55.919921875, 57.68994140625, 59.4599609375, 61.22998046875, 63.0]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 13.0, 24.0, 74.0, 187.0, 348.0, 192.0, 102.0, 28.0, 11.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2627.65576171875, -2544.605712890625, -2461.555908203125, -2378.505859375, -2295.4560546875, -2212.406005859375, -2129.356201171875, -2046.30615234375, -1963.25634765625, -1880.2064208984375, -1797.156494140625, -1714.1065673828125, -1631.056640625, -1548.0067138671875, -1464.956787109375, -1381.90673828125, -1298.8568115234375, -1215.806884765625, -1132.7569580078125, -1049.70703125, -966.6571044921875, -883.607177734375, -800.5571899414062, -717.5072631835938, -634.4573364257812, -551.4074096679688, -468.35748291015625, -385.3075256347656, -302.2575988769531, -219.20767211914062, -136.15771484375, -53.1077880859375, 29.942138671875, 112.99207305908203, 196.04200744628906, 279.0919494628906, 362.1418762207031, 445.1918029785156, 528.2417602539062, 611.2916870117188, 694.3416137695312, 777.3915405273438, 860.4414672851562, 943.491455078125, 1026.5413818359375, 1109.59130859375, 1192.6412353515625, 1275.691162109375, 1358.7410888671875, 1441.791015625, 1524.8409423828125, 1607.890869140625, 1690.9407958984375, 1773.99072265625, 1857.040771484375, 1940.090576171875, 2023.140625, 2106.190673828125, 2189.240478515625, 2272.29052734375, 2355.34033203125, 2438.390380859375, 2521.440185546875, 2604.490234375, 2687.5400390625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 10.0, 6.0, 10.0, 6.0, 13.0, 12.0, 20.0, 18.0, 22.0, 26.0, 34.0, 33.0, 45.0, 29.0, 60.0, 62.0, 88.0, 69.0, 72.0, 58.0, 41.0, 39.0, 28.0, 39.0, 22.0, 23.0, 20.0, 16.0, 17.0, 17.0, 6.0, 12.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-700.0050048828125, -673.2182006835938, -646.431396484375, -619.6445922851562, -592.8577880859375, -566.0709228515625, -539.2841796875, -512.497314453125, -485.71051025390625, -458.9237060546875, -432.13690185546875, -405.35009765625, -378.5632629394531, -351.7764587402344, -324.9896545410156, -298.20281982421875, -271.4160461425781, -244.62924194335938, -217.84242248535156, -191.0556182861328, -164.268798828125, -137.48199462890625, -110.6951904296875, -83.90837097167969, -57.12156677246094, -30.33475685119629, -3.5479469299316406, 23.238861083984375, 50.025672912597656, 76.81248474121094, 103.59928894042969, 130.3861083984375, 157.17291259765625, 183.959716796875, 210.7465362548828, 237.53334045410156, 264.3201599121094, 291.1069641113281, 317.8937683105469, 344.68060302734375, 371.4674072265625, 398.25421142578125, 425.041015625, 451.82781982421875, 478.6146545410156, 505.4014587402344, 532.188232421875, 558.97509765625, 585.7618408203125, 612.5486450195312, 639.33544921875, 666.1222534179688, 692.9090576171875, 719.6959228515625, 746.482666015625, 773.26953125, 800.0563354492188, 826.8431396484375, 853.6299438476562, 880.416748046875, 907.2035522460938, 933.9903564453125, 960.7772216796875, 987.5640258789062, 1014.350830078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 14.0, 12.0, 12.0, 26.0, 42.0, 76.0, 111.0, 223.0, 308.0, 503.0, 880.0, 1695.0, 3968.0, 12777.0, 90189.0, 3363310.0, 672575.0, 34947.0, 7204.0, 2595.0, 1189.0, 636.0, 358.0, 224.0, 121.0, 88.0, 62.0, 31.0, 35.0, 17.0, 14.0, 9.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.4375, -110.5947265625, -106.751953125, -102.9091796875, -99.06640625, -95.2236328125, -91.380859375, -87.5380859375, -83.6953125, -79.8525390625, -76.009765625, -72.1669921875, -68.32421875, -64.4814453125, -60.638671875, -56.7958984375, -52.953125, -49.1103515625, -45.267578125, -41.4248046875, -37.58203125, -33.7392578125, -29.896484375, -26.0537109375, -22.2109375, -18.3681640625, -14.525390625, -10.6826171875, -6.83984375, -2.9970703125, 0.845703125, 4.6884765625, 8.53125, 12.3740234375, 16.216796875, 20.0595703125, 23.90234375, 27.7451171875, 31.587890625, 35.4306640625, 39.2734375, 43.1162109375, 46.958984375, 50.8017578125, 54.64453125, 58.4873046875, 62.330078125, 66.1728515625, 70.015625, 73.8583984375, 77.701171875, 81.5439453125, 85.38671875, 89.2294921875, 93.072265625, 96.9150390625, 100.7578125, 104.6005859375, 108.443359375, 112.2861328125, 116.12890625, 119.9716796875, 123.814453125, 127.6572265625, 131.5]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 7.0, 7.0, 9.0, 10.0, 11.0, 15.0, 16.0, 27.0, 37.0, 33.0, 40.0, 37.0, 60.0, 54.0, 64.0, 101.0, 73.0, 72.0, 47.0, 48.0, 40.0, 36.0, 32.0, 24.0, 21.0, 14.0, 12.0, 4.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.21875, -48.76171875, -47.3046875, -45.84765625, -44.390625, -42.93359375, -41.4765625, -40.01953125, -38.5625, -37.10546875, -35.6484375, -34.19140625, -32.734375, -31.27734375, -29.8203125, -28.36328125, -26.90625, -25.44921875, -23.9921875, -22.53515625, -21.078125, -19.62109375, -18.1640625, -16.70703125, -15.25, -13.79296875, -12.3359375, -10.87890625, -9.421875, -7.96484375, -6.5078125, -5.05078125, -3.59375, -2.13671875, -0.6796875, 0.77734375, 2.234375, 3.69140625, 5.1484375, 6.60546875, 8.0625, 9.51953125, 10.9765625, 12.43359375, 13.890625, 15.34765625, 16.8046875, 18.26171875, 19.71875, 21.17578125, 22.6328125, 24.08984375, 25.546875, 27.00390625, 28.4609375, 29.91796875, 31.375, 32.83203125, 34.2890625, 35.74609375, 37.203125, 38.66015625, 40.1171875, 41.57421875, 43.03125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 10.0, 10.0, 31.0, 37.0, 86.0, 171.0, 361.0, 775.0, 3883.0, 4171266.0, 15896.0, 922.0, 363.0, 178.0, 106.0, 54.0, 26.0, 36.0, 23.0, 17.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-894.0, -857.765625, -821.53125, -785.296875, -749.0625, -712.828125, -676.59375, -640.359375, -604.125, -567.890625, -531.65625, -495.421875, -459.1875, -422.953125, -386.71875, -350.484375, -314.25, -278.015625, -241.78125, -205.546875, -169.3125, -133.078125, -96.84375, -60.609375, -24.375, 11.859375, 48.09375, 84.328125, 120.5625, 156.796875, 193.03125, 229.265625, 265.5, 301.734375, 337.96875, 374.203125, 410.4375, 446.671875, 482.90625, 519.140625, 555.375, 591.609375, 627.84375, 664.078125, 700.3125, 736.546875, 772.78125, 809.015625, 845.25, 881.484375, 917.71875, 953.953125, 990.1875, 1026.421875, 1062.65625, 1098.890625, 1135.125, 1171.359375, 1207.59375, 1243.828125, 1280.0625, 1316.296875, 1352.53125, 1388.765625, 1425.0]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 8.0, 21.0, 105.0, 2801.0, 1030.0, 78.0, 17.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-646.0, -622.8125, -599.625, -576.4375, -553.25, -530.0625, -506.875, -483.6875, -460.5, -437.3125, -414.125, -390.9375, -367.75, -344.5625, -321.375, -298.1875, -275.0, -251.8125, -228.625, -205.4375, -182.25, -159.0625, -135.875, -112.6875, -89.5, -66.3125, -43.125, -19.9375, 3.25, 26.4375, 49.625, 72.8125, 96.0, 119.1875, 142.375, 165.5625, 188.75, 211.9375, 235.125, 258.3125, 281.5, 304.6875, 327.875, 351.0625, 374.25, 397.4375, 420.625, 443.8125, 467.0, 490.1875, 513.375, 536.5625, 559.75, 582.9375, 606.125, 629.3125, 652.5, 675.6875, 698.875, 722.0625, 745.25, 768.4375, 791.625, 814.8125, 838.0]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 15.0, 34.0, 119.0, 427.0, 285.0, 76.0, 21.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4234.72314453125, -4082.369384765625, -3930.015869140625, -3777.662109375, -3625.30859375, -3472.954833984375, -3320.60107421875, -3168.24755859375, -3015.893798828125, -2863.5400390625, -2711.1865234375, -2558.832763671875, -2406.47900390625, -2254.12548828125, -2101.771728515625, -1949.4180908203125, -1797.064453125, -1644.7108154296875, -1492.357177734375, -1340.00341796875, -1187.6497802734375, -1035.296142578125, -882.9424438476562, -730.5887451171875, -578.235107421875, -425.8814392089844, -273.52777099609375, -121.17410278320312, 31.1795654296875, 183.533203125, 335.88690185546875, 488.2406005859375, 640.59375, 792.9473876953125, 945.3010864257812, 1097.65478515625, 1250.0084228515625, 1402.362060546875, 1554.7158203125, 1707.0694580078125, 1859.423095703125, 2011.7767333984375, 2164.13037109375, 2316.484130859375, 2468.837890625, 2621.19140625, 2773.545166015625, 2925.89892578125, 3078.25244140625, 3230.606201171875, 3382.959716796875, 3535.3134765625, 3687.6669921875, 3840.020751953125, 3992.37451171875, 4144.72802734375, 4297.08203125, 4449.435546875, 4601.78955078125, 4754.14306640625, 4906.49658203125, 5058.8505859375, 5211.2041015625, 5363.5576171875, 5515.9111328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 14.0, 8.0, 18.0, 22.0, 39.0, 48.0, 39.0, 62.0, 73.0, 95.0, 76.0, 91.0, 84.0, 72.0, 70.0, 50.0, 42.0, 51.0, 17.0, 9.0, 13.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1225.6424560546875, -1176.6087646484375, -1127.5750732421875, -1078.5413818359375, -1029.507568359375, -980.4739379882812, -931.440185546875, -882.406494140625, -833.372802734375, -784.339111328125, -735.305419921875, -686.2716674804688, -637.2379760742188, -588.2042846679688, -539.1705322265625, -490.1368408203125, -441.1031494140625, -392.0694580078125, -343.0357360839844, -294.00201416015625, -244.96832275390625, -195.9346160888672, -146.90090942382812, -97.8671875, -48.83349609375, 0.2002105712890625, 49.233917236328125, 98.26762390136719, 147.30133056640625, 196.3350372314453, 245.36874389648438, 294.4024658203125, 343.43603515625, 392.4697265625, 441.5034484863281, 490.53717041015625, 539.5708618164062, 588.6045532226562, 637.6383056640625, 686.6719970703125, 735.7056884765625, 784.7393798828125, 833.7730712890625, 882.8068237304688, 931.8405151367188, 980.8742065429688, 1029.907958984375, 1078.941650390625, 1127.975341796875, 1177.009033203125, 1226.042724609375, 1275.076416015625, 1324.110107421875, 1373.1439208984375, 1422.1776123046875, 1471.2113037109375, 1520.2449951171875, 1569.2786865234375, 1618.3123779296875, 1667.3460693359375, 1716.3798828125, 1765.41357421875, 1814.447265625, 1863.48095703125, 1912.5146484375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 4.0, 8.0, 13.0, 12.0, 24.0, 45.0, 40.0, 72.0, 96.0, 175.0, 300.0, 485.0, 848.0, 1442.0, 2655.0, 5099.0, 10301.0, 22205.0, 54089.0, 159791.0, 423953.0, 235967.0, 75104.0, 28995.0, 12844.0, 6366.0, 3218.0, 1826.0, 1020.0, 601.0, 341.0, 226.0, 145.0, 78.0, 50.0, 45.0, 24.0, 15.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.9375, -68.373046875, -65.80859375, -63.244140625, -60.6796875, -58.115234375, -55.55078125, -52.986328125, -50.421875, -47.857421875, -45.29296875, -42.728515625, -40.1640625, -37.599609375, -35.03515625, -32.470703125, -29.90625, -27.341796875, -24.77734375, -22.212890625, -19.6484375, -17.083984375, -14.51953125, -11.955078125, -9.390625, -6.826171875, -4.26171875, -1.697265625, 0.8671875, 3.431640625, 5.99609375, 8.560546875, 11.125, 13.689453125, 16.25390625, 18.818359375, 21.3828125, 23.947265625, 26.51171875, 29.076171875, 31.640625, 34.205078125, 36.76953125, 39.333984375, 41.8984375, 44.462890625, 47.02734375, 49.591796875, 52.15625, 54.720703125, 57.28515625, 59.849609375, 62.4140625, 64.978515625, 67.54296875, 70.107421875, 72.671875, 75.236328125, 77.80078125, 80.365234375, 82.9296875, 85.494140625, 88.05859375, 90.623046875, 93.1875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 14.0, 11.0, 21.0, 21.0, 31.0, 37.0, 32.0, 45.0, 47.0, 58.0, 52.0, 65.0, 54.0, 68.0, 71.0, 57.0, 39.0, 45.0, 46.0, 31.0, 26.0, 22.0, 15.0, 17.0, 14.0, 9.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5, -52.28515625, -50.0703125, -47.85546875, -45.640625, -43.42578125, -41.2109375, -38.99609375, -36.78125, -34.56640625, -32.3515625, -30.13671875, -27.921875, -25.70703125, -23.4921875, -21.27734375, -19.0625, -16.84765625, -14.6328125, -12.41796875, -10.203125, -7.98828125, -5.7734375, -3.55859375, -1.34375, 0.87109375, 3.0859375, 5.30078125, 7.515625, 9.73046875, 11.9453125, 14.16015625, 16.375, 18.58984375, 20.8046875, 23.01953125, 25.234375, 27.44921875, 29.6640625, 31.87890625, 34.09375, 36.30859375, 38.5234375, 40.73828125, 42.953125, 45.16796875, 47.3828125, 49.59765625, 51.8125, 54.02734375, 56.2421875, 58.45703125, 60.671875, 62.88671875, 65.1015625, 67.31640625, 69.53125, 71.74609375, 73.9609375, 76.17578125, 78.390625, 80.60546875, 82.8203125, 85.03515625, 87.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 5.0, 4.0, 5.0, 14.0, 8.0, 15.0, 23.0, 34.0, 42.0, 75.0, 119.0, 227.0, 452.0, 982.0, 2687.0, 8390.0, 37452.0, 331683.0, 603399.0, 47891.0, 9937.0, 2858.0, 1131.0, 485.0, 235.0, 143.0, 84.0, 51.0, 34.0, 34.0, 12.0, 18.0, 8.0, 4.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-222.875, -216.134765625, -209.39453125, -202.654296875, -195.9140625, -189.173828125, -182.43359375, -175.693359375, -168.953125, -162.212890625, -155.47265625, -148.732421875, -141.9921875, -135.251953125, -128.51171875, -121.771484375, -115.03125, -108.291015625, -101.55078125, -94.810546875, -88.0703125, -81.330078125, -74.58984375, -67.849609375, -61.109375, -54.369140625, -47.62890625, -40.888671875, -34.1484375, -27.408203125, -20.66796875, -13.927734375, -7.1875, -0.447265625, 6.29296875, 13.033203125, 19.7734375, 26.513671875, 33.25390625, 39.994140625, 46.734375, 53.474609375, 60.21484375, 66.955078125, 73.6953125, 80.435546875, 87.17578125, 93.916015625, 100.65625, 107.396484375, 114.13671875, 120.876953125, 127.6171875, 134.357421875, 141.09765625, 147.837890625, 154.578125, 161.318359375, 168.05859375, 174.798828125, 181.5390625, 188.279296875, 195.01953125, 201.759765625, 208.5]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 8.0, 11.0, 15.0, 20.0, 24.0, 26.0, 28.0, 23.0, 35.0, 39.0, 49.0, 49.0, 39.0, 45.0, 53.0, 47.0, 47.0, 57.0, 45.0, 39.0, 48.0, 37.0, 19.0, 31.0, 29.0, 17.0, 15.0, 16.0, 16.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-280.25, -271.91796875, -263.5859375, -255.25390625, -246.921875, -238.58984375, -230.2578125, -221.92578125, -213.59375, -205.26171875, -196.9296875, -188.59765625, -180.265625, -171.93359375, -163.6015625, -155.26953125, -146.9375, -138.60546875, -130.2734375, -121.94140625, -113.609375, -105.27734375, -96.9453125, -88.61328125, -80.28125, -71.94921875, -63.6171875, -55.28515625, -46.953125, -38.62109375, -30.2890625, -21.95703125, -13.625, -5.29296875, 3.0390625, 11.37109375, 19.703125, 28.03515625, 36.3671875, 44.69921875, 53.03125, 61.36328125, 69.6953125, 78.02734375, 86.359375, 94.69140625, 103.0234375, 111.35546875, 119.6875, 128.01953125, 136.3515625, 144.68359375, 153.015625, 161.34765625, 169.6796875, 178.01171875, 186.34375, 194.67578125, 203.0078125, 211.33984375, 219.671875, 228.00390625, 236.3359375, 244.66796875, 253.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 6.0, 6.0, 12.0, 16.0, 20.0, 27.0, 35.0, 58.0, 67.0, 132.0, 207.0, 277.0, 433.0, 731.0, 1372.0, 2771.0, 8268.0, 47118.0, 775685.0, 184103.0, 18104.0, 4553.0, 1863.0, 978.0, 612.0, 353.0, 212.0, 172.0, 104.0, 62.0, 48.0, 43.0, 30.0, 16.0, 12.0, 12.0, 2.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.3125, -98.2197265625, -95.126953125, -92.0341796875, -88.94140625, -85.8486328125, -82.755859375, -79.6630859375, -76.5703125, -73.4775390625, -70.384765625, -67.2919921875, -64.19921875, -61.1064453125, -58.013671875, -54.9208984375, -51.828125, -48.7353515625, -45.642578125, -42.5498046875, -39.45703125, -36.3642578125, -33.271484375, -30.1787109375, -27.0859375, -23.9931640625, -20.900390625, -17.8076171875, -14.71484375, -11.6220703125, -8.529296875, -5.4365234375, -2.34375, 0.7490234375, 3.841796875, 6.9345703125, 10.02734375, 13.1201171875, 16.212890625, 19.3056640625, 22.3984375, 25.4912109375, 28.583984375, 31.6767578125, 34.76953125, 37.8623046875, 40.955078125, 44.0478515625, 47.140625, 50.2333984375, 53.326171875, 56.4189453125, 59.51171875, 62.6044921875, 65.697265625, 68.7900390625, 71.8828125, 74.9755859375, 78.068359375, 81.1611328125, 84.25390625, 87.3466796875, 90.439453125, 93.5322265625, 96.625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 27.0, 62.0, 228.0, 425.0, 148.0, 57.0, 17.0, 11.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1083984375, -0.10601091384887695, -0.1036233901977539, -0.10123586654663086, -0.09884834289550781, -0.09646081924438477, -0.09407329559326172, -0.09168577194213867, -0.08929824829101562, -0.08691072463989258, -0.08452320098876953, -0.08213567733764648, -0.07974815368652344, -0.07736063003540039, -0.07497310638427734, -0.0725855827331543, -0.07019805908203125, -0.0678105354309082, -0.06542301177978516, -0.06303548812866211, -0.06064796447753906, -0.058260440826416016, -0.05587291717529297, -0.05348539352416992, -0.051097869873046875, -0.04871034622192383, -0.04632282257080078, -0.043935298919677734, -0.04154777526855469, -0.03916025161743164, -0.036772727966308594, -0.03438520431518555, -0.0319976806640625, -0.029610157012939453, -0.027222633361816406, -0.02483510971069336, -0.022447586059570312, -0.020060062408447266, -0.01767253875732422, -0.015285015106201172, -0.012897491455078125, -0.010509967803955078, -0.008122444152832031, -0.005734920501708984, -0.0033473968505859375, -0.0009598731994628906, 0.0014276504516601562, 0.003815174102783203, 0.00620269775390625, 0.008590221405029297, 0.010977745056152344, 0.01336526870727539, 0.015752792358398438, 0.018140316009521484, 0.02052783966064453, 0.022915363311767578, 0.025302886962890625, 0.027690410614013672, 0.03007793426513672, 0.032465457916259766, 0.03485298156738281, 0.03724050521850586, 0.039628028869628906, 0.04201555252075195, 0.044403076171875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 13.0, 8.0, 14.0, 24.0, 36.0, 60.0, 114.0, 205.0, 394.0, 833.0, 1999.0, 5467.0, 23425.0, 277060.0, 689811.0, 37213.0, 7334.0, 2478.0, 1062.0, 470.0, 246.0, 114.0, 56.0, 44.0, 26.0, 18.0, 9.0, 6.0, 7.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.5625, -111.390625, -108.21875, -105.046875, -101.875, -98.703125, -95.53125, -92.359375, -89.1875, -86.015625, -82.84375, -79.671875, -76.5, -73.328125, -70.15625, -66.984375, -63.8125, -60.640625, -57.46875, -54.296875, -51.125, -47.953125, -44.78125, -41.609375, -38.4375, -35.265625, -32.09375, -28.921875, -25.75, -22.578125, -19.40625, -16.234375, -13.0625, -9.890625, -6.71875, -3.546875, -0.375, 2.796875, 5.96875, 9.140625, 12.3125, 15.484375, 18.65625, 21.828125, 25.0, 28.171875, 31.34375, 34.515625, 37.6875, 40.859375, 44.03125, 47.203125, 50.375, 53.546875, 56.71875, 59.890625, 63.0625, 66.234375, 69.40625, 72.578125, 75.75, 78.921875, 82.09375, 85.265625, 88.4375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 2.0, 13.0, 8.0, 13.0, 17.0, 34.0, 54.0, 74.0, 109.0, 144.0, 148.0, 126.0, 83.0, 55.0, 42.0, 29.0, 17.0, 7.0, 3.0, 2.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.1875, -112.1796875, -109.171875, -106.1640625, -103.15625, -100.1484375, -97.140625, -94.1328125, -91.125, -88.1171875, -85.109375, -82.1015625, -79.09375, -76.0859375, -73.078125, -70.0703125, -67.0625, -64.0546875, -61.046875, -58.0390625, -55.03125, -52.0234375, -49.015625, -46.0078125, -43.0, -39.9921875, -36.984375, -33.9765625, -30.96875, -27.9609375, -24.953125, -21.9453125, -18.9375, -15.9296875, -12.921875, -9.9140625, -6.90625, -3.8984375, -0.890625, 2.1171875, 5.125, 8.1328125, 11.140625, 14.1484375, 17.15625, 20.1640625, 23.171875, 26.1796875, 29.1875, 32.1953125, 35.203125, 38.2109375, 41.21875, 44.2265625, 47.234375, 50.2421875, 53.25, 56.2578125, 59.265625, 62.2734375, 65.28125, 68.2890625, 71.296875, 74.3046875, 77.3125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 17.0, 30.0, 98.0, 228.0, 386.0, 147.0, 45.0, 24.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2199.96875, -2113.217041015625, -2026.465087890625, -1939.71337890625, -1852.9615478515625, -1766.209716796875, -1679.4580078125, -1592.7061767578125, -1505.954345703125, -1419.2025146484375, -1332.45068359375, -1245.698974609375, -1158.9471435546875, -1072.1953125, -985.4435424804688, -898.6917724609375, -811.93994140625, -725.1881103515625, -638.4363403320312, -551.6845703125, -464.9327392578125, -378.1809387207031, -291.42913818359375, -204.6773681640625, -117.925537109375, -31.173736572265625, 55.57806396484375, 142.32986450195312, 229.0816650390625, 315.8334655761719, 402.58526611328125, 489.3370361328125, 576.0888671875, 662.8406982421875, 749.5924682617188, 836.34423828125, 923.0960693359375, 1009.847900390625, 1096.599609375, 1183.3514404296875, 1270.103271484375, 1356.8551025390625, 1443.60693359375, 1530.358642578125, 1617.1104736328125, 1703.8623046875, 1790.614013671875, 1877.3658447265625, 1964.11767578125, 2050.869384765625, 2137.621337890625, 2224.373046875, 2311.125, 2397.876708984375, 2484.62841796875, 2571.38037109375, 2658.132080078125, 2744.8837890625, 2831.6357421875, 2918.387451171875, 3005.13916015625, 3091.89111328125, 3178.642822265625, 3265.39453125, 3352.146484375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 5.0, 6.0, 8.0, 8.0, 12.0, 13.0, 17.0, 18.0, 14.0, 17.0, 24.0, 18.0, 22.0, 28.0, 34.0, 30.0, 44.0, 44.0, 52.0, 61.0, 53.0, 50.0, 52.0, 40.0, 26.0, 28.0, 27.0, 32.0, 17.0, 15.0, 31.0, 22.0, 16.0, 15.0, 14.0, 10.0, 11.0, 5.0, 9.0, 9.0, 6.0, 1.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-1008.56005859375, -977.6911010742188, -946.8220825195312, -915.953125, -885.0841674804688, -854.2152099609375, -823.34619140625, -792.4772338867188, -761.6082763671875, -730.7393188476562, -699.8703002929688, -669.0013427734375, -638.1323852539062, -607.263427734375, -576.3944091796875, -545.5254516601562, -514.656494140625, -483.7875061035156, -452.9185485839844, -422.049560546875, -391.18060302734375, -360.3116149902344, -329.442626953125, -298.57366943359375, -267.70465087890625, -236.83567810058594, -205.96670532226562, -175.09771728515625, -144.228759765625, -113.35977172851562, -82.49079895019531, -51.621826171875, -20.75286865234375, 10.116106033325195, 40.98508071899414, 71.85405731201172, 102.72303009033203, 133.59201049804688, 164.4609832763672, 195.3299560546875, 226.1989288330078, 257.0679016113281, 287.9368896484375, 318.80584716796875, 349.6748352050781, 380.5438232421875, 411.41278076171875, 442.28173828125, 473.1507263183594, 504.01971435546875, 534.888671875, 565.7576293945312, 596.6266479492188, 627.49560546875, 658.3645629882812, 689.2335205078125, 720.1025390625, 750.9714965820312, 781.8405151367188, 812.70947265625, 843.5784301757812, 874.4473876953125, 905.31640625, 936.1853637695312, 967.0543212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 13.0, 17.0, 14.0, 17.0, 34.0, 43.0, 61.0, 94.0, 130.0, 184.0, 302.0, 492.0, 780.0, 1453.0, 3249.0, 8845.0, 42744.0, 409964.0, 3339297.0, 331546.0, 40078.0, 8410.0, 2989.0, 1429.0, 777.0, 430.0, 307.0, 172.0, 120.0, 82.0, 64.0, 31.0, 28.0, 21.0, 14.0, 9.0, 9.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-98.5, -95.2666015625, -92.033203125, -88.7998046875, -85.56640625, -82.3330078125, -79.099609375, -75.8662109375, -72.6328125, -69.3994140625, -66.166015625, -62.9326171875, -59.69921875, -56.4658203125, -53.232421875, -49.9990234375, -46.765625, -43.5322265625, -40.298828125, -37.0654296875, -33.83203125, -30.5986328125, -27.365234375, -24.1318359375, -20.8984375, -17.6650390625, -14.431640625, -11.1982421875, -7.96484375, -4.7314453125, -1.498046875, 1.7353515625, 4.96875, 8.2021484375, 11.435546875, 14.6689453125, 17.90234375, 21.1357421875, 24.369140625, 27.6025390625, 30.8359375, 34.0693359375, 37.302734375, 40.5361328125, 43.76953125, 47.0029296875, 50.236328125, 53.4697265625, 56.703125, 59.9365234375, 63.169921875, 66.4033203125, 69.63671875, 72.8701171875, 76.103515625, 79.3369140625, 82.5703125, 85.8037109375, 89.037109375, 92.2705078125, 95.50390625, 98.7373046875, 101.970703125, 105.2041015625, 108.4375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 1.0, 9.0, 5.0, 11.0, 13.0, 24.0, 25.0, 38.0, 28.0, 43.0, 45.0, 40.0, 62.0, 52.0, 71.0, 70.0, 71.0, 63.0, 48.0, 47.0, 41.0, 45.0, 29.0, 21.0, 25.0, 16.0, 12.0, 15.0, 5.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.75, -69.376953125, -67.00390625, -64.630859375, -62.2578125, -59.884765625, -57.51171875, -55.138671875, -52.765625, -50.392578125, -48.01953125, -45.646484375, -43.2734375, -40.900390625, -38.52734375, -36.154296875, -33.78125, -31.408203125, -29.03515625, -26.662109375, -24.2890625, -21.916015625, -19.54296875, -17.169921875, -14.796875, -12.423828125, -10.05078125, -7.677734375, -5.3046875, -2.931640625, -0.55859375, 1.814453125, 4.1875, 6.560546875, 8.93359375, 11.306640625, 13.6796875, 16.052734375, 18.42578125, 20.798828125, 23.171875, 25.544921875, 27.91796875, 30.291015625, 32.6640625, 35.037109375, 37.41015625, 39.783203125, 42.15625, 44.529296875, 46.90234375, 49.275390625, 51.6484375, 54.021484375, 56.39453125, 58.767578125, 61.140625, 63.513671875, 65.88671875, 68.259765625, 70.6328125, 73.005859375, 75.37890625, 77.751953125, 80.125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 19.0, 39.0, 112.0, 267.0, 1405.0, 2400377.0, 1790205.0, 1375.0, 292.0, 111.0, 42.0, 16.0, 11.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1317.0, -1284.875, -1252.75, -1220.625, -1188.5, -1156.375, -1124.25, -1092.125, -1060.0, -1027.875, -995.75, -963.625, -931.5, -899.375, -867.25, -835.125, -803.0, -770.875, -738.75, -706.625, -674.5, -642.375, -610.25, -578.125, -546.0, -513.875, -481.75, -449.625, -417.5, -385.375, -353.25, -321.125, -289.0, -256.875, -224.75, -192.625, -160.5, -128.375, -96.25, -64.125, -32.0, 0.125, 32.25, 64.375, 96.5, 128.625, 160.75, 192.875, 225.0, 257.125, 289.25, 321.375, 353.5, 385.625, 417.75, 449.875, 482.0, 514.125, 546.25, 578.375, 610.5, 642.625, 674.75, 706.875, 739.0]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 3.0, 6.0, 12.0, 27.0, 42.0, 136.0, 740.0, 2208.0, 671.0, 120.0, 48.0, 23.0, 13.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.5, -192.1171875, -181.734375, -171.3515625, -160.96875, -150.5859375, -140.203125, -129.8203125, -119.4375, -109.0546875, -98.671875, -88.2890625, -77.90625, -67.5234375, -57.140625, -46.7578125, -36.375, -25.9921875, -15.609375, -5.2265625, 5.15625, 15.5390625, 25.921875, 36.3046875, 46.6875, 57.0703125, 67.453125, 77.8359375, 88.21875, 98.6015625, 108.984375, 119.3671875, 129.75, 140.1328125, 150.515625, 160.8984375, 171.28125, 181.6640625, 192.046875, 202.4296875, 212.8125, 223.1953125, 233.578125, 243.9609375, 254.34375, 264.7265625, 275.109375, 285.4921875, 295.875, 306.2578125, 316.640625, 327.0234375, 337.40625, 347.7890625, 358.171875, 368.5546875, 378.9375, 389.3203125, 399.703125, 410.0859375, 420.46875, 430.8515625, 441.234375, 451.6171875, 462.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 13.0, 21.0, 38.0, 54.0, 100.0, 123.0, 163.0, 148.0, 122.0, 95.0, 44.0, 30.0, 13.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-743.2432861328125, -709.4435424804688, -675.643798828125, -641.8440551757812, -608.0443115234375, -574.2445678710938, -540.44482421875, -506.64508056640625, -472.8453369140625, -439.04559326171875, -405.245849609375, -371.44610595703125, -337.6463623046875, -303.84661865234375, -270.046875, -236.24713134765625, -202.4473876953125, -168.64764404296875, -134.847900390625, -101.04815673828125, -67.2484130859375, -33.44866943359375, 0.35107421875, 34.15081787109375, 67.9505615234375, 101.75030517578125, 135.550048828125, 169.34979248046875, 203.1495361328125, 236.94927978515625, 270.7490234375, 304.54876708984375, 338.3485107421875, 372.14825439453125, 405.947998046875, 439.74774169921875, 473.5474853515625, 507.34722900390625, 541.14697265625, 574.9467163085938, 608.7464599609375, 642.5462036132812, 676.345947265625, 710.1456909179688, 743.9454345703125, 777.7451782226562, 811.544921875, 845.3446655273438, 879.1444091796875, 912.9441528320312, 946.743896484375, 980.5436401367188, 1014.3433837890625, 1048.14306640625, 1081.94287109375, 1115.74267578125, 1149.5423583984375, 1183.342041015625, 1217.141845703125, 1250.941650390625, 1284.7413330078125, 1318.541015625, 1352.3408203125, 1386.140625, 1419.9403076171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 4.0, 9.0, 7.0, 7.0, 10.0, 11.0, 20.0, 20.0, 31.0, 36.0, 37.0, 31.0, 36.0, 42.0, 41.0, 40.0, 53.0, 41.0, 46.0, 41.0, 59.0, 40.0, 39.0, 30.0, 42.0, 25.0, 28.0, 22.0, 22.0, 26.0, 10.0, 21.0, 15.0, 12.0, 15.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-597.777099609375, -580.9933471679688, -564.2095336914062, -547.42578125, -530.6420288085938, -513.8582763671875, -497.074462890625, -480.29071044921875, -463.5069274902344, -446.72314453125, -429.93939208984375, -413.1556091308594, -396.371826171875, -379.58807373046875, -362.8042907714844, -346.0205078125, -329.23675537109375, -312.4529724121094, -295.6692199707031, -278.88543701171875, -262.1016845703125, -245.31790161132812, -228.53411865234375, -211.75035095214844, -194.96658325195312, -178.1828155517578, -161.3990478515625, -144.61526489257812, -127.83149719238281, -111.0477294921875, -94.26395416259766, -77.48017883300781, -60.6964111328125, -43.91263961791992, -27.128868103027344, -10.345096588134766, 6.4386749267578125, 23.222442626953125, 40.00621795654297, 56.78999328613281, 73.57376098632812, 90.35752868652344, 107.14130401611328, 123.92507934570312, 140.70884704589844, 157.49261474609375, 174.27639770507812, 191.06016540527344, 207.84393310546875, 224.62770080566406, 241.41146850585938, 258.19525146484375, 274.97900390625, 291.7627868652344, 308.54656982421875, 325.330322265625, 342.1141052246094, 358.89788818359375, 375.681640625, 392.4654235839844, 409.24920654296875, 426.032958984375, 442.8167419433594, 459.60052490234375, 476.38427734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 13.0, 10.0, 14.0, 16.0, 35.0, 28.0, 52.0, 60.0, 131.0, 148.0, 210.0, 327.0, 490.0, 849.0, 1412.0, 2487.0, 4649.0, 9146.0, 19505.0, 48301.0, 147832.0, 441753.0, 245101.0, 72519.0, 27493.0, 12181.0, 5924.0, 3255.0, 1727.0, 1006.0, 649.0, 405.0, 245.0, 175.0, 126.0, 76.0, 61.0, 50.0, 28.0, 19.0, 10.0, 13.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.5, -73.923828125, -71.34765625, -68.771484375, -66.1953125, -63.619140625, -61.04296875, -58.466796875, -55.890625, -53.314453125, -50.73828125, -48.162109375, -45.5859375, -43.009765625, -40.43359375, -37.857421875, -35.28125, -32.705078125, -30.12890625, -27.552734375, -24.9765625, -22.400390625, -19.82421875, -17.248046875, -14.671875, -12.095703125, -9.51953125, -6.943359375, -4.3671875, -1.791015625, 0.78515625, 3.361328125, 5.9375, 8.513671875, 11.08984375, 13.666015625, 16.2421875, 18.818359375, 21.39453125, 23.970703125, 26.546875, 29.123046875, 31.69921875, 34.275390625, 36.8515625, 39.427734375, 42.00390625, 44.580078125, 47.15625, 49.732421875, 52.30859375, 54.884765625, 57.4609375, 60.037109375, 62.61328125, 65.189453125, 67.765625, 70.341796875, 72.91796875, 75.494140625, 78.0703125, 80.646484375, 83.22265625, 85.798828125, 88.375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 1.0, 6.0, 9.0, 15.0, 5.0, 19.0, 25.0, 30.0, 24.0, 47.0, 37.0, 51.0, 46.0, 56.0, 61.0, 71.0, 59.0, 57.0, 61.0, 50.0, 37.0, 41.0, 38.0, 21.0, 25.0, 13.0, 21.0, 19.0, 12.0, 11.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -80.0263671875, -77.740234375, -75.4541015625, -73.16796875, -70.8818359375, -68.595703125, -66.3095703125, -64.0234375, -61.7373046875, -59.451171875, -57.1650390625, -54.87890625, -52.5927734375, -50.306640625, -48.0205078125, -45.734375, -43.4482421875, -41.162109375, -38.8759765625, -36.58984375, -34.3037109375, -32.017578125, -29.7314453125, -27.4453125, -25.1591796875, -22.873046875, -20.5869140625, -18.30078125, -16.0146484375, -13.728515625, -11.4423828125, -9.15625, -6.8701171875, -4.583984375, -2.2978515625, -0.01171875, 2.2744140625, 4.560546875, 6.8466796875, 9.1328125, 11.4189453125, 13.705078125, 15.9912109375, 18.27734375, 20.5634765625, 22.849609375, 25.1357421875, 27.421875, 29.7080078125, 31.994140625, 34.2802734375, 36.56640625, 38.8525390625, 41.138671875, 43.4248046875, 45.7109375, 47.9970703125, 50.283203125, 52.5693359375, 54.85546875, 57.1416015625, 59.427734375, 61.7138671875, 64.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 11.0, 14.0, 18.0, 28.0, 44.0, 87.0, 140.0, 349.0, 1174.0, 5924.0, 80644.0, 921521.0, 33639.0, 3556.0, 798.0, 310.0, 116.0, 52.0, 37.0, 20.0, 18.0, 9.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-339.5, -328.3203125, -317.140625, -305.9609375, -294.78125, -283.6015625, -272.421875, -261.2421875, -250.0625, -238.8828125, -227.703125, -216.5234375, -205.34375, -194.1640625, -182.984375, -171.8046875, -160.625, -149.4453125, -138.265625, -127.0859375, -115.90625, -104.7265625, -93.546875, -82.3671875, -71.1875, -60.0078125, -48.828125, -37.6484375, -26.46875, -15.2890625, -4.109375, 7.0703125, 18.25, 29.4296875, 40.609375, 51.7890625, 62.96875, 74.1484375, 85.328125, 96.5078125, 107.6875, 118.8671875, 130.046875, 141.2265625, 152.40625, 163.5859375, 174.765625, 185.9453125, 197.125, 208.3046875, 219.484375, 230.6640625, 241.84375, 253.0234375, 264.203125, 275.3828125, 286.5625, 297.7421875, 308.921875, 320.1015625, 331.28125, 342.4609375, 353.640625, 364.8203125, 376.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 4.0, 8.0, 13.0, 10.0, 20.0, 17.0, 22.0, 26.0, 33.0, 28.0, 35.0, 42.0, 52.0, 48.0, 70.0, 43.0, 54.0, 60.0, 50.0, 51.0, 56.0, 41.0, 41.0, 28.0, 25.0, 19.0, 19.0, 17.0, 15.0, 12.0, 8.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-278.0, -269.3671875, -260.734375, -252.1015625, -243.46875, -234.8359375, -226.203125, -217.5703125, -208.9375, -200.3046875, -191.671875, -183.0390625, -174.40625, -165.7734375, -157.140625, -148.5078125, -139.875, -131.2421875, -122.609375, -113.9765625, -105.34375, -96.7109375, -88.078125, -79.4453125, -70.8125, -62.1796875, -53.546875, -44.9140625, -36.28125, -27.6484375, -19.015625, -10.3828125, -1.75, 6.8828125, 15.515625, 24.1484375, 32.78125, 41.4140625, 50.046875, 58.6796875, 67.3125, 75.9453125, 84.578125, 93.2109375, 101.84375, 110.4765625, 119.109375, 127.7421875, 136.375, 145.0078125, 153.640625, 162.2734375, 170.90625, 179.5390625, 188.171875, 196.8046875, 205.4375, 214.0703125, 222.703125, 231.3359375, 239.96875, 248.6015625, 257.234375, 265.8671875, 274.5]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 15.0, 19.0, 33.0, 46.0, 58.0, 95.0, 153.0, 266.0, 577.0, 1336.0, 3641.0, 15277.0, 123745.0, 825730.0, 62832.0, 9900.0, 2664.0, 1060.0, 437.0, 222.0, 126.0, 91.0, 63.0, 45.0, 29.0, 24.0, 12.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.125, -75.7109375, -73.296875, -70.8828125, -68.46875, -66.0546875, -63.640625, -61.2265625, -58.8125, -56.3984375, -53.984375, -51.5703125, -49.15625, -46.7421875, -44.328125, -41.9140625, -39.5, -37.0859375, -34.671875, -32.2578125, -29.84375, -27.4296875, -25.015625, -22.6015625, -20.1875, -17.7734375, -15.359375, -12.9453125, -10.53125, -8.1171875, -5.703125, -3.2890625, -0.875, 1.5390625, 3.953125, 6.3671875, 8.78125, 11.1953125, 13.609375, 16.0234375, 18.4375, 20.8515625, 23.265625, 25.6796875, 28.09375, 30.5078125, 32.921875, 35.3359375, 37.75, 40.1640625, 42.578125, 44.9921875, 47.40625, 49.8203125, 52.234375, 54.6484375, 57.0625, 59.4765625, 61.890625, 64.3046875, 66.71875, 69.1328125, 71.546875, 73.9609375, 76.375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 5.0, 14.0, 22.0, 36.0, 52.0, 141.0, 249.0, 231.0, 110.0, 61.0, 30.0, 19.0, 15.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045623779296875, -0.04450798034667969, -0.043392181396484375, -0.04227638244628906, -0.04116058349609375, -0.04004478454589844, -0.038928985595703125, -0.03781318664550781, -0.0366973876953125, -0.03558158874511719, -0.034465789794921875, -0.03334999084472656, -0.03223419189453125, -0.031118392944335938, -0.030002593994140625, -0.028886795043945312, -0.02777099609375, -0.026655197143554688, -0.025539398193359375, -0.024423599243164062, -0.02330780029296875, -0.022192001342773438, -0.021076202392578125, -0.019960403442382812, -0.0188446044921875, -0.017728805541992188, -0.016613006591796875, -0.015497207641601562, -0.01438140869140625, -0.013265609741210938, -0.012149810791015625, -0.011034011840820312, -0.009918212890625, -0.008802413940429688, -0.007686614990234375, -0.0065708160400390625, -0.00545501708984375, -0.0043392181396484375, -0.003223419189453125, -0.0021076202392578125, -0.0009918212890625, 0.0001239776611328125, 0.001239776611328125, 0.0023555755615234375, 0.00347137451171875, 0.0045871734619140625, 0.005702972412109375, 0.0068187713623046875, 0.0079345703125, 0.009050369262695312, 0.010166168212890625, 0.011281967163085938, 0.01239776611328125, 0.013513565063476562, 0.014629364013671875, 0.015745162963867188, 0.0168609619140625, 0.017976760864257812, 0.019092559814453125, 0.020208358764648438, 0.02132415771484375, 0.022439956665039062, 0.023555755615234375, 0.024671554565429688, 0.025787353515625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 3.0, 12.0, 8.0, 11.0, 18.0, 27.0, 26.0, 40.0, 54.0, 101.0, 151.0, 257.0, 417.0, 831.0, 1700.0, 4210.0, 12978.0, 67894.0, 799835.0, 129945.0, 19866.0, 5674.0, 2139.0, 1061.0, 507.0, 298.0, 158.0, 104.0, 61.0, 45.0, 30.0, 14.0, 12.0, 19.0, 8.0, 11.0, 4.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.125, -72.7509765625, -70.376953125, -68.0029296875, -65.62890625, -63.2548828125, -60.880859375, -58.5068359375, -56.1328125, -53.7587890625, -51.384765625, -49.0107421875, -46.63671875, -44.2626953125, -41.888671875, -39.5146484375, -37.140625, -34.7666015625, -32.392578125, -30.0185546875, -27.64453125, -25.2705078125, -22.896484375, -20.5224609375, -18.1484375, -15.7744140625, -13.400390625, -11.0263671875, -8.65234375, -6.2783203125, -3.904296875, -1.5302734375, 0.84375, 3.2177734375, 5.591796875, 7.9658203125, 10.33984375, 12.7138671875, 15.087890625, 17.4619140625, 19.8359375, 22.2099609375, 24.583984375, 26.9580078125, 29.33203125, 31.7060546875, 34.080078125, 36.4541015625, 38.828125, 41.2021484375, 43.576171875, 45.9501953125, 48.32421875, 50.6982421875, 53.072265625, 55.4462890625, 57.8203125, 60.1943359375, 62.568359375, 64.9423828125, 67.31640625, 69.6904296875, 72.064453125, 74.4384765625, 76.8125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 1.0, 3.0, 8.0, 4.0, 11.0, 8.0, 6.0, 16.0, 26.0, 25.0, 50.0, 68.0, 68.0, 101.0, 131.0, 136.0, 94.0, 69.0, 39.0, 26.0, 21.0, 19.0, 11.0, 6.0, 8.0, 8.0, 12.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-61.34375, -59.529296875, -57.71484375, -55.900390625, -54.0859375, -52.271484375, -50.45703125, -48.642578125, -46.828125, -45.013671875, -43.19921875, -41.384765625, -39.5703125, -37.755859375, -35.94140625, -34.126953125, -32.3125, -30.498046875, -28.68359375, -26.869140625, -25.0546875, -23.240234375, -21.42578125, -19.611328125, -17.796875, -15.982421875, -14.16796875, -12.353515625, -10.5390625, -8.724609375, -6.91015625, -5.095703125, -3.28125, -1.466796875, 0.34765625, 2.162109375, 3.9765625, 5.791015625, 7.60546875, 9.419921875, 11.234375, 13.048828125, 14.86328125, 16.677734375, 18.4921875, 20.306640625, 22.12109375, 23.935546875, 25.75, 27.564453125, 29.37890625, 31.193359375, 33.0078125, 34.822265625, 36.63671875, 38.451171875, 40.265625, 42.080078125, 43.89453125, 45.708984375, 47.5234375, 49.337890625, 51.15234375, 52.966796875, 54.78125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 9.0, 25.0, 110.0, 533.0, 269.0, 38.0, 15.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-933.4581909179688, -812.8829956054688, -692.3077392578125, -571.7325439453125, -451.1573486328125, -330.5821533203125, -210.00689697265625, -89.43170166015625, 31.14349365234375, 151.7187042236328, 272.2939147949219, 392.869140625, 513.4443359375, 634.01953125, 754.5947875976562, 875.1699829101562, 995.7451782226562, 1116.3204345703125, 1236.8956298828125, 1357.4708251953125, 1478.0460205078125, 1598.6212158203125, 1719.196533203125, 1839.771728515625, 1960.346923828125, 2080.922119140625, 2201.497314453125, 2322.072509765625, 2442.647705078125, 2563.222900390625, 2683.79833984375, 2804.37353515625, 2924.94873046875, 3045.52392578125, 3166.09912109375, 3286.67431640625, 3407.24951171875, 3527.82470703125, 3648.39990234375, 3768.97509765625, 3889.55029296875, 4010.12548828125, 4130.70068359375, 4251.27587890625, 4371.85107421875, 4492.42626953125, 4613.00146484375, 4733.57666015625, 4854.15234375, 4974.7275390625, 5095.302734375, 5215.8779296875, 5336.453125, 5457.0283203125, 5577.603515625, 5698.1787109375, 5818.75390625, 5939.3291015625, 6059.904296875, 6180.4794921875, 6301.0546875, 6421.6298828125, 6542.205078125, 6662.7802734375, 6783.35546875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 10.0, 6.0, 10.0, 6.0, 12.0, 13.0, 19.0, 23.0, 12.0, 24.0, 36.0, 34.0, 32.0, 29.0, 53.0, 63.0, 92.0, 104.0, 76.0, 37.0, 39.0, 26.0, 31.0, 19.0, 25.0, 26.0, 21.0, 17.0, 13.0, 13.0, 12.0, 14.0, 10.0, 7.0, 4.0, 1.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1055.872802734375, -1024.9217529296875, -993.9706420898438, -963.01953125, -932.0684204101562, -901.1173706054688, -870.166259765625, -839.2152099609375, -808.2640991210938, -777.31298828125, -746.3619384765625, -715.4108276367188, -684.459716796875, -653.5086669921875, -622.5575561523438, -591.6064453125, -560.6553955078125, -529.7042846679688, -498.7532043457031, -467.8021240234375, -436.8510437011719, -405.89996337890625, -374.9488525390625, -343.9977722167969, -313.046630859375, -282.0955505371094, -251.1444549560547, -220.193359375, -189.24227905273438, -158.2911834716797, -127.340087890625, -96.38900756835938, -65.43792724609375, -34.486839294433594, -3.535747528076172, 27.41534423828125, 58.366432189941406, 89.31752014160156, 120.26861572265625, 151.21969604492188, 182.17079162597656, 213.12188720703125, 244.07296752929688, 275.0240478515625, 305.97515869140625, 336.9262390136719, 367.8773193359375, 398.82843017578125, 429.7795104980469, 460.7305908203125, 491.68170166015625, 522.6328125, 553.5838623046875, 584.5349731445312, 615.486083984375, 646.4371337890625, 677.3882446289062, 708.33935546875, 739.2904052734375, 770.2415161132812, 801.192626953125, 832.1436767578125, 863.0947875976562, 894.0458984375, 924.9969482421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 4.0, 5.0, 12.0, 6.0, 9.0, 8.0, 4.0, 12.0, 21.0, 18.0, 32.0, 29.0, 63.0, 90.0, 124.0, 229.0, 509.0, 1177.0, 4040.0, 28972.0, 3040370.0, 1096719.0, 16536.0, 3125.0, 1036.0, 466.0, 233.0, 129.0, 91.0, 53.0, 40.0, 30.0, 18.0, 9.0, 12.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-182.625, -175.294921875, -167.96484375, -160.634765625, -153.3046875, -145.974609375, -138.64453125, -131.314453125, -123.984375, -116.654296875, -109.32421875, -101.994140625, -94.6640625, -87.333984375, -80.00390625, -72.673828125, -65.34375, -58.013671875, -50.68359375, -43.353515625, -36.0234375, -28.693359375, -21.36328125, -14.033203125, -6.703125, 0.626953125, 7.95703125, 15.287109375, 22.6171875, 29.947265625, 37.27734375, 44.607421875, 51.9375, 59.267578125, 66.59765625, 73.927734375, 81.2578125, 88.587890625, 95.91796875, 103.248046875, 110.578125, 117.908203125, 125.23828125, 132.568359375, 139.8984375, 147.228515625, 154.55859375, 161.888671875, 169.21875, 176.548828125, 183.87890625, 191.208984375, 198.5390625, 205.869140625, 213.19921875, 220.529296875, 227.859375, 235.189453125, 242.51953125, 249.849609375, 257.1796875, 264.509765625, 271.83984375, 279.169921875, 286.5]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 6.0, 5.0, 8.0, 10.0, 9.0, 9.0, 15.0, 19.0, 24.0, 32.0, 42.0, 37.0, 49.0, 32.0, 40.0, 45.0, 41.0, 56.0, 56.0, 50.0, 65.0, 35.0, 48.0, 53.0, 26.0, 38.0, 21.0, 17.0, 13.0, 12.0, 16.0, 10.0, 15.0, 7.0, 15.0, 2.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.375, -56.4384765625, -54.501953125, -52.5654296875, -50.62890625, -48.6923828125, -46.755859375, -44.8193359375, -42.8828125, -40.9462890625, -39.009765625, -37.0732421875, -35.13671875, -33.2001953125, -31.263671875, -29.3271484375, -27.390625, -25.4541015625, -23.517578125, -21.5810546875, -19.64453125, -17.7080078125, -15.771484375, -13.8349609375, -11.8984375, -9.9619140625, -8.025390625, -6.0888671875, -4.15234375, -2.2158203125, -0.279296875, 1.6572265625, 3.59375, 5.5302734375, 7.466796875, 9.4033203125, 11.33984375, 13.2763671875, 15.212890625, 17.1494140625, 19.0859375, 21.0224609375, 22.958984375, 24.8955078125, 26.83203125, 28.7685546875, 30.705078125, 32.6416015625, 34.578125, 36.5146484375, 38.451171875, 40.3876953125, 42.32421875, 44.2607421875, 46.197265625, 48.1337890625, 50.0703125, 52.0068359375, 53.943359375, 55.8798828125, 57.81640625, 59.7529296875, 61.689453125, 63.6259765625, 65.5625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 12.0, 11.0, 23.0, 23.0, 55.0, 83.0, 184.0, 468.0, 2894.0, 64541.0, 4115822.0, 8744.0, 970.0, 216.0, 88.0, 59.0, 34.0, 28.0, 10.0, 11.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-869.5, -844.828125, -820.15625, -795.484375, -770.8125, -746.140625, -721.46875, -696.796875, -672.125, -647.453125, -622.78125, -598.109375, -573.4375, -548.765625, -524.09375, -499.421875, -474.75, -450.078125, -425.40625, -400.734375, -376.0625, -351.390625, -326.71875, -302.046875, -277.375, -252.703125, -228.03125, -203.359375, -178.6875, -154.015625, -129.34375, -104.671875, -80.0, -55.328125, -30.65625, -5.984375, 18.6875, 43.359375, 68.03125, 92.703125, 117.375, 142.046875, 166.71875, 191.390625, 216.0625, 240.734375, 265.40625, 290.078125, 314.75, 339.421875, 364.09375, 388.765625, 413.4375, 438.109375, 462.78125, 487.453125, 512.125, 536.796875, 561.46875, 586.140625, 610.8125, 635.484375, 660.15625, 684.828125, 709.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 5.0, 15.0, 22.0, 48.0, 119.0, 587.0, 2089.0, 840.0, 200.0, 52.0, 29.0, 15.0, 16.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-516.0, -504.935546875, -493.87109375, -482.806640625, -471.7421875, -460.677734375, -449.61328125, -438.548828125, -427.484375, -416.419921875, -405.35546875, -394.291015625, -383.2265625, -372.162109375, -361.09765625, -350.033203125, -338.96875, -327.904296875, -316.83984375, -305.775390625, -294.7109375, -283.646484375, -272.58203125, -261.517578125, -250.453125, -239.388671875, -228.32421875, -217.259765625, -206.1953125, -195.130859375, -184.06640625, -173.001953125, -161.9375, -150.873046875, -139.80859375, -128.744140625, -117.6796875, -106.615234375, -95.55078125, -84.486328125, -73.421875, -62.357421875, -51.29296875, -40.228515625, -29.1640625, -18.099609375, -7.03515625, 4.029296875, 15.09375, 26.158203125, 37.22265625, 48.287109375, 59.3515625, 70.416015625, 81.48046875, 92.544921875, 103.609375, 114.673828125, 125.73828125, 136.802734375, 147.8671875, 158.931640625, 169.99609375, 181.060546875, 192.125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 12.0, 16.0, 32.0, 100.0, 240.0, 381.0, 155.0, 41.0, 9.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5116.96142578125, -5004.3525390625, -4891.744140625, -4779.13525390625, -4666.5263671875, -4553.91748046875, -4441.30908203125, -4328.7001953125, -4216.09130859375, -4103.482421875, -3990.873779296875, -3878.26513671875, -3765.65625, -3653.047607421875, -3540.43896484375, -3427.830078125, -3315.221435546875, -3202.61279296875, -3090.00390625, -2977.395263671875, -2864.786376953125, -2752.177734375, -2639.56884765625, -2526.960205078125, -2414.3515625, -2301.742919921875, -2189.134033203125, -2076.525390625, -1963.91650390625, -1851.307861328125, -1738.6990966796875, -1626.09033203125, -1513.481201171875, -1400.8724365234375, -1288.263671875, -1175.655029296875, -1063.046142578125, -950.4374389648438, -837.8287353515625, -725.219970703125, -612.6112060546875, -500.00244140625, -387.3937072753906, -274.78497314453125, -162.17620849609375, -49.56744384765625, 63.041259765625, 175.6500244140625, 288.2587890625, 400.8675537109375, 513.476318359375, 626.0850219726562, 738.6937866210938, 851.3025512695312, 963.9112548828125, 1076.52001953125, 1189.1287841796875, 1301.737548828125, 1414.3463134765625, 1526.955078125, 1639.563720703125, 1752.172607421875, 1864.78125, 1977.3900146484375, 2089.998779296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 9.0, 17.0, 17.0, 18.0, 23.0, 27.0, 31.0, 33.0, 42.0, 45.0, 44.0, 56.0, 63.0, 49.0, 56.0, 63.0, 46.0, 40.0, 41.0, 39.0, 41.0, 28.0, 32.0, 19.0, 30.0, 17.0, 13.0, 10.0, 11.0, 8.0, 3.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-882.3338623046875, -852.0466918945312, -821.7595825195312, -791.472412109375, -761.185302734375, -730.8981323242188, -700.6109619140625, -670.3238525390625, -640.0367431640625, -609.7495727539062, -579.4624633789062, -549.17529296875, -518.88818359375, -488.60101318359375, -458.3138732910156, -428.0267333984375, -397.73956298828125, -367.4524230957031, -337.165283203125, -306.87811279296875, -276.59100341796875, -246.30384826660156, -216.01669311523438, -185.72955322265625, -155.44241333007812, -125.1552734375, -94.86812591552734, -64.58097839355469, -34.29383850097656, -4.0066986083984375, 26.28045654296875, 56.567596435546875, 86.854736328125, 117.14187622070312, 147.42901611328125, 177.71617126464844, 208.00331115722656, 238.2904510498047, 268.5776062011719, 298.86474609375, 329.1518859863281, 359.43902587890625, 389.7261657714844, 420.0133056640625, 450.30047607421875, 480.58758544921875, 510.874755859375, 541.161865234375, 571.4490356445312, 601.7362060546875, 632.0233154296875, 662.3104858398438, 692.5975952148438, 722.884765625, 753.171875, 783.4590454101562, 813.7462158203125, 844.0333862304688, 874.3204956054688, 904.607666015625, 934.894775390625, 965.1819458007812, 995.4691162109375, 1025.7562255859375, 1056.0433349609375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 6.0, 17.0, 27.0, 44.0, 39.0, 82.0, 132.0, 179.0, 304.0, 489.0, 911.0, 1417.0, 2708.0, 5255.0, 10956.0, 25346.0, 69658.0, 246843.0, 464908.0, 140031.0, 44652.0, 17583.0, 7918.0, 4038.0, 2136.0, 1144.0, 661.0, 373.0, 202.0, 155.0, 110.0, 69.0, 53.0, 32.0, 22.0, 15.0, 10.0, 5.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-114.4375, -110.8935546875, -107.349609375, -103.8056640625, -100.26171875, -96.7177734375, -93.173828125, -89.6298828125, -86.0859375, -82.5419921875, -78.998046875, -75.4541015625, -71.91015625, -68.3662109375, -64.822265625, -61.2783203125, -57.734375, -54.1904296875, -50.646484375, -47.1025390625, -43.55859375, -40.0146484375, -36.470703125, -32.9267578125, -29.3828125, -25.8388671875, -22.294921875, -18.7509765625, -15.20703125, -11.6630859375, -8.119140625, -4.5751953125, -1.03125, 2.5126953125, 6.056640625, 9.6005859375, 13.14453125, 16.6884765625, 20.232421875, 23.7763671875, 27.3203125, 30.8642578125, 34.408203125, 37.9521484375, 41.49609375, 45.0400390625, 48.583984375, 52.1279296875, 55.671875, 59.2158203125, 62.759765625, 66.3037109375, 69.84765625, 73.3916015625, 76.935546875, 80.4794921875, 84.0234375, 87.5673828125, 91.111328125, 94.6552734375, 98.19921875, 101.7431640625, 105.287109375, 108.8310546875, 112.375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 5.0, 10.0, 8.0, 10.0, 11.0, 16.0, 21.0, 22.0, 37.0, 28.0, 34.0, 41.0, 54.0, 58.0, 44.0, 58.0, 53.0, 59.0, 66.0, 53.0, 44.0, 51.0, 28.0, 38.0, 24.0, 25.0, 15.0, 11.0, 8.0, 11.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-90.0625, -87.583984375, -85.10546875, -82.626953125, -80.1484375, -77.669921875, -75.19140625, -72.712890625, -70.234375, -67.755859375, -65.27734375, -62.798828125, -60.3203125, -57.841796875, -55.36328125, -52.884765625, -50.40625, -47.927734375, -45.44921875, -42.970703125, -40.4921875, -38.013671875, -35.53515625, -33.056640625, -30.578125, -28.099609375, -25.62109375, -23.142578125, -20.6640625, -18.185546875, -15.70703125, -13.228515625, -10.75, -8.271484375, -5.79296875, -3.314453125, -0.8359375, 1.642578125, 4.12109375, 6.599609375, 9.078125, 11.556640625, 14.03515625, 16.513671875, 18.9921875, 21.470703125, 23.94921875, 26.427734375, 28.90625, 31.384765625, 33.86328125, 36.341796875, 38.8203125, 41.298828125, 43.77734375, 46.255859375, 48.734375, 51.212890625, 53.69140625, 56.169921875, 58.6484375, 61.126953125, 63.60546875, 66.083984375, 68.5625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 11.0, 6.0, 14.0, 23.0, 21.0, 31.0, 36.0, 55.0, 73.0, 132.0, 242.0, 484.0, 1211.0, 3980.0, 20772.0, 389626.0, 603566.0, 21705.0, 4122.0, 1271.0, 495.0, 250.0, 134.0, 78.0, 65.0, 36.0, 24.0, 20.0, 12.0, 7.0, 10.0, 13.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-336.5, -325.98828125, -315.4765625, -304.96484375, -294.453125, -283.94140625, -273.4296875, -262.91796875, -252.40625, -241.89453125, -231.3828125, -220.87109375, -210.359375, -199.84765625, -189.3359375, -178.82421875, -168.3125, -157.80078125, -147.2890625, -136.77734375, -126.265625, -115.75390625, -105.2421875, -94.73046875, -84.21875, -73.70703125, -63.1953125, -52.68359375, -42.171875, -31.66015625, -21.1484375, -10.63671875, -0.125, 10.38671875, 20.8984375, 31.41015625, 41.921875, 52.43359375, 62.9453125, 73.45703125, 83.96875, 94.48046875, 104.9921875, 115.50390625, 126.015625, 136.52734375, 147.0390625, 157.55078125, 168.0625, 178.57421875, 189.0859375, 199.59765625, 210.109375, 220.62109375, 231.1328125, 241.64453125, 252.15625, 262.66796875, 273.1796875, 283.69140625, 294.203125, 304.71484375, 315.2265625, 325.73828125, 336.25]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 5.0, 4.0, 6.0, 7.0, 14.0, 12.0, 10.0, 20.0, 16.0, 23.0, 33.0, 30.0, 37.0, 37.0, 35.0, 46.0, 72.0, 71.0, 58.0, 62.0, 62.0, 52.0, 40.0, 47.0, 29.0, 25.0, 22.0, 13.0, 24.0, 14.0, 14.0, 13.0, 11.0, 6.0, 6.0, 6.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.0, -297.73046875, -287.4609375, -277.19140625, -266.921875, -256.65234375, -246.3828125, -236.11328125, -225.84375, -215.57421875, -205.3046875, -195.03515625, -184.765625, -174.49609375, -164.2265625, -153.95703125, -143.6875, -133.41796875, -123.1484375, -112.87890625, -102.609375, -92.33984375, -82.0703125, -71.80078125, -61.53125, -51.26171875, -40.9921875, -30.72265625, -20.453125, -10.18359375, 0.0859375, 10.35546875, 20.625, 30.89453125, 41.1640625, 51.43359375, 61.703125, 71.97265625, 82.2421875, 92.51171875, 102.78125, 113.05078125, 123.3203125, 133.58984375, 143.859375, 154.12890625, 164.3984375, 174.66796875, 184.9375, 195.20703125, 205.4765625, 215.74609375, 226.015625, 236.28515625, 246.5546875, 256.82421875, 267.09375, 277.36328125, 287.6328125, 297.90234375, 308.171875, 318.44140625, 328.7109375, 338.98046875, 349.25]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 8.0, 14.0, 16.0, 33.0, 87.0, 164.0, 345.0, 925.0, 2863.0, 13063.0, 178240.0, 823304.0, 23095.0, 4235.0, 1300.0, 455.0, 187.0, 93.0, 39.0, 26.0, 15.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-130.125, -125.80859375, -121.4921875, -117.17578125, -112.859375, -108.54296875, -104.2265625, -99.91015625, -95.59375, -91.27734375, -86.9609375, -82.64453125, -78.328125, -74.01171875, -69.6953125, -65.37890625, -61.0625, -56.74609375, -52.4296875, -48.11328125, -43.796875, -39.48046875, -35.1640625, -30.84765625, -26.53125, -22.21484375, -17.8984375, -13.58203125, -9.265625, -4.94921875, -0.6328125, 3.68359375, 8.0, 12.31640625, 16.6328125, 20.94921875, 25.265625, 29.58203125, 33.8984375, 38.21484375, 42.53125, 46.84765625, 51.1640625, 55.48046875, 59.796875, 64.11328125, 68.4296875, 72.74609375, 77.0625, 81.37890625, 85.6953125, 90.01171875, 94.328125, 98.64453125, 102.9609375, 107.27734375, 111.59375, 115.91015625, 120.2265625, 124.54296875, 128.859375, 133.17578125, 137.4921875, 141.80859375, 146.125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 7.0, 7.0, 20.0, 31.0, 58.0, 162.0, 355.0, 158.0, 75.0, 35.0, 23.0, 6.0, 4.0, 5.0, 8.0, 6.0, 3.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0389404296875, -0.03747272491455078, -0.03600502014160156, -0.034537315368652344, -0.033069610595703125, -0.031601905822753906, -0.030134201049804688, -0.02866649627685547, -0.02719879150390625, -0.02573108673095703, -0.024263381958007812, -0.022795677185058594, -0.021327972412109375, -0.019860267639160156, -0.018392562866210938, -0.01692485809326172, -0.0154571533203125, -0.013989448547363281, -0.012521743774414062, -0.011054039001464844, -0.009586334228515625, -0.008118629455566406, -0.0066509246826171875, -0.005183219909667969, -0.00371551513671875, -0.0022478103637695312, -0.0007801055908203125, 0.0006875991821289062, 0.002155303955078125, 0.0036230087280273438, 0.0050907135009765625, 0.006558418273925781, 0.008026123046875, 0.009493827819824219, 0.010961532592773438, 0.012429237365722656, 0.013896942138671875, 0.015364646911621094, 0.016832351684570312, 0.01830005645751953, 0.01976776123046875, 0.02123546600341797, 0.022703170776367188, 0.024170875549316406, 0.025638580322265625, 0.027106285095214844, 0.028573989868164062, 0.03004169464111328, 0.0315093994140625, 0.03297710418701172, 0.03444480895996094, 0.035912513732910156, 0.037380218505859375, 0.038847923278808594, 0.04031562805175781, 0.04178333282470703, 0.04325103759765625, 0.04471874237060547, 0.04618644714355469, 0.047654151916503906, 0.049121856689453125, 0.050589561462402344, 0.05205726623535156, 0.05352497100830078, 0.05499267578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 12.0, 10.0, 18.0, 22.0, 31.0, 57.0, 85.0, 174.0, 346.0, 821.0, 2596.0, 12511.0, 139825.0, 848771.0, 35556.0, 5222.0, 1432.0, 533.0, 231.0, 113.0, 71.0, 36.0, 19.0, 16.0, 14.0, 10.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.1875, -114.2802734375, -110.373046875, -106.4658203125, -102.55859375, -98.6513671875, -94.744140625, -90.8369140625, -86.9296875, -83.0224609375, -79.115234375, -75.2080078125, -71.30078125, -67.3935546875, -63.486328125, -59.5791015625, -55.671875, -51.7646484375, -47.857421875, -43.9501953125, -40.04296875, -36.1357421875, -32.228515625, -28.3212890625, -24.4140625, -20.5068359375, -16.599609375, -12.6923828125, -8.78515625, -4.8779296875, -0.970703125, 2.9365234375, 6.84375, 10.7509765625, 14.658203125, 18.5654296875, 22.47265625, 26.3798828125, 30.287109375, 34.1943359375, 38.1015625, 42.0087890625, 45.916015625, 49.8232421875, 53.73046875, 57.6376953125, 61.544921875, 65.4521484375, 69.359375, 73.2666015625, 77.173828125, 81.0810546875, 84.98828125, 88.8955078125, 92.802734375, 96.7099609375, 100.6171875, 104.5244140625, 108.431640625, 112.3388671875, 116.24609375, 120.1533203125, 124.060546875, 127.9677734375, 131.875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 16.0, 23.0, 19.0, 33.0, 49.0, 58.0, 102.0, 164.0, 159.0, 101.0, 75.0, 49.0, 33.0, 26.0, 13.0, 17.0, 7.0, 9.0, 3.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.6875, -84.439453125, -81.19140625, -77.943359375, -74.6953125, -71.447265625, -68.19921875, -64.951171875, -61.703125, -58.455078125, -55.20703125, -51.958984375, -48.7109375, -45.462890625, -42.21484375, -38.966796875, -35.71875, -32.470703125, -29.22265625, -25.974609375, -22.7265625, -19.478515625, -16.23046875, -12.982421875, -9.734375, -6.486328125, -3.23828125, 0.009765625, 3.2578125, 6.505859375, 9.75390625, 13.001953125, 16.25, 19.498046875, 22.74609375, 25.994140625, 29.2421875, 32.490234375, 35.73828125, 38.986328125, 42.234375, 45.482421875, 48.73046875, 51.978515625, 55.2265625, 58.474609375, 61.72265625, 64.970703125, 68.21875, 71.466796875, 74.71484375, 77.962890625, 81.2109375, 84.458984375, 87.70703125, 90.955078125, 94.203125, 97.451171875, 100.69921875, 103.947265625, 107.1953125, 110.443359375, 113.69140625, 116.939453125, 120.1875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 14.0, 47.0, 288.0, 495.0, 111.0, 36.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5085.96435546875, -4927.49853515625, -4769.03271484375, -4610.56689453125, -4452.10107421875, -4293.63525390625, -4135.16943359375, -3976.70361328125, -3818.23779296875, -3659.77197265625, -3501.30615234375, -3342.84033203125, -3184.37451171875, -3025.90869140625, -2867.44287109375, -2708.97705078125, -2550.510986328125, -2392.045166015625, -2233.579345703125, -2075.113525390625, -1916.647705078125, -1758.181884765625, -1599.7159423828125, -1441.2501220703125, -1282.7843017578125, -1124.3184814453125, -965.8526611328125, -807.3867797851562, -648.9209594726562, -490.45513916015625, -331.9892578125, -173.5234375, -15.0576171875, 143.40821838378906, 301.8740539550781, 460.33990478515625, 618.8057250976562, 777.2715454101562, 935.7374267578125, 1094.2032470703125, 1252.6690673828125, 1411.1348876953125, 1569.6007080078125, 1728.066650390625, 1886.532470703125, 2044.998291015625, 2203.464111328125, 2361.929931640625, 2520.395751953125, 2678.861572265625, 2837.327392578125, 2995.793212890625, 3154.259033203125, 3312.724853515625, 3471.19091796875, 3629.65673828125, 3788.12255859375, 3946.58837890625, 4105.05419921875, 4263.52001953125, 4421.98583984375, 4580.45166015625, 4738.91748046875, 4897.38330078125, 5055.84912109375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 10.0, 11.0, 11.0, 14.0, 12.0, 10.0, 17.0, 28.0, 32.0, 20.0, 33.0, 32.0, 33.0, 46.0, 97.0, 158.0, 108.0, 44.0, 33.0, 29.0, 37.0, 19.0, 23.0, 22.0, 10.0, 12.0, 16.0, 15.0, 6.0, 14.0, 4.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1466.438720703125, -1422.586181640625, -1378.7337646484375, -1334.8812255859375, -1291.02880859375, -1247.17626953125, -1203.3238525390625, -1159.4713134765625, -1115.618896484375, -1071.766357421875, -1027.9139404296875, -984.0614624023438, -940.208984375, -896.3565063476562, -852.5040283203125, -808.6514892578125, -764.7990112304688, -720.946533203125, -677.0940551757812, -633.2415771484375, -589.3890991210938, -545.53662109375, -501.6841125488281, -457.8316345214844, -413.9791564941406, -370.1266784667969, -326.2742004394531, -282.42169189453125, -238.56922912597656, -194.7167510986328, -150.8642578125, -107.01177978515625, -63.1593017578125, -19.306819915771484, 24.54566192626953, 68.39814758300781, 112.25062561035156, 156.1031036376953, 199.95559692382812, 243.80807495117188, 287.6605529785156, 331.5130310058594, 375.3655090332031, 419.218017578125, 463.07049560546875, 506.9229736328125, 550.7754516601562, 594.6279296875, 638.4804077148438, 682.3328857421875, 726.1853637695312, 770.037841796875, 813.8903198242188, 857.7427978515625, 901.5953369140625, 945.44775390625, 989.30029296875, 1033.15283203125, 1077.0052490234375, 1120.8577880859375, 1164.710205078125, 1208.562744140625, 1252.4151611328125, 1296.2677001953125, 1340.1201171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 5.0, 7.0, 8.0, 11.0, 28.0, 40.0, 44.0, 86.0, 162.0, 175.0, 338.0, 546.0, 1040.0, 1861.0, 3656.0, 8443.0, 24108.0, 141294.0, 2369234.0, 1504594.0, 104159.0, 20241.0, 7294.0, 3208.0, 1516.0, 853.0, 487.0, 329.0, 161.0, 105.0, 66.0, 40.0, 43.0, 24.0, 20.0, 21.0, 7.0, 6.0, 10.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.125, -190.75, -184.375, -178.0, -171.625, -165.25, -158.875, -152.5, -146.125, -139.75, -133.375, -127.0, -120.625, -114.25, -107.875, -101.5, -95.125, -88.75, -82.375, -76.0, -69.625, -63.25, -56.875, -50.5, -44.125, -37.75, -31.375, -25.0, -18.625, -12.25, -5.875, 0.5, 6.875, 13.25, 19.625, 26.0, 32.375, 38.75, 45.125, 51.5, 57.875, 64.25, 70.625, 77.0, 83.375, 89.75, 96.125, 102.5, 108.875, 115.25, 121.625, 128.0, 134.375, 140.75, 147.125, 153.5, 159.875, 166.25, 172.625, 179.0, 185.375, 191.75, 198.125, 204.5, 210.875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 0.0, 4.0, 5.0, 3.0, 5.0, 9.0, 13.0, 10.0, 9.0, 23.0, 22.0, 29.0, 35.0, 32.0, 45.0, 43.0, 53.0, 44.0, 54.0, 72.0, 48.0, 49.0, 59.0, 49.0, 45.0, 34.0, 39.0, 24.0, 29.0, 20.0, 20.0, 21.0, 12.0, 13.0, 12.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-79.125, -76.7275390625, -74.330078125, -71.9326171875, -69.53515625, -67.1376953125, -64.740234375, -62.3427734375, -59.9453125, -57.5478515625, -55.150390625, -52.7529296875, -50.35546875, -47.9580078125, -45.560546875, -43.1630859375, -40.765625, -38.3681640625, -35.970703125, -33.5732421875, -31.17578125, -28.7783203125, -26.380859375, -23.9833984375, -21.5859375, -19.1884765625, -16.791015625, -14.3935546875, -11.99609375, -9.5986328125, -7.201171875, -4.8037109375, -2.40625, -0.0087890625, 2.388671875, 4.7861328125, 7.18359375, 9.5810546875, 11.978515625, 14.3759765625, 16.7734375, 19.1708984375, 21.568359375, 23.9658203125, 26.36328125, 28.7607421875, 31.158203125, 33.5556640625, 35.953125, 38.3505859375, 40.748046875, 43.1455078125, 45.54296875, 47.9404296875, 50.337890625, 52.7353515625, 55.1328125, 57.5302734375, 59.927734375, 62.3251953125, 64.72265625, 67.1201171875, 69.517578125, 71.9150390625, 74.3125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 16.0, 18.0, 27.0, 55.0, 163.0, 408.0, 1756.0, 269248.0, 3919076.0, 2679.0, 500.0, 196.0, 72.0, 32.0, 21.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1460.0, -1404.0, -1348.0, -1292.0, -1236.0, -1180.0, -1124.0, -1068.0, -1012.0, -956.0, -900.0, -844.0, -788.0, -732.0, -676.0, -620.0, -564.0, -508.0, -452.0, -396.0, -340.0, -284.0, -228.0, -172.0, -116.0, -60.0, -4.0, 52.0, 108.0, 164.0, 220.0, 276.0, 332.0, 388.0, 444.0, 500.0, 556.0, 612.0, 668.0, 724.0, 780.0, 836.0, 892.0, 948.0, 1004.0, 1060.0, 1116.0, 1172.0, 1228.0, 1284.0, 1340.0, 1396.0, 1452.0, 1508.0, 1564.0, 1620.0, 1676.0, 1732.0, 1788.0, 1844.0, 1900.0, 1956.0, 2012.0, 2068.0, 2124.0]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 15.0, 32.0, 63.0, 178.0, 616.0, 2125.0, 694.0, 189.0, 77.0, 46.0, 14.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.5, -270.1484375, -246.796875, -223.4453125, -200.09375, -176.7421875, -153.390625, -130.0390625, -106.6875, -83.3359375, -59.984375, -36.6328125, -13.28125, 10.0703125, 33.421875, 56.7734375, 80.125, 103.4765625, 126.828125, 150.1796875, 173.53125, 196.8828125, 220.234375, 243.5859375, 266.9375, 290.2890625, 313.640625, 336.9921875, 360.34375, 383.6953125, 407.046875, 430.3984375, 453.75, 477.1015625, 500.453125, 523.8046875, 547.15625, 570.5078125, 593.859375, 617.2109375, 640.5625, 663.9140625, 687.265625, 710.6171875, 733.96875, 757.3203125, 780.671875, 804.0234375, 827.375, 850.7265625, 874.078125, 897.4296875, 920.78125, 944.1328125, 967.484375, 990.8359375, 1014.1875, 1037.5390625, 1060.890625, 1084.2421875, 1107.59375, 1130.9453125, 1154.296875, 1177.6484375, 1201.0]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 9.0, 10.0, 17.0, 35.0, 55.0, 94.0, 181.0, 189.0, 149.0, 94.0, 54.0, 23.0, 31.0, 7.0, 7.0, 7.0, 1.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2762.39892578125, -2664.6455078125, -2566.89208984375, -2469.138427734375, -2371.385009765625, -2273.631591796875, -2175.878173828125, -2078.12451171875, -1980.37109375, -1882.61767578125, -1784.8641357421875, -1687.1107177734375, -1589.357177734375, -1491.603759765625, -1393.850341796875, -1296.0968017578125, -1198.3433837890625, -1100.5899658203125, -1002.83642578125, -905.0830078125, -807.3294677734375, -709.5760498046875, -611.8225708007812, -514.069091796875, -416.31561279296875, -318.5621337890625, -220.8086700439453, -123.05520629882812, -25.301727294921875, 72.45175170898438, 170.2052001953125, 267.95867919921875, 365.712158203125, 463.46563720703125, 561.2191162109375, 658.9725341796875, 756.72607421875, 854.4794921875, 952.2329711914062, 1049.9864501953125, 1147.739990234375, 1245.493408203125, 1343.2469482421875, 1441.0003662109375, 1538.75390625, 1636.50732421875, 1734.2607421875, 1832.0142822265625, 1929.7677001953125, 2027.5211181640625, 2125.274658203125, 2223.028076171875, 2320.781494140625, 2418.53515625, 2516.28857421875, 2614.0419921875, 2711.79541015625, 2809.548828125, 2907.30224609375, 3005.055908203125, 3102.809326171875, 3200.562744140625, 3298.316162109375, 3396.06982421875, 3493.8232421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 3.0, 6.0, 9.0, 9.0, 18.0, 20.0, 27.0, 37.0, 48.0, 45.0, 52.0, 63.0, 77.0, 90.0, 87.0, 86.0, 51.0, 63.0, 53.0, 39.0, 26.0, 27.0, 21.0, 10.0, 13.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2712.68212890625, -2650.98193359375, -2589.28173828125, -2527.58154296875, -2465.88134765625, -2404.18115234375, -2342.48095703125, -2280.78076171875, -2219.08056640625, -2157.38037109375, -2095.68017578125, -2033.97998046875, -1972.27978515625, -1910.57958984375, -1848.87939453125, -1787.17919921875, -1725.4788818359375, -1663.7786865234375, -1602.0784912109375, -1540.3782958984375, -1478.6781005859375, -1416.9779052734375, -1355.277587890625, -1293.577392578125, -1231.877197265625, -1170.177001953125, -1108.476806640625, -1046.776611328125, -985.076416015625, -923.376220703125, -861.6759643554688, -799.9757690429688, -738.2755126953125, -676.5753173828125, -614.8751220703125, -553.1749267578125, -491.4747009277344, -429.7745056152344, -368.07427978515625, -306.37408447265625, -244.67388916015625, -182.97369384765625, -121.27348327636719, -59.573272705078125, 2.126922607421875, 63.827117919921875, 125.52734375, 187.2275390625, 248.927734375, 310.6279296875, 372.328125, 434.0283508300781, 495.7285461425781, 557.4287109375, 619.1289672851562, 680.8291625976562, 742.5293579101562, 804.2295532226562, 865.9297485351562, 927.6300048828125, 989.3302001953125, 1051.0303955078125, 1112.7305908203125, 1174.4307861328125, 1236.1309814453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 15.0, 20.0, 30.0, 61.0, 75.0, 135.0, 218.0, 357.0, 601.0, 1108.0, 2349.0, 5156.0, 12746.0, 37726.0, 164055.0, 635657.0, 134812.0, 32657.0, 11283.0, 4711.0, 2259.0, 1052.0, 572.0, 346.0, 183.0, 118.0, 88.0, 46.0, 30.0, 26.0, 14.0, 11.0, 7.0, 1.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.125, -163.380859375, -157.63671875, -151.892578125, -146.1484375, -140.404296875, -134.66015625, -128.916015625, -123.171875, -117.427734375, -111.68359375, -105.939453125, -100.1953125, -94.451171875, -88.70703125, -82.962890625, -77.21875, -71.474609375, -65.73046875, -59.986328125, -54.2421875, -48.498046875, -42.75390625, -37.009765625, -31.265625, -25.521484375, -19.77734375, -14.033203125, -8.2890625, -2.544921875, 3.19921875, 8.943359375, 14.6875, 20.431640625, 26.17578125, 31.919921875, 37.6640625, 43.408203125, 49.15234375, 54.896484375, 60.640625, 66.384765625, 72.12890625, 77.873046875, 83.6171875, 89.361328125, 95.10546875, 100.849609375, 106.59375, 112.337890625, 118.08203125, 123.826171875, 129.5703125, 135.314453125, 141.05859375, 146.802734375, 152.546875, 158.291015625, 164.03515625, 169.779296875, 175.5234375, 181.267578125, 187.01171875, 192.755859375, 198.5]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 11.0, 5.0, 8.0, 15.0, 16.0, 23.0, 27.0, 33.0, 37.0, 52.0, 67.0, 63.0, 77.0, 66.0, 72.0, 68.0, 57.0, 59.0, 36.0, 45.0, 32.0, 29.0, 32.0, 12.0, 9.0, 9.0, 9.0, 11.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.6875, -115.6728515625, -111.658203125, -107.6435546875, -103.62890625, -99.6142578125, -95.599609375, -91.5849609375, -87.5703125, -83.5556640625, -79.541015625, -75.5263671875, -71.51171875, -67.4970703125, -63.482421875, -59.4677734375, -55.453125, -51.4384765625, -47.423828125, -43.4091796875, -39.39453125, -35.3798828125, -31.365234375, -27.3505859375, -23.3359375, -19.3212890625, -15.306640625, -11.2919921875, -7.27734375, -3.2626953125, 0.751953125, 4.7666015625, 8.78125, 12.7958984375, 16.810546875, 20.8251953125, 24.83984375, 28.8544921875, 32.869140625, 36.8837890625, 40.8984375, 44.9130859375, 48.927734375, 52.9423828125, 56.95703125, 60.9716796875, 64.986328125, 69.0009765625, 73.015625, 77.0302734375, 81.044921875, 85.0595703125, 89.07421875, 93.0888671875, 97.103515625, 101.1181640625, 105.1328125, 109.1474609375, 113.162109375, 117.1767578125, 121.19140625, 125.2060546875, 129.220703125, 133.2353515625, 137.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 10.0, 11.0, 14.0, 28.0, 35.0, 73.0, 122.0, 221.0, 599.0, 1762.0, 7755.0, 103768.0, 907241.0, 21744.0, 3377.0, 937.0, 372.0, 185.0, 96.0, 61.0, 41.0, 16.0, 16.0, 12.0, 16.0, 5.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-344.25, -332.86328125, -321.4765625, -310.08984375, -298.703125, -287.31640625, -275.9296875, -264.54296875, -253.15625, -241.76953125, -230.3828125, -218.99609375, -207.609375, -196.22265625, -184.8359375, -173.44921875, -162.0625, -150.67578125, -139.2890625, -127.90234375, -116.515625, -105.12890625, -93.7421875, -82.35546875, -70.96875, -59.58203125, -48.1953125, -36.80859375, -25.421875, -14.03515625, -2.6484375, 8.73828125, 20.125, 31.51171875, 42.8984375, 54.28515625, 65.671875, 77.05859375, 88.4453125, 99.83203125, 111.21875, 122.60546875, 133.9921875, 145.37890625, 156.765625, 168.15234375, 179.5390625, 190.92578125, 202.3125, 213.69921875, 225.0859375, 236.47265625, 247.859375, 259.24609375, 270.6328125, 282.01953125, 293.40625, 304.79296875, 316.1796875, 327.56640625, 338.953125, 350.33984375, 361.7265625, 373.11328125, 384.5]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 13.0, 7.0, 18.0, 28.0, 33.0, 45.0, 57.0, 69.0, 95.0, 106.0, 118.0, 85.0, 77.0, 55.0, 35.0, 26.0, 23.0, 24.0, 14.0, 17.0, 10.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-562.0, -543.1328125, -524.265625, -505.3984375, -486.53125, -467.6640625, -448.796875, -429.9296875, -411.0625, -392.1953125, -373.328125, -354.4609375, -335.59375, -316.7265625, -297.859375, -278.9921875, -260.125, -241.2578125, -222.390625, -203.5234375, -184.65625, -165.7890625, -146.921875, -128.0546875, -109.1875, -90.3203125, -71.453125, -52.5859375, -33.71875, -14.8515625, 4.015625, 22.8828125, 41.75, 60.6171875, 79.484375, 98.3515625, 117.21875, 136.0859375, 154.953125, 173.8203125, 192.6875, 211.5546875, 230.421875, 249.2890625, 268.15625, 287.0234375, 305.890625, 324.7578125, 343.625, 362.4921875, 381.359375, 400.2265625, 419.09375, 437.9609375, 456.828125, 475.6953125, 494.5625, 513.4296875, 532.296875, 551.1640625, 570.03125, 588.8984375, 607.765625, 626.6328125, 645.5]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 5.0, 0.0, 2.0, 2.0, 3.0, 8.0, 1.0, 8.0, 6.0, 9.0, 5.0, 14.0, 18.0, 24.0, 28.0, 35.0, 42.0, 40.0, 64.0, 88.0, 150.0, 230.0, 376.0, 560.0, 1153.0, 2390.0, 6038.0, 22219.0, 295903.0, 684150.0, 23211.0, 6295.0, 2501.0, 1211.0, 631.0, 380.0, 232.0, 138.0, 92.0, 66.0, 48.0, 29.0, 34.0, 22.0, 26.0, 17.0, 16.0, 10.0, 12.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-87.375, -84.728515625, -82.08203125, -79.435546875, -76.7890625, -74.142578125, -71.49609375, -68.849609375, -66.203125, -63.556640625, -60.91015625, -58.263671875, -55.6171875, -52.970703125, -50.32421875, -47.677734375, -45.03125, -42.384765625, -39.73828125, -37.091796875, -34.4453125, -31.798828125, -29.15234375, -26.505859375, -23.859375, -21.212890625, -18.56640625, -15.919921875, -13.2734375, -10.626953125, -7.98046875, -5.333984375, -2.6875, -0.041015625, 2.60546875, 5.251953125, 7.8984375, 10.544921875, 13.19140625, 15.837890625, 18.484375, 21.130859375, 23.77734375, 26.423828125, 29.0703125, 31.716796875, 34.36328125, 37.009765625, 39.65625, 42.302734375, 44.94921875, 47.595703125, 50.2421875, 52.888671875, 55.53515625, 58.181640625, 60.828125, 63.474609375, 66.12109375, 68.767578125, 71.4140625, 74.060546875, 76.70703125, 79.353515625, 82.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 8.0, 14.0, 24.0, 79.0, 374.0, 332.0, 87.0, 31.0, 14.0, 5.0, 6.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07928466796875, -0.07654857635498047, -0.07381248474121094, -0.0710763931274414, -0.06834030151367188, -0.06560420989990234, -0.06286811828613281, -0.06013202667236328, -0.05739593505859375, -0.05465984344482422, -0.05192375183105469, -0.049187660217285156, -0.046451568603515625, -0.043715476989746094, -0.04097938537597656, -0.03824329376220703, -0.0355072021484375, -0.03277111053466797, -0.030035018920898438, -0.027298927307128906, -0.024562835693359375, -0.021826744079589844, -0.019090652465820312, -0.01635456085205078, -0.01361846923828125, -0.010882377624511719, -0.008146286010742188, -0.005410194396972656, -0.002674102783203125, 6.198883056640625e-05, 0.0027980804443359375, 0.005534172058105469, 0.008270263671875, 0.011006355285644531, 0.013742446899414062, 0.016478538513183594, 0.019214630126953125, 0.021950721740722656, 0.024686813354492188, 0.02742290496826172, 0.03015899658203125, 0.03289508819580078, 0.03563117980957031, 0.038367271423339844, 0.041103363037109375, 0.043839454650878906, 0.04657554626464844, 0.04931163787841797, 0.0520477294921875, 0.05478382110595703, 0.05751991271972656, 0.060256004333496094, 0.06299209594726562, 0.06572818756103516, 0.06846427917480469, 0.07120037078857422, 0.07393646240234375, 0.07667255401611328, 0.07940864562988281, 0.08214473724365234, 0.08488082885742188, 0.0876169204711914, 0.09035301208496094, 0.09308910369873047, 0.0958251953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 17.0, 17.0, 46.0, 69.0, 112.0, 168.0, 296.0, 668.0, 1489.0, 4207.0, 17133.0, 784495.0, 219667.0, 13861.0, 3604.0, 1277.0, 618.0, 297.0, 162.0, 115.0, 54.0, 48.0, 37.0, 21.0, 18.0, 9.0, 10.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4375, -85.154296875, -81.87109375, -78.587890625, -75.3046875, -72.021484375, -68.73828125, -65.455078125, -62.171875, -58.888671875, -55.60546875, -52.322265625, -49.0390625, -45.755859375, -42.47265625, -39.189453125, -35.90625, -32.623046875, -29.33984375, -26.056640625, -22.7734375, -19.490234375, -16.20703125, -12.923828125, -9.640625, -6.357421875, -3.07421875, 0.208984375, 3.4921875, 6.775390625, 10.05859375, 13.341796875, 16.625, 19.908203125, 23.19140625, 26.474609375, 29.7578125, 33.041015625, 36.32421875, 39.607421875, 42.890625, 46.173828125, 49.45703125, 52.740234375, 56.0234375, 59.306640625, 62.58984375, 65.873046875, 69.15625, 72.439453125, 75.72265625, 79.005859375, 82.2890625, 85.572265625, 88.85546875, 92.138671875, 95.421875, 98.705078125, 101.98828125, 105.271484375, 108.5546875, 111.837890625, 115.12109375, 118.404296875, 121.6875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 11.0, 7.0, 16.0, 20.0, 19.0, 14.0, 33.0, 31.0, 50.0, 79.0, 96.0, 117.0, 126.0, 82.0, 63.0, 56.0, 32.0, 22.0, 19.0, 18.0, 7.0, 15.0, 8.0, 6.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.9375, -62.671875, -60.40625, -58.140625, -55.875, -53.609375, -51.34375, -49.078125, -46.8125, -44.546875, -42.28125, -40.015625, -37.75, -35.484375, -33.21875, -30.953125, -28.6875, -26.421875, -24.15625, -21.890625, -19.625, -17.359375, -15.09375, -12.828125, -10.5625, -8.296875, -6.03125, -3.765625, -1.5, 0.765625, 3.03125, 5.296875, 7.5625, 9.828125, 12.09375, 14.359375, 16.625, 18.890625, 21.15625, 23.421875, 25.6875, 27.953125, 30.21875, 32.484375, 34.75, 37.015625, 39.28125, 41.546875, 43.8125, 46.078125, 48.34375, 50.609375, 52.875, 55.140625, 57.40625, 59.671875, 61.9375, 64.203125, 66.46875, 68.734375, 71.0, 73.265625, 75.53125, 77.796875, 80.0625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 21.0, 47.0, 269.0, 502.0, 91.0, 30.0, 16.0, 11.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1244.56787109375, -1107.2962646484375, -970.0245361328125, -832.7529296875, -695.4812622070312, -558.2095947265625, -420.93798828125, -283.66632080078125, -146.3946533203125, -9.123001098632812, 128.14865112304688, 265.4202880859375, 402.69195556640625, 539.963623046875, 677.2352294921875, 814.5068969726562, 951.778564453125, 1089.0501708984375, 1226.3218994140625, 1363.593505859375, 1500.865234375, 1638.1368408203125, 1775.408447265625, 1912.68017578125, 2049.95166015625, 2187.223388671875, 2324.494873046875, 2461.7666015625, 2599.038330078125, 2736.31005859375, 2873.58154296875, 3010.853271484375, 3148.125, 3285.396728515625, 3422.668212890625, 3559.93994140625, 3697.211669921875, 3834.4833984375, 3971.7548828125, 4109.0263671875, 4246.29833984375, 4383.56982421875, 4520.841796875, 4658.11328125, 4795.384765625, 4932.65673828125, 5069.92822265625, 5207.19970703125, 5344.4716796875, 5481.7431640625, 5619.01513671875, 5756.28662109375, 5893.55810546875, 6030.830078125, 6168.1015625, 6305.373046875, 6442.64453125, 6579.916015625, 6717.18798828125, 6854.45947265625, 6991.73095703125, 7129.0029296875, 7266.2744140625, 7403.5458984375, 7540.81787109375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 8.0, 9.0, 11.0, 15.0, 24.0, 21.0, 29.0, 35.0, 31.0, 37.0, 215.0, 255.0, 58.0, 37.0, 33.0, 26.0, 28.0, 18.0, 17.0, 14.0, 13.0, 13.0, 11.0, 4.0, 4.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1884.7779541015625, -1826.2215576171875, -1767.6651611328125, -1709.1087646484375, -1650.5523681640625, -1591.995849609375, -1533.439453125, -1474.883056640625, -1416.32666015625, -1357.770263671875, -1299.2138671875, -1240.657470703125, -1182.10107421875, -1123.544677734375, -1064.98828125, -1006.4317626953125, -947.8754272460938, -889.3190307617188, -830.7626342773438, -772.2061767578125, -713.6497802734375, -655.0933837890625, -596.5369873046875, -537.9805908203125, -479.4241638183594, -420.8677673339844, -362.31134033203125, -303.75494384765625, -245.1985321044922, -186.64212036132812, -128.08572387695312, -69.529296875, -10.972900390625, 47.5835075378418, 106.1399154663086, 164.69631958007812, 223.2527313232422, 281.80914306640625, 340.36553955078125, 398.9219665527344, 457.4783630371094, 516.0347900390625, 574.5911865234375, 633.1475830078125, 691.7039794921875, 750.2603759765625, 808.8167724609375, 867.3732299804688, 925.9296264648438, 984.4860229492188, 1043.04248046875, 1101.598876953125, 1160.1552734375, 1218.711669921875, 1277.26806640625, 1335.824462890625, 1394.380859375, 1452.937255859375, 1511.49365234375, 1570.050048828125, 1628.6064453125, 1687.162841796875, 1745.71923828125, 1804.2757568359375, 1862.8321533203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 7.0, 5.0, 13.0, 9.0, 12.0, 11.0, 12.0, 13.0, 26.0, 28.0, 34.0, 45.0, 48.0, 131.0, 211.0, 100.0, 51.0, 33.0, 34.0, 25.0, 19.0, 22.0, 15.0, 15.0, 11.0, 11.0, 6.0, 8.0, 7.0, 5.0, 3.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-117.3125, -113.888671875, -110.46484375, -107.041015625, -103.6171875, -100.193359375, -96.76953125, -93.345703125, -89.921875, -86.498046875, -83.07421875, -79.650390625, -76.2265625, -72.802734375, -69.37890625, -65.955078125, -62.53125, -59.107421875, -55.68359375, -52.259765625, -48.8359375, -45.412109375, -41.98828125, -38.564453125, -35.140625, -31.716796875, -28.29296875, -24.869140625, -21.4453125, -18.021484375, -14.59765625, -11.173828125, -7.75, -4.326171875, -0.90234375, 2.521484375, 5.9453125, 9.369140625, 12.79296875, 16.216796875, 19.640625, 23.064453125, 26.48828125, 29.912109375, 33.3359375, 36.759765625, 40.18359375, 43.607421875, 47.03125, 50.455078125, 53.87890625, 57.302734375, 60.7265625, 64.150390625, 67.57421875, 70.998046875, 74.421875, 77.845703125, 81.26953125, 84.693359375, 88.1171875, 91.541015625, 94.96484375, 98.388671875, 101.8125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 16.0, 18.0, 21.0, 40.0, 69.0, 212.0, 755.0, 5946.0, 8367471.0, 12405.0, 1124.0, 227.0, 122.0, 49.0, 20.0, 16.0, 19.0, 6.0, 2.0, 1.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1390.2318115234375, -1335.9791259765625, -1281.726318359375, -1227.4736328125, -1173.220947265625, -1118.96826171875, -1064.715576171875, -1010.4627685546875, -956.2100830078125, -901.9573974609375, -847.7046508789062, -793.451904296875, -739.19921875, -684.946533203125, -630.6937866210938, -576.4410400390625, -522.1883544921875, -467.9356384277344, -413.68292236328125, -359.4302062988281, -305.177490234375, -250.92477416992188, -196.67205810546875, -142.41934204101562, -88.1666259765625, -33.913909912109375, 20.33880615234375, 74.59152221679688, 128.84423828125, 183.09695434570312, 237.34967041015625, 291.6023864746094, 345.855224609375, 400.1079406738281, 454.36065673828125, 508.6133728027344, 562.8660888671875, 617.1187744140625, 671.3715209960938, 725.624267578125, 779.876953125, 834.129638671875, 888.3823852539062, 942.6351318359375, 996.8878173828125, 1051.1405029296875, 1105.393310546875, 1159.64599609375, 1213.898681640625, 1268.1513671875, 1322.404052734375, 1376.6568603515625, 1430.9095458984375, 1485.1622314453125, 1539.4150390625, 1593.667724609375, 1647.92041015625, 1702.173095703125, 1756.42578125, 1810.6785888671875, 1864.9312744140625, 1919.1839599609375, 1973.436767578125, 2027.689453125, 2081.942138671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1213.4683837890625, -1177.4456787109375, -1141.423095703125, -1105.400390625, -1069.377685546875, -1033.35498046875, -997.3323364257812, -961.3096923828125, -925.2869873046875, -889.2642822265625, -853.2416381835938, -817.218994140625, -781.1962890625, -745.173583984375, -709.1509399414062, -673.1282958984375, -637.1055908203125, -601.0828857421875, -565.0602416992188, -529.03759765625, -493.014892578125, -456.9922180175781, -420.96954345703125, -384.9468688964844, -348.9241943359375, -312.9015197753906, -276.87884521484375, -240.85617065429688, -204.83349609375, -168.81082153320312, -132.78814697265625, -96.76547241210938, -60.74267578125, -24.720001220703125, 11.30267333984375, 47.325347900390625, 83.3480224609375, 119.37069702148438, 155.39337158203125, 191.41604614257812, 227.438720703125, 263.4613952636719, 299.48406982421875, 335.5067443847656, 371.5294189453125, 407.5520935058594, 443.57476806640625, 479.5974426269531, 515.6201171875, 551.642822265625, 587.6654663085938, 623.6881103515625, 659.7108154296875, 695.7335205078125, 731.7561645507812, 767.77880859375, 803.801513671875, 839.82421875, 875.8468627929688, 911.8695068359375, 947.8922119140625, 983.9149169921875, 1019.9375610351562, 1055.960205078125, 1091.98291015625]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 14.0, 16.0, 32.0, 48.0, 49.0, 79.0, 90.0, 100.0, 94.0, 94.0, 71.0, 92.0, 54.0, 53.0, 32.0, 27.0, 18.0, 14.0, 9.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-102.8125, -100.34814453125, -97.8837890625, -95.41943359375, -92.955078125, -90.49072265625, -88.0263671875, -85.56201171875, -83.09765625, -80.63330078125, -78.1689453125, -75.70458984375, -73.240234375, -70.77587890625, -68.3115234375, -65.84716796875, -63.3828125, -60.91845703125, -58.4541015625, -55.98974609375, -53.525390625, -51.06103515625, -48.5966796875, -46.13232421875, -43.66796875, -41.20361328125, -38.7392578125, -36.27490234375, -33.810546875, -31.34619140625, -28.8818359375, -26.41748046875, -23.953125, -21.48876953125, -19.0244140625, -16.56005859375, -14.095703125, -11.63134765625, -9.1669921875, -6.70263671875, -4.23828125, -1.77392578125, 0.6904296875, 3.15478515625, 5.619140625, 8.08349609375, 10.5478515625, 13.01220703125, 15.4765625, 17.94091796875, 20.4052734375, 22.86962890625, 25.333984375, 27.79833984375, 30.2626953125, 32.72705078125, 35.19140625, 37.65576171875, 40.1201171875, 42.58447265625, 45.048828125, 47.51318359375, 49.9775390625, 52.44189453125, 54.90625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 13.0, 11.0, 15.0, 24.0, 31.0, 42.0, 78.0, 105.0, 163.0, 250.0, 459.0, 807.0, 1591.0, 3365.0, 8117.0, 24160.0, 97692.0, 261570.0, 89405.0, 22870.0, 7225.0, 3026.0, 1359.0, 734.0, 415.0, 256.0, 154.0, 118.0, 69.0, 49.0, 32.0, 19.0, 13.0, 8.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-684.0, -656.046875, -628.09375, -600.140625, -572.1875, -544.234375, -516.28125, -488.328125, -460.375, -432.421875, -404.46875, -376.515625, -348.5625, -320.609375, -292.65625, -264.703125, -236.75, -208.796875, -180.84375, -152.890625, -124.9375, -96.984375, -69.03125, -41.078125, -13.125, 14.828125, 42.78125, 70.734375, 98.6875, 126.640625, 154.59375, 182.546875, 210.5, 238.453125, 266.40625, 294.359375, 322.3125, 350.265625, 378.21875, 406.171875, 434.125, 462.078125, 490.03125, 517.984375, 545.9375, 573.890625, 601.84375, 629.796875, 657.75, 685.703125, 713.65625, 741.609375, 769.5625, 797.515625, 825.46875, 853.421875, 881.375, 909.328125, 937.28125, 965.234375, 993.1875, 1021.140625, 1049.09375, 1077.046875, 1105.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 7.0, 7.0, 13.0, 14.0, 16.0, 22.0, 19.0, 25.0, 37.0, 41.0, 45.0, 54.0, 54.0, 72.0, 73.0, 70.0, 54.0, 59.0, 59.0, 49.0, 29.0, 40.0, 29.0, 17.0, 13.0, 22.0, 12.0, 13.0, 3.0, 4.0, 6.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.6875, -91.1787109375, -87.669921875, -84.1611328125, -80.65234375, -77.1435546875, -73.634765625, -70.1259765625, -66.6171875, -63.1083984375, -59.599609375, -56.0908203125, -52.58203125, -49.0732421875, -45.564453125, -42.0556640625, -38.546875, -35.0380859375, -31.529296875, -28.0205078125, -24.51171875, -21.0029296875, -17.494140625, -13.9853515625, -10.4765625, -6.9677734375, -3.458984375, 0.0498046875, 3.55859375, 7.0673828125, 10.576171875, 14.0849609375, 17.59375, 21.1025390625, 24.611328125, 28.1201171875, 31.62890625, 35.1376953125, 38.646484375, 42.1552734375, 45.6640625, 49.1728515625, 52.681640625, 56.1904296875, 59.69921875, 63.2080078125, 66.716796875, 70.2255859375, 73.734375, 77.2431640625, 80.751953125, 84.2607421875, 87.76953125, 91.2783203125, 94.787109375, 98.2958984375, 101.8046875, 105.3134765625, 108.822265625, 112.3310546875, 115.83984375, 119.3486328125, 122.857421875, 126.3662109375, 129.875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 24.0, 30.0, 62.0, 79.0, 89.0, 52.0, 37.0, 28.0, 27.0, 10.0, 11.0, 9.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-871.1535034179688, -844.0928344726562, -817.0321655273438, -789.971435546875, -762.9107666015625, -735.85009765625, -708.7894287109375, -681.728759765625, -654.6680908203125, -627.607421875, -600.5467529296875, -573.486083984375, -546.4253540039062, -519.3646850585938, -492.30401611328125, -465.24334716796875, -438.1826171875, -411.1219482421875, -384.0612487792969, -357.0005798339844, -329.93988037109375, -302.87921142578125, -275.81854248046875, -248.7578582763672, -221.69717407226562, -194.63648986816406, -167.5758056640625, -140.51513671875, -113.45445251464844, -86.39376831054688, -59.333099365234375, -32.27241516113281, -5.2117919921875, 21.848888397216797, 48.909568786621094, 75.97024536132812, 103.03092956542969, 130.09161376953125, 157.15228271484375, 184.2129669189453, 211.27365112304688, 238.33433532714844, 265.39501953125, 292.4556884765625, 319.516357421875, 346.5770568847656, 373.6377258300781, 400.69842529296875, 427.75909423828125, 454.81976318359375, 481.8804626464844, 508.9411315917969, 536.0018310546875, 563.0625, 590.1231689453125, 617.183837890625, 644.2445068359375, 671.30517578125, 698.3658447265625, 725.426513671875, 752.4872436523438, 779.5479125976562, 806.6085815429688, 833.6692504882812, 860.72998046875]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 7.0, 9.0, 11.0, 20.0, 37.0, 91.0, 82.0, 76.0, 46.0, 23.0, 17.0, 4.0, 9.0, 7.0, 4.0, 4.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-685.730712890625, -663.8141479492188, -641.8975830078125, -619.98095703125, -598.0643920898438, -576.1478271484375, -554.231201171875, -532.3146362304688, -510.3980712890625, -488.48150634765625, -466.5649108886719, -444.6483154296875, -422.73175048828125, -400.815185546875, -378.8985900878906, -356.98199462890625, -335.0654296875, -313.14886474609375, -291.2322692871094, -269.315673828125, -247.39910888671875, -225.48252868652344, -203.56594848632812, -181.6493682861328, -159.7327880859375, -137.8162078857422, -115.89962768554688, -93.98304748535156, -72.06646728515625, -50.14988708496094, -28.233306884765625, -6.3167266845703125, 15.599853515625, 37.51643371582031, 59.433013916015625, 81.34959411621094, 103.26617431640625, 125.18275451660156, 147.09933471679688, 169.0159149169922, 190.9324951171875, 212.8490753173828, 234.76565551757812, 256.6822509765625, 278.59881591796875, 300.515380859375, 322.4319763183594, 344.34857177734375, 366.26513671875, 388.18170166015625, 410.0982971191406, 432.014892578125, 453.93145751953125, 475.8480224609375, 497.7646179199219, 519.6812133789062, 541.5977783203125, 563.5143432617188, 585.430908203125, 607.3475341796875, 629.2640991210938, 651.1806640625, 673.0972900390625, 695.0138549804688, 716.930419921875]}, "eval/loss": 2.1931169033050537, "eval/wer": 0.34303847679492266, "eval/runtime": 642.668, "eval/samples_per_second": 4.111, "eval/steps_per_second": 0.515} \ No newline at end of file