{"train/loss": 0.0371, "train/learning_rate": 1.164e-05, "train/epoch": 0.87, "train/global_step": 194, "_runtime": 4382, "_timestamp": 1648414854, "_step": 193, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 8.0, 12.0, 37.0, 75.0, 153.0, 273.0, 233.0, 115.0, 47.0, 26.0, 19.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.415894508361816, -4.075726509094238, -3.7355589866638184, -3.3953909873962402, -3.055223226547241, -2.715055465698242, -2.374887466430664, -2.034719705581665, -1.694551944732666, -1.354384183883667, -1.0142163038253784, -0.6740484237670898, -0.3338806629180908, 0.006287097930908203, 0.34645509719848633, 0.6866228580474854, 1.0267906188964844, 1.3669583797454834, 1.707126259803772, 2.0472941398620605, 2.3874619007110596, 2.7276296615600586, 3.0677976608276367, 3.4079654216766357, 3.7481331825256348, 4.088301181793213, 4.428468704223633, 4.768636703491211, 5.108804702758789, 5.448972225189209, 5.789140224456787, 6.129307746887207, 6.469474792480469, 6.809642791748047, 7.149810314178467, 7.489978313446045, 7.830145835876465, 8.170313835144043, 8.510481834411621, 8.8506498336792, 9.190816879272461, 9.530984878540039, 9.871152877807617, 10.211320877075195, 10.551487922668457, 10.891655921936035, 11.231823921203613, 11.571991920471191, 11.91215991973877, 12.252327919006348, 12.592495918273926, 12.932662963867188, 13.272830963134766, 13.612998962402344, 13.953166961669922, 14.2933349609375, 14.633502960205078, 14.973670959472656, 15.313838958740234, 15.654006958007812, 15.994174003601074, 16.33434295654297, 16.674510955810547, 17.014677047729492, 17.35484504699707]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 9.0, 11.0, 10.0, 15.0, 8.0, 17.0, 17.0, 27.0, 24.0, 29.0, 38.0, 29.0, 37.0, 34.0, 29.0, 42.0, 34.0, 39.0, 30.0, 53.0, 47.0, 30.0, 41.0, 30.0, 39.0, 35.0, 34.0, 22.0, 24.0, 22.0, 15.0, 13.0, 18.0, 13.0, 15.0, 11.0, 6.0, 6.0, 13.0, 9.0, 5.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.907078742980957, -3.7852444648742676, -3.6634104251861572, -3.5415761470794678, -3.4197421073913574, -3.297907829284668, -3.1760735511779785, -3.054239511489868, -2.932405471801758, -2.8105711936950684, -2.688737154006958, -2.5669028759002686, -2.445068836212158, -2.3232345581054688, -2.2014002799987793, -2.079566240310669, -1.9577319622039795, -1.8358978033065796, -1.7140636444091797, -1.5922293663024902, -1.4703953266143799, -1.3485610485076904, -1.2267268896102905, -1.1048927307128906, -0.9830585718154907, -0.8612244129180908, -0.7393902540206909, -0.6175560355186462, -0.49572187662124634, -0.37388771772384644, -0.25205349922180176, -0.13021934032440186, -0.008385419845581055, 0.11344875395298004, 0.23528292775154114, 0.3571171164512634, 0.47895127534866333, 0.6007854342460632, 0.7226196527481079, 0.8444538116455078, 0.9662879705429077, 1.0881221294403076, 1.2099562883377075, 1.3317904472351074, 1.4536247253417969, 1.5754587650299072, 1.6972930431365967, 1.8191272020339966, 1.9409613609313965, 2.062795639038086, 2.1846296787261963, 2.3064639568328857, 2.428297996520996, 2.5501322746276855, 2.671966552734375, 2.7938005924224854, 2.9156346321105957, 3.037468910217285, 3.1593029499053955, 3.281137228012085, 3.4029712677001953, 3.5248055458068848, 3.646639823913574, 3.7684738636016846, 3.890308141708374]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 15.0, 17.0, 21.0, 23.0, 55.0, 60.0, 76.0, 124.0, 169.0, 224.0, 386.0, 569.0, 914.0, 1486.0, 2985.0, 6784.0, 24148.0, 119710.0, 662048.0, 2676039.0, 574168.0, 93050.0, 18568.0, 5714.0, 2645.0, 1505.0, 883.0, 610.0, 377.0, 244.0, 198.0, 120.0, 91.0, 69.0, 51.0, 27.0, 26.0, 26.0, 11.0, 12.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.267578125, -7.99609375, -7.724609375, -7.453125, -7.181640625, -6.91015625, -6.638671875, -6.3671875, -6.095703125, -5.82421875, -5.552734375, -5.28125, -5.009765625, -4.73828125, -4.466796875, -4.1953125, -3.923828125, -3.65234375, -3.380859375, -3.109375, -2.837890625, -2.56640625, -2.294921875, -2.0234375, -1.751953125, -1.48046875, -1.208984375, -0.9375, -0.666015625, -0.39453125, -0.123046875, 0.1484375, 0.419921875, 0.69140625, 0.962890625, 1.234375, 1.505859375, 1.77734375, 2.048828125, 2.3203125, 2.591796875, 2.86328125, 3.134765625, 3.40625, 3.677734375, 3.94921875, 4.220703125, 4.4921875, 4.763671875, 5.03515625, 5.306640625, 5.578125, 5.849609375, 6.12109375, 6.392578125, 6.6640625, 6.935546875, 7.20703125, 7.478515625, 7.75, 8.021484375, 8.29296875, 8.564453125, 8.8359375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 7.0, 8.0, 17.0, 13.0, 28.0, 12.0, 21.0, 26.0, 20.0, 26.0, 28.0, 31.0, 29.0, 39.0, 39.0, 31.0, 42.0, 44.0, 37.0, 40.0, 51.0, 24.0, 47.0, 42.0, 29.0, 26.0, 21.0, 22.0, 23.0, 22.0, 18.0, 10.0, 21.0, 4.0, 13.0, 6.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.1640625, -4.99896240234375, -4.8338623046875, -4.66876220703125, -4.503662109375, -4.33856201171875, -4.1734619140625, -4.00836181640625, -3.84326171875, -3.67816162109375, -3.5130615234375, -3.34796142578125, -3.182861328125, -3.01776123046875, -2.8526611328125, -2.68756103515625, -2.5224609375, -2.35736083984375, -2.1922607421875, -2.02716064453125, -1.862060546875, -1.69696044921875, -1.5318603515625, -1.36676025390625, -1.20166015625, -1.03656005859375, -0.8714599609375, -0.70635986328125, -0.541259765625, -0.37615966796875, -0.2110595703125, -0.04595947265625, 0.119140625, 0.28424072265625, 0.4493408203125, 0.61444091796875, 0.779541015625, 0.94464111328125, 1.1097412109375, 1.27484130859375, 1.43994140625, 1.60504150390625, 1.7701416015625, 1.93524169921875, 2.100341796875, 2.26544189453125, 2.4305419921875, 2.59564208984375, 2.7607421875, 2.92584228515625, 3.0909423828125, 3.25604248046875, 3.421142578125, 3.58624267578125, 3.7513427734375, 3.91644287109375, 4.08154296875, 4.24664306640625, 4.4117431640625, 4.57684326171875, 4.741943359375, 4.90704345703125, 5.0721435546875, 5.23724365234375, 5.40234375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 20.0, 100.0, 1338.0, 4192291.0, 444.0, 71.0, 14.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.375, -158.509765625, -145.64453125, -132.779296875, -119.9140625, -107.048828125, -94.18359375, -81.318359375, -68.453125, -55.587890625, -42.72265625, -29.857421875, -16.9921875, -4.126953125, 8.73828125, 21.603515625, 34.46875, 47.333984375, 60.19921875, 73.064453125, 85.9296875, 98.794921875, 111.66015625, 124.525390625, 137.390625, 150.255859375, 163.12109375, 175.986328125, 188.8515625, 201.716796875, 214.58203125, 227.447265625, 240.3125, 253.177734375, 266.04296875, 278.908203125, 291.7734375, 304.638671875, 317.50390625, 330.369140625, 343.234375, 356.099609375, 368.96484375, 381.830078125, 394.6953125, 407.560546875, 420.42578125, 433.291015625, 446.15625, 459.021484375, 471.88671875, 484.751953125, 497.6171875, 510.482421875, 523.34765625, 536.212890625, 549.078125, 561.943359375, 574.80859375, 587.673828125, 600.5390625, 613.404296875, 626.26953125, 639.134765625, 652.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 10.0, 59.0, 437.0, 3279.0, 232.0, 43.0, 8.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.6455078125, -4.197265625, -3.7490234375, -3.30078125, -2.8525390625, -2.404296875, -1.9560546875, -1.5078125, -1.0595703125, -0.611328125, -0.1630859375, 0.28515625, 0.7333984375, 1.181640625, 1.6298828125, 2.078125, 2.5263671875, 2.974609375, 3.4228515625, 3.87109375, 4.3193359375, 4.767578125, 5.2158203125, 5.6640625, 6.1123046875, 6.560546875, 7.0087890625, 7.45703125, 7.9052734375, 8.353515625, 8.8017578125, 9.25, 9.6982421875, 10.146484375, 10.5947265625, 11.04296875, 11.4912109375, 11.939453125, 12.3876953125, 12.8359375, 13.2841796875, 13.732421875, 14.1806640625, 14.62890625, 15.0771484375, 15.525390625, 15.9736328125, 16.421875, 16.8701171875, 17.318359375, 17.7666015625, 18.21484375, 18.6630859375, 19.111328125, 19.5595703125, 20.0078125, 20.4560546875, 20.904296875, 21.3525390625, 21.80078125, 22.2490234375, 22.697265625, 23.1455078125, 23.59375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 12.0, 7.0, 12.0, 29.0, 36.0, 43.0, 50.0, 67.0, 81.0, 102.0, 108.0, 103.0, 93.0, 68.0, 54.0, 34.0, 28.0, 18.0, 19.0, 9.0, 10.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.912460327148438, -8.668784141540527, -8.4251070022583, -8.18143081665039, -7.937754154205322, -7.694077491760254, -7.450401306152344, -7.206724643707275, -6.963047981262207, -6.719371318817139, -6.47569465637207, -6.23201847076416, -5.988341808319092, -5.744665145874023, -5.500988960266113, -5.257312297821045, -5.013635635375977, -4.769958972930908, -4.52628231048584, -4.28260612487793, -4.038929462432861, -3.795252799987793, -3.5515763759613037, -3.3078999519348145, -3.064223289489746, -2.8205466270446777, -2.5768702030181885, -2.333193778991699, -2.089517116546631, -1.845840573310852, -1.6021640300750732, -1.3584874868392944, -1.1148109436035156, -0.8711344003677368, -0.627457857131958, -0.3837813138961792, -0.1401047706604004, 0.10357177257537842, 0.3472483158111572, 0.590924859046936, 0.8346014022827148, 1.0782779455184937, 1.3219544887542725, 1.5656310319900513, 1.80930757522583, 2.0529842376708984, 2.2966606616973877, 2.540337085723877, 2.7840137481689453, 3.0276904106140137, 3.271366834640503, 3.515043258666992, 3.7587199211120605, 4.002396583557129, 4.246072769165039, 4.489749431610107, 4.733426094055176, 4.977102756500244, 5.2207794189453125, 5.464455604553223, 5.708132266998291, 5.951808929443359, 6.1954851150512695, 6.439161777496338, 6.682838439941406]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 14.0, 9.0, 15.0, 17.0, 24.0, 24.0, 28.0, 32.0, 37.0, 45.0, 36.0, 45.0, 51.0, 45.0, 44.0, 42.0, 57.0, 54.0, 42.0, 54.0, 43.0, 38.0, 29.0, 27.0, 18.0, 26.0, 16.0, 18.0, 10.0, 13.0, 12.0, 7.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.056798458099365, -4.897091865539551, -4.737384796142578, -4.577678203582764, -4.417971134185791, -4.258264541625977, -4.098557472229004, -3.9388508796691895, -3.779144048690796, -3.6194372177124023, -3.459730386734009, -3.3000235557556152, -3.140316963195801, -2.980609893798828, -2.8209033012390137, -2.66119647026062, -2.5014896392822266, -2.341782808303833, -2.1820759773254395, -2.022369146347046, -1.862662434577942, -1.7029556035995483, -1.5432488918304443, -1.3835420608520508, -1.2238352298736572, -1.0641283988952637, -0.9044216275215149, -0.7447148561477661, -0.5850080251693726, -0.425301194190979, -0.2655944228172302, -0.10588765144348145, 0.05381965637207031, 0.21352645754814148, 0.37323325872421265, 0.5329400300979614, 0.692646861076355, 0.8523536920547485, 1.0120604038238525, 1.171767234802246, 1.3314740657806396, 1.4911808967590332, 1.6508877277374268, 1.8105944395065308, 1.9703012704849243, 2.1300082206726074, 2.289714813232422, 2.4494216442108154, 2.609128475189209, 2.7688353061676025, 2.928542137145996, 3.0882489681243896, 3.247955799102783, 3.4076623916625977, 3.567369222640991, 3.7270760536193848, 3.8867828845977783, 4.046489715576172, 4.206196308135986, 4.365903377532959, 4.525609970092773, 4.685317039489746, 4.8450236320495605, 5.004730224609375, 5.164437294006348]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 12.0, 11.0, 15.0, 26.0, 45.0, 77.0, 111.0, 181.0, 289.0, 462.0, 862.0, 1536.0, 2787.0, 5700.0, 11956.0, 25354.0, 60565.0, 150793.0, 332888.0, 264786.0, 108074.0, 44013.0, 19373.0, 8928.0, 4507.0, 2381.0, 1217.0, 681.0, 337.0, 219.0, 136.0, 86.0, 43.0, 27.0, 18.0, 18.0, 8.0, 11.0, 7.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16796875, -2.092742919921875, -2.01751708984375, -1.942291259765625, -1.8670654296875, -1.791839599609375, -1.71661376953125, -1.641387939453125, -1.566162109375, -1.490936279296875, -1.41571044921875, -1.340484619140625, -1.2652587890625, -1.190032958984375, -1.11480712890625, -1.039581298828125, -0.96435546875, -0.889129638671875, -0.81390380859375, -0.738677978515625, -0.6634521484375, -0.588226318359375, -0.51300048828125, -0.437774658203125, -0.362548828125, -0.287322998046875, -0.21209716796875, -0.136871337890625, -0.0616455078125, 0.013580322265625, 0.08880615234375, 0.164031982421875, 0.2392578125, 0.314483642578125, 0.38970947265625, 0.464935302734375, 0.5401611328125, 0.615386962890625, 0.69061279296875, 0.765838623046875, 0.841064453125, 0.916290283203125, 0.99151611328125, 1.066741943359375, 1.1419677734375, 1.217193603515625, 1.29241943359375, 1.367645263671875, 1.44287109375, 1.518096923828125, 1.59332275390625, 1.668548583984375, 1.7437744140625, 1.819000244140625, 1.89422607421875, 1.969451904296875, 2.044677734375, 2.119903564453125, 2.19512939453125, 2.270355224609375, 2.3455810546875, 2.420806884765625, 2.49603271484375, 2.571258544921875, 2.646484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 11.0, 12.0, 17.0, 22.0, 22.0, 29.0, 30.0, 30.0, 41.0, 47.0, 36.0, 53.0, 52.0, 41.0, 48.0, 56.0, 47.0, 41.0, 46.0, 46.0, 41.0, 38.0, 27.0, 25.0, 23.0, 18.0, 11.0, 12.0, 5.0, 11.0, 9.0, 9.0, 7.0, 9.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.42578125, -3.323883056640625, -3.22198486328125, -3.120086669921875, -3.0181884765625, -2.916290283203125, -2.81439208984375, -2.712493896484375, -2.610595703125, -2.508697509765625, -2.40679931640625, -2.304901123046875, -2.2030029296875, -2.101104736328125, -1.99920654296875, -1.897308349609375, -1.79541015625, -1.693511962890625, -1.59161376953125, -1.489715576171875, -1.3878173828125, -1.285919189453125, -1.18402099609375, -1.082122802734375, -0.980224609375, -0.878326416015625, -0.77642822265625, -0.674530029296875, -0.5726318359375, -0.470733642578125, -0.36883544921875, -0.266937255859375, -0.1650390625, -0.063140869140625, 0.03875732421875, 0.140655517578125, 0.2425537109375, 0.344451904296875, 0.44635009765625, 0.548248291015625, 0.650146484375, 0.752044677734375, 0.85394287109375, 0.955841064453125, 1.0577392578125, 1.159637451171875, 1.26153564453125, 1.363433837890625, 1.46533203125, 1.567230224609375, 1.66912841796875, 1.771026611328125, 1.8729248046875, 1.974822998046875, 2.07672119140625, 2.178619384765625, 2.280517578125, 2.382415771484375, 2.48431396484375, 2.586212158203125, 2.6881103515625, 2.790008544921875, 2.89190673828125, 2.993804931640625, 3.095703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 13.0, 24.0, 28.0, 47.0, 79.0, 114.0, 186.0, 322.0, 598.0, 1173.0, 2216.0, 5248.0, 13295.0, 42194.0, 174911.0, 523880.0, 209338.0, 48942.0, 14864.0, 5709.0, 2533.0, 1228.0, 664.0, 340.0, 235.0, 109.0, 79.0, 46.0, 35.0, 22.0, 15.0, 18.0, 8.0, 5.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.416015625, -3.3199462890625, -3.223876953125, -3.1278076171875, -3.03173828125, -2.9356689453125, -2.839599609375, -2.7435302734375, -2.6474609375, -2.5513916015625, -2.455322265625, -2.3592529296875, -2.26318359375, -2.1671142578125, -2.071044921875, -1.9749755859375, -1.87890625, -1.7828369140625, -1.686767578125, -1.5906982421875, -1.49462890625, -1.3985595703125, -1.302490234375, -1.2064208984375, -1.1103515625, -1.0142822265625, -0.918212890625, -0.8221435546875, -0.72607421875, -0.6300048828125, -0.533935546875, -0.4378662109375, -0.341796875, -0.2457275390625, -0.149658203125, -0.0535888671875, 0.04248046875, 0.1385498046875, 0.234619140625, 0.3306884765625, 0.4267578125, 0.5228271484375, 0.618896484375, 0.7149658203125, 0.81103515625, 0.9071044921875, 1.003173828125, 1.0992431640625, 1.1953125, 1.2913818359375, 1.387451171875, 1.4835205078125, 1.57958984375, 1.6756591796875, 1.771728515625, 1.8677978515625, 1.9638671875, 2.0599365234375, 2.156005859375, 2.2520751953125, 2.34814453125, 2.4442138671875, 2.540283203125, 2.6363525390625, 2.732421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 5.0, 10.0, 12.0, 9.0, 14.0, 18.0, 19.0, 32.0, 31.0, 37.0, 37.0, 36.0, 29.0, 45.0, 47.0, 57.0, 56.0, 47.0, 39.0, 54.0, 40.0, 43.0, 45.0, 37.0, 39.0, 28.0, 23.0, 18.0, 20.0, 12.0, 11.0, 4.0, 10.0, 5.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.7890625, -6.5811767578125, -6.373291015625, -6.1654052734375, -5.95751953125, -5.7496337890625, -5.541748046875, -5.3338623046875, -5.1259765625, -4.9180908203125, -4.710205078125, -4.5023193359375, -4.29443359375, -4.0865478515625, -3.878662109375, -3.6707763671875, -3.462890625, -3.2550048828125, -3.047119140625, -2.8392333984375, -2.63134765625, -2.4234619140625, -2.215576171875, -2.0076904296875, -1.7998046875, -1.5919189453125, -1.384033203125, -1.1761474609375, -0.96826171875, -0.7603759765625, -0.552490234375, -0.3446044921875, -0.13671875, 0.0711669921875, 0.279052734375, 0.4869384765625, 0.69482421875, 0.9027099609375, 1.110595703125, 1.3184814453125, 1.5263671875, 1.7342529296875, 1.942138671875, 2.1500244140625, 2.35791015625, 2.5657958984375, 2.773681640625, 2.9815673828125, 3.189453125, 3.3973388671875, 3.605224609375, 3.8131103515625, 4.02099609375, 4.2288818359375, 4.436767578125, 4.6446533203125, 4.8525390625, 5.0604248046875, 5.268310546875, 5.4761962890625, 5.68408203125, 5.8919677734375, 6.099853515625, 6.3077392578125, 6.515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 10.0, 6.0, 9.0, 14.0, 19.0, 21.0, 30.0, 40.0, 61.0, 99.0, 154.0, 197.0, 298.0, 445.0, 697.0, 1131.0, 1809.0, 2838.0, 5001.0, 9121.0, 17941.0, 45081.0, 161429.0, 549937.0, 165485.0, 45693.0, 18712.0, 9235.0, 5022.0, 2931.0, 1847.0, 1131.0, 677.0, 461.0, 301.0, 210.0, 146.0, 100.0, 62.0, 42.0, 37.0, 19.0, 26.0, 9.0, 8.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.62890625, -0.610137939453125, -0.59136962890625, -0.572601318359375, -0.5538330078125, -0.535064697265625, -0.51629638671875, -0.497528076171875, -0.478759765625, -0.459991455078125, -0.44122314453125, -0.422454833984375, -0.4036865234375, -0.384918212890625, -0.36614990234375, -0.347381591796875, -0.32861328125, -0.309844970703125, -0.29107666015625, -0.272308349609375, -0.2535400390625, -0.234771728515625, -0.21600341796875, -0.197235107421875, -0.178466796875, -0.159698486328125, -0.14093017578125, -0.122161865234375, -0.1033935546875, -0.084625244140625, -0.06585693359375, -0.047088623046875, -0.0283203125, -0.009552001953125, 0.00921630859375, 0.027984619140625, 0.0467529296875, 0.065521240234375, 0.08428955078125, 0.103057861328125, 0.121826171875, 0.140594482421875, 0.15936279296875, 0.178131103515625, 0.1968994140625, 0.215667724609375, 0.23443603515625, 0.253204345703125, 0.27197265625, 0.290740966796875, 0.30950927734375, 0.328277587890625, 0.3470458984375, 0.365814208984375, 0.38458251953125, 0.403350830078125, 0.422119140625, 0.440887451171875, 0.45965576171875, 0.478424072265625, 0.4971923828125, 0.515960693359375, 0.53472900390625, 0.553497314453125, 0.572265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 12.0, 12.0, 12.0, 25.0, 44.0, 80.0, 186.0, 260.0, 152.0, 78.0, 38.0, 23.0, 18.0, 11.0, 7.0, 3.0, 8.0, 1.0, 8.0, 0.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001071929931640625, -0.0010399669408798218, -0.0010080039501190186, -0.0009760409593582153, -0.0009440779685974121, -0.0009121149778366089, -0.0008801519870758057, -0.0008481889963150024, -0.0008162260055541992, -0.000784263014793396, -0.0007523000240325928, -0.0007203370332717896, -0.0006883740425109863, -0.0006564110517501831, -0.0006244480609893799, -0.0005924850702285767, -0.0005605220794677734, -0.0005285590887069702, -0.000496596097946167, -0.00046463310718536377, -0.00043267011642456055, -0.0004007071256637573, -0.0003687441349029541, -0.0003367811441421509, -0.00030481815338134766, -0.00027285516262054443, -0.0002408921718597412, -0.000208929181098938, -0.00017696619033813477, -0.00014500319957733154, -0.00011304020881652832, -8.10772180557251e-05, -4.9114227294921875e-05, -1.7151236534118652e-05, 1.481175422668457e-05, 4.677474498748779e-05, 7.873773574829102e-05, 0.00011070072650909424, 0.00014266371726989746, 0.00017462670803070068, 0.0002065896987915039, 0.00023855268955230713, 0.00027051568031311035, 0.0003024786710739136, 0.0003344416618347168, 0.00036640465259552, 0.00039836764335632324, 0.00043033063411712646, 0.0004622936248779297, 0.0004942566156387329, 0.0005262196063995361, 0.0005581825971603394, 0.0005901455879211426, 0.0006221085786819458, 0.000654071569442749, 0.0006860345602035522, 0.0007179975509643555, 0.0007499605417251587, 0.0007819235324859619, 0.0008138865232467651, 0.0008458495140075684, 0.0008778125047683716, 0.0009097754955291748, 0.000941738486289978, 0.0009737014770507812]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 16.0, 7.0, 18.0, 39.0, 59.0, 97.0, 178.0, 440.0, 1020.0, 2638.0, 8355.0, 43727.0, 673615.0, 284936.0, 24317.0, 5645.0, 1880.0, 802.0, 370.0, 167.0, 87.0, 52.0, 25.0, 17.0, 9.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0123291015625, -0.968017578125, -0.9237060546875, -0.87939453125, -0.8350830078125, -0.790771484375, -0.7464599609375, -0.7021484375, -0.6578369140625, -0.613525390625, -0.5692138671875, -0.52490234375, -0.4805908203125, -0.436279296875, -0.3919677734375, -0.34765625, -0.3033447265625, -0.259033203125, -0.2147216796875, -0.17041015625, -0.1260986328125, -0.081787109375, -0.0374755859375, 0.0068359375, 0.0511474609375, 0.095458984375, 0.1397705078125, 0.18408203125, 0.2283935546875, 0.272705078125, 0.3170166015625, 0.361328125, 0.4056396484375, 0.449951171875, 0.4942626953125, 0.53857421875, 0.5828857421875, 0.627197265625, 0.6715087890625, 0.7158203125, 0.7601318359375, 0.804443359375, 0.8487548828125, 0.89306640625, 0.9373779296875, 0.981689453125, 1.0260009765625, 1.0703125, 1.1146240234375, 1.158935546875, 1.2032470703125, 1.24755859375, 1.2918701171875, 1.336181640625, 1.3804931640625, 1.4248046875, 1.4691162109375, 1.513427734375, 1.5577392578125, 1.60205078125, 1.6463623046875, 1.690673828125, 1.7349853515625, 1.779296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 6.0, 2.0, 2.0, 10.0, 11.0, 13.0, 11.0, 16.0, 31.0, 45.0, 59.0, 96.0, 102.0, 105.0, 101.0, 74.0, 76.0, 48.0, 36.0, 38.0, 27.0, 11.0, 16.0, 10.0, 4.0, 4.0, 10.0, 8.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.206787109375, -0.1997966766357422, -0.19280624389648438, -0.18581581115722656, -0.17882537841796875, -0.17183494567871094, -0.16484451293945312, -0.1578540802001953, -0.1508636474609375, -0.1438732147216797, -0.13688278198242188, -0.12989234924316406, -0.12290191650390625, -0.11591148376464844, -0.10892105102539062, -0.10193061828613281, -0.094940185546875, -0.08794975280761719, -0.08095932006835938, -0.07396888732910156, -0.06697845458984375, -0.05998802185058594, -0.052997589111328125, -0.04600715637207031, -0.0390167236328125, -0.03202629089355469, -0.025035858154296875, -0.018045425415039062, -0.01105499267578125, -0.0040645599365234375, 0.002925872802734375, 0.009916305541992188, 0.01690673828125, 0.023897171020507812, 0.030887603759765625, 0.03787803649902344, 0.04486846923828125, 0.05185890197753906, 0.058849334716796875, 0.06583976745605469, 0.0728302001953125, 0.07982063293457031, 0.08681106567382812, 0.09380149841308594, 0.10079193115234375, 0.10778236389160156, 0.11477279663085938, 0.12176322937011719, 0.128753662109375, 0.1357440948486328, 0.14273452758789062, 0.14972496032714844, 0.15671539306640625, 0.16370582580566406, 0.17069625854492188, 0.1776866912841797, 0.1846771240234375, 0.1916675567626953, 0.19865798950195312, 0.20564842224121094, 0.21263885498046875, 0.21962928771972656, 0.22661972045898438, 0.2336101531982422, 0.2406005859375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 4.0, 14.0, 19.0, 20.0, 50.0, 61.0, 117.0, 141.0, 159.0, 126.0, 108.0, 70.0, 46.0, 31.0, 16.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.518216133117676, -8.301972389221191, -8.085728645324707, -7.869484901428223, -7.6532416343688965, -7.436997890472412, -7.220754146575928, -7.004510402679443, -6.788267135620117, -6.572023391723633, -6.355779647827148, -6.139535903930664, -5.923292636871338, -5.7070488929748535, -5.490805149078369, -5.274561405181885, -5.0583176612854, -4.842073917388916, -4.625830173492432, -4.4095869064331055, -4.193343162536621, -3.9770994186401367, -3.7608556747436523, -3.544611930847168, -3.3283684253692627, -3.1121246814727783, -2.895881175994873, -2.6796374320983887, -2.4633936882019043, -2.247150182723999, -2.0309064388275146, -1.8146628141403198, -1.5984187126159668, -1.382175087928772, -1.1659314632415771, -0.9496877193450928, -0.733444094657898, -0.5172004699707031, -0.30095672607421875, -0.08471310138702393, 0.1315305233001709, 0.3477741777896881, 0.5640178322792053, 0.7802615165710449, 0.9965051412582397, 1.2127487659454346, 1.428992509841919, 1.6452361345291138, 1.8614797592163086, 2.077723503112793, 2.2939670085906982, 2.5102107524871826, 2.726454257965088, 2.9426980018615723, 3.1589417457580566, 3.375185489654541, 3.5914289951324463, 3.8076727390289307, 4.023916244506836, 4.24015998840332, 4.456403732299805, 4.672647476196289, 4.888891220092773, 5.1051344871521, 5.321378231048584]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 9.0, 13.0, 12.0, 16.0, 27.0, 30.0, 18.0, 28.0, 37.0, 39.0, 40.0, 48.0, 45.0, 50.0, 43.0, 43.0, 45.0, 53.0, 42.0, 36.0, 49.0, 43.0, 40.0, 24.0, 25.0, 16.0, 24.0, 15.0, 13.0, 13.0, 8.0, 11.0, 9.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.203831195831299, -3.1082069873809814, -3.012582778930664, -2.916958808898926, -2.8213346004486084, -2.725710391998291, -2.6300861835479736, -2.5344619750976562, -2.438838005065918, -2.3432137966156006, -2.247589588165283, -2.151965618133545, -2.0563414096832275, -1.9607172012329102, -1.8650929927825928, -1.7694687843322754, -1.673844575881958, -1.5782203674316406, -1.4825962781906128, -1.3869720697402954, -1.2913479804992676, -1.1957237720489502, -1.1000995635986328, -1.0044753551483154, -0.9088512659072876, -0.813227117061615, -0.7176029682159424, -0.621978759765625, -0.5263546109199524, -0.4307304620742798, -0.3351062536239624, -0.2394821047782898, -0.14385771751403809, -0.048233553767204285, 0.04739060997962952, 0.1430147886276245, 0.23863893747329712, 0.3342630863189697, 0.4298872947692871, 0.5255114436149597, 0.6211355924606323, 0.7167597413063049, 0.8123838901519775, 0.9080080986022949, 1.0036323070526123, 1.0992563962936401, 1.1948806047439575, 1.2905046939849854, 1.3861289024353027, 1.4817531108856201, 1.577377200126648, 1.6730014085769653, 1.7686254978179932, 1.8642497062683105, 1.959873914718628, 2.0554981231689453, 2.1511220932006836, 2.246746301651001, 2.3423705101013184, 2.4379944801330566, 2.533618688583374, 2.6292428970336914, 2.724867105484009, 2.820491313934326, 2.9161155223846436]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 5.0, 4.0, 12.0, 14.0, 14.0, 12.0, 17.0, 23.0, 46.0, 60.0, 76.0, 131.0, 195.0, 273.0, 390.0, 654.0, 1033.0, 1868.0, 3525.0, 6819.0, 14052.0, 31087.0, 70716.0, 155622.0, 288111.0, 248166.0, 123348.0, 54379.0, 24311.0, 11214.0, 5393.0, 2814.0, 1559.0, 915.0, 515.0, 345.0, 237.0, 159.0, 128.0, 77.0, 68.0, 44.0, 35.0, 16.0, 23.0, 14.0, 13.0, 10.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0], "bins": [-0.720703125, -0.7000198364257812, -0.6793365478515625, -0.6586532592773438, -0.637969970703125, -0.6172866821289062, -0.5966033935546875, -0.5759201049804688, -0.55523681640625, -0.5345535278320312, -0.5138702392578125, -0.49318695068359375, -0.472503662109375, -0.45182037353515625, -0.4311370849609375, -0.41045379638671875, -0.3897705078125, -0.36908721923828125, -0.3484039306640625, -0.32772064208984375, -0.307037353515625, -0.28635406494140625, -0.2656707763671875, -0.24498748779296875, -0.22430419921875, -0.20362091064453125, -0.1829376220703125, -0.16225433349609375, -0.141571044921875, -0.12088775634765625, -0.1002044677734375, -0.07952117919921875, -0.058837890625, -0.03815460205078125, -0.0174713134765625, 0.00321197509765625, 0.023895263671875, 0.04457855224609375, 0.0652618408203125, 0.08594512939453125, 0.10662841796875, 0.12731170654296875, 0.1479949951171875, 0.16867828369140625, 0.189361572265625, 0.21004486083984375, 0.2307281494140625, 0.25141143798828125, 0.2720947265625, 0.29277801513671875, 0.3134613037109375, 0.33414459228515625, 0.354827880859375, 0.37551116943359375, 0.3961944580078125, 0.41687774658203125, 0.43756103515625, 0.45824432373046875, 0.4789276123046875, 0.49961090087890625, 0.520294189453125, 0.5409774780273438, 0.5616607666015625, 0.5823440551757812, 0.60302734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 12.0, 12.0, 9.0, 15.0, 17.0, 21.0, 28.0, 24.0, 22.0, 22.0, 20.0, 31.0, 33.0, 27.0, 33.0, 43.0, 46.0, 51.0, 47.0, 36.0, 33.0, 30.0, 33.0, 45.0, 29.0, 29.0, 37.0, 30.0, 32.0, 18.0, 19.0, 18.0, 17.0, 16.0, 12.0, 7.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.37109375, -5.20196533203125, -5.0328369140625, -4.86370849609375, -4.694580078125, -4.52545166015625, -4.3563232421875, -4.18719482421875, -4.01806640625, -3.84893798828125, -3.6798095703125, -3.51068115234375, -3.341552734375, -3.17242431640625, -3.0032958984375, -2.83416748046875, -2.6650390625, -2.49591064453125, -2.3267822265625, -2.15765380859375, -1.988525390625, -1.81939697265625, -1.6502685546875, -1.48114013671875, -1.31201171875, -1.14288330078125, -0.9737548828125, -0.80462646484375, -0.635498046875, -0.46636962890625, -0.2972412109375, -0.12811279296875, 0.041015625, 0.21014404296875, 0.3792724609375, 0.54840087890625, 0.717529296875, 0.88665771484375, 1.0557861328125, 1.22491455078125, 1.39404296875, 1.56317138671875, 1.7322998046875, 1.90142822265625, 2.070556640625, 2.23968505859375, 2.4088134765625, 2.57794189453125, 2.7470703125, 2.91619873046875, 3.0853271484375, 3.25445556640625, 3.423583984375, 3.59271240234375, 3.7618408203125, 3.93096923828125, 4.10009765625, 4.26922607421875, 4.4383544921875, 4.60748291015625, 4.776611328125, 4.94573974609375, 5.1148681640625, 5.28399658203125, 5.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 8.0, 5.0, 15.0, 14.0, 14.0, 36.0, 29.0, 43.0, 47.0, 61.0, 76.0, 124.0, 167.0, 283.0, 684.0, 2369.0, 47370.0, 953977.0, 39368.0, 2205.0, 665.0, 293.0, 205.0, 103.0, 80.0, 66.0, 50.0, 36.0, 26.0, 23.0, 18.0, 10.0, 14.0, 8.0, 6.0, 9.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.849609375, -3.727325439453125, -3.60504150390625, -3.482757568359375, -3.3604736328125, -3.238189697265625, -3.11590576171875, -2.993621826171875, -2.871337890625, -2.749053955078125, -2.62677001953125, -2.504486083984375, -2.3822021484375, -2.259918212890625, -2.13763427734375, -2.015350341796875, -1.89306640625, -1.770782470703125, -1.64849853515625, -1.526214599609375, -1.4039306640625, -1.281646728515625, -1.15936279296875, -1.037078857421875, -0.914794921875, -0.792510986328125, -0.67022705078125, -0.547943115234375, -0.4256591796875, -0.303375244140625, -0.18109130859375, -0.058807373046875, 0.0634765625, 0.185760498046875, 0.30804443359375, 0.430328369140625, 0.5526123046875, 0.674896240234375, 0.79718017578125, 0.919464111328125, 1.041748046875, 1.164031982421875, 1.28631591796875, 1.408599853515625, 1.5308837890625, 1.653167724609375, 1.77545166015625, 1.897735595703125, 2.02001953125, 2.142303466796875, 2.26458740234375, 2.386871337890625, 2.5091552734375, 2.631439208984375, 2.75372314453125, 2.876007080078125, 2.998291015625, 3.120574951171875, 3.24285888671875, 3.365142822265625, 3.4874267578125, 3.609710693359375, 3.73199462890625, 3.854278564453125, 3.9765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 7.0, 4.0, 16.0, 11.0, 17.0, 26.0, 24.0, 25.0, 25.0, 29.0, 34.0, 41.0, 42.0, 38.0, 48.0, 41.0, 50.0, 46.0, 40.0, 45.0, 33.0, 47.0, 34.0, 29.0, 36.0, 33.0, 29.0, 19.0, 16.0, 17.0, 15.0, 10.0, 9.0, 8.0, 6.0, 10.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.88671875, -5.6973876953125, -5.508056640625, -5.3187255859375, -5.12939453125, -4.9400634765625, -4.750732421875, -4.5614013671875, -4.3720703125, -4.1827392578125, -3.993408203125, -3.8040771484375, -3.61474609375, -3.4254150390625, -3.236083984375, -3.0467529296875, -2.857421875, -2.6680908203125, -2.478759765625, -2.2894287109375, -2.10009765625, -1.9107666015625, -1.721435546875, -1.5321044921875, -1.3427734375, -1.1534423828125, -0.964111328125, -0.7747802734375, -0.58544921875, -0.3961181640625, -0.206787109375, -0.0174560546875, 0.171875, 0.3612060546875, 0.550537109375, 0.7398681640625, 0.92919921875, 1.1185302734375, 1.307861328125, 1.4971923828125, 1.6865234375, 1.8758544921875, 2.065185546875, 2.2545166015625, 2.44384765625, 2.6331787109375, 2.822509765625, 3.0118408203125, 3.201171875, 3.3905029296875, 3.579833984375, 3.7691650390625, 3.95849609375, 4.1478271484375, 4.337158203125, 4.5264892578125, 4.7158203125, 4.9051513671875, 5.094482421875, 5.2838134765625, 5.47314453125, 5.6624755859375, 5.851806640625, 6.0411376953125, 6.23046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 5.0, 19.0, 17.0, 24.0, 33.0, 53.0, 77.0, 142.0, 260.0, 473.0, 1071.0, 2500.0, 7322.0, 27914.0, 243746.0, 702239.0, 45775.0, 10687.0, 3449.0, 1353.0, 612.0, 302.0, 160.0, 101.0, 63.0, 56.0, 27.0, 13.0, 11.0, 15.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.439453125, -0.4276237487792969, -0.41579437255859375, -0.4039649963378906, -0.3921356201171875, -0.3803062438964844, -0.36847686767578125, -0.3566474914550781, -0.344818115234375, -0.3329887390136719, -0.32115936279296875, -0.3093299865722656, -0.2975006103515625, -0.2856712341308594, -0.27384185791015625, -0.2620124816894531, -0.25018310546875, -0.23835372924804688, -0.22652435302734375, -0.21469497680664062, -0.2028656005859375, -0.19103622436523438, -0.17920684814453125, -0.16737747192382812, -0.155548095703125, -0.14371871948242188, -0.13188934326171875, -0.12005996704101562, -0.1082305908203125, -0.09640121459960938, -0.08457183837890625, -0.07274246215820312, -0.0609130859375, -0.049083709716796875, -0.03725433349609375, -0.025424957275390625, -0.0135955810546875, -0.001766204833984375, 0.01006317138671875, 0.021892547607421875, 0.033721923828125, 0.045551300048828125, 0.05738067626953125, 0.06921005249023438, 0.0810394287109375, 0.09286880493164062, 0.10469818115234375, 0.11652755737304688, 0.12835693359375, 0.14018630981445312, 0.15201568603515625, 0.16384506225585938, 0.1756744384765625, 0.18750381469726562, 0.19933319091796875, 0.21116256713867188, 0.222991943359375, 0.23482131958007812, 0.24665069580078125, 0.2584800720214844, 0.2703094482421875, 0.2821388244628906, 0.29396820068359375, 0.3057975769042969, 0.317626953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 11.0, 9.0, 9.0, 9.0, 14.0, 14.0, 35.0, 52.0, 79.0, 156.0, 231.0, 165.0, 76.0, 51.0, 23.0, 20.0, 9.0, 8.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.894899368286133e-05, -5.724374204874039e-05, -5.5538490414619446e-05, -5.3833238780498505e-05, -5.2127987146377563e-05, -5.042273551225662e-05, -4.871748387813568e-05, -4.701223224401474e-05, -4.53069806098938e-05, -4.360172897577286e-05, -4.1896477341651917e-05, -4.0191225707530975e-05, -3.8485974073410034e-05, -3.678072243928909e-05, -3.507547080516815e-05, -3.337021917104721e-05, -3.166496753692627e-05, -2.995971590280533e-05, -2.8254464268684387e-05, -2.6549212634563446e-05, -2.4843961000442505e-05, -2.3138709366321564e-05, -2.1433457732200623e-05, -1.972820609807968e-05, -1.802295446395874e-05, -1.63177028298378e-05, -1.4612451195716858e-05, -1.2907199561595917e-05, -1.1201947927474976e-05, -9.496696293354034e-06, -7.791444659233093e-06, -6.086193025112152e-06, -4.380941390991211e-06, -2.6756897568702698e-06, -9.704381227493286e-07, 7.348135113716125e-07, 2.4400651454925537e-06, 4.145316779613495e-06, 5.850568413734436e-06, 7.555820047855377e-06, 9.261071681976318e-06, 1.096632331609726e-05, 1.26715749502182e-05, 1.4376826584339142e-05, 1.6082078218460083e-05, 1.7787329852581024e-05, 1.9492581486701965e-05, 2.1197833120822906e-05, 2.2903084754943848e-05, 2.460833638906479e-05, 2.631358802318573e-05, 2.801883965730667e-05, 2.9724091291427612e-05, 3.1429342925548553e-05, 3.3134594559669495e-05, 3.4839846193790436e-05, 3.654509782791138e-05, 3.825034946203232e-05, 3.995560109615326e-05, 4.16608527302742e-05, 4.336610436439514e-05, 4.507135599851608e-05, 4.6776607632637024e-05, 4.8481859266757965e-05, 5.0187110900878906e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 12.0, 6.0, 5.0, 13.0, 19.0, 23.0, 26.0, 40.0, 89.0, 164.0, 306.0, 916.0, 2750.0, 10223.0, 69900.0, 883792.0, 66059.0, 9970.0, 2671.0, 888.0, 331.0, 131.0, 70.0, 44.0, 36.0, 22.0, 10.0, 8.0, 9.0, 4.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5361328125, -0.5205879211425781, -0.5050430297851562, -0.4894981384277344, -0.4739532470703125, -0.4584083557128906, -0.44286346435546875, -0.4273185729980469, -0.411773681640625, -0.3962287902832031, -0.38068389892578125, -0.3651390075683594, -0.3495941162109375, -0.3340492248535156, -0.31850433349609375, -0.3029594421386719, -0.28741455078125, -0.2718696594238281, -0.25632476806640625, -0.24077987670898438, -0.2252349853515625, -0.20969009399414062, -0.19414520263671875, -0.17860031127929688, -0.163055419921875, -0.14751052856445312, -0.13196563720703125, -0.11642074584960938, -0.1008758544921875, -0.08533096313476562, -0.06978607177734375, -0.054241180419921875, -0.0386962890625, -0.023151397705078125, -0.00760650634765625, 0.007938385009765625, 0.0234832763671875, 0.039028167724609375, 0.05457305908203125, 0.07011795043945312, 0.085662841796875, 0.10120773315429688, 0.11675262451171875, 0.13229751586914062, 0.1478424072265625, 0.16338729858398438, 0.17893218994140625, 0.19447708129882812, 0.21002197265625, 0.22556686401367188, 0.24111175537109375, 0.2566566467285156, 0.2722015380859375, 0.2877464294433594, 0.30329132080078125, 0.3188362121582031, 0.334381103515625, 0.3499259948730469, 0.36547088623046875, 0.3810157775878906, 0.3965606689453125, 0.4121055603027344, 0.42765045166015625, 0.4431953430175781, 0.458740234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 7.0, 4.0, 6.0, 9.0, 8.0, 18.0, 23.0, 43.0, 53.0, 60.0, 118.0, 216.0, 160.0, 84.0, 50.0, 39.0, 28.0, 13.0, 10.0, 9.0, 6.0, 6.0, 3.0, 7.0, 7.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.17919921875, -0.17469120025634766, -0.1701831817626953, -0.16567516326904297, -0.16116714477539062, -0.15665912628173828, -0.15215110778808594, -0.1476430892944336, -0.14313507080078125, -0.1386270523071289, -0.13411903381347656, -0.12961101531982422, -0.12510299682617188, -0.12059497833251953, -0.11608695983886719, -0.11157894134521484, -0.1070709228515625, -0.10256290435791016, -0.09805488586425781, -0.09354686737060547, -0.08903884887695312, -0.08453083038330078, -0.08002281188964844, -0.0755147933959961, -0.07100677490234375, -0.0664987564086914, -0.06199073791503906, -0.05748271942138672, -0.052974700927734375, -0.04846668243408203, -0.04395866394042969, -0.039450645446777344, -0.034942626953125, -0.030434608459472656, -0.025926589965820312, -0.02141857147216797, -0.016910552978515625, -0.012402534484863281, -0.007894515991210938, -0.0033864974975585938, 0.00112152099609375, 0.005629539489746094, 0.010137557983398438, 0.014645576477050781, 0.019153594970703125, 0.02366161346435547, 0.028169631958007812, 0.032677650451660156, 0.0371856689453125, 0.041693687438964844, 0.04620170593261719, 0.05070972442626953, 0.055217742919921875, 0.05972576141357422, 0.06423377990722656, 0.0687417984008789, 0.07324981689453125, 0.0777578353881836, 0.08226585388183594, 0.08677387237548828, 0.09128189086914062, 0.09578990936279297, 0.10029792785644531, 0.10480594635009766, 0.10931396484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 6.0, 22.0, 40.0, 77.0, 173.0, 243.0, 209.0, 119.0, 67.0, 31.0, 13.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24908971786499, -4.707395553588867, -4.165701389312744, -3.6240074634552, -3.082313299179077, -2.540619134902954, -1.9989252090454102, -1.457231044769287, -0.9155368804931641, -0.3738427758216858, 0.16785132884979248, 0.709545373916626, 1.251239538192749, 1.792933702468872, 2.334627628326416, 2.876321792602539, 3.418015956878662, 3.959710121154785, 4.501404285430908, 5.043098449707031, 5.584792137145996, 6.126486778259277, 6.668180465698242, 7.209874629974365, 7.751568794250488, 8.293262481689453, 8.834957122802734, 9.3766508102417, 9.91834545135498, 10.460039138793945, 11.001733779907227, 11.543427467346191, 12.085121154785156, 12.626814842224121, 13.168509483337402, 13.710203170776367, 14.251897811889648, 14.793591499328613, 15.335285186767578, 15.87697982788086, 16.41867446899414, 16.960369110107422, 17.50206184387207, 18.04375648498535, 18.585451126098633, 19.127145767211914, 19.668838500976562, 20.210533142089844, 20.752227783203125, 21.293922424316406, 21.835615158081055, 22.377309799194336, 22.919004440307617, 23.4606990814209, 24.002391815185547, 24.544086456298828, 25.085779190063477, 25.627473831176758, 26.169166564941406, 26.710861206054688, 27.25255584716797, 27.79425048828125, 28.3359432220459, 28.87763786315918, 29.41933250427246]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 14.0, 6.0, 9.0, 13.0, 13.0, 13.0, 12.0, 20.0, 28.0, 18.0, 22.0, 31.0, 32.0, 31.0, 37.0, 34.0, 41.0, 49.0, 40.0, 30.0, 34.0, 36.0, 31.0, 38.0, 36.0, 37.0, 31.0, 36.0, 22.0, 31.0, 23.0, 22.0, 18.0, 11.0, 11.0, 14.0, 7.0, 5.0, 12.0, 5.0, 8.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-9.38237190246582, -9.125243186950684, -8.868115425109863, -8.610986709594727, -8.353858947753906, -8.09673023223877, -7.839601516723633, -7.582473278045654, -7.325345039367676, -7.068216800689697, -6.811088562011719, -6.553959846496582, -6.2968316078186035, -6.039703369140625, -5.782574653625488, -5.52544641494751, -5.268318176269531, -5.011189937591553, -4.754061698913574, -4.4969329833984375, -4.239804744720459, -3.9826765060424805, -3.725548028945923, -3.4684195518493652, -3.2112913131713867, -2.954163074493408, -2.6970345973968506, -2.439906120300293, -2.1827778816223145, -1.9256495237350464, -1.6685211658477783, -1.4113928079605103, -1.1542644500732422, -0.8971360921859741, -0.640007734298706, -0.382879376411438, -0.12575101852416992, 0.13137733936309814, 0.3885056972503662, 0.6456340551376343, 0.9027624130249023, 1.1598907709121704, 1.4170191287994385, 1.6741474866867065, 1.9312758445739746, 2.188404083251953, 2.4455325603485107, 2.7026610374450684, 2.959789276123047, 3.2169175148010254, 3.474045991897583, 3.7311744689941406, 3.988302707672119, 4.245430946350098, 4.502559661865234, 4.759687900543213, 5.016816139221191, 5.27394437789917, 5.531072616577148, 5.788201332092285, 6.045329570770264, 6.302457809448242, 6.559586524963379, 6.816714763641357, 7.073843002319336]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 6.0, 5.0, 12.0, 10.0, 15.0, 22.0, 44.0, 62.0, 70.0, 114.0, 197.0, 337.0, 571.0, 1048.0, 2252.0, 5097.0, 14808.0, 93707.0, 1253384.0, 2571984.0, 211332.0, 25728.0, 7512.0, 2878.0, 1348.0, 710.0, 393.0, 213.0, 147.0, 99.0, 50.0, 52.0, 26.0, 18.0, 11.0, 11.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.11822509765625, -7.9161376953125, -7.71405029296875, -7.511962890625, -7.30987548828125, -7.1077880859375, -6.90570068359375, -6.70361328125, -6.50152587890625, -6.2994384765625, -6.09735107421875, -5.895263671875, -5.69317626953125, -5.4910888671875, -5.28900146484375, -5.0869140625, -4.88482666015625, -4.6827392578125, -4.48065185546875, -4.278564453125, -4.07647705078125, -3.8743896484375, -3.67230224609375, -3.47021484375, -3.26812744140625, -3.0660400390625, -2.86395263671875, -2.661865234375, -2.45977783203125, -2.2576904296875, -2.05560302734375, -1.853515625, -1.65142822265625, -1.4493408203125, -1.24725341796875, -1.045166015625, -0.84307861328125, -0.6409912109375, -0.43890380859375, -0.23681640625, -0.03472900390625, 0.1673583984375, 0.36944580078125, 0.571533203125, 0.77362060546875, 0.9757080078125, 1.17779541015625, 1.3798828125, 1.58197021484375, 1.7840576171875, 1.98614501953125, 2.188232421875, 2.39031982421875, 2.5924072265625, 2.79449462890625, 2.99658203125, 3.19866943359375, 3.4007568359375, 3.60284423828125, 3.804931640625, 4.00701904296875, 4.2091064453125, 4.41119384765625, 4.61328125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 8.0, 13.0, 21.0, 14.0, 19.0, 34.0, 35.0, 32.0, 39.0, 59.0, 49.0, 49.0, 42.0, 58.0, 55.0, 54.0, 41.0, 61.0, 36.0, 40.0, 39.0, 29.0, 30.0, 25.0, 12.0, 17.0, 18.0, 8.0, 10.0, 7.0, 8.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.4296875, -3.3228759765625, -3.216064453125, -3.1092529296875, -3.00244140625, -2.8956298828125, -2.788818359375, -2.6820068359375, -2.5751953125, -2.4683837890625, -2.361572265625, -2.2547607421875, -2.14794921875, -2.0411376953125, -1.934326171875, -1.8275146484375, -1.720703125, -1.6138916015625, -1.507080078125, -1.4002685546875, -1.29345703125, -1.1866455078125, -1.079833984375, -0.9730224609375, -0.8662109375, -0.7593994140625, -0.652587890625, -0.5457763671875, -0.43896484375, -0.3321533203125, -0.225341796875, -0.1185302734375, -0.01171875, 0.0950927734375, 0.201904296875, 0.3087158203125, 0.41552734375, 0.5223388671875, 0.629150390625, 0.7359619140625, 0.8427734375, 0.9495849609375, 1.056396484375, 1.1632080078125, 1.27001953125, 1.3768310546875, 1.483642578125, 1.5904541015625, 1.697265625, 1.8040771484375, 1.910888671875, 2.0177001953125, 2.12451171875, 2.2313232421875, 2.338134765625, 2.4449462890625, 2.5517578125, 2.6585693359375, 2.765380859375, 2.8721923828125, 2.97900390625, 3.0858154296875, 3.192626953125, 3.2994384765625, 3.40625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 10.0, 13.0, 21.0, 25.0, 35.0, 99.0, 294.0, 1910.0, 208830.0, 3978848.0, 3547.0, 405.0, 116.0, 46.0, 28.0, 14.0, 9.0, 7.0, 3.0, 1.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-43.3125, -42.23291015625, -41.1533203125, -40.07373046875, -38.994140625, -37.91455078125, -36.8349609375, -35.75537109375, -34.67578125, -33.59619140625, -32.5166015625, -31.43701171875, -30.357421875, -29.27783203125, -28.1982421875, -27.11865234375, -26.0390625, -24.95947265625, -23.8798828125, -22.80029296875, -21.720703125, -20.64111328125, -19.5615234375, -18.48193359375, -17.40234375, -16.32275390625, -15.2431640625, -14.16357421875, -13.083984375, -12.00439453125, -10.9248046875, -9.84521484375, -8.765625, -7.68603515625, -6.6064453125, -5.52685546875, -4.447265625, -3.36767578125, -2.2880859375, -1.20849609375, -0.12890625, 0.95068359375, 2.0302734375, 3.10986328125, 4.189453125, 5.26904296875, 6.3486328125, 7.42822265625, 8.5078125, 9.58740234375, 10.6669921875, 11.74658203125, 12.826171875, 13.90576171875, 14.9853515625, 16.06494140625, 17.14453125, 18.22412109375, 19.3037109375, 20.38330078125, 21.462890625, 22.54248046875, 23.6220703125, 24.70166015625, 25.78125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 6.0, 16.0, 28.0, 35.0, 48.0, 89.0, 169.0, 400.0, 879.0, 1229.0, 598.0, 260.0, 120.0, 63.0, 37.0, 26.0, 26.0, 6.0, 6.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.728515625, -2.64892578125, -2.5693359375, -2.48974609375, -2.41015625, -2.33056640625, -2.2509765625, -2.17138671875, -2.091796875, -2.01220703125, -1.9326171875, -1.85302734375, -1.7734375, -1.69384765625, -1.6142578125, -1.53466796875, -1.455078125, -1.37548828125, -1.2958984375, -1.21630859375, -1.13671875, -1.05712890625, -0.9775390625, -0.89794921875, -0.818359375, -0.73876953125, -0.6591796875, -0.57958984375, -0.5, -0.42041015625, -0.3408203125, -0.26123046875, -0.181640625, -0.10205078125, -0.0224609375, 0.05712890625, 0.13671875, 0.21630859375, 0.2958984375, 0.37548828125, 0.455078125, 0.53466796875, 0.6142578125, 0.69384765625, 0.7734375, 0.85302734375, 0.9326171875, 1.01220703125, 1.091796875, 1.17138671875, 1.2509765625, 1.33056640625, 1.41015625, 1.48974609375, 1.5693359375, 1.64892578125, 1.728515625, 1.80810546875, 1.8876953125, 1.96728515625, 2.046875, 2.12646484375, 2.2060546875, 2.28564453125, 2.365234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 7.0, 15.0, 14.0, 21.0, 17.0, 29.0, 57.0, 61.0, 64.0, 76.0, 94.0, 94.0, 94.0, 70.0, 58.0, 41.0, 36.0, 40.0, 25.0, 20.0, 17.0, 15.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.958065986633301, -4.793521404266357, -4.628976821899414, -4.464432239532471, -4.299887657165527, -4.135343074798584, -3.9707984924316406, -3.8062539100646973, -3.641709327697754, -3.4771647453308105, -3.312620162963867, -3.148075580596924, -2.9835309982299805, -2.818986415863037, -2.6544418334960938, -2.4898972511291504, -2.325352668762207, -2.1608080863952637, -1.9962635040283203, -1.831718921661377, -1.6671743392944336, -1.5026297569274902, -1.3380851745605469, -1.1735405921936035, -1.0089960098266602, -0.8444514274597168, -0.6799068450927734, -0.5153622627258301, -0.3508176803588867, -0.18627309799194336, -0.021728515625, 0.14281606674194336, 0.3073611259460449, 0.4719057083129883, 0.6364502906799316, 0.800994873046875, 0.9655394554138184, 1.1300840377807617, 1.294628620147705, 1.4591732025146484, 1.6237177848815918, 1.7882623672485352, 1.9528069496154785, 2.117351531982422, 2.2818961143493652, 2.4464406967163086, 2.610985279083252, 2.7755298614501953, 2.9400744438171387, 3.104619026184082, 3.2691636085510254, 3.4337081909179688, 3.598252773284912, 3.7627973556518555, 3.927341938018799, 4.091886520385742, 4.2564311027526855, 4.420975685119629, 4.585520267486572, 4.750064849853516, 4.914609432220459, 5.079154014587402, 5.243698596954346, 5.408243179321289, 5.572787761688232]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 1.0, 8.0, 12.0, 10.0, 13.0, 11.0, 19.0, 12.0, 22.0, 13.0, 22.0, 17.0, 29.0, 33.0, 38.0, 31.0, 36.0, 40.0, 37.0, 29.0, 41.0, 41.0, 33.0, 27.0, 36.0, 30.0, 29.0, 36.0, 31.0, 33.0, 19.0, 32.0, 24.0, 20.0, 26.0, 26.0, 12.0, 5.0, 7.0, 9.0, 9.0, 8.0, 5.0, 7.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.525717258453369, -2.4362633228302, -2.346809148788452, -2.257355213165283, -2.167901039123535, -2.078447103500366, -1.9889931678771973, -1.8995391130447388, -1.8100850582122803, -1.7206310033798218, -1.6311769485473633, -1.5417230129241943, -1.4522689580917358, -1.3628149032592773, -1.2733609676361084, -1.18390691280365, -1.0944528579711914, -1.004998803138733, -0.9155448079109192, -0.8260908126831055, -0.736636757850647, -0.6471827030181885, -0.5577287077903748, -0.46827471256256104, -0.37882065773010254, -0.28936663269996643, -0.19991260766983032, -0.11045858263969421, -0.021004557609558105, 0.068449467420578, 0.1579034924507141, 0.24735748767852783, 0.3368113040924072, 0.42626532912254333, 0.5157193541526794, 0.6051733493804932, 0.6946274042129517, 0.7840814590454102, 0.8735354542732239, 0.9629894495010376, 1.052443504333496, 1.1418975591659546, 1.231351613998413, 1.320805549621582, 1.4102596044540405, 1.499713659286499, 1.589167594909668, 1.6786216497421265, 1.768075704574585, 1.8575297594070435, 1.946983814239502, 2.036437749862671, 2.12589168548584, 2.215345859527588, 2.304799795150757, 2.394253730773926, 2.483707904815674, 2.5731618404388428, 2.662616014480591, 2.7520699501037598, 2.841524124145508, 2.9309780597686768, 3.0204319953918457, 3.1098861694335938, 3.1993401050567627]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 20.0, 28.0, 29.0, 43.0, 63.0, 104.0, 178.0, 212.0, 322.0, 612.0, 877.0, 1487.0, 2222.0, 3644.0, 6023.0, 10063.0, 17715.0, 31976.0, 59479.0, 113291.0, 219697.0, 260009.0, 149272.0, 76242.0, 40625.0, 22364.0, 12615.0, 7464.0, 4465.0, 2670.0, 1737.0, 1104.0, 657.0, 436.0, 274.0, 164.0, 126.0, 91.0, 39.0, 33.0, 26.0, 14.0, 9.0, 3.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.2578125, -1.2199249267578125, -1.182037353515625, -1.1441497802734375, -1.10626220703125, -1.0683746337890625, -1.030487060546875, -0.9925994873046875, -0.9547119140625, -0.9168243408203125, -0.878936767578125, -0.8410491943359375, -0.80316162109375, -0.7652740478515625, -0.727386474609375, -0.6894989013671875, -0.651611328125, -0.6137237548828125, -0.575836181640625, -0.5379486083984375, -0.50006103515625, -0.4621734619140625, -0.424285888671875, -0.3863983154296875, -0.3485107421875, -0.3106231689453125, -0.272735595703125, -0.2348480224609375, -0.19696044921875, -0.1590728759765625, -0.121185302734375, -0.0832977294921875, -0.04541015625, -0.0075225830078125, 0.030364990234375, 0.0682525634765625, 0.10614013671875, 0.1440277099609375, 0.181915283203125, 0.2198028564453125, 0.2576904296875, 0.2955780029296875, 0.333465576171875, 0.3713531494140625, 0.40924072265625, 0.4471282958984375, 0.485015869140625, 0.5229034423828125, 0.560791015625, 0.5986785888671875, 0.636566162109375, 0.6744537353515625, 0.71234130859375, 0.7502288818359375, 0.788116455078125, 0.8260040283203125, 0.8638916015625, 0.9017791748046875, 0.939666748046875, 0.9775543212890625, 1.01544189453125, 1.0533294677734375, 1.091217041015625, 1.1291046142578125, 1.1669921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 2.0, 8.0, 18.0, 12.0, 14.0, 12.0, 25.0, 28.0, 18.0, 21.0, 28.0, 42.0, 48.0, 45.0, 32.0, 46.0, 58.0, 50.0, 37.0, 45.0, 47.0, 39.0, 45.0, 31.0, 45.0, 45.0, 22.0, 24.0, 23.0, 21.0, 16.0, 3.0, 9.0, 16.0, 7.0, 7.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.048095703125, -1.96923828125, -1.890380859375, -1.8115234375, -1.732666015625, -1.65380859375, -1.574951171875, -1.49609375, -1.417236328125, -1.33837890625, -1.259521484375, -1.1806640625, -1.101806640625, -1.02294921875, -0.944091796875, -0.865234375, -0.786376953125, -0.70751953125, -0.628662109375, -0.5498046875, -0.470947265625, -0.39208984375, -0.313232421875, -0.234375, -0.155517578125, -0.07666015625, 0.002197265625, 0.0810546875, 0.159912109375, 0.23876953125, 0.317626953125, 0.396484375, 0.475341796875, 0.55419921875, 0.633056640625, 0.7119140625, 0.790771484375, 0.86962890625, 0.948486328125, 1.02734375, 1.106201171875, 1.18505859375, 1.263916015625, 1.3427734375, 1.421630859375, 1.50048828125, 1.579345703125, 1.658203125, 1.737060546875, 1.81591796875, 1.894775390625, 1.9736328125, 2.052490234375, 2.13134765625, 2.210205078125, 2.2890625, 2.367919921875, 2.44677734375, 2.525634765625, 2.6044921875, 2.683349609375, 2.76220703125, 2.841064453125, 2.919921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 15.0, 10.0, 23.0, 40.0, 60.0, 96.0, 144.0, 275.0, 539.0, 1083.0, 2355.0, 5741.0, 16119.0, 59230.0, 287660.0, 508718.0, 121806.0, 28695.0, 9051.0, 3611.0, 1578.0, 758.0, 398.0, 224.0, 109.0, 52.0, 37.0, 28.0, 28.0, 18.0, 3.0, 4.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.33349609375, -2.2587890625, -2.18408203125, -2.109375, -2.03466796875, -1.9599609375, -1.88525390625, -1.810546875, -1.73583984375, -1.6611328125, -1.58642578125, -1.51171875, -1.43701171875, -1.3623046875, -1.28759765625, -1.212890625, -1.13818359375, -1.0634765625, -0.98876953125, -0.9140625, -0.83935546875, -0.7646484375, -0.68994140625, -0.615234375, -0.54052734375, -0.4658203125, -0.39111328125, -0.31640625, -0.24169921875, -0.1669921875, -0.09228515625, -0.017578125, 0.05712890625, 0.1318359375, 0.20654296875, 0.28125, 0.35595703125, 0.4306640625, 0.50537109375, 0.580078125, 0.65478515625, 0.7294921875, 0.80419921875, 0.87890625, 0.95361328125, 1.0283203125, 1.10302734375, 1.177734375, 1.25244140625, 1.3271484375, 1.40185546875, 1.4765625, 1.55126953125, 1.6259765625, 1.70068359375, 1.775390625, 1.85009765625, 1.9248046875, 1.99951171875, 2.07421875, 2.14892578125, 2.2236328125, 2.29833984375, 2.373046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 12.0, 13.0, 17.0, 24.0, 20.0, 24.0, 31.0, 32.0, 37.0, 49.0, 45.0, 55.0, 63.0, 47.0, 69.0, 48.0, 53.0, 52.0, 53.0, 42.0, 33.0, 37.0, 26.0, 30.0, 11.0, 15.0, 18.0, 3.0, 5.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66796875, -5.49542236328125, -5.3228759765625, -5.15032958984375, -4.977783203125, -4.80523681640625, -4.6326904296875, -4.46014404296875, -4.28759765625, -4.11505126953125, -3.9425048828125, -3.76995849609375, -3.597412109375, -3.42486572265625, -3.2523193359375, -3.07977294921875, -2.9072265625, -2.73468017578125, -2.5621337890625, -2.38958740234375, -2.217041015625, -2.04449462890625, -1.8719482421875, -1.69940185546875, -1.52685546875, -1.35430908203125, -1.1817626953125, -1.00921630859375, -0.836669921875, -0.66412353515625, -0.4915771484375, -0.31903076171875, -0.146484375, 0.02606201171875, 0.1986083984375, 0.37115478515625, 0.543701171875, 0.71624755859375, 0.8887939453125, 1.06134033203125, 1.23388671875, 1.40643310546875, 1.5789794921875, 1.75152587890625, 1.924072265625, 2.09661865234375, 2.2691650390625, 2.44171142578125, 2.6142578125, 2.78680419921875, 2.9593505859375, 3.13189697265625, 3.304443359375, 3.47698974609375, 3.6495361328125, 3.82208251953125, 3.99462890625, 4.16717529296875, 4.3397216796875, 4.51226806640625, 4.684814453125, 4.85736083984375, 5.0299072265625, 5.20245361328125, 5.375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 18.0, 35.0, 50.0, 86.0, 95.0, 147.0, 252.0, 417.0, 729.0, 1290.0, 2392.0, 4451.0, 10018.0, 24834.0, 76102.0, 401228.0, 404994.0, 76594.0, 24767.0, 9906.0, 4641.0, 2260.0, 1318.0, 724.0, 422.0, 262.0, 161.0, 116.0, 65.0, 41.0, 25.0, 18.0, 17.0, 20.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3232612609863281, -0.31082916259765625, -0.2983970642089844, -0.2859649658203125, -0.2735328674316406, -0.26110076904296875, -0.24866867065429688, -0.236236572265625, -0.22380447387695312, -0.21137237548828125, -0.19894027709960938, -0.1865081787109375, -0.17407608032226562, -0.16164398193359375, -0.14921188354492188, -0.13677978515625, -0.12434768676757812, -0.11191558837890625, -0.09948348999023438, -0.0870513916015625, -0.07461929321289062, -0.06218719482421875, -0.049755096435546875, -0.037322998046875, -0.024890899658203125, -0.01245880126953125, -2.6702880859375e-05, 0.0124053955078125, 0.024837493896484375, 0.03726959228515625, 0.049701690673828125, 0.0621337890625, 0.07456588745117188, 0.08699798583984375, 0.09943008422851562, 0.1118621826171875, 0.12429428100585938, 0.13672637939453125, 0.14915847778320312, 0.161590576171875, 0.17402267456054688, 0.18645477294921875, 0.19888687133789062, 0.2113189697265625, 0.22375106811523438, 0.23618316650390625, 0.24861526489257812, 0.26104736328125, 0.2734794616699219, 0.28591156005859375, 0.2983436584472656, 0.3107757568359375, 0.3232078552246094, 0.33563995361328125, 0.3480720520019531, 0.360504150390625, 0.3729362487792969, 0.38536834716796875, 0.3978004455566406, 0.4102325439453125, 0.4226646423339844, 0.43509674072265625, 0.4475288391113281, 0.4599609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 8.0, 7.0, 12.0, 24.0, 27.0, 43.0, 56.0, 109.0, 182.0, 200.0, 117.0, 72.0, 46.0, 35.0, 12.0, 11.0, 14.0, 6.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005350112915039062, -0.0005205832421779633, -0.0005061551928520203, -0.0004917271435260773, -0.0004772990942001343, -0.0004628710448741913, -0.0004484429955482483, -0.0004340149462223053, -0.0004195868968963623, -0.0004051588475704193, -0.0003907307982444763, -0.0003763027489185333, -0.00036187469959259033, -0.00034744665026664734, -0.00033301860094070435, -0.00031859055161476135, -0.00030416250228881836, -0.00028973445296287537, -0.0002753064036369324, -0.0002608783543109894, -0.0002464503049850464, -0.0002320222556591034, -0.0002175942063331604, -0.0002031661570072174, -0.00018873810768127441, -0.00017431005835533142, -0.00015988200902938843, -0.00014545395970344543, -0.00013102591037750244, -0.00011659786105155945, -0.00010216981172561646, -8.774176239967346e-05, -7.331371307373047e-05, -5.8885663747787476e-05, -4.445761442184448e-05, -3.002956509590149e-05, -1.5601515769958496e-05, -1.173466444015503e-06, 1.325458288192749e-05, 2.7682632207870483e-05, 4.2110681533813477e-05, 5.653873085975647e-05, 7.096678018569946e-05, 8.539482951164246e-05, 9.982287883758545e-05, 0.00011425092816352844, 0.00012867897748947144, 0.00014310702681541443, 0.00015753507614135742, 0.00017196312546730042, 0.0001863911747932434, 0.0002008192241191864, 0.0002152472734451294, 0.0002296753227710724, 0.00024410337209701538, 0.0002585314214229584, 0.00027295947074890137, 0.00028738752007484436, 0.00030181556940078735, 0.00031624361872673035, 0.00033067166805267334, 0.00034509971737861633, 0.0003595277667045593, 0.0003739558160305023, 0.0003883838653564453]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 14.0, 16.0, 42.0, 53.0, 115.0, 226.0, 527.0, 1244.0, 3164.0, 9862.0, 36573.0, 226529.0, 650539.0, 90626.0, 19665.0, 5798.0, 1966.0, 863.0, 353.0, 159.0, 89.0, 44.0, 28.0, 15.0, 10.0, 7.0, 6.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.484375, -0.46724700927734375, -0.4501190185546875, -0.43299102783203125, -0.415863037109375, -0.39873504638671875, -0.3816070556640625, -0.36447906494140625, -0.34735107421875, -0.33022308349609375, -0.3130950927734375, -0.29596710205078125, -0.278839111328125, -0.26171112060546875, -0.2445831298828125, -0.22745513916015625, -0.2103271484375, -0.19319915771484375, -0.1760711669921875, -0.15894317626953125, -0.141815185546875, -0.12468719482421875, -0.1075592041015625, -0.09043121337890625, -0.07330322265625, -0.05617523193359375, -0.0390472412109375, -0.02191925048828125, -0.004791259765625, 0.01233673095703125, 0.0294647216796875, 0.04659271240234375, 0.063720703125, 0.08084869384765625, 0.0979766845703125, 0.11510467529296875, 0.132232666015625, 0.14936065673828125, 0.1664886474609375, 0.18361663818359375, 0.20074462890625, 0.21787261962890625, 0.2350006103515625, 0.25212860107421875, 0.269256591796875, 0.28638458251953125, 0.3035125732421875, 0.32064056396484375, 0.3377685546875, 0.35489654541015625, 0.3720245361328125, 0.38915252685546875, 0.406280517578125, 0.42340850830078125, 0.4405364990234375, 0.45766448974609375, 0.47479248046875, 0.49192047119140625, 0.5090484619140625, 0.5261764526367188, 0.543304443359375, 0.5604324340820312, 0.5775604248046875, 0.5946884155273438, 0.61181640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 8.0, 10.0, 15.0, 11.0, 11.0, 16.0, 23.0, 30.0, 34.0, 54.0, 58.0, 67.0, 75.0, 89.0, 87.0, 81.0, 56.0, 48.0, 40.0, 22.0, 39.0, 15.0, 17.0, 17.0, 8.0, 10.0, 11.0, 4.0, 6.0, 3.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.09832763671875, -0.09531688690185547, -0.09230613708496094, -0.0892953872680664, -0.08628463745117188, -0.08327388763427734, -0.08026313781738281, -0.07725238800048828, -0.07424163818359375, -0.07123088836669922, -0.06822013854980469, -0.06520938873291016, -0.062198638916015625, -0.059187889099121094, -0.05617713928222656, -0.05316638946533203, -0.0501556396484375, -0.04714488983154297, -0.04413414001464844, -0.041123390197753906, -0.038112640380859375, -0.035101890563964844, -0.03209114074707031, -0.02908039093017578, -0.02606964111328125, -0.02305889129638672, -0.020048141479492188, -0.017037391662597656, -0.014026641845703125, -0.011015892028808594, -0.008005142211914062, -0.004994392395019531, -0.001983642578125, 0.0010271072387695312, 0.0040378570556640625, 0.007048606872558594, 0.010059356689453125, 0.013070106506347656, 0.016080856323242188, 0.01909160614013672, 0.02210235595703125, 0.02511310577392578, 0.028123855590820312, 0.031134605407714844, 0.034145355224609375, 0.037156105041503906, 0.04016685485839844, 0.04317760467529297, 0.0461883544921875, 0.04919910430908203, 0.05220985412597656, 0.055220603942871094, 0.058231353759765625, 0.061242103576660156, 0.06425285339355469, 0.06726360321044922, 0.07027435302734375, 0.07328510284423828, 0.07629585266113281, 0.07930660247802734, 0.08231735229492188, 0.0853281021118164, 0.08833885192871094, 0.09134960174560547, 0.0943603515625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 10.0, 16.0, 21.0, 19.0, 37.0, 54.0, 85.0, 101.0, 163.0, 149.0, 89.0, 72.0, 58.0, 43.0, 31.0, 13.0, 15.0, 13.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.007998943328857, -3.869391918182373, -3.7307846546173096, -3.592177629470825, -3.4535703659057617, -3.3149633407592773, -3.176356315612793, -3.0377492904663086, -2.899142026901245, -2.7605350017547607, -2.6219277381896973, -2.483320713043213, -2.3447136878967285, -2.206106424331665, -2.0674993991851807, -1.9288922548294067, -1.7902851104736328, -1.6516779661178589, -1.513070821762085, -1.3744637966156006, -1.2358566522598267, -1.0972495079040527, -0.9586424231529236, -0.8200353384017944, -0.6814281940460205, -0.5428210496902466, -0.40421396493911743, -0.2656068503856659, -0.12699973583221436, 0.01160740852355957, 0.15021449327468872, 0.28882157802581787, 0.4274282455444336, 0.5660353899002075, 0.7046424746513367, 0.8432495594024658, 0.9818567037582397, 1.1204638481140137, 1.259070873260498, 1.397678017616272, 1.536285161972046, 1.6748923063278198, 1.8134994506835938, 1.9521064758300781, 2.0907135009765625, 2.229320764541626, 2.3679277896881104, 2.506535053253174, 2.645142078399658, 2.7837491035461426, 2.922356367111206, 3.0609633922576904, 3.199570655822754, 3.3381776809692383, 3.4767847061157227, 3.615391731262207, 3.7539989948272705, 3.892606019973755, 4.031213283538818, 4.169820308685303, 4.308427333831787, 4.44703483581543, 4.585641860961914, 4.724248886108398, 4.862855911254883]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 9.0, 9.0, 20.0, 13.0, 18.0, 20.0, 20.0, 18.0, 29.0, 34.0, 53.0, 47.0, 38.0, 42.0, 44.0, 50.0, 47.0, 36.0, 39.0, 47.0, 34.0, 48.0, 34.0, 26.0, 44.0, 28.0, 35.0, 17.0, 17.0, 9.0, 10.0, 6.0, 14.0, 11.0, 6.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0213634967803955, -1.9487606287002563, -1.8761577606201172, -1.803554892539978, -1.7309520244598389, -1.6583491563796997, -1.5857462882995605, -1.513143539428711, -1.4405405521392822, -1.367937684059143, -1.295334815979004, -1.2227319478988647, -1.1501290798187256, -1.0775262117385864, -1.0049233436584473, -0.9323205351829529, -0.8597177267074585, -0.7871148586273193, -0.7145119905471802, -0.641909122467041, -0.5693062543869019, -0.4967034161090851, -0.4241005778312683, -0.35149770975112915, -0.27889484167099, -0.20629197359085083, -0.13368912041187286, -0.0610862672328949, 0.011516600847244263, 0.08411946892738342, 0.1567223072052002, 0.22932517528533936, 0.3019280433654785, 0.3745309114456177, 0.44713377952575684, 0.519736647605896, 0.5923395156860352, 0.6649423837661743, 0.7375451922416687, 0.8101480603218079, 0.882750928401947, 0.9553537964820862, 1.0279566049575806, 1.1005594730377197, 1.1731623411178589, 1.245765209197998, 1.3183680772781372, 1.3909709453582764, 1.4635738134384155, 1.5361766815185547, 1.6087795495986938, 1.681382417678833, 1.7539852857589722, 1.8265881538391113, 1.899190902709961, 1.9717938899993896, 2.0443966388702393, 2.116999387741089, 2.1896023750305176, 2.262205123901367, 2.334808111190796, 2.4074108600616455, 2.480013847351074, 2.552616596221924, 2.6252195835113525]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 6.0, 6.0, 12.0, 12.0, 12.0, 16.0, 16.0, 24.0, 38.0, 49.0, 105.0, 161.0, 264.0, 410.0, 848.0, 1492.0, 3259.0, 7794.0, 24171.0, 137373.0, 744789.0, 94931.0, 19894.0, 6815.0, 2922.0, 1342.0, 744.0, 385.0, 219.0, 119.0, 88.0, 72.0, 44.0, 28.0, 19.0, 13.0, 12.0, 6.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.01171875, -2.9188232421875, -2.825927734375, -2.7330322265625, -2.64013671875, -2.5472412109375, -2.454345703125, -2.3614501953125, -2.2685546875, -2.1756591796875, -2.082763671875, -1.9898681640625, -1.89697265625, -1.8040771484375, -1.711181640625, -1.6182861328125, -1.525390625, -1.4324951171875, -1.339599609375, -1.2467041015625, -1.15380859375, -1.0609130859375, -0.968017578125, -0.8751220703125, -0.7822265625, -0.6893310546875, -0.596435546875, -0.5035400390625, -0.41064453125, -0.3177490234375, -0.224853515625, -0.1319580078125, -0.0390625, 0.0538330078125, 0.146728515625, 0.2396240234375, 0.33251953125, 0.4254150390625, 0.518310546875, 0.6112060546875, 0.7041015625, 0.7969970703125, 0.889892578125, 0.9827880859375, 1.07568359375, 1.1685791015625, 1.261474609375, 1.3543701171875, 1.447265625, 1.5401611328125, 1.633056640625, 1.7259521484375, 1.81884765625, 1.9117431640625, 2.004638671875, 2.0975341796875, 2.1904296875, 2.2833251953125, 2.376220703125, 2.4691162109375, 2.56201171875, 2.6549072265625, 2.747802734375, 2.8406982421875, 2.93359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 2.0, 8.0, 7.0, 7.0, 13.0, 7.0, 15.0, 16.0, 19.0, 25.0, 20.0, 26.0, 43.0, 37.0, 33.0, 28.0, 43.0, 44.0, 45.0, 40.0, 46.0, 37.0, 56.0, 37.0, 47.0, 45.0, 39.0, 22.0, 31.0, 28.0, 28.0, 16.0, 15.0, 7.0, 7.0, 9.0, 12.0, 10.0, 7.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.9375, -3.80224609375, -3.6669921875, -3.53173828125, -3.396484375, -3.26123046875, -3.1259765625, -2.99072265625, -2.85546875, -2.72021484375, -2.5849609375, -2.44970703125, -2.314453125, -2.17919921875, -2.0439453125, -1.90869140625, -1.7734375, -1.63818359375, -1.5029296875, -1.36767578125, -1.232421875, -1.09716796875, -0.9619140625, -0.82666015625, -0.69140625, -0.55615234375, -0.4208984375, -0.28564453125, -0.150390625, -0.01513671875, 0.1201171875, 0.25537109375, 0.390625, 0.52587890625, 0.6611328125, 0.79638671875, 0.931640625, 1.06689453125, 1.2021484375, 1.33740234375, 1.47265625, 1.60791015625, 1.7431640625, 1.87841796875, 2.013671875, 2.14892578125, 2.2841796875, 2.41943359375, 2.5546875, 2.68994140625, 2.8251953125, 2.96044921875, 3.095703125, 3.23095703125, 3.3662109375, 3.50146484375, 3.63671875, 3.77197265625, 3.9072265625, 4.04248046875, 4.177734375, 4.31298828125, 4.4482421875, 4.58349609375, 4.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 9.0, 13.0, 17.0, 14.0, 21.0, 39.0, 30.0, 36.0, 59.0, 59.0, 76.0, 135.0, 334.0, 3081.0, 968722.0, 73829.0, 1373.0, 218.0, 103.0, 63.0, 51.0, 48.0, 34.0, 28.0, 18.0, 19.0, 23.0, 22.0, 14.0, 7.0, 5.0, 8.0, 6.0, 8.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.28125, -16.755126953125, -16.22900390625, -15.702880859375, -15.1767578125, -14.650634765625, -14.12451171875, -13.598388671875, -13.072265625, -12.546142578125, -12.02001953125, -11.493896484375, -10.9677734375, -10.441650390625, -9.91552734375, -9.389404296875, -8.86328125, -8.337158203125, -7.81103515625, -7.284912109375, -6.7587890625, -6.232666015625, -5.70654296875, -5.180419921875, -4.654296875, -4.128173828125, -3.60205078125, -3.075927734375, -2.5498046875, -2.023681640625, -1.49755859375, -0.971435546875, -0.4453125, 0.080810546875, 0.60693359375, 1.133056640625, 1.6591796875, 2.185302734375, 2.71142578125, 3.237548828125, 3.763671875, 4.289794921875, 4.81591796875, 5.342041015625, 5.8681640625, 6.394287109375, 6.92041015625, 7.446533203125, 7.97265625, 8.498779296875, 9.02490234375, 9.551025390625, 10.0771484375, 10.603271484375, 11.12939453125, 11.655517578125, 12.181640625, 12.707763671875, 13.23388671875, 13.760009765625, 14.2861328125, 14.812255859375, 15.33837890625, 15.864501953125, 16.390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 1.0, 2.0, 10.0, 8.0, 8.0, 12.0, 11.0, 18.0, 23.0, 35.0, 34.0, 38.0, 37.0, 47.0, 56.0, 48.0, 50.0, 61.0, 49.0, 63.0, 56.0, 53.0, 48.0, 36.0, 37.0, 20.0, 21.0, 17.0, 20.0, 15.0, 13.0, 14.0, 8.0, 6.0, 9.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484375, -6.26666259765625, -6.0489501953125, -5.83123779296875, -5.613525390625, -5.39581298828125, -5.1781005859375, -4.96038818359375, -4.74267578125, -4.52496337890625, -4.3072509765625, -4.08953857421875, -3.871826171875, -3.65411376953125, -3.4364013671875, -3.21868896484375, -3.0009765625, -2.78326416015625, -2.5655517578125, -2.34783935546875, -2.130126953125, -1.91241455078125, -1.6947021484375, -1.47698974609375, -1.25927734375, -1.04156494140625, -0.8238525390625, -0.60614013671875, -0.388427734375, -0.17071533203125, 0.0469970703125, 0.26470947265625, 0.482421875, 0.70013427734375, 0.9178466796875, 1.13555908203125, 1.353271484375, 1.57098388671875, 1.7886962890625, 2.00640869140625, 2.22412109375, 2.44183349609375, 2.6595458984375, 2.87725830078125, 3.094970703125, 3.31268310546875, 3.5303955078125, 3.74810791015625, 3.9658203125, 4.18353271484375, 4.4012451171875, 4.61895751953125, 4.836669921875, 5.05438232421875, 5.2720947265625, 5.48980712890625, 5.70751953125, 5.92523193359375, 6.1429443359375, 6.36065673828125, 6.578369140625, 6.79608154296875, 7.0137939453125, 7.23150634765625, 7.44921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 13.0, 18.0, 23.0, 49.0, 70.0, 207.0, 1608.0, 496643.0, 547922.0, 1605.0, 214.0, 65.0, 33.0, 15.0, 15.0, 10.0, 10.0, 4.0, 3.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.3203125, -8.1312255859375, -7.942138671875, -7.7530517578125, -7.56396484375, -7.3748779296875, -7.185791015625, -6.9967041015625, -6.8076171875, -6.6185302734375, -6.429443359375, -6.2403564453125, -6.05126953125, -5.8621826171875, -5.673095703125, -5.4840087890625, -5.294921875, -5.1058349609375, -4.916748046875, -4.7276611328125, -4.53857421875, -4.3494873046875, -4.160400390625, -3.9713134765625, -3.7822265625, -3.5931396484375, -3.404052734375, -3.2149658203125, -3.02587890625, -2.8367919921875, -2.647705078125, -2.4586181640625, -2.26953125, -2.0804443359375, -1.891357421875, -1.7022705078125, -1.51318359375, -1.3240966796875, -1.135009765625, -0.9459228515625, -0.7568359375, -0.5677490234375, -0.378662109375, -0.1895751953125, -0.00048828125, 0.1885986328125, 0.377685546875, 0.5667724609375, 0.755859375, 0.9449462890625, 1.134033203125, 1.3231201171875, 1.51220703125, 1.7012939453125, 1.890380859375, 2.0794677734375, 2.2685546875, 2.4576416015625, 2.646728515625, 2.8358154296875, 3.02490234375, 3.2139892578125, 3.403076171875, 3.5921630859375, 3.78125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 3.0, 2.0, 5.0, 14.0, 12.0, 26.0, 52.0, 84.0, 208.0, 302.0, 112.0, 61.0, 34.0, 16.0, 16.0, 16.0, 6.0, 9.0, 9.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002713203430175781, -0.00026234984397888184, -0.00025337934494018555, -0.00024440884590148926, -0.00023543834686279297, -0.00022646784782409668, -0.0002174973487854004, -0.0002085268497467041, -0.0001995563507080078, -0.00019058585166931152, -0.00018161535263061523, -0.00017264485359191895, -0.00016367435455322266, -0.00015470385551452637, -0.00014573335647583008, -0.0001367628574371338, -0.0001277923583984375, -0.00011882185935974121, -0.00010985136032104492, -0.00010088086128234863, -9.191036224365234e-05, -8.293986320495605e-05, -7.396936416625977e-05, -6.499886512756348e-05, -5.602836608886719e-05, -4.70578670501709e-05, -3.808736801147461e-05, -2.911686897277832e-05, -2.014636993408203e-05, -1.1175870895385742e-05, -2.205371856689453e-06, 6.765127182006836e-06, 1.5735626220703125e-05, 2.4706125259399414e-05, 3.36766242980957e-05, 4.264712333679199e-05, 5.161762237548828e-05, 6.058812141418457e-05, 6.955862045288086e-05, 7.852911949157715e-05, 8.749961853027344e-05, 9.647011756896973e-05, 0.00010544061660766602, 0.0001144111156463623, 0.0001233816146850586, 0.00013235211372375488, 0.00014132261276245117, 0.00015029311180114746, 0.00015926361083984375, 0.00016823410987854004, 0.00017720460891723633, 0.00018617510795593262, 0.0001951456069946289, 0.0002041161060333252, 0.00021308660507202148, 0.00022205710411071777, 0.00023102760314941406, 0.00023999810218811035, 0.00024896860122680664, 0.00025793910026550293, 0.0002669095993041992, 0.0002758800983428955, 0.0002848505973815918, 0.0002938210964202881, 0.0003027915954589844]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 9.0, 10.0, 3.0, 13.0, 14.0, 19.0, 22.0, 50.0, 116.0, 426.0, 2667.0, 47106.0, 975104.0, 20745.0, 1710.0, 305.0, 80.0, 43.0, 27.0, 18.0, 14.0, 12.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-4.078125, -3.962890625, -3.84765625, -3.732421875, -3.6171875, -3.501953125, -3.38671875, -3.271484375, -3.15625, -3.041015625, -2.92578125, -2.810546875, -2.6953125, -2.580078125, -2.46484375, -2.349609375, -2.234375, -2.119140625, -2.00390625, -1.888671875, -1.7734375, -1.658203125, -1.54296875, -1.427734375, -1.3125, -1.197265625, -1.08203125, -0.966796875, -0.8515625, -0.736328125, -0.62109375, -0.505859375, -0.390625, -0.275390625, -0.16015625, -0.044921875, 0.0703125, 0.185546875, 0.30078125, 0.416015625, 0.53125, 0.646484375, 0.76171875, 0.876953125, 0.9921875, 1.107421875, 1.22265625, 1.337890625, 1.453125, 1.568359375, 1.68359375, 1.798828125, 1.9140625, 2.029296875, 2.14453125, 2.259765625, 2.375, 2.490234375, 2.60546875, 2.720703125, 2.8359375, 2.951171875, 3.06640625, 3.181640625, 3.296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 7.0, 13.0, 20.0, 16.0, 28.0, 42.0, 36.0, 61.0, 98.0, 164.0, 157.0, 81.0, 55.0, 44.0, 36.0, 24.0, 17.0, 12.0, 16.0, 14.0, 8.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.413330078125, -0.3984642028808594, -0.38359832763671875, -0.3687324523925781, -0.3538665771484375, -0.3390007019042969, -0.32413482666015625, -0.3092689514160156, -0.294403076171875, -0.2795372009277344, -0.26467132568359375, -0.24980545043945312, -0.2349395751953125, -0.22007369995117188, -0.20520782470703125, -0.19034194946289062, -0.17547607421875, -0.16061019897460938, -0.14574432373046875, -0.13087844848632812, -0.1160125732421875, -0.10114669799804688, -0.08628082275390625, -0.07141494750976562, -0.056549072265625, -0.041683197021484375, -0.02681732177734375, -0.011951446533203125, 0.0029144287109375, 0.017780303955078125, 0.03264617919921875, 0.047512054443359375, 0.0623779296875, 0.07724380493164062, 0.09210968017578125, 0.10697555541992188, 0.1218414306640625, 0.13670730590820312, 0.15157318115234375, 0.16643905639648438, 0.181304931640625, 0.19617080688476562, 0.21103668212890625, 0.22590255737304688, 0.2407684326171875, 0.2556343078613281, 0.27050018310546875, 0.2853660583496094, 0.30023193359375, 0.3150978088378906, 0.32996368408203125, 0.3448295593261719, 0.3596954345703125, 0.3745613098144531, 0.38942718505859375, 0.4042930603027344, 0.419158935546875, 0.4340248107910156, 0.44889068603515625, 0.4637565612792969, 0.4786224365234375, 0.4934883117675781, 0.5083541870117188, 0.5232200622558594, 0.5380859375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 4.0, 11.0, 15.0, 14.0, 33.0, 38.0, 74.0, 84.0, 130.0, 111.0, 123.0, 87.0, 85.0, 53.0, 45.0, 31.0, 20.0, 12.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.201132774353027, -10.951082229614258, -10.701031684875488, -10.450981140136719, -10.200931549072266, -9.950881004333496, -9.700830459594727, -9.450779914855957, -9.200729370117188, -8.950678825378418, -8.700628280639648, -8.450578689575195, -8.200528144836426, -7.950477600097656, -7.700427055358887, -7.450376510620117, -7.200326442718506, -6.950275897979736, -6.700225830078125, -6.4501752853393555, -6.200124740600586, -5.950074195861816, -5.700024127960205, -5.4499735832214355, -5.199923515319824, -4.949872970581055, -4.699822902679443, -4.449772357940674, -4.199721813201904, -3.949671506881714, -3.6996212005615234, -3.449570655822754, -3.199519634246826, -2.9494693279266357, -2.699418783187866, -2.449368476867676, -2.1993179321289062, -1.9492676258087158, -1.6992173194885254, -1.4491668939590454, -1.1991164684295654, -0.9490660429000854, -0.6990156769752502, -0.44896531105041504, -0.19891488552093506, 0.05113554000854492, 0.30118584632873535, 0.5512362718582153, 0.8012866973876953, 1.0513371229171753, 1.3013875484466553, 1.5514378547668457, 1.8014882802963257, 2.0515387058258057, 2.301589012145996, 2.5516395568847656, 2.801689863204956, 3.0517401695251465, 3.301790714263916, 3.5518410205841064, 3.801891326904297, 4.051941871643066, 4.301992416381836, 4.552042484283447, 4.802093029022217]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 8.0, 10.0, 7.0, 13.0, 22.0, 24.0, 39.0, 31.0, 36.0, 36.0, 42.0, 38.0, 60.0, 53.0, 57.0, 52.0, 49.0, 50.0, 63.0, 38.0, 39.0, 40.0, 43.0, 24.0, 20.0, 15.0, 14.0, 17.0, 12.0, 8.0, 15.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.479508399963379, -9.19746208190918, -8.915416717529297, -8.633370399475098, -8.351324081420898, -8.0692777633667, -7.787231922149658, -7.505186080932617, -7.223139762878418, -6.941093444824219, -6.659047603607178, -6.377001762390137, -6.0949554443359375, -5.812909126281738, -5.530863285064697, -5.248817443847656, -4.966771125793457, -4.684724807739258, -4.402678966522217, -4.120633125305176, -3.8385868072509766, -3.5565407276153564, -3.2744946479797363, -2.992448568344116, -2.710402488708496, -2.428356409072876, -2.146310329437256, -1.8642642498016357, -1.5822181701660156, -1.3001720905303955, -1.0181260108947754, -0.7360799312591553, -0.45403480529785156, -0.17198872566223145, 0.11005735397338867, 0.3921034336090088, 0.6741495132446289, 0.956195592880249, 1.2382416725158691, 1.5202877521514893, 1.8023338317871094, 2.0843799114227295, 2.3664259910583496, 2.6484720706939697, 2.93051815032959, 3.21256422996521, 3.49461030960083, 3.77665638923645, 4.05870246887207, 4.3407487869262695, 4.6227946281433105, 4.904840469360352, 5.186886787414551, 5.46893310546875, 5.750978946685791, 6.033024787902832, 6.315071105957031, 6.5971174240112305, 6.8791632652282715, 7.1612091064453125, 7.443255424499512, 7.725301742553711, 8.007347106933594, 8.289393424987793, 8.571439743041992]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 8.0, 3.0, 5.0, 13.0, 14.0, 23.0, 29.0, 40.0, 56.0, 88.0, 110.0, 141.0, 235.0, 340.0, 599.0, 971.0, 1939.0, 3784.0, 8958.0, 26503.0, 166063.0, 1764941.0, 1994016.0, 179854.0, 28166.0, 8992.0, 3796.0, 1800.0, 1052.0, 589.0, 368.0, 241.0, 167.0, 102.0, 87.0, 50.0, 28.0, 38.0, 22.0, 17.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.36328125, -5.19580078125, -5.0283203125, -4.86083984375, -4.693359375, -4.52587890625, -4.3583984375, -4.19091796875, -4.0234375, -3.85595703125, -3.6884765625, -3.52099609375, -3.353515625, -3.18603515625, -3.0185546875, -2.85107421875, -2.68359375, -2.51611328125, -2.3486328125, -2.18115234375, -2.013671875, -1.84619140625, -1.6787109375, -1.51123046875, -1.34375, -1.17626953125, -1.0087890625, -0.84130859375, -0.673828125, -0.50634765625, -0.3388671875, -0.17138671875, -0.00390625, 0.16357421875, 0.3310546875, 0.49853515625, 0.666015625, 0.83349609375, 1.0009765625, 1.16845703125, 1.3359375, 1.50341796875, 1.6708984375, 1.83837890625, 2.005859375, 2.17333984375, 2.3408203125, 2.50830078125, 2.67578125, 2.84326171875, 3.0107421875, 3.17822265625, 3.345703125, 3.51318359375, 3.6806640625, 3.84814453125, 4.015625, 4.18310546875, 4.3505859375, 4.51806640625, 4.685546875, 4.85302734375, 5.0205078125, 5.18798828125, 5.35546875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 15.0, 16.0, 19.0, 26.0, 27.0, 40.0, 43.0, 35.0, 38.0, 44.0, 43.0, 69.0, 55.0, 67.0, 57.0, 43.0, 51.0, 39.0, 44.0, 48.0, 34.0, 24.0, 22.0, 24.0, 13.0, 8.0, 14.0, 8.0, 7.0, 11.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.06512451171875, -2.9642333984375, -2.86334228515625, -2.762451171875, -2.66156005859375, -2.5606689453125, -2.45977783203125, -2.35888671875, -2.25799560546875, -2.1571044921875, -2.05621337890625, -1.955322265625, -1.85443115234375, -1.7535400390625, -1.65264892578125, -1.5517578125, -1.45086669921875, -1.3499755859375, -1.24908447265625, -1.148193359375, -1.04730224609375, -0.9464111328125, -0.84552001953125, -0.74462890625, -0.64373779296875, -0.5428466796875, -0.44195556640625, -0.341064453125, -0.24017333984375, -0.1392822265625, -0.03839111328125, 0.0625, 0.16339111328125, 0.2642822265625, 0.36517333984375, 0.466064453125, 0.56695556640625, 0.6678466796875, 0.76873779296875, 0.86962890625, 0.97052001953125, 1.0714111328125, 1.17230224609375, 1.273193359375, 1.37408447265625, 1.4749755859375, 1.57586669921875, 1.6767578125, 1.77764892578125, 1.8785400390625, 1.97943115234375, 2.080322265625, 2.18121337890625, 2.2821044921875, 2.38299560546875, 2.48388671875, 2.58477783203125, 2.6856689453125, 2.78656005859375, 2.887451171875, 2.98834228515625, 3.0892333984375, 3.19012451171875, 3.291015625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 1.0, 4.0, 4.0, 13.0, 12.0, 20.0, 34.0, 53.0, 89.0, 157.0, 370.0, 759.0, 2316.0, 13677.0, 553655.0, 3589196.0, 28526.0, 3491.0, 1012.0, 398.0, 200.0, 109.0, 64.0, 31.0, 27.0, 18.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.40625, -15.99755859375, -15.5888671875, -15.18017578125, -14.771484375, -14.36279296875, -13.9541015625, -13.54541015625, -13.13671875, -12.72802734375, -12.3193359375, -11.91064453125, -11.501953125, -11.09326171875, -10.6845703125, -10.27587890625, -9.8671875, -9.45849609375, -9.0498046875, -8.64111328125, -8.232421875, -7.82373046875, -7.4150390625, -7.00634765625, -6.59765625, -6.18896484375, -5.7802734375, -5.37158203125, -4.962890625, -4.55419921875, -4.1455078125, -3.73681640625, -3.328125, -2.91943359375, -2.5107421875, -2.10205078125, -1.693359375, -1.28466796875, -0.8759765625, -0.46728515625, -0.05859375, 0.35009765625, 0.7587890625, 1.16748046875, 1.576171875, 1.98486328125, 2.3935546875, 2.80224609375, 3.2109375, 3.61962890625, 4.0283203125, 4.43701171875, 4.845703125, 5.25439453125, 5.6630859375, 6.07177734375, 6.48046875, 6.88916015625, 7.2978515625, 7.70654296875, 8.115234375, 8.52392578125, 8.9326171875, 9.34130859375, 9.75]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 13.0, 20.0, 21.0, 26.0, 49.0, 69.0, 91.0, 129.0, 260.0, 462.0, 808.0, 844.0, 506.0, 295.0, 170.0, 80.0, 61.0, 38.0, 32.0, 25.0, 21.0, 13.0, 5.0, 7.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2890625, -2.22900390625, -2.1689453125, -2.10888671875, -2.048828125, -1.98876953125, -1.9287109375, -1.86865234375, -1.80859375, -1.74853515625, -1.6884765625, -1.62841796875, -1.568359375, -1.50830078125, -1.4482421875, -1.38818359375, -1.328125, -1.26806640625, -1.2080078125, -1.14794921875, -1.087890625, -1.02783203125, -0.9677734375, -0.90771484375, -0.84765625, -0.78759765625, -0.7275390625, -0.66748046875, -0.607421875, -0.54736328125, -0.4873046875, -0.42724609375, -0.3671875, -0.30712890625, -0.2470703125, -0.18701171875, -0.126953125, -0.06689453125, -0.0068359375, 0.05322265625, 0.11328125, 0.17333984375, 0.2333984375, 0.29345703125, 0.353515625, 0.41357421875, 0.4736328125, 0.53369140625, 0.59375, 0.65380859375, 0.7138671875, 0.77392578125, 0.833984375, 0.89404296875, 0.9541015625, 1.01416015625, 1.07421875, 1.13427734375, 1.1943359375, 1.25439453125, 1.314453125, 1.37451171875, 1.4345703125, 1.49462890625, 1.5546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 10.0, 14.0, 7.0, 19.0, 27.0, 29.0, 37.0, 41.0, 77.0, 77.0, 97.0, 92.0, 84.0, 77.0, 51.0, 66.0, 42.0, 38.0, 22.0, 21.0, 11.0, 13.0, 13.0, 7.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.749384880065918, -4.598608016967773, -4.447831630706787, -4.297054767608643, -4.146277904510498, -3.9955012798309326, -3.844724655151367, -3.6939477920532227, -3.5431711673736572, -3.392394542694092, -3.2416176795959473, -3.090841054916382, -2.9400644302368164, -2.789287567138672, -2.6385109424591064, -2.487734317779541, -2.3369574546813965, -2.186180830001831, -2.0354039669036865, -1.884627342224121, -1.7338505983352661, -1.5830738544464111, -1.4322972297668457, -1.2815204858779907, -1.1307437419891357, -0.9799669981002808, -0.8291903138160706, -0.6784136295318604, -0.5276368856430054, -0.3768601417541504, -0.22608345746994019, -0.07530677318572998, 0.075469970703125, 0.2262466847896576, 0.3770233988761902, 0.5278000831604004, 0.6785768270492554, 0.8293535709381104, 0.9801302552223206, 1.1309069395065308, 1.2816836833953857, 1.4324604272842407, 1.5832371711730957, 1.7340137958526611, 1.8847905397415161, 2.035567283630371, 2.1863439083099365, 2.337120532989502, 2.4878973960876465, 2.638674020767212, 2.7894508838653564, 2.940227508544922, 3.0910043716430664, 3.241780996322632, 3.3925576210021973, 3.543334484100342, 3.6941111087799072, 3.8448877334594727, 3.995664596557617, 4.146441459655762, 4.297217845916748, 4.447994709014893, 4.598771572113037, 4.749547958374023, 4.900324821472168]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 7.0, 1.0, 7.0, 12.0, 5.0, 10.0, 17.0, 19.0, 18.0, 28.0, 25.0, 31.0, 28.0, 40.0, 42.0, 39.0, 33.0, 46.0, 49.0, 32.0, 39.0, 33.0, 42.0, 34.0, 37.0, 36.0, 28.0, 27.0, 26.0, 25.0, 33.0, 32.0, 17.0, 18.0, 13.0, 11.0, 8.0, 13.0, 13.0, 10.0, 3.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5517444610595703, -2.4590368270874023, -2.3663289546966553, -2.2736213207244873, -2.1809134483337402, -2.0882058143615723, -1.9954981803894043, -1.9027904272079468, -1.8100826740264893, -1.7173749208450317, -1.6246671676635742, -1.5319595336914062, -1.4392517805099487, -1.3465440273284912, -1.2538363933563232, -1.1611286401748657, -1.0684208869934082, -0.9757131338119507, -0.8830054402351379, -0.7902977466583252, -0.6975899934768677, -0.6048822402954102, -0.5121745467185974, -0.41946685314178467, -0.32675909996032715, -0.23405137658119202, -0.14134365320205688, -0.04863592982292175, 0.04407179355621338, 0.1367795169353485, 0.22948724031448364, 0.3221949338912964, 0.4149026870727539, 0.5076104402542114, 0.6003181338310242, 0.6930258274078369, 0.7857335805892944, 0.878441333770752, 0.9711490273475647, 1.0638567209243774, 1.156564474105835, 1.2492722272872925, 1.34197998046875, 1.434687614440918, 1.5273953676223755, 1.620103120803833, 1.712810754776001, 1.8055185079574585, 1.898226261138916, 1.9909340143203735, 2.083641767501831, 2.176349401473999, 2.269057273864746, 2.361764907836914, 2.454472541809082, 2.54718017578125, 2.639888048171997, 2.732595682144165, 2.825303554534912, 2.91801118850708, 3.010718822479248, 3.103426694869995, 3.196134328842163, 3.28884220123291, 3.381549835205078]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 8.0, 7.0, 5.0, 19.0, 23.0, 18.0, 45.0, 70.0, 125.0, 213.0, 397.0, 764.0, 1481.0, 3241.0, 7701.0, 19770.0, 61296.0, 260682.0, 500706.0, 132744.0, 36419.0, 12838.0, 5220.0, 2330.0, 1172.0, 548.0, 262.0, 170.0, 100.0, 62.0, 38.0, 27.0, 12.0, 11.0, 15.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.017578125, -1.955078125, -1.892578125, -1.830078125, -1.767578125, -1.705078125, -1.642578125, -1.580078125, -1.517578125, -1.455078125, -1.392578125, -1.330078125, -1.267578125, -1.205078125, -1.142578125, -1.080078125, -1.017578125, -0.955078125, -0.892578125, -0.830078125, -0.767578125, -0.705078125, -0.642578125, -0.580078125, -0.517578125, -0.455078125, -0.392578125, -0.330078125, -0.267578125, -0.205078125, -0.142578125, -0.080078125, -0.017578125, 0.044921875, 0.107421875, 0.169921875, 0.232421875, 0.294921875, 0.357421875, 0.419921875, 0.482421875, 0.544921875, 0.607421875, 0.669921875, 0.732421875, 0.794921875, 0.857421875, 0.919921875, 0.982421875, 1.044921875, 1.107421875, 1.169921875, 1.232421875, 1.294921875, 1.357421875, 1.419921875, 1.482421875, 1.544921875, 1.607421875, 1.669921875, 1.732421875, 1.794921875, 1.857421875, 1.919921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 9.0, 13.0, 22.0, 21.0, 25.0, 29.0, 37.0, 40.0, 48.0, 48.0, 43.0, 56.0, 53.0, 49.0, 55.0, 38.0, 50.0, 48.0, 45.0, 41.0, 26.0, 31.0, 32.0, 23.0, 17.0, 11.0, 19.0, 15.0, 8.0, 10.0, 5.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9223175048828125, -1.853424072265625, -1.7845306396484375, -1.71563720703125, -1.6467437744140625, -1.577850341796875, -1.5089569091796875, -1.4400634765625, -1.3711700439453125, -1.302276611328125, -1.2333831787109375, -1.16448974609375, -1.0955963134765625, -1.026702880859375, -0.9578094482421875, -0.888916015625, -0.8200225830078125, -0.751129150390625, -0.6822357177734375, -0.61334228515625, -0.5444488525390625, -0.475555419921875, -0.4066619873046875, -0.3377685546875, -0.2688751220703125, -0.199981689453125, -0.1310882568359375, -0.06219482421875, 0.0066986083984375, 0.075592041015625, 0.1444854736328125, 0.21337890625, 0.2822723388671875, 0.351165771484375, 0.4200592041015625, 0.48895263671875, 0.5578460693359375, 0.626739501953125, 0.6956329345703125, 0.7645263671875, 0.8334197998046875, 0.902313232421875, 0.9712066650390625, 1.04010009765625, 1.1089935302734375, 1.177886962890625, 1.2467803955078125, 1.315673828125, 1.3845672607421875, 1.453460693359375, 1.5223541259765625, 1.59124755859375, 1.6601409912109375, 1.729034423828125, 1.7979278564453125, 1.8668212890625, 1.9357147216796875, 2.004608154296875, 2.0735015869140625, 2.14239501953125, 2.2112884521484375, 2.280181884765625, 2.3490753173828125, 2.41796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 12.0, 9.0, 7.0, 18.0, 45.0, 56.0, 79.0, 154.0, 287.0, 543.0, 1265.0, 3265.0, 9894.0, 38741.0, 230431.0, 615349.0, 114611.0, 22825.0, 6492.0, 2382.0, 944.0, 486.0, 249.0, 152.0, 83.0, 63.0, 42.0, 23.0, 17.0, 9.0, 10.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.623046875, -2.55633544921875, -2.4896240234375, -2.42291259765625, -2.356201171875, -2.28948974609375, -2.2227783203125, -2.15606689453125, -2.08935546875, -2.02264404296875, -1.9559326171875, -1.88922119140625, -1.822509765625, -1.75579833984375, -1.6890869140625, -1.62237548828125, -1.5556640625, -1.48895263671875, -1.4222412109375, -1.35552978515625, -1.288818359375, -1.22210693359375, -1.1553955078125, -1.08868408203125, -1.02197265625, -0.95526123046875, -0.8885498046875, -0.82183837890625, -0.755126953125, -0.68841552734375, -0.6217041015625, -0.55499267578125, -0.48828125, -0.42156982421875, -0.3548583984375, -0.28814697265625, -0.221435546875, -0.15472412109375, -0.0880126953125, -0.02130126953125, 0.04541015625, 0.11212158203125, 0.1788330078125, 0.24554443359375, 0.312255859375, 0.37896728515625, 0.4456787109375, 0.51239013671875, 0.5791015625, 0.64581298828125, 0.7125244140625, 0.77923583984375, 0.845947265625, 0.91265869140625, 0.9793701171875, 1.04608154296875, 1.11279296875, 1.17950439453125, 1.2462158203125, 1.31292724609375, 1.379638671875, 1.44635009765625, 1.5130615234375, 1.57977294921875, 1.646484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 13.0, 17.0, 20.0, 20.0, 31.0, 23.0, 31.0, 28.0, 42.0, 54.0, 49.0, 50.0, 55.0, 58.0, 65.0, 52.0, 40.0, 43.0, 38.0, 42.0, 34.0, 30.0, 22.0, 24.0, 19.0, 9.0, 10.0, 8.0, 16.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.19140625, -4.05816650390625, -3.9249267578125, -3.79168701171875, -3.658447265625, -3.52520751953125, -3.3919677734375, -3.25872802734375, -3.12548828125, -2.99224853515625, -2.8590087890625, -2.72576904296875, -2.592529296875, -2.45928955078125, -2.3260498046875, -2.19281005859375, -2.0595703125, -1.92633056640625, -1.7930908203125, -1.65985107421875, -1.526611328125, -1.39337158203125, -1.2601318359375, -1.12689208984375, -0.99365234375, -0.86041259765625, -0.7271728515625, -0.59393310546875, -0.460693359375, -0.32745361328125, -0.1942138671875, -0.06097412109375, 0.072265625, 0.20550537109375, 0.3387451171875, 0.47198486328125, 0.605224609375, 0.73846435546875, 0.8717041015625, 1.00494384765625, 1.13818359375, 1.27142333984375, 1.4046630859375, 1.53790283203125, 1.671142578125, 1.80438232421875, 1.9376220703125, 2.07086181640625, 2.2041015625, 2.33734130859375, 2.4705810546875, 2.60382080078125, 2.737060546875, 2.87030029296875, 3.0035400390625, 3.13677978515625, 3.27001953125, 3.40325927734375, 3.5364990234375, 3.66973876953125, 3.802978515625, 3.93621826171875, 4.0694580078125, 4.20269775390625, 4.3359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 11.0, 7.0, 8.0, 24.0, 43.0, 45.0, 74.0, 115.0, 190.0, 396.0, 725.0, 1423.0, 3506.0, 9936.0, 42035.0, 444161.0, 483081.0, 45559.0, 10358.0, 3622.0, 1593.0, 723.0, 362.0, 190.0, 145.0, 70.0, 42.0, 39.0, 21.0, 16.0, 10.0, 9.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8359375, -0.8127288818359375, -0.789520263671875, -0.7663116455078125, -0.74310302734375, -0.7198944091796875, -0.696685791015625, -0.6734771728515625, -0.6502685546875, -0.6270599365234375, -0.603851318359375, -0.5806427001953125, -0.55743408203125, -0.5342254638671875, -0.511016845703125, -0.4878082275390625, -0.464599609375, -0.4413909912109375, -0.418182373046875, -0.3949737548828125, -0.37176513671875, -0.3485565185546875, -0.325347900390625, -0.3021392822265625, -0.2789306640625, -0.2557220458984375, -0.232513427734375, -0.2093048095703125, -0.18609619140625, -0.1628875732421875, -0.139678955078125, -0.1164703369140625, -0.09326171875, -0.0700531005859375, -0.046844482421875, -0.0236358642578125, -0.00042724609375, 0.0227813720703125, 0.045989990234375, 0.0691986083984375, 0.0924072265625, 0.1156158447265625, 0.138824462890625, 0.1620330810546875, 0.18524169921875, 0.2084503173828125, 0.231658935546875, 0.2548675537109375, 0.278076171875, 0.3012847900390625, 0.324493408203125, 0.3477020263671875, 0.37091064453125, 0.3941192626953125, 0.417327880859375, 0.4405364990234375, 0.4637451171875, 0.4869537353515625, 0.510162353515625, 0.5333709716796875, 0.55657958984375, 0.5797882080078125, 0.602996826171875, 0.6262054443359375, 0.6494140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 7.0, 16.0, 21.0, 17.0, 45.0, 91.0, 245.0, 261.0, 147.0, 65.0, 29.0, 14.0, 14.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007615089416503906, -0.0007378607988357544, -0.0007142126560211182, -0.0006905645132064819, -0.0006669163703918457, -0.0006432682275772095, -0.0006196200847625732, -0.000595971941947937, -0.0005723237991333008, -0.0005486756563186646, -0.0005250275135040283, -0.0005013793706893921, -0.00047773122787475586, -0.00045408308506011963, -0.0004304349422454834, -0.00040678679943084717, -0.00038313865661621094, -0.0003594905138015747, -0.0003358423709869385, -0.00031219422817230225, -0.000288546085357666, -0.0002648979425430298, -0.00024124979972839355, -0.00021760165691375732, -0.0001939535140991211, -0.00017030537128448486, -0.00014665722846984863, -0.0001230090856552124, -9.936094284057617e-05, -7.571280002593994e-05, -5.206465721130371e-05, -2.841651439666748e-05, -4.76837158203125e-06, 1.887977123260498e-05, 4.252791404724121e-05, 6.617605686187744e-05, 8.982419967651367e-05, 0.0001134723424911499, 0.00013712048530578613, 0.00016076862812042236, 0.0001844167709350586, 0.00020806491374969482, 0.00023171305656433105, 0.0002553611993789673, 0.0002790093421936035, 0.00030265748500823975, 0.000326305627822876, 0.0003499537706375122, 0.00037360191345214844, 0.00039725005626678467, 0.0004208981990814209, 0.00044454634189605713, 0.00046819448471069336, 0.0004918426275253296, 0.0005154907703399658, 0.000539138913154602, 0.0005627870559692383, 0.0005864351987838745, 0.0006100833415985107, 0.000633731484413147, 0.0006573796272277832, 0.0006810277700424194, 0.0007046759128570557, 0.0007283240556716919, 0.0007519721984863281]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 2.0, 5.0, 7.0, 9.0, 10.0, 22.0, 35.0, 48.0, 67.0, 115.0, 142.0, 277.0, 417.0, 616.0, 859.0, 1639.0, 2773.0, 5432.0, 11644.0, 32765.0, 133909.0, 544002.0, 233640.0, 49136.0, 15757.0, 6835.0, 3360.0, 1898.0, 1130.0, 671.0, 461.0, 266.0, 190.0, 120.0, 81.0, 63.0, 46.0, 28.0, 15.0, 18.0, 5.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.486572265625, -0.4716758728027344, -0.45677947998046875, -0.4418830871582031, -0.4269866943359375, -0.4120903015136719, -0.39719390869140625, -0.3822975158691406, -0.367401123046875, -0.3525047302246094, -0.33760833740234375, -0.3227119445800781, -0.3078155517578125, -0.2929191589355469, -0.27802276611328125, -0.2631263732910156, -0.24822998046875, -0.23333358764648438, -0.21843719482421875, -0.20354080200195312, -0.1886444091796875, -0.17374801635742188, -0.15885162353515625, -0.14395523071289062, -0.129058837890625, -0.11416244506835938, -0.09926605224609375, -0.08436965942382812, -0.0694732666015625, -0.054576873779296875, -0.03968048095703125, -0.024784088134765625, -0.0098876953125, 0.005008697509765625, 0.01990509033203125, 0.034801483154296875, 0.0496978759765625, 0.06459426879882812, 0.07949066162109375, 0.09438705444335938, 0.109283447265625, 0.12417984008789062, 0.13907623291015625, 0.15397262573242188, 0.1688690185546875, 0.18376541137695312, 0.19866180419921875, 0.21355819702148438, 0.22845458984375, 0.24335098266601562, 0.25824737548828125, 0.2731437683105469, 0.2880401611328125, 0.3029365539550781, 0.31783294677734375, 0.3327293395996094, 0.347625732421875, 0.3625221252441406, 0.37741851806640625, 0.3923149108886719, 0.4072113037109375, 0.4221076965332031, 0.43700408935546875, 0.4519004821777344, 0.466796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 7.0, 16.0, 20.0, 20.0, 28.0, 39.0, 60.0, 61.0, 94.0, 102.0, 104.0, 98.0, 94.0, 58.0, 44.0, 33.0, 24.0, 16.0, 12.0, 10.0, 8.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.1349649429321289, -0.1308917999267578, -0.12681865692138672, -0.12274551391601562, -0.11867237091064453, -0.11459922790527344, -0.11052608489990234, -0.10645294189453125, -0.10237979888916016, -0.09830665588378906, -0.09423351287841797, -0.09016036987304688, -0.08608722686767578, -0.08201408386230469, -0.0779409408569336, -0.0738677978515625, -0.0697946548461914, -0.06572151184082031, -0.06164836883544922, -0.057575225830078125, -0.05350208282470703, -0.04942893981933594, -0.045355796813964844, -0.04128265380859375, -0.037209510803222656, -0.03313636779785156, -0.02906322479248047, -0.024990081787109375, -0.02091693878173828, -0.016843795776367188, -0.012770652770996094, -0.008697509765625, -0.004624366760253906, -0.0005512237548828125, 0.0035219192504882812, 0.007595062255859375, 0.011668205261230469, 0.015741348266601562, 0.019814491271972656, 0.02388763427734375, 0.027960777282714844, 0.03203392028808594, 0.03610706329345703, 0.040180206298828125, 0.04425334930419922, 0.04832649230957031, 0.052399635314941406, 0.0564727783203125, 0.060545921325683594, 0.06461906433105469, 0.06869220733642578, 0.07276535034179688, 0.07683849334716797, 0.08091163635253906, 0.08498477935791016, 0.08905792236328125, 0.09313106536865234, 0.09720420837402344, 0.10127735137939453, 0.10535049438476562, 0.10942363739013672, 0.11349678039550781, 0.1175699234008789, 0.12164306640625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 14.0, 11.0, 15.0, 29.0, 28.0, 44.0, 61.0, 85.0, 108.0, 119.0, 82.0, 80.0, 85.0, 40.0, 54.0, 40.0, 22.0, 15.0, 14.0, 12.0, 8.0, 6.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.452235221862793, -3.3555376529693604, -3.2588400840759277, -3.162142515182495, -3.0654449462890625, -2.96874737739563, -2.8720498085021973, -2.7753524780273438, -2.678654670715332, -2.5819571018218994, -2.485259532928467, -2.388561964035034, -2.2918643951416016, -2.195166826248169, -2.0984692573547363, -2.001771926879883, -1.9050743579864502, -1.8083767890930176, -1.711679220199585, -1.6149816513061523, -1.5182840824127197, -1.421586513519287, -1.324889063835144, -1.2281914949417114, -1.1314939260482788, -1.0347963571548462, -0.9380987882614136, -0.8414012789726257, -0.7447037100791931, -0.6480061411857605, -0.5513086318969727, -0.45461106300354004, -0.3579132556915283, -0.2612156867980957, -0.16451814770698547, -0.06782060861587524, 0.028876960277557373, 0.12557452917099, 0.22227203845977783, 0.31896960735321045, 0.41566717624664307, 0.5123647451400757, 0.6090623140335083, 0.7057598233222961, 0.8024573922157288, 0.8991549611091614, 0.9958524703979492, 1.0925500392913818, 1.1892476081848145, 1.285945177078247, 1.3826427459716797, 1.4793403148651123, 1.576037883758545, 1.6727354526519775, 1.7694329023361206, 1.8661304712295532, 1.9628280401229858, 2.059525489807129, 2.1562230587005615, 2.252920627593994, 2.3496181964874268, 2.4463157653808594, 2.543013334274292, 2.6397109031677246, 2.7364084720611572]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 6.0, 9.0, 10.0, 14.0, 11.0, 22.0, 18.0, 21.0, 23.0, 25.0, 31.0, 34.0, 38.0, 43.0, 35.0, 50.0, 40.0, 44.0, 44.0, 48.0, 43.0, 28.0, 35.0, 39.0, 29.0, 28.0, 23.0, 26.0, 27.0, 26.0, 23.0, 17.0, 13.0, 10.0, 11.0, 11.0, 11.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.466634750366211, -1.4116249084472656, -1.3566149473190308, -1.3016051054000854, -1.2465951442718506, -1.1915853023529053, -1.13657546043396, -1.081565499305725, -1.0265555381774902, -0.9715456366539001, -0.9165357351303101, -0.8615258932113647, -0.8065159320831299, -0.7515060901641846, -0.6964961886405945, -0.6414862871170044, -0.5864764451980591, -0.531466543674469, -0.4764566421508789, -0.4214467704296112, -0.3664368689060211, -0.31142696738243103, -0.25641709566116333, -0.20140719413757324, -0.14639729261398315, -0.09138739854097366, -0.03637750446796417, 0.01863238215446472, 0.07364228367805481, 0.1286521852016449, 0.1836620569229126, 0.23867195844650269, 0.2936818599700928, 0.34869176149368286, 0.40370166301727295, 0.45871153473854065, 0.5137214660644531, 0.5687313079833984, 0.6237412095069885, 0.6787511110305786, 0.7337610125541687, 0.7887709140777588, 0.8437808156013489, 0.898790717124939, 0.9538005590438843, 1.0088105201721191, 1.0638203620910645, 1.1188302040100098, 1.1738401651382446, 1.22885000705719, 1.2838599681854248, 1.3388698101043701, 1.393879771232605, 1.4488896131515503, 1.5038995742797852, 1.5589094161987305, 1.6139192581176758, 1.668929100036621, 1.723939061164856, 1.7789489030838013, 1.8339588642120361, 1.8889687061309814, 1.9439785480499268, 1.9989885091781616, 2.0539984703063965]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 13.0, 20.0, 24.0, 41.0, 48.0, 73.0, 110.0, 158.0, 219.0, 359.0, 494.0, 704.0, 1111.0, 1684.0, 2869.0, 5376.0, 10567.0, 26837.0, 84821.0, 383901.0, 391552.0, 86399.0, 27003.0, 10953.0, 5218.0, 2919.0, 1689.0, 1129.0, 721.0, 488.0, 383.0, 198.0, 158.0, 104.0, 81.0, 43.0, 25.0, 28.0, 13.0, 6.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.8027496337890625, -1.733428955078125, -1.6641082763671875, -1.59478759765625, -1.5254669189453125, -1.456146240234375, -1.3868255615234375, -1.3175048828125, -1.2481842041015625, -1.178863525390625, -1.1095428466796875, -1.04022216796875, -0.9709014892578125, -0.901580810546875, -0.8322601318359375, -0.762939453125, -0.6936187744140625, -0.624298095703125, -0.5549774169921875, -0.48565673828125, -0.4163360595703125, -0.347015380859375, -0.2776947021484375, -0.2083740234375, -0.1390533447265625, -0.069732666015625, -0.0004119873046875, 0.06890869140625, 0.1382293701171875, 0.207550048828125, 0.2768707275390625, 0.34619140625, 0.4155120849609375, 0.484832763671875, 0.5541534423828125, 0.62347412109375, 0.6927947998046875, 0.762115478515625, 0.8314361572265625, 0.9007568359375, 0.9700775146484375, 1.039398193359375, 1.1087188720703125, 1.17803955078125, 1.2473602294921875, 1.316680908203125, 1.3860015869140625, 1.455322265625, 1.5246429443359375, 1.593963623046875, 1.6632843017578125, 1.73260498046875, 1.8019256591796875, 1.871246337890625, 1.9405670166015625, 2.0098876953125, 2.0792083740234375, 2.148529052734375, 2.2178497314453125, 2.28717041015625, 2.3564910888671875, 2.425811767578125, 2.4951324462890625, 2.564453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 6.0, 8.0, 7.0, 9.0, 14.0, 17.0, 22.0, 31.0, 24.0, 36.0, 29.0, 28.0, 31.0, 45.0, 48.0, 41.0, 43.0, 47.0, 46.0, 49.0, 55.0, 33.0, 32.0, 33.0, 29.0, 23.0, 35.0, 27.0, 18.0, 21.0, 18.0, 17.0, 6.0, 17.0, 10.0, 9.0, 3.0, 10.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0625, -2.94573974609375, -2.8289794921875, -2.71221923828125, -2.595458984375, -2.47869873046875, -2.3619384765625, -2.24517822265625, -2.12841796875, -2.01165771484375, -1.8948974609375, -1.77813720703125, -1.661376953125, -1.54461669921875, -1.4278564453125, -1.31109619140625, -1.1943359375, -1.07757568359375, -0.9608154296875, -0.84405517578125, -0.727294921875, -0.61053466796875, -0.4937744140625, -0.37701416015625, -0.26025390625, -0.14349365234375, -0.0267333984375, 0.09002685546875, 0.206787109375, 0.32354736328125, 0.4403076171875, 0.55706787109375, 0.673828125, 0.79058837890625, 0.9073486328125, 1.02410888671875, 1.140869140625, 1.25762939453125, 1.3743896484375, 1.49114990234375, 1.60791015625, 1.72467041015625, 1.8414306640625, 1.95819091796875, 2.074951171875, 2.19171142578125, 2.3084716796875, 2.42523193359375, 2.5419921875, 2.65875244140625, 2.7755126953125, 2.89227294921875, 3.009033203125, 3.12579345703125, 3.2425537109375, 3.35931396484375, 3.47607421875, 3.59283447265625, 3.7095947265625, 3.82635498046875, 3.943115234375, 4.05987548828125, 4.1766357421875, 4.29339599609375, 4.41015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 3.0, 6.0, 8.0, 8.0, 16.0, 16.0, 13.0, 17.0, 23.0, 33.0, 51.0, 59.0, 89.0, 104.0, 256.0, 1749.0, 458610.0, 584857.0, 1912.0, 263.0, 109.0, 74.0, 58.0, 42.0, 33.0, 30.0, 24.0, 12.0, 20.0, 13.0, 17.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-22.859375, -22.24169921875, -21.6240234375, -21.00634765625, -20.388671875, -19.77099609375, -19.1533203125, -18.53564453125, -17.91796875, -17.30029296875, -16.6826171875, -16.06494140625, -15.447265625, -14.82958984375, -14.2119140625, -13.59423828125, -12.9765625, -12.35888671875, -11.7412109375, -11.12353515625, -10.505859375, -9.88818359375, -9.2705078125, -8.65283203125, -8.03515625, -7.41748046875, -6.7998046875, -6.18212890625, -5.564453125, -4.94677734375, -4.3291015625, -3.71142578125, -3.09375, -2.47607421875, -1.8583984375, -1.24072265625, -0.623046875, -0.00537109375, 0.6123046875, 1.22998046875, 1.84765625, 2.46533203125, 3.0830078125, 3.70068359375, 4.318359375, 4.93603515625, 5.5537109375, 6.17138671875, 6.7890625, 7.40673828125, 8.0244140625, 8.64208984375, 9.259765625, 9.87744140625, 10.4951171875, 11.11279296875, 11.73046875, 12.34814453125, 12.9658203125, 13.58349609375, 14.201171875, 14.81884765625, 15.4365234375, 16.05419921875, 16.671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 6.0, 5.0, 13.0, 19.0, 22.0, 25.0, 26.0, 43.0, 52.0, 61.0, 57.0, 65.0, 66.0, 73.0, 75.0, 47.0, 59.0, 48.0, 39.0, 36.0, 23.0, 34.0, 22.0, 14.0, 17.0, 8.0, 11.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34375, -6.1463623046875, -5.948974609375, -5.7515869140625, -5.55419921875, -5.3568115234375, -5.159423828125, -4.9620361328125, -4.7646484375, -4.5672607421875, -4.369873046875, -4.1724853515625, -3.97509765625, -3.7777099609375, -3.580322265625, -3.3829345703125, -3.185546875, -2.9881591796875, -2.790771484375, -2.5933837890625, -2.39599609375, -2.1986083984375, -2.001220703125, -1.8038330078125, -1.6064453125, -1.4090576171875, -1.211669921875, -1.0142822265625, -0.81689453125, -0.6195068359375, -0.422119140625, -0.2247314453125, -0.02734375, 0.1700439453125, 0.367431640625, 0.5648193359375, 0.76220703125, 0.9595947265625, 1.156982421875, 1.3543701171875, 1.5517578125, 1.7491455078125, 1.946533203125, 2.1439208984375, 2.34130859375, 2.5386962890625, 2.736083984375, 2.9334716796875, 3.130859375, 3.3282470703125, 3.525634765625, 3.7230224609375, 3.92041015625, 4.1177978515625, 4.315185546875, 4.5125732421875, 4.7099609375, 4.9073486328125, 5.104736328125, 5.3021240234375, 5.49951171875, 5.6968994140625, 5.894287109375, 6.0916748046875, 6.2890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 24.0, 32.0, 83.0, 146.0, 376.0, 1283.0, 6796.0, 271516.0, 756734.0, 9070.0, 1559.0, 485.0, 181.0, 103.0, 51.0, 27.0, 24.0, 11.0, 11.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69921875, -4.581939697265625, -4.46466064453125, -4.347381591796875, -4.2301025390625, -4.112823486328125, -3.99554443359375, -3.878265380859375, -3.760986328125, -3.643707275390625, -3.52642822265625, -3.409149169921875, -3.2918701171875, -3.174591064453125, -3.05731201171875, -2.940032958984375, -2.82275390625, -2.705474853515625, -2.58819580078125, -2.470916748046875, -2.3536376953125, -2.236358642578125, -2.11907958984375, -2.001800537109375, -1.884521484375, -1.767242431640625, -1.64996337890625, -1.532684326171875, -1.4154052734375, -1.298126220703125, -1.18084716796875, -1.063568115234375, -0.9462890625, -0.829010009765625, -0.71173095703125, -0.594451904296875, -0.4771728515625, -0.359893798828125, -0.24261474609375, -0.125335693359375, -0.008056640625, 0.109222412109375, 0.22650146484375, 0.343780517578125, 0.4610595703125, 0.578338623046875, 0.69561767578125, 0.812896728515625, 0.93017578125, 1.047454833984375, 1.16473388671875, 1.282012939453125, 1.3992919921875, 1.516571044921875, 1.63385009765625, 1.751129150390625, 1.868408203125, 1.985687255859375, 2.10296630859375, 2.220245361328125, 2.3375244140625, 2.454803466796875, 2.57208251953125, 2.689361572265625, 2.806640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 17.0, 21.0, 27.0, 56.0, 85.0, 157.0, 306.0, 127.0, 69.0, 38.0, 21.0, 15.0, 16.0, 8.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003025531768798828, -0.00029188767075538635, -0.0002812221646308899, -0.00027055665850639343, -0.00025989115238189697, -0.0002492256462574005, -0.00023856014013290405, -0.0002278946340084076, -0.00021722912788391113, -0.00020656362175941467, -0.0001958981156349182, -0.00018523260951042175, -0.0001745671033859253, -0.00016390159726142883, -0.00015323609113693237, -0.0001425705850124359, -0.00013190507888793945, -0.00012123957276344299, -0.00011057406663894653, -9.990856051445007e-05, -8.924305438995361e-05, -7.857754826545715e-05, -6.79120421409607e-05, -5.7246536016464233e-05, -4.6581029891967773e-05, -3.5915523767471313e-05, -2.5250017642974854e-05, -1.4584511518478394e-05, -3.919005393981934e-06, 6.746500730514526e-06, 1.7412006855010986e-05, 2.8077512979507446e-05, 3.8743019104003906e-05, 4.9408525228500366e-05, 6.0074031352996826e-05, 7.073953747749329e-05, 8.140504360198975e-05, 9.20705497264862e-05, 0.00010273605585098267, 0.00011340156197547913, 0.00012406706809997559, 0.00013473257422447205, 0.0001453980803489685, 0.00015606358647346497, 0.00016672909259796143, 0.00017739459872245789, 0.00018806010484695435, 0.0001987256109714508, 0.00020939111709594727, 0.00022005662322044373, 0.00023072212934494019, 0.00024138763546943665, 0.0002520531415939331, 0.00026271864771842957, 0.000273384153842926, 0.0002840496599674225, 0.00029471516609191895, 0.0003053806722164154, 0.00031604617834091187, 0.0003267116844654083, 0.0003373771905899048, 0.00034804269671440125, 0.0003587082028388977, 0.00036937370896339417, 0.0003800392150878906]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 9.0, 14.0, 26.0, 28.0, 35.0, 79.0, 120.0, 224.0, 443.0, 893.0, 1861.0, 4467.0, 13737.0, 88635.0, 838365.0, 78359.0, 13145.0, 4423.0, 1854.0, 862.0, 443.0, 226.0, 108.0, 72.0, 36.0, 21.0, 12.0, 16.0, 15.0, 7.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.21484375, -2.1557464599609375, -2.096649169921875, -2.0375518798828125, -1.97845458984375, -1.9193572998046875, -1.860260009765625, -1.8011627197265625, -1.7420654296875, -1.6829681396484375, -1.623870849609375, -1.5647735595703125, -1.50567626953125, -1.4465789794921875, -1.387481689453125, -1.3283843994140625, -1.269287109375, -1.2101898193359375, -1.151092529296875, -1.0919952392578125, -1.03289794921875, -0.9738006591796875, -0.914703369140625, -0.8556060791015625, -0.7965087890625, -0.7374114990234375, -0.678314208984375, -0.6192169189453125, -0.56011962890625, -0.5010223388671875, -0.441925048828125, -0.3828277587890625, -0.32373046875, -0.2646331787109375, -0.205535888671875, -0.1464385986328125, -0.08734130859375, -0.0282440185546875, 0.030853271484375, 0.0899505615234375, 0.1490478515625, 0.2081451416015625, 0.267242431640625, 0.3263397216796875, 0.38543701171875, 0.4445343017578125, 0.503631591796875, 0.5627288818359375, 0.621826171875, 0.6809234619140625, 0.740020751953125, 0.7991180419921875, 0.85821533203125, 0.9173126220703125, 0.976409912109375, 1.0355072021484375, 1.0946044921875, 1.1537017822265625, 1.212799072265625, 1.2718963623046875, 1.33099365234375, 1.3900909423828125, 1.449188232421875, 1.5082855224609375, 1.5673828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 12.0, 21.0, 25.0, 34.0, 61.0, 75.0, 112.0, 260.0, 139.0, 79.0, 53.0, 32.0, 17.0, 14.0, 12.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.900390625, -0.8726730346679688, -0.8449554443359375, -0.8172378540039062, -0.789520263671875, -0.7618026733398438, -0.7340850830078125, -0.7063674926757812, -0.67864990234375, -0.6509323120117188, -0.6232147216796875, -0.5954971313476562, -0.567779541015625, -0.5400619506835938, -0.5123443603515625, -0.48462677001953125, -0.4569091796875, -0.42919158935546875, -0.4014739990234375, -0.37375640869140625, -0.346038818359375, -0.31832122802734375, -0.2906036376953125, -0.26288604736328125, -0.23516845703125, -0.20745086669921875, -0.1797332763671875, -0.15201568603515625, -0.124298095703125, -0.09658050537109375, -0.0688629150390625, -0.04114532470703125, -0.013427734375, 0.01428985595703125, 0.0420074462890625, 0.06972503662109375, 0.097442626953125, 0.12516021728515625, 0.1528778076171875, 0.18059539794921875, 0.20831298828125, 0.23603057861328125, 0.2637481689453125, 0.29146575927734375, 0.319183349609375, 0.34690093994140625, 0.3746185302734375, 0.40233612060546875, 0.4300537109375, 0.45777130126953125, 0.4854888916015625, 0.5132064819335938, 0.540924072265625, 0.5686416625976562, 0.5963592529296875, 0.6240768432617188, 0.65179443359375, 0.6795120239257812, 0.7072296142578125, 0.7349472045898438, 0.762664794921875, 0.7903823852539062, 0.8180999755859375, 0.8458175659179688, 0.87353515625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 16.0, 99.0, 300.0, 396.0, 145.0, 41.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.186899185180664, -6.3047194480896, -5.422539710998535, -4.540359973907471, -3.6581802368164062, -2.776000499725342, -1.8938207626342773, -1.011641025543213, -0.12946128845214844, 0.752718448638916, 1.6348981857299805, 2.517077922821045, 3.3992576599121094, 4.281437397003174, 5.163617134094238, 6.045796871185303, 6.927976608276367, 7.810156345367432, 8.692336082458496, 9.574516296386719, 10.456695556640625, 11.338874816894531, 12.221055030822754, 13.103235244750977, 13.985414505004883, 14.867593765258789, 15.749773979187012, 16.631954193115234, 17.51413345336914, 18.396312713623047, 19.278491973876953, 20.160673141479492, 21.042850494384766, 21.925029754638672, 22.807209014892578, 23.689390182495117, 24.571569442749023, 25.45374870300293, 26.33592987060547, 27.218109130859375, 28.10028839111328, 28.982467651367188, 29.864646911621094, 30.746828079223633, 31.62900733947754, 32.51118850708008, 33.393367767333984, 34.27554702758789, 35.1577262878418, 36.0399055480957, 36.92208480834961, 37.804264068603516, 38.68644714355469, 39.568626403808594, 40.4508056640625, 41.332984924316406, 42.21516418457031, 43.09734344482422, 43.979522705078125, 44.86170196533203, 45.74388122558594, 46.62606430053711, 47.508243560791016, 48.39042282104492, 49.27260208129883]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 3.0, 7.0, 4.0, 11.0, 10.0, 7.0, 17.0, 12.0, 24.0, 16.0, 21.0, 17.0, 30.0, 28.0, 31.0, 26.0, 31.0, 36.0, 30.0, 23.0, 28.0, 41.0, 40.0, 32.0, 34.0, 44.0, 36.0, 30.0, 26.0, 40.0, 22.0, 26.0, 28.0, 17.0, 20.0, 16.0, 13.0, 20.0, 12.0, 12.0, 12.0, 18.0, 8.0, 10.0, 4.0, 5.0, 2.0, 5.0, 7.0, 3.0, 3.0, 1.0, 5.0], "bins": [-6.141655921936035, -5.9691162109375, -5.796576499938965, -5.62403678894043, -5.451497554779053, -5.278957843780518, -5.106418132781982, -4.933878421783447, -4.76133918762207, -4.588799476623535, -4.416259765625, -4.243720054626465, -4.071180820465088, -3.8986411094665527, -3.7261013984680176, -3.5535616874694824, -3.3810219764709473, -3.208482265472412, -3.035942792892456, -2.863403081893921, -2.690863609313965, -2.5183238983154297, -2.3457841873168945, -2.1732444763183594, -2.0007050037384033, -1.8281654119491577, -1.655625820159912, -1.483086109161377, -1.3105465173721313, -1.1380069255828857, -0.9654672145843506, -0.792927622795105, -0.6203885078430176, -0.4478488862514496, -0.2753092646598816, -0.10276961326599121, 0.0697699785232544, 0.2423095703125, 0.41484928131103516, 0.5873888731002808, 0.7599284648895264, 0.932468056678772, 1.1050076484680176, 1.2775473594665527, 1.4500869512557983, 1.622626543045044, 1.795166254043579, 1.9677058458328247, 2.1402454376220703, 2.3127851486206055, 2.4853246212005615, 2.6578643321990967, 2.8304038047790527, 3.002943515777588, 3.175483226776123, 3.348022937774658, 3.5205624103546143, 3.6931021213531494, 3.8656415939331055, 4.038181304931641, 4.210721015930176, 4.383260726928711, 4.555800437927246, 4.728339672088623, 4.900879383087158]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 3.0, 3.0, 3.0, 5.0, 11.0, 7.0, 10.0, 12.0, 20.0, 23.0, 24.0, 31.0, 29.0, 35.0, 61.0, 100.0, 231.0, 646.0, 1822.0, 7265.0, 132402.0, 3884452.0, 156175.0, 7779.0, 1892.0, 605.0, 248.0, 108.0, 47.0, 46.0, 27.0, 21.0, 25.0, 13.0, 19.0, 12.0, 14.0, 14.0, 6.0, 7.0, 8.0, 6.0, 1.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.8001708984375, -9.444091796875, -9.0880126953125, -8.73193359375, -8.3758544921875, -8.019775390625, -7.6636962890625, -7.3076171875, -6.9515380859375, -6.595458984375, -6.2393798828125, -5.88330078125, -5.5272216796875, -5.171142578125, -4.8150634765625, -4.458984375, -4.1029052734375, -3.746826171875, -3.3907470703125, -3.03466796875, -2.6785888671875, -2.322509765625, -1.9664306640625, -1.6103515625, -1.2542724609375, -0.898193359375, -0.5421142578125, -0.18603515625, 0.1700439453125, 0.526123046875, 0.8822021484375, 1.23828125, 1.5943603515625, 1.950439453125, 2.3065185546875, 2.66259765625, 3.0186767578125, 3.374755859375, 3.7308349609375, 4.0869140625, 4.4429931640625, 4.799072265625, 5.1551513671875, 5.51123046875, 5.8673095703125, 6.223388671875, 6.5794677734375, 6.935546875, 7.2916259765625, 7.647705078125, 8.0037841796875, 8.35986328125, 8.7159423828125, 9.072021484375, 9.4281005859375, 9.7841796875, 10.1402587890625, 10.496337890625, 10.8524169921875, 11.20849609375, 11.5645751953125, 11.920654296875, 12.2767333984375, 12.6328125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 7.0, 5.0, 9.0, 14.0, 11.0, 20.0, 25.0, 31.0, 21.0, 22.0, 29.0, 46.0, 36.0, 50.0, 47.0, 40.0, 49.0, 51.0, 40.0, 44.0, 49.0, 38.0, 35.0, 44.0, 34.0, 23.0, 28.0, 28.0, 20.0, 19.0, 12.0, 20.0, 8.0, 10.0, 7.0, 7.0, 10.0, 3.0, 0.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.685546875, -2.593017578125, -2.50048828125, -2.407958984375, -2.3154296875, -2.222900390625, -2.13037109375, -2.037841796875, -1.9453125, -1.852783203125, -1.76025390625, -1.667724609375, -1.5751953125, -1.482666015625, -1.39013671875, -1.297607421875, -1.205078125, -1.112548828125, -1.02001953125, -0.927490234375, -0.8349609375, -0.742431640625, -0.64990234375, -0.557373046875, -0.46484375, -0.372314453125, -0.27978515625, -0.187255859375, -0.0947265625, -0.002197265625, 0.09033203125, 0.182861328125, 0.275390625, 0.367919921875, 0.46044921875, 0.552978515625, 0.6455078125, 0.738037109375, 0.83056640625, 0.923095703125, 1.015625, 1.108154296875, 1.20068359375, 1.293212890625, 1.3857421875, 1.478271484375, 1.57080078125, 1.663330078125, 1.755859375, 1.848388671875, 1.94091796875, 2.033447265625, 2.1259765625, 2.218505859375, 2.31103515625, 2.403564453125, 2.49609375, 2.588623046875, 2.68115234375, 2.773681640625, 2.8662109375, 2.958740234375, 3.05126953125, 3.143798828125, 3.236328125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 6.0, 17.0, 28.0, 65.0, 162.0, 1233.0, 1914786.0, 2276412.0, 1284.0, 140.0, 60.0, 33.0, 20.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.068603515625, -16.21533203125, -15.362060546875, -14.5087890625, -13.655517578125, -12.80224609375, -11.948974609375, -11.095703125, -10.242431640625, -9.38916015625, -8.535888671875, -7.6826171875, -6.829345703125, -5.97607421875, -5.122802734375, -4.26953125, -3.416259765625, -2.56298828125, -1.709716796875, -0.8564453125, -0.003173828125, 0.85009765625, 1.703369140625, 2.556640625, 3.409912109375, 4.26318359375, 5.116455078125, 5.9697265625, 6.822998046875, 7.67626953125, 8.529541015625, 9.3828125, 10.236083984375, 11.08935546875, 11.942626953125, 12.7958984375, 13.649169921875, 14.50244140625, 15.355712890625, 16.208984375, 17.062255859375, 17.91552734375, 18.768798828125, 19.6220703125, 20.475341796875, 21.32861328125, 22.181884765625, 23.03515625, 23.888427734375, 24.74169921875, 25.594970703125, 26.4482421875, 27.301513671875, 28.15478515625, 29.008056640625, 29.861328125, 30.714599609375, 31.56787109375, 32.421142578125, 33.2744140625, 34.127685546875, 34.98095703125, 35.834228515625, 36.6875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 6.0, 3.0, 10.0, 7.0, 11.0, 12.0, 21.0, 24.0, 31.0, 42.0, 65.0, 99.0, 162.0, 234.0, 452.0, 648.0, 724.0, 546.0, 326.0, 216.0, 138.0, 85.0, 57.0, 35.0, 24.0, 18.0, 18.0, 17.0, 14.0, 6.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3564453125, -1.3157806396484375, -1.275115966796875, -1.2344512939453125, -1.19378662109375, -1.1531219482421875, -1.112457275390625, -1.0717926025390625, -1.0311279296875, -0.9904632568359375, -0.949798583984375, -0.9091339111328125, -0.86846923828125, -0.8278045654296875, -0.787139892578125, -0.7464752197265625, -0.705810546875, -0.6651458740234375, -0.624481201171875, -0.5838165283203125, -0.54315185546875, -0.5024871826171875, -0.461822509765625, -0.4211578369140625, -0.3804931640625, -0.3398284912109375, -0.299163818359375, -0.2584991455078125, -0.21783447265625, -0.1771697998046875, -0.136505126953125, -0.0958404541015625, -0.05517578125, -0.0145111083984375, 0.026153564453125, 0.0668182373046875, 0.10748291015625, 0.1481475830078125, 0.188812255859375, 0.2294769287109375, 0.2701416015625, 0.3108062744140625, 0.351470947265625, 0.3921356201171875, 0.43280029296875, 0.4734649658203125, 0.514129638671875, 0.5547943115234375, 0.595458984375, 0.6361236572265625, 0.676788330078125, 0.7174530029296875, 0.75811767578125, 0.7987823486328125, 0.839447021484375, 0.8801116943359375, 0.9207763671875, 0.9614410400390625, 1.002105712890625, 1.0427703857421875, 1.08343505859375, 1.1240997314453125, 1.164764404296875, 1.2054290771484375, 1.24609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 8.0, 6.0, 13.0, 16.0, 30.0, 30.0, 41.0, 53.0, 80.0, 89.0, 112.0, 106.0, 83.0, 90.0, 62.0, 46.0, 38.0, 25.0, 20.0, 23.0, 14.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.741819858551025, -4.590375900268555, -4.438931941986084, -4.287487983703613, -4.136043548583984, -3.9845998287200928, -3.833155632019043, -3.6817116737365723, -3.5302677154541016, -3.378823757171631, -3.22737979888916, -3.0759356021881104, -2.9244916439056396, -2.773047685623169, -2.621603488922119, -2.4701595306396484, -2.3187155723571777, -2.167271614074707, -2.0158276557922363, -1.8643834590911865, -1.7129395008087158, -1.5614955425262451, -1.4100514650344849, -1.2586073875427246, -1.107163429260254, -0.9557194113731384, -0.804275393486023, -0.6528313755989075, -0.501387357711792, -0.3499433398246765, -0.19849932193756104, -0.04705524444580078, 0.10438823699951172, 0.2558322548866272, 0.4072762727737427, 0.5587202906608582, 0.7101643085479736, 0.8616083264350891, 1.0130523443222046, 1.1644964218139648, 1.3159403800964355, 1.4673843383789062, 1.6188284158706665, 1.7702724933624268, 1.9217164516448975, 2.073160409927368, 2.224604606628418, 2.3760485649108887, 2.5274925231933594, 2.67893648147583, 2.830380439758301, 2.9818246364593506, 3.1332685947418213, 3.284712553024292, 3.436156749725342, 3.5876007080078125, 3.739044666290283, 3.890488624572754, 4.041932582855225, 4.193376541137695, 4.344820976257324, 4.496264934539795, 4.647708892822266, 4.799152851104736, 4.950596809387207]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 13.0, 4.0, 7.0, 7.0, 9.0, 16.0, 13.0, 18.0, 21.0, 28.0, 27.0, 25.0, 21.0, 39.0, 25.0, 43.0, 34.0, 34.0, 32.0, 30.0, 41.0, 43.0, 56.0, 44.0, 34.0, 36.0, 33.0, 45.0, 25.0, 24.0, 24.0, 28.0, 16.0, 17.0, 20.0, 8.0, 13.0, 13.0, 9.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5473122596740723, -2.4611082077026367, -2.374903917312622, -2.2886998653411865, -2.202495574951172, -2.1162915229797363, -2.030087471008301, -1.9438831806182861, -1.857679009437561, -1.771474838256836, -1.6852706670761108, -1.5990664958953857, -1.5128624439239502, -1.4266581535339355, -1.3404541015625, -1.254249930381775, -1.1680457592010498, -1.0818415880203247, -0.9956374168395996, -0.9094333052635193, -0.8232291340827942, -0.7370249629020691, -0.6508208513259888, -0.5646166801452637, -0.4784125089645386, -0.3922083377838135, -0.30600419640541077, -0.21980005502700806, -0.13359588384628296, -0.04739171266555786, 0.03881239891052246, 0.12501657009124756, 0.21122097969055176, 0.29742515087127686, 0.38362929224967957, 0.4698334336280823, 0.5560376048088074, 0.6422417759895325, 0.7284458875656128, 0.8146500587463379, 0.900854229927063, 0.9870584011077881, 1.0732625722885132, 1.1594667434692383, 1.2456707954406738, 1.3318750858306885, 1.418079137802124, 1.5042833089828491, 1.5904874801635742, 1.6766916513442993, 1.7628958225250244, 1.84909987449646, 1.9353041648864746, 2.02150821685791, 2.1077122688293457, 2.1939165592193604, 2.280120849609375, 2.3663249015808105, 2.452529191970825, 2.5387332439422607, 2.6249375343322754, 2.711141586303711, 2.7973456382751465, 2.883549928665161, 2.9697539806365967]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 13.0, 34.0, 40.0, 75.0, 159.0, 355.0, 692.0, 1581.0, 3567.0, 9215.0, 28983.0, 176187.0, 694278.0, 99775.0, 21171.0, 7130.0, 2953.0, 1224.0, 536.0, 266.0, 155.0, 59.0, 42.0, 16.0, 12.0, 9.0, 7.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9599609375, -1.8908843994140625, -1.821807861328125, -1.7527313232421875, -1.68365478515625, -1.6145782470703125, -1.545501708984375, -1.4764251708984375, -1.4073486328125, -1.3382720947265625, -1.269195556640625, -1.2001190185546875, -1.13104248046875, -1.0619659423828125, -0.992889404296875, -0.9238128662109375, -0.854736328125, -0.7856597900390625, -0.716583251953125, -0.6475067138671875, -0.57843017578125, -0.5093536376953125, -0.440277099609375, -0.3712005615234375, -0.3021240234375, -0.2330474853515625, -0.163970947265625, -0.0948944091796875, -0.02581787109375, 0.0432586669921875, 0.112335205078125, 0.1814117431640625, 0.25048828125, 0.3195648193359375, 0.388641357421875, 0.4577178955078125, 0.52679443359375, 0.5958709716796875, 0.664947509765625, 0.7340240478515625, 0.8031005859375, 0.8721771240234375, 0.941253662109375, 1.0103302001953125, 1.07940673828125, 1.1484832763671875, 1.217559814453125, 1.2866363525390625, 1.355712890625, 1.4247894287109375, 1.493865966796875, 1.5629425048828125, 1.63201904296875, 1.7010955810546875, 1.770172119140625, 1.8392486572265625, 1.9083251953125, 1.9774017333984375, 2.046478271484375, 2.1155548095703125, 2.18463134765625, 2.2537078857421875, 2.322784423828125, 2.3918609619140625, 2.4609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 4.0, 6.0, 7.0, 22.0, 22.0, 26.0, 17.0, 28.0, 32.0, 31.0, 38.0, 51.0, 42.0, 42.0, 30.0, 56.0, 46.0, 57.0, 62.0, 46.0, 41.0, 49.0, 32.0, 38.0, 20.0, 27.0, 18.0, 13.0, 13.0, 20.0, 13.0, 7.0, 8.0, 2.0, 7.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.869140625, -1.8096466064453125, -1.750152587890625, -1.6906585693359375, -1.63116455078125, -1.5716705322265625, -1.512176513671875, -1.4526824951171875, -1.3931884765625, -1.3336944580078125, -1.274200439453125, -1.2147064208984375, -1.15521240234375, -1.0957183837890625, -1.036224365234375, -0.9767303466796875, -0.917236328125, -0.8577423095703125, -0.798248291015625, -0.7387542724609375, -0.67926025390625, -0.6197662353515625, -0.560272216796875, -0.5007781982421875, -0.4412841796875, -0.3817901611328125, -0.322296142578125, -0.2628021240234375, -0.20330810546875, -0.1438140869140625, -0.084320068359375, -0.0248260498046875, 0.03466796875, 0.0941619873046875, 0.153656005859375, 0.2131500244140625, 0.27264404296875, 0.3321380615234375, 0.391632080078125, 0.4511260986328125, 0.5106201171875, 0.5701141357421875, 0.629608154296875, 0.6891021728515625, 0.74859619140625, 0.8080902099609375, 0.867584228515625, 0.9270782470703125, 0.986572265625, 1.0460662841796875, 1.105560302734375, 1.1650543212890625, 1.22454833984375, 1.2840423583984375, 1.343536376953125, 1.4030303955078125, 1.4625244140625, 1.5220184326171875, 1.581512451171875, 1.6410064697265625, 1.70050048828125, 1.7599945068359375, 1.819488525390625, 1.8789825439453125, 1.9384765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 5.0, 8.0, 11.0, 7.0, 15.0, 36.0, 52.0, 82.0, 137.0, 223.0, 359.0, 699.0, 1510.0, 3513.0, 9142.0, 27974.0, 110216.0, 472121.0, 322210.0, 69474.0, 19178.0, 6488.0, 2594.0, 1176.0, 575.0, 297.0, 153.0, 94.0, 69.0, 44.0, 27.0, 13.0, 13.0, 7.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0458984375, -1.0108489990234375, -0.975799560546875, -0.9407501220703125, -0.90570068359375, -0.8706512451171875, -0.835601806640625, -0.8005523681640625, -0.7655029296875, -0.7304534912109375, -0.695404052734375, -0.6603546142578125, -0.62530517578125, -0.5902557373046875, -0.555206298828125, -0.5201568603515625, -0.485107421875, -0.4500579833984375, -0.415008544921875, -0.3799591064453125, -0.34490966796875, -0.3098602294921875, -0.274810791015625, -0.2397613525390625, -0.2047119140625, -0.1696624755859375, -0.134613037109375, -0.0995635986328125, -0.06451416015625, -0.0294647216796875, 0.005584716796875, 0.0406341552734375, 0.07568359375, 0.1107330322265625, 0.145782470703125, 0.1808319091796875, 0.21588134765625, 0.2509307861328125, 0.285980224609375, 0.3210296630859375, 0.3560791015625, 0.3911285400390625, 0.426177978515625, 0.4612274169921875, 0.49627685546875, 0.5313262939453125, 0.566375732421875, 0.6014251708984375, 0.636474609375, 0.6715240478515625, 0.706573486328125, 0.7416229248046875, 0.77667236328125, 0.8117218017578125, 0.846771240234375, 0.8818206787109375, 0.9168701171875, 0.9519195556640625, 0.986968994140625, 1.0220184326171875, 1.05706787109375, 1.0921173095703125, 1.127166748046875, 1.1622161865234375, 1.197265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 6.0, 9.0, 11.0, 14.0, 20.0, 23.0, 20.0, 19.0, 32.0, 35.0, 48.0, 43.0, 53.0, 63.0, 58.0, 51.0, 57.0, 47.0, 68.0, 45.0, 36.0, 44.0, 32.0, 32.0, 30.0, 27.0, 17.0, 15.0, 7.0, 5.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.6484375, -4.522735595703125, -4.39703369140625, -4.271331787109375, -4.1456298828125, -4.019927978515625, -3.89422607421875, -3.768524169921875, -3.642822265625, -3.517120361328125, -3.39141845703125, -3.265716552734375, -3.1400146484375, -3.014312744140625, -2.88861083984375, -2.762908935546875, -2.63720703125, -2.511505126953125, -2.38580322265625, -2.260101318359375, -2.1343994140625, -2.008697509765625, -1.88299560546875, -1.757293701171875, -1.631591796875, -1.505889892578125, -1.38018798828125, -1.254486083984375, -1.1287841796875, -1.003082275390625, -0.87738037109375, -0.751678466796875, -0.6259765625, -0.500274658203125, -0.37457275390625, -0.248870849609375, -0.1231689453125, 0.002532958984375, 0.12823486328125, 0.253936767578125, 0.379638671875, 0.505340576171875, 0.63104248046875, 0.756744384765625, 0.8824462890625, 1.008148193359375, 1.13385009765625, 1.259552001953125, 1.38525390625, 1.510955810546875, 1.63665771484375, 1.762359619140625, 1.8880615234375, 2.013763427734375, 2.13946533203125, 2.265167236328125, 2.390869140625, 2.516571044921875, 2.64227294921875, 2.767974853515625, 2.8936767578125, 3.019378662109375, 3.14508056640625, 3.270782470703125, 3.396484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 8.0, 6.0, 12.0, 12.0, 27.0, 21.0, 33.0, 55.0, 87.0, 122.0, 208.0, 305.0, 594.0, 901.0, 1611.0, 2898.0, 5855.0, 12897.0, 32606.0, 107625.0, 427764.0, 329510.0, 77564.0, 25652.0, 10888.0, 5062.0, 2635.0, 1378.0, 803.0, 491.0, 326.0, 188.0, 134.0, 80.0, 50.0, 38.0, 30.0, 21.0, 24.0, 10.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2734375, -0.2651214599609375, -0.256805419921875, -0.2484893798828125, -0.24017333984375, -0.2318572998046875, -0.223541259765625, -0.2152252197265625, -0.2069091796875, -0.1985931396484375, -0.190277099609375, -0.1819610595703125, -0.17364501953125, -0.1653289794921875, -0.157012939453125, -0.1486968994140625, -0.140380859375, -0.1320648193359375, -0.123748779296875, -0.1154327392578125, -0.10711669921875, -0.0988006591796875, -0.090484619140625, -0.0821685791015625, -0.0738525390625, -0.0655364990234375, -0.057220458984375, -0.0489044189453125, -0.04058837890625, -0.0322723388671875, -0.023956298828125, -0.0156402587890625, -0.00732421875, 0.0009918212890625, 0.009307861328125, 0.0176239013671875, 0.02593994140625, 0.0342559814453125, 0.042572021484375, 0.0508880615234375, 0.0592041015625, 0.0675201416015625, 0.075836181640625, 0.0841522216796875, 0.09246826171875, 0.1007843017578125, 0.109100341796875, 0.1174163818359375, 0.125732421875, 0.1340484619140625, 0.142364501953125, 0.1506805419921875, 0.15899658203125, 0.1673126220703125, 0.175628662109375, 0.1839447021484375, 0.1922607421875, 0.2005767822265625, 0.208892822265625, 0.2172088623046875, 0.22552490234375, 0.2338409423828125, 0.242156982421875, 0.2504730224609375, 0.2587890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 4.0, 10.0, 11.0, 14.0, 23.0, 20.0, 40.0, 62.0, 86.0, 102.0, 119.0, 122.0, 99.0, 60.0, 73.0, 38.0, 29.0, 16.0, 17.0, 8.0, 15.0, 5.0, 7.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002142190933227539, -0.00020805932581424713, -0.00020189955830574036, -0.00019573979079723358, -0.0001895800232887268, -0.00018342025578022003, -0.00017726048827171326, -0.00017110072076320648, -0.0001649409532546997, -0.00015878118574619293, -0.00015262141823768616, -0.00014646165072917938, -0.0001403018832206726, -0.00013414211571216583, -0.00012798234820365906, -0.00012182258069515228, -0.00011566281318664551, -0.00010950304567813873, -0.00010334327816963196, -9.718351066112518e-05, -9.102374315261841e-05, -8.486397564411163e-05, -7.870420813560486e-05, -7.254444062709808e-05, -6.638467311859131e-05, -6.0224905610084534e-05, -5.406513810157776e-05, -4.7905370593070984e-05, -4.174560308456421e-05, -3.5585835576057434e-05, -2.942606806755066e-05, -2.3266300559043884e-05, -1.710653305053711e-05, -1.0946765542030334e-05, -4.7869980335235596e-06, 1.3727694749832153e-06, 7.53253698348999e-06, 1.3692304491996765e-05, 1.985207200050354e-05, 2.6011839509010315e-05, 3.217160701751709e-05, 3.8331374526023865e-05, 4.449114203453064e-05, 5.0650909543037415e-05, 5.681067705154419e-05, 6.297044456005096e-05, 6.913021206855774e-05, 7.528997957706451e-05, 8.144974708557129e-05, 8.760951459407806e-05, 9.376928210258484e-05, 9.992904961109161e-05, 0.00010608881711959839, 0.00011224858462810516, 0.00011840835213661194, 0.0001245681196451187, 0.0001307278871536255, 0.00013688765466213226, 0.00014304742217063904, 0.0001492071896791458, 0.0001553669571876526, 0.00016152672469615936, 0.00016768649220466614, 0.0001738462597131729, 0.0001800060272216797]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 7.0, 15.0, 23.0, 35.0, 36.0, 66.0, 111.0, 173.0, 350.0, 590.0, 1081.0, 2301.0, 4979.0, 12266.0, 37143.0, 172300.0, 576190.0, 179589.0, 38497.0, 12692.0, 5179.0, 2314.0, 1113.0, 651.0, 300.0, 197.0, 121.0, 62.0, 47.0, 37.0, 22.0, 15.0, 8.0, 4.0, 3.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3439521789550781, -0.33267974853515625, -0.3214073181152344, -0.3101348876953125, -0.2988624572753906, -0.28759002685546875, -0.2763175964355469, -0.265045166015625, -0.2537727355957031, -0.24250030517578125, -0.23122787475585938, -0.2199554443359375, -0.20868301391601562, -0.19741058349609375, -0.18613815307617188, -0.17486572265625, -0.16359329223632812, -0.15232086181640625, -0.14104843139648438, -0.1297760009765625, -0.11850357055664062, -0.10723114013671875, -0.09595870971679688, -0.084686279296875, -0.07341384887695312, -0.06214141845703125, -0.050868988037109375, -0.0395965576171875, -0.028324127197265625, -0.01705169677734375, -0.005779266357421875, 0.0054931640625, 0.016765594482421875, 0.02803802490234375, 0.039310455322265625, 0.0505828857421875, 0.061855316162109375, 0.07312774658203125, 0.08440017700195312, 0.095672607421875, 0.10694503784179688, 0.11821746826171875, 0.12948989868164062, 0.1407623291015625, 0.15203475952148438, 0.16330718994140625, 0.17457962036132812, 0.18585205078125, 0.19712448120117188, 0.20839691162109375, 0.21966934204101562, 0.2309417724609375, 0.24221420288085938, 0.25348663330078125, 0.2647590637207031, 0.276031494140625, 0.2873039245605469, 0.29857635498046875, 0.3098487854003906, 0.3211212158203125, 0.3323936462402344, 0.34366607666015625, 0.3549385070800781, 0.3662109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 7.0, 4.0, 11.0, 7.0, 8.0, 13.0, 12.0, 11.0, 20.0, 25.0, 30.0, 36.0, 49.0, 43.0, 59.0, 60.0, 76.0, 73.0, 54.0, 66.0, 54.0, 38.0, 42.0, 29.0, 28.0, 18.0, 18.0, 14.0, 16.0, 11.0, 6.0, 8.0, 5.0, 6.0, 9.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.061725616455078125, -0.05960845947265625, -0.057491302490234375, -0.0553741455078125, -0.053256988525390625, -0.05113983154296875, -0.049022674560546875, -0.046905517578125, -0.044788360595703125, -0.04267120361328125, -0.040554046630859375, -0.0384368896484375, -0.036319732666015625, -0.03420257568359375, -0.032085418701171875, -0.02996826171875, -0.027851104736328125, -0.02573394775390625, -0.023616790771484375, -0.0214996337890625, -0.019382476806640625, -0.01726531982421875, -0.015148162841796875, -0.013031005859375, -0.010913848876953125, -0.00879669189453125, -0.006679534912109375, -0.0045623779296875, -0.002445220947265625, -0.00032806396484375, 0.001789093017578125, 0.00390625, 0.006023406982421875, 0.00814056396484375, 0.010257720947265625, 0.0123748779296875, 0.014492034912109375, 0.01660919189453125, 0.018726348876953125, 0.020843505859375, 0.022960662841796875, 0.02507781982421875, 0.027194976806640625, 0.0293121337890625, 0.031429290771484375, 0.03354644775390625, 0.035663604736328125, 0.03778076171875, 0.039897918701171875, 0.04201507568359375, 0.044132232666015625, 0.0462493896484375, 0.048366546630859375, 0.05048370361328125, 0.052600860595703125, 0.054718017578125, 0.056835174560546875, 0.05895233154296875, 0.061069488525390625, 0.0631866455078125, 0.06530380249023438, 0.06742095947265625, 0.06953811645507812, 0.0716552734375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 4.0, 22.0, 46.0, 74.0, 120.0, 185.0, 192.0, 134.0, 98.0, 56.0, 26.0, 15.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.192495822906494, -6.042137622833252, -5.89177942276001, -5.741421222686768, -5.591063022613525, -5.440704822540283, -5.290346622467041, -5.139988422393799, -4.989630222320557, -4.8392720222473145, -4.688913822174072, -4.53855562210083, -4.388197422027588, -4.237839221954346, -4.0874810218811035, -3.9371228218078613, -3.78676438331604, -3.636406183242798, -3.4860479831695557, -3.3356897830963135, -3.1853315830230713, -3.034973382949829, -2.884614944458008, -2.7342567443847656, -2.5838985443115234, -2.4335403442382812, -2.283182144165039, -2.132823944091797, -1.9824657440185547, -1.8321075439453125, -1.6817492246627808, -1.5313910245895386, -1.381033182144165, -1.2306749820709229, -1.0803167819976807, -0.9299585223197937, -0.7796003222465515, -0.6292421221733093, -0.47888386249542236, -0.3285256624221802, -0.178167462348938, -0.027809247374534607, 0.12254896759986877, 0.27290719747543335, 0.42326539754867554, 0.5736235976219177, 0.7239818572998047, 0.8743400573730469, 1.024698257446289, 1.1750564575195312, 1.3254146575927734, 1.4757728576660156, 1.6261310577392578, 1.7764892578125, 1.9268475770950317, 2.0772056579589844, 2.2275638580322266, 2.3779220581054688, 2.528280258178711, 2.678638458251953, 2.8289966583251953, 2.9793548583984375, 3.1297130584716797, 3.280071258544922, 3.430429697036743]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 10.0, 11.0, 4.0, 11.0, 15.0, 22.0, 24.0, 26.0, 30.0, 34.0, 37.0, 47.0, 48.0, 40.0, 42.0, 39.0, 62.0, 55.0, 66.0, 40.0, 54.0, 47.0, 35.0, 36.0, 31.0, 28.0, 20.0, 21.0, 17.0, 9.0, 6.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7920842170715332, -1.729731798171997, -1.667379379272461, -1.6050270795822144, -1.5426746606826782, -1.480322241783142, -1.4179699420928955, -1.3556175231933594, -1.2932651042938232, -1.230912685394287, -1.168560266494751, -1.1062079668045044, -1.0438555479049683, -0.9815031290054321, -0.9191507697105408, -0.8567984104156494, -0.7944459915161133, -0.7320935726165771, -0.6697412133216858, -0.6073888540267944, -0.5450364351272583, -0.48268404603004456, -0.4203316569328308, -0.35797926783561707, -0.2956268787384033, -0.23327448964118958, -0.17092210054397583, -0.10856971144676208, -0.04621732234954834, 0.016135066747665405, 0.07848745584487915, 0.1408398449420929, 0.20319223403930664, 0.2655446231365204, 0.32789701223373413, 0.3902494013309479, 0.4526017904281616, 0.5149542093276978, 0.5773065686225891, 0.6396589279174805, 0.7020113468170166, 0.7643637657165527, 0.8267161250114441, 0.8890684843063354, 0.9514209032058716, 1.0137733221054077, 1.0761256217956543, 1.1384780406951904, 1.2008304595947266, 1.2631828784942627, 1.3255352973937988, 1.3878875970840454, 1.4502400159835815, 1.5125924348831177, 1.5749447345733643, 1.6372971534729004, 1.6996495723724365, 1.7620019912719727, 1.8243544101715088, 1.8867067098617554, 1.9490591287612915, 2.011411428451538, 2.073763847351074, 2.1361162662506104, 2.1984686851501465]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 5.0, 15.0, 16.0, 16.0, 21.0, 36.0, 52.0, 79.0, 95.0, 155.0, 170.0, 263.0, 398.0, 611.0, 919.0, 1448.0, 2377.0, 4394.0, 9430.0, 25617.0, 96092.0, 482904.0, 321889.0, 65475.0, 19050.0, 7530.0, 3668.0, 2012.0, 1267.0, 823.0, 501.0, 373.0, 220.0, 195.0, 115.0, 84.0, 67.0, 60.0, 28.0, 24.0, 12.0, 7.0, 8.0, 7.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.5234375, -2.444244384765625, -2.36505126953125, -2.285858154296875, -2.2066650390625, -2.127471923828125, -2.04827880859375, -1.969085693359375, -1.889892578125, -1.810699462890625, -1.73150634765625, -1.652313232421875, -1.5731201171875, -1.493927001953125, -1.41473388671875, -1.335540771484375, -1.25634765625, -1.177154541015625, -1.09796142578125, -1.018768310546875, -0.9395751953125, -0.860382080078125, -0.78118896484375, -0.701995849609375, -0.622802734375, -0.543609619140625, -0.46441650390625, -0.385223388671875, -0.3060302734375, -0.226837158203125, -0.14764404296875, -0.068450927734375, 0.0107421875, 0.089935302734375, 0.16912841796875, 0.248321533203125, 0.3275146484375, 0.406707763671875, 0.48590087890625, 0.565093994140625, 0.644287109375, 0.723480224609375, 0.80267333984375, 0.881866455078125, 0.9610595703125, 1.040252685546875, 1.11944580078125, 1.198638916015625, 1.27783203125, 1.357025146484375, 1.43621826171875, 1.515411376953125, 1.5946044921875, 1.673797607421875, 1.75299072265625, 1.832183837890625, 1.911376953125, 1.990570068359375, 2.06976318359375, 2.148956298828125, 2.2281494140625, 2.307342529296875, 2.38653564453125, 2.465728759765625, 2.544921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 4.0, 9.0, 7.0, 8.0, 14.0, 13.0, 20.0, 24.0, 22.0, 27.0, 31.0, 33.0, 41.0, 35.0, 42.0, 39.0, 43.0, 51.0, 49.0, 52.0, 50.0, 53.0, 53.0, 33.0, 35.0, 37.0, 30.0, 29.0, 22.0, 19.0, 18.0, 6.0, 11.0, 12.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.764068603515625, -3.62774658203125, -3.491424560546875, -3.3551025390625, -3.218780517578125, -3.08245849609375, -2.946136474609375, -2.809814453125, -2.673492431640625, -2.53717041015625, -2.400848388671875, -2.2645263671875, -2.128204345703125, -1.99188232421875, -1.855560302734375, -1.71923828125, -1.582916259765625, -1.44659423828125, -1.310272216796875, -1.1739501953125, -1.037628173828125, -0.90130615234375, -0.764984130859375, -0.628662109375, -0.492340087890625, -0.35601806640625, -0.219696044921875, -0.0833740234375, 0.052947998046875, 0.18927001953125, 0.325592041015625, 0.4619140625, 0.598236083984375, 0.73455810546875, 0.870880126953125, 1.0072021484375, 1.143524169921875, 1.27984619140625, 1.416168212890625, 1.552490234375, 1.688812255859375, 1.82513427734375, 1.961456298828125, 2.0977783203125, 2.234100341796875, 2.37042236328125, 2.506744384765625, 2.64306640625, 2.779388427734375, 2.91571044921875, 3.052032470703125, 3.1883544921875, 3.324676513671875, 3.46099853515625, 3.597320556640625, 3.733642578125, 3.869964599609375, 4.00628662109375, 4.142608642578125, 4.2789306640625, 4.415252685546875, 4.55157470703125, 4.687896728515625, 4.82421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 14.0, 26.0, 33.0, 34.0, 49.0, 76.0, 125.0, 763.0, 1030158.0, 16682.0, 237.0, 110.0, 74.0, 45.0, 38.0, 25.0, 24.0, 9.0, 5.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.96875, -25.1513671875, -24.333984375, -23.5166015625, -22.69921875, -21.8818359375, -21.064453125, -20.2470703125, -19.4296875, -18.6123046875, -17.794921875, -16.9775390625, -16.16015625, -15.3427734375, -14.525390625, -13.7080078125, -12.890625, -12.0732421875, -11.255859375, -10.4384765625, -9.62109375, -8.8037109375, -7.986328125, -7.1689453125, -6.3515625, -5.5341796875, -4.716796875, -3.8994140625, -3.08203125, -2.2646484375, -1.447265625, -0.6298828125, 0.1875, 1.0048828125, 1.822265625, 2.6396484375, 3.45703125, 4.2744140625, 5.091796875, 5.9091796875, 6.7265625, 7.5439453125, 8.361328125, 9.1787109375, 9.99609375, 10.8134765625, 11.630859375, 12.4482421875, 13.265625, 14.0830078125, 14.900390625, 15.7177734375, 16.53515625, 17.3525390625, 18.169921875, 18.9873046875, 19.8046875, 20.6220703125, 21.439453125, 22.2568359375, 23.07421875, 23.8916015625, 24.708984375, 25.5263671875, 26.34375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 14.0, 18.0, 31.0, 41.0, 39.0, 68.0, 75.0, 87.0, 94.0, 88.0, 80.0, 78.0, 76.0, 62.0, 35.0, 29.0, 28.0, 18.0, 10.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.4029541015625, -7.165283203125, -6.9276123046875, -6.68994140625, -6.4522705078125, -6.214599609375, -5.9769287109375, -5.7392578125, -5.5015869140625, -5.263916015625, -5.0262451171875, -4.78857421875, -4.5509033203125, -4.313232421875, -4.0755615234375, -3.837890625, -3.6002197265625, -3.362548828125, -3.1248779296875, -2.88720703125, -2.6495361328125, -2.411865234375, -2.1741943359375, -1.9365234375, -1.6988525390625, -1.461181640625, -1.2235107421875, -0.98583984375, -0.7481689453125, -0.510498046875, -0.2728271484375, -0.03515625, 0.2025146484375, 0.440185546875, 0.6778564453125, 0.91552734375, 1.1531982421875, 1.390869140625, 1.6285400390625, 1.8662109375, 2.1038818359375, 2.341552734375, 2.5792236328125, 2.81689453125, 3.0545654296875, 3.292236328125, 3.5299072265625, 3.767578125, 4.0052490234375, 4.242919921875, 4.4805908203125, 4.71826171875, 4.9559326171875, 5.193603515625, 5.4312744140625, 5.6689453125, 5.9066162109375, 6.144287109375, 6.3819580078125, 6.61962890625, 6.8572998046875, 7.094970703125, 7.3326416015625, 7.5703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 3.0, 6.0, 7.0, 5.0, 12.0, 11.0, 20.0, 31.0, 34.0, 60.0, 85.0, 139.0, 306.0, 753.0, 2056.0, 7529.0, 51021.0, 815502.0, 152296.0, 13423.0, 3232.0, 1042.0, 468.0, 195.0, 97.0, 60.0, 46.0, 27.0, 18.0, 15.0, 21.0, 6.0, 12.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.1572265625, -1.1182403564453125, -1.079254150390625, -1.0402679443359375, -1.00128173828125, -0.9622955322265625, -0.923309326171875, -0.8843231201171875, -0.8453369140625, -0.8063507080078125, -0.767364501953125, -0.7283782958984375, -0.68939208984375, -0.6504058837890625, -0.611419677734375, -0.5724334716796875, -0.533447265625, -0.4944610595703125, -0.455474853515625, -0.4164886474609375, -0.37750244140625, -0.3385162353515625, -0.299530029296875, -0.2605438232421875, -0.2215576171875, -0.1825714111328125, -0.143585205078125, -0.1045989990234375, -0.06561279296875, -0.0266265869140625, 0.012359619140625, 0.0513458251953125, 0.09033203125, 0.1293182373046875, 0.168304443359375, 0.2072906494140625, 0.24627685546875, 0.2852630615234375, 0.324249267578125, 0.3632354736328125, 0.4022216796875, 0.4412078857421875, 0.480194091796875, 0.5191802978515625, 0.55816650390625, 0.5971527099609375, 0.636138916015625, 0.6751251220703125, 0.714111328125, 0.7530975341796875, 0.792083740234375, 0.8310699462890625, 0.87005615234375, 0.9090423583984375, 0.948028564453125, 0.9870147705078125, 1.0260009765625, 1.0649871826171875, 1.103973388671875, 1.1429595947265625, 1.18194580078125, 1.2209320068359375, 1.259918212890625, 1.2989044189453125, 1.337890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 10.0, 16.0, 16.0, 24.0, 44.0, 57.0, 71.0, 87.0, 123.0, 142.0, 110.0, 56.0, 47.0, 47.0, 35.0, 17.0, 19.0, 15.0, 14.0, 3.0, 8.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012755393981933594, -0.00012391898781061172, -0.00012028403580188751, -0.0001166490837931633, -0.00011301413178443909, -0.00010937917977571487, -0.00010574422776699066, -0.00010210927575826645, -9.847432374954224e-05, -9.483937174081802e-05, -9.120441973209381e-05, -8.75694677233696e-05, -8.393451571464539e-05, -8.029956370592117e-05, -7.666461169719696e-05, -7.302965968847275e-05, -6.939470767974854e-05, -6.575975567102432e-05, -6.212480366230011e-05, -5.84898516535759e-05, -5.4854899644851685e-05, -5.121994763612747e-05, -4.758499562740326e-05, -4.395004361867905e-05, -4.0315091609954834e-05, -3.668013960123062e-05, -3.304518759250641e-05, -2.9410235583782196e-05, -2.5775283575057983e-05, -2.214033156633377e-05, -1.8505379557609558e-05, -1.4870427548885345e-05, -1.1235475540161133e-05, -7.60052353143692e-06, -3.9655715227127075e-06, -3.3061951398849487e-07, 3.3043324947357178e-06, 6.93928450345993e-06, 1.0574236512184143e-05, 1.4209188520908356e-05, 1.784414052963257e-05, 2.147909253835678e-05, 2.5114044547080994e-05, 2.8748996555805206e-05, 3.238394856452942e-05, 3.601890057325363e-05, 3.9653852581977844e-05, 4.328880459070206e-05, 4.692375659942627e-05, 5.055870860815048e-05, 5.4193660616874695e-05, 5.782861262559891e-05, 6.146356463432312e-05, 6.509851664304733e-05, 6.873346865177155e-05, 7.236842066049576e-05, 7.600337266921997e-05, 7.963832467794418e-05, 8.32732766866684e-05, 8.690822869539261e-05, 9.054318070411682e-05, 9.417813271284103e-05, 9.781308472156525e-05, 0.00010144803673028946, 0.00010508298873901367]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 3.0, 4.0, 19.0, 23.0, 42.0, 73.0, 86.0, 180.0, 311.0, 584.0, 1226.0, 3374.0, 13594.0, 126782.0, 807415.0, 79485.0, 10268.0, 2775.0, 1163.0, 476.0, 300.0, 140.0, 72.0, 43.0, 33.0, 24.0, 10.0, 9.0, 10.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0078125, -0.9710540771484375, -0.934295654296875, -0.8975372314453125, -0.86077880859375, -0.8240203857421875, -0.787261962890625, -0.7505035400390625, -0.7137451171875, -0.6769866943359375, -0.640228271484375, -0.6034698486328125, -0.56671142578125, -0.5299530029296875, -0.493194580078125, -0.4564361572265625, -0.419677734375, -0.3829193115234375, -0.346160888671875, -0.3094024658203125, -0.27264404296875, -0.2358856201171875, -0.199127197265625, -0.1623687744140625, -0.1256103515625, -0.0888519287109375, -0.052093505859375, -0.0153350830078125, 0.02142333984375, 0.0581817626953125, 0.094940185546875, 0.1316986083984375, 0.16845703125, 0.2052154541015625, 0.241973876953125, 0.2787322998046875, 0.31549072265625, 0.3522491455078125, 0.389007568359375, 0.4257659912109375, 0.4625244140625, 0.4992828369140625, 0.536041259765625, 0.5727996826171875, 0.60955810546875, 0.6463165283203125, 0.683074951171875, 0.7198333740234375, 0.756591796875, 0.7933502197265625, 0.830108642578125, 0.8668670654296875, 0.90362548828125, 0.9403839111328125, 0.977142333984375, 1.0139007568359375, 1.0506591796875, 1.0874176025390625, 1.124176025390625, 1.1609344482421875, 1.19769287109375, 1.2344512939453125, 1.271209716796875, 1.3079681396484375, 1.3447265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 5.0, 12.0, 10.0, 18.0, 32.0, 59.0, 42.0, 92.0, 105.0, 147.0, 141.0, 106.0, 71.0, 40.0, 29.0, 20.0, 18.0, 11.0, 11.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.55517578125, -0.5415534973144531, -0.5279312133789062, -0.5143089294433594, -0.5006866455078125, -0.4870643615722656, -0.47344207763671875, -0.4598197937011719, -0.446197509765625, -0.4325752258300781, -0.41895294189453125, -0.4053306579589844, -0.3917083740234375, -0.3780860900878906, -0.36446380615234375, -0.3508415222167969, -0.33721923828125, -0.3235969543457031, -0.30997467041015625, -0.2963523864746094, -0.2827301025390625, -0.2691078186035156, -0.25548553466796875, -0.24186325073242188, -0.228240966796875, -0.21461868286132812, -0.20099639892578125, -0.18737411499023438, -0.1737518310546875, -0.16012954711914062, -0.14650726318359375, -0.13288497924804688, -0.1192626953125, -0.10564041137695312, -0.09201812744140625, -0.07839584350585938, -0.0647735595703125, -0.051151275634765625, -0.03752899169921875, -0.023906707763671875, -0.010284423828125, 0.003337860107421875, 0.01696014404296875, 0.030582427978515625, 0.0442047119140625, 0.057826995849609375, 0.07144927978515625, 0.08507156372070312, 0.09869384765625, 0.11231613159179688, 0.12593841552734375, 0.13956069946289062, 0.1531829833984375, 0.16680526733398438, 0.18042755126953125, 0.19404983520507812, 0.207672119140625, 0.22129440307617188, 0.23491668701171875, 0.24853897094726562, 0.2621612548828125, 0.2757835388183594, 0.28940582275390625, 0.3030281066894531, 0.316650390625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 15.0, 61.0, 274.0, 410.0, 177.0, 49.0, 16.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.86382484436035, -31.20501708984375, -30.54620933532715, -29.887399673461914, -29.228591918945312, -28.56978416442871, -27.91097640991211, -27.252168655395508, -26.593360900878906, -25.934553146362305, -25.275745391845703, -24.61693572998047, -23.958127975463867, -23.299320220947266, -22.640512466430664, -21.981704711914062, -21.322895050048828, -20.664087295532227, -20.005279541015625, -19.34646987915039, -18.68766212463379, -18.028854370117188, -17.370046615600586, -16.711238861083984, -16.05242919921875, -15.393621444702148, -14.73481273651123, -14.076004981994629, -13.417196273803711, -12.75838851928711, -12.099580764770508, -11.440773010253906, -10.781966209411621, -10.12315845489502, -9.464349746704102, -8.8055419921875, -8.146734237670898, -7.4879255294799805, -6.829117774963379, -6.170309543609619, -5.511501312255859, -4.8526930809021, -4.19388484954834, -3.5350770950317383, -2.8762688636779785, -2.2174606323242188, -1.558652639389038, -0.8998446464538574, -0.24103641510009766, 0.41777169704437256, 1.0765798091888428, 1.735387921333313, 2.394196033477783, 3.053004264831543, 3.7118122577667236, 4.370620250701904, 5.029428482055664, 5.688236713409424, 6.347044944763184, 7.005852699279785, 7.664660930633545, 8.323469161987305, 8.982276916503906, 9.641084671020508, 10.299893379211426]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 3.0, 3.0, 4.0, 10.0, 10.0, 8.0, 14.0, 10.0, 18.0, 28.0, 26.0, 24.0, 31.0, 35.0, 23.0, 29.0, 31.0, 35.0, 34.0, 49.0, 44.0, 45.0, 45.0, 42.0, 53.0, 42.0, 36.0, 38.0, 27.0, 23.0, 24.0, 22.0, 22.0, 27.0, 22.0, 19.0, 7.0, 12.0, 12.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.298618316650391, -6.077427864074707, -5.856236934661865, -5.635046482086182, -5.41385555267334, -5.192665100097656, -4.971474647521973, -4.750284194946289, -4.529093265533447, -4.307902812957764, -4.086711883544922, -3.8655214309692383, -3.6443307399749756, -3.423140048980713, -3.2019495964050293, -2.9807589054107666, -2.759568214416504, -2.538377523422241, -2.3171868324279785, -2.095996379852295, -1.8748056888580322, -1.6536149978637695, -1.4324244260787964, -1.2112338542938232, -0.9900431632995605, -0.7688525319099426, -0.5476619005203247, -0.3264712691307068, -0.10528063774108887, 0.11591005325317383, 0.337100625038147, 0.5582911968231201, 0.7794818878173828, 1.0006725788116455, 1.2218631505966187, 1.4430537223815918, 1.6642444133758545, 1.8854351043701172, 2.106625556945801, 2.3278162479400635, 2.549006938934326, 2.770197629928589, 2.9913883209228516, 3.212578773498535, 3.433769464492798, 3.6549601554870605, 3.876150608062744, 4.097341537475586, 4.3185319900512695, 4.539722442626953, 4.760913372039795, 4.9821038246154785, 5.20329475402832, 5.424485206604004, 5.6456756591796875, 5.866866111755371, 6.088057041168213, 6.3092474937438965, 6.530438423156738, 6.751628875732422, 6.9728193283081055, 7.194010257720947, 7.415200710296631, 7.636391639709473, 7.857582092285156]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 10.0, 15.0, 20.0, 32.0, 41.0, 64.0, 91.0, 90.0, 170.0, 220.0, 304.0, 503.0, 744.0, 1271.0, 2290.0, 4498.0, 10221.0, 33625.0, 254272.0, 2258578.0, 1446590.0, 140333.0, 23734.0, 8042.0, 3664.0, 1986.0, 1055.0, 641.0, 373.0, 257.0, 170.0, 111.0, 68.0, 60.0, 42.0, 17.0, 22.0, 9.0, 16.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.62109375, -3.507476806640625, -3.39385986328125, -3.280242919921875, -3.1666259765625, -3.053009033203125, -2.93939208984375, -2.825775146484375, -2.712158203125, -2.598541259765625, -2.48492431640625, -2.371307373046875, -2.2576904296875, -2.144073486328125, -2.03045654296875, -1.916839599609375, -1.80322265625, -1.689605712890625, -1.57598876953125, -1.462371826171875, -1.3487548828125, -1.235137939453125, -1.12152099609375, -1.007904052734375, -0.894287109375, -0.780670166015625, -0.66705322265625, -0.553436279296875, -0.4398193359375, -0.326202392578125, -0.21258544921875, -0.098968505859375, 0.0146484375, 0.128265380859375, 0.24188232421875, 0.355499267578125, 0.4691162109375, 0.582733154296875, 0.69635009765625, 0.809967041015625, 0.923583984375, 1.037200927734375, 1.15081787109375, 1.264434814453125, 1.3780517578125, 1.491668701171875, 1.60528564453125, 1.718902587890625, 1.83251953125, 1.946136474609375, 2.05975341796875, 2.173370361328125, 2.2869873046875, 2.400604248046875, 2.51422119140625, 2.627838134765625, 2.741455078125, 2.855072021484375, 2.96868896484375, 3.082305908203125, 3.1959228515625, 3.309539794921875, 3.42315673828125, 3.536773681640625, 3.650390625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 9.0, 2.0, 8.0, 10.0, 7.0, 16.0, 15.0, 11.0, 26.0, 18.0, 26.0, 39.0, 33.0, 51.0, 41.0, 38.0, 48.0, 48.0, 49.0, 60.0, 39.0, 48.0, 52.0, 44.0, 34.0, 45.0, 25.0, 22.0, 32.0, 15.0, 11.0, 14.0, 12.0, 12.0, 15.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.298828125, -2.231048583984375, -2.16326904296875, -2.095489501953125, -2.0277099609375, -1.959930419921875, -1.89215087890625, -1.824371337890625, -1.756591796875, -1.688812255859375, -1.62103271484375, -1.553253173828125, -1.4854736328125, -1.417694091796875, -1.34991455078125, -1.282135009765625, -1.21435546875, -1.146575927734375, -1.07879638671875, -1.011016845703125, -0.9432373046875, -0.875457763671875, -0.80767822265625, -0.739898681640625, -0.672119140625, -0.604339599609375, -0.53656005859375, -0.468780517578125, -0.4010009765625, -0.333221435546875, -0.26544189453125, -0.197662353515625, -0.1298828125, -0.062103271484375, 0.00567626953125, 0.073455810546875, 0.1412353515625, 0.209014892578125, 0.27679443359375, 0.344573974609375, 0.412353515625, 0.480133056640625, 0.54791259765625, 0.615692138671875, 0.6834716796875, 0.751251220703125, 0.81903076171875, 0.886810302734375, 0.95458984375, 1.022369384765625, 1.09014892578125, 1.157928466796875, 1.2257080078125, 1.293487548828125, 1.36126708984375, 1.429046630859375, 1.496826171875, 1.564605712890625, 1.63238525390625, 1.700164794921875, 1.7679443359375, 1.835723876953125, 1.90350341796875, 1.971282958984375, 2.0390625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 11.0, 19.0, 15.0, 23.0, 28.0, 44.0, 29.0, 65.0, 131.0, 307.0, 963.0, 6257.0, 258682.0, 3905977.0, 18883.0, 1915.0, 441.0, 168.0, 69.0, 51.0, 36.0, 32.0, 23.0, 21.0, 13.0, 10.0, 12.0, 12.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.2740478515625, -7.969970703125, -7.6658935546875, -7.36181640625, -7.0577392578125, -6.753662109375, -6.4495849609375, -6.1455078125, -5.8414306640625, -5.537353515625, -5.2332763671875, -4.92919921875, -4.6251220703125, -4.321044921875, -4.0169677734375, -3.712890625, -3.4088134765625, -3.104736328125, -2.8006591796875, -2.49658203125, -2.1925048828125, -1.888427734375, -1.5843505859375, -1.2802734375, -0.9761962890625, -0.672119140625, -0.3680419921875, -0.06396484375, 0.2401123046875, 0.544189453125, 0.8482666015625, 1.15234375, 1.4564208984375, 1.760498046875, 2.0645751953125, 2.36865234375, 2.6727294921875, 2.976806640625, 3.2808837890625, 3.5849609375, 3.8890380859375, 4.193115234375, 4.4971923828125, 4.80126953125, 5.1053466796875, 5.409423828125, 5.7135009765625, 6.017578125, 6.3216552734375, 6.625732421875, 6.9298095703125, 7.23388671875, 7.5379638671875, 7.842041015625, 8.1461181640625, 8.4501953125, 8.7542724609375, 9.058349609375, 9.3624267578125, 9.66650390625, 9.9705810546875, 10.274658203125, 10.5787353515625, 10.8828125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 13.0, 6.0, 17.0, 17.0, 37.0, 56.0, 90.0, 135.0, 278.0, 464.0, 799.0, 819.0, 557.0, 317.0, 165.0, 84.0, 69.0, 45.0, 21.0, 20.0, 15.0, 14.0, 4.0, 4.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0517578125, -1.0156707763671875, -0.979583740234375, -0.9434967041015625, -0.90740966796875, -0.8713226318359375, -0.835235595703125, -0.7991485595703125, -0.7630615234375, -0.7269744873046875, -0.690887451171875, -0.6548004150390625, -0.61871337890625, -0.5826263427734375, -0.546539306640625, -0.5104522705078125, -0.474365234375, -0.4382781982421875, -0.402191162109375, -0.3661041259765625, -0.33001708984375, -0.2939300537109375, -0.257843017578125, -0.2217559814453125, -0.1856689453125, -0.1495819091796875, -0.113494873046875, -0.0774078369140625, -0.04132080078125, -0.0052337646484375, 0.030853271484375, 0.0669403076171875, 0.10302734375, 0.1391143798828125, 0.175201416015625, 0.2112884521484375, 0.24737548828125, 0.2834625244140625, 0.319549560546875, 0.3556365966796875, 0.3917236328125, 0.4278106689453125, 0.463897705078125, 0.4999847412109375, 0.53607177734375, 0.5721588134765625, 0.608245849609375, 0.6443328857421875, 0.680419921875, 0.7165069580078125, 0.752593994140625, 0.7886810302734375, 0.82476806640625, 0.8608551025390625, 0.896942138671875, 0.9330291748046875, 0.9691162109375, 1.0052032470703125, 1.041290283203125, 1.0773773193359375, 1.11346435546875, 1.1495513916015625, 1.185638427734375, 1.2217254638671875, 1.2578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 6.0, 17.0, 18.0, 27.0, 36.0, 38.0, 61.0, 79.0, 100.0, 87.0, 101.0, 97.0, 71.0, 48.0, 47.0, 39.0, 19.0, 32.0, 13.0, 9.0, 7.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.512279748916626, -3.4101383686065674, -3.3079967498779297, -3.205855369567871, -3.1037137508392334, -3.001572370529175, -2.899430751800537, -2.7972893714904785, -2.69514799118042, -2.5930066108703613, -2.4908649921417236, -2.388723611831665, -2.2865819931030273, -2.1844406127929688, -2.08229923248291, -1.9801576137542725, -1.8780161142349243, -1.7758746147155762, -1.673733115196228, -1.5715916156768799, -1.4694502353668213, -1.3673087358474731, -1.265167236328125, -1.1630258560180664, -1.0608842372894287, -0.9587427377700806, -0.8566012978553772, -0.754459798336029, -0.6523183584213257, -0.5501768589019775, -0.4480353593826294, -0.345893919467926, -0.24375247955322266, -0.1416110098361969, -0.03946952521800995, 0.062671959400177, 0.16481342911720276, 0.2669548988342285, 0.36909639835357666, 0.47123783826828003, 0.5733793377876282, 0.6755208373069763, 0.7776622772216797, 0.8798037767410278, 0.981945276260376, 1.0840866565704346, 1.1862282752990723, 1.2883696556091309, 1.390511155128479, 1.4926526546478271, 1.5947941541671753, 1.6969356536865234, 1.799077033996582, 1.9012185335159302, 2.0033600330352783, 2.105501413345337, 2.2076430320739746, 2.309784412384033, 2.411926031112671, 2.5140674114227295, 2.616209030151367, 2.718350410461426, 2.8204917907714844, 2.922633409500122, 3.0247747898101807]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 6.0, 7.0, 6.0, 6.0, 12.0, 10.0, 7.0, 11.0, 13.0, 18.0, 25.0, 23.0, 23.0, 32.0, 25.0, 28.0, 46.0, 31.0, 46.0, 31.0, 49.0, 44.0, 41.0, 35.0, 44.0, 41.0, 35.0, 34.0, 32.0, 29.0, 29.0, 24.0, 21.0, 23.0, 18.0, 15.0, 22.0, 11.0, 8.0, 6.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.1568896770477295, -2.0957131385803223, -2.034536838531494, -1.973360300064087, -1.9121837615966797, -1.851007342338562, -1.7898309230804443, -1.728654384613037, -1.6674779653549194, -1.6063015460968018, -1.5451250076293945, -1.4839485883712769, -1.4227721691131592, -1.361595630645752, -1.3004192113876343, -1.2392427921295166, -1.1780662536621094, -1.1168898344039917, -1.0557132959365845, -0.9945368766784668, -0.9333603978157043, -0.8721839189529419, -0.8110074996948242, -0.7498310208320618, -0.6886545419692993, -0.6274780631065369, -0.5663015842437744, -0.5051251649856567, -0.4439486861228943, -0.38277220726013184, -0.3215957581996918, -0.2604193091392517, -0.1992427110671997, -0.13806624710559845, -0.07688978314399719, -0.015713319182395935, 0.04546314477920532, 0.10663962364196777, 0.16781607270240784, 0.2289925217628479, 0.29016900062561035, 0.3513454794883728, 0.41252192854881287, 0.47369837760925293, 0.5348748564720154, 0.5960513353347778, 0.6572277545928955, 0.718404233455658, 0.7795807123184204, 0.8407571911811829, 0.9019336700439453, 0.963110089302063, 1.0242865085601807, 1.085463047027588, 1.1466394662857056, 1.2078158855438232, 1.2689924240112305, 1.3301688432693481, 1.3913453817367554, 1.452521800994873, 1.5136983394622803, 1.574874758720398, 1.6360511779785156, 1.6972277164459229, 1.7584041357040405]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 13.0, 9.0, 13.0, 11.0, 28.0, 36.0, 56.0, 90.0, 168.0, 306.0, 567.0, 1229.0, 2831.0, 7105.0, 19735.0, 65555.0, 254670.0, 459815.0, 168323.0, 44524.0, 14126.0, 5137.0, 2193.0, 904.0, 470.0, 250.0, 140.0, 85.0, 56.0, 33.0, 17.0, 10.0, 13.0, 10.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5935287475585938, -0.5757293701171875, -0.5579299926757812, -0.540130615234375, -0.5223312377929688, -0.5045318603515625, -0.48673248291015625, -0.46893310546875, -0.45113372802734375, -0.4333343505859375, -0.41553497314453125, -0.397735595703125, -0.37993621826171875, -0.3621368408203125, -0.34433746337890625, -0.3265380859375, -0.30873870849609375, -0.2909393310546875, -0.27313995361328125, -0.255340576171875, -0.23754119873046875, -0.2197418212890625, -0.20194244384765625, -0.18414306640625, -0.16634368896484375, -0.1485443115234375, -0.13074493408203125, -0.112945556640625, -0.09514617919921875, -0.0773468017578125, -0.05954742431640625, -0.041748046875, -0.02394866943359375, -0.0061492919921875, 0.01165008544921875, 0.029449462890625, 0.04724884033203125, 0.0650482177734375, 0.08284759521484375, 0.10064697265625, 0.11844635009765625, 0.1362457275390625, 0.15404510498046875, 0.171844482421875, 0.18964385986328125, 0.2074432373046875, 0.22524261474609375, 0.2430419921875, 0.26084136962890625, 0.2786407470703125, 0.29644012451171875, 0.314239501953125, 0.33203887939453125, 0.3498382568359375, 0.36763763427734375, 0.38543701171875, 0.40323638916015625, 0.4210357666015625, 0.43883514404296875, 0.456634521484375, 0.47443389892578125, 0.4922332763671875, 0.5100326538085938, 0.52783203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 2.0, 7.0, 10.0, 4.0, 9.0, 6.0, 14.0, 15.0, 17.0, 25.0, 27.0, 34.0, 32.0, 37.0, 43.0, 54.0, 36.0, 39.0, 41.0, 57.0, 53.0, 49.0, 33.0, 36.0, 48.0, 33.0, 24.0, 29.0, 25.0, 25.0, 16.0, 21.0, 19.0, 15.0, 9.0, 6.0, 11.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.4345703125, -1.3919525146484375, -1.349334716796875, -1.3067169189453125, -1.26409912109375, -1.2214813232421875, -1.178863525390625, -1.1362457275390625, -1.0936279296875, -1.0510101318359375, -1.008392333984375, -0.9657745361328125, -0.92315673828125, -0.8805389404296875, -0.837921142578125, -0.7953033447265625, -0.752685546875, -0.7100677490234375, -0.667449951171875, -0.6248321533203125, -0.58221435546875, -0.5395965576171875, -0.496978759765625, -0.4543609619140625, -0.4117431640625, -0.3691253662109375, -0.326507568359375, -0.2838897705078125, -0.24127197265625, -0.1986541748046875, -0.156036376953125, -0.1134185791015625, -0.07080078125, -0.0281829833984375, 0.014434814453125, 0.0570526123046875, 0.09967041015625, 0.1422882080078125, 0.184906005859375, 0.2275238037109375, 0.2701416015625, 0.3127593994140625, 0.355377197265625, 0.3979949951171875, 0.44061279296875, 0.4832305908203125, 0.525848388671875, 0.5684661865234375, 0.611083984375, 0.6537017822265625, 0.696319580078125, 0.7389373779296875, 0.78155517578125, 0.8241729736328125, 0.866790771484375, 0.9094085693359375, 0.9520263671875, 0.9946441650390625, 1.037261962890625, 1.0798797607421875, 1.12249755859375, 1.1651153564453125, 1.207733154296875, 1.2503509521484375, 1.29296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 10.0, 18.0, 19.0, 35.0, 45.0, 78.0, 117.0, 245.0, 445.0, 948.0, 2244.0, 6250.0, 20776.0, 85611.0, 365542.0, 422089.0, 106729.0, 25023.0, 7502.0, 2548.0, 1121.0, 483.0, 241.0, 143.0, 96.0, 50.0, 38.0, 28.0, 16.0, 13.0, 12.0, 6.0, 8.0, 7.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6161346435546875, -0.597503662109375, -0.5788726806640625, -0.56024169921875, -0.5416107177734375, -0.522979736328125, -0.5043487548828125, -0.4857177734375, -0.4670867919921875, -0.448455810546875, -0.4298248291015625, -0.41119384765625, -0.3925628662109375, -0.373931884765625, -0.3553009033203125, -0.336669921875, -0.3180389404296875, -0.299407958984375, -0.2807769775390625, -0.26214599609375, -0.2435150146484375, -0.224884033203125, -0.2062530517578125, -0.1876220703125, -0.1689910888671875, -0.150360107421875, -0.1317291259765625, -0.11309814453125, -0.0944671630859375, -0.075836181640625, -0.0572052001953125, -0.03857421875, -0.0199432373046875, -0.001312255859375, 0.0173187255859375, 0.03594970703125, 0.0545806884765625, 0.073211669921875, 0.0918426513671875, 0.1104736328125, 0.1291046142578125, 0.147735595703125, 0.1663665771484375, 0.18499755859375, 0.2036285400390625, 0.222259521484375, 0.2408905029296875, 0.259521484375, 0.2781524658203125, 0.296783447265625, 0.3154144287109375, 0.33404541015625, 0.3526763916015625, 0.371307373046875, 0.3899383544921875, 0.4085693359375, 0.4272003173828125, 0.445831298828125, 0.4644622802734375, 0.48309326171875, 0.5017242431640625, 0.520355224609375, 0.5389862060546875, 0.5576171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 10.0, 14.0, 13.0, 16.0, 20.0, 21.0, 21.0, 20.0, 27.0, 34.0, 32.0, 29.0, 42.0, 29.0, 47.0, 50.0, 52.0, 41.0, 54.0, 43.0, 26.0, 38.0, 35.0, 34.0, 25.0, 30.0, 25.0, 29.0, 21.0, 17.0, 14.0, 9.0, 9.0, 12.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.224609375, -2.149017333984375, -2.07342529296875, -1.997833251953125, -1.9222412109375, -1.846649169921875, -1.77105712890625, -1.695465087890625, -1.619873046875, -1.544281005859375, -1.46868896484375, -1.393096923828125, -1.3175048828125, -1.241912841796875, -1.16632080078125, -1.090728759765625, -1.01513671875, -0.939544677734375, -0.86395263671875, -0.788360595703125, -0.7127685546875, -0.637176513671875, -0.56158447265625, -0.485992431640625, -0.410400390625, -0.334808349609375, -0.25921630859375, -0.183624267578125, -0.1080322265625, -0.032440185546875, 0.04315185546875, 0.118743896484375, 0.1943359375, 0.269927978515625, 0.34552001953125, 0.421112060546875, 0.4967041015625, 0.572296142578125, 0.64788818359375, 0.723480224609375, 0.799072265625, 0.874664306640625, 0.95025634765625, 1.025848388671875, 1.1014404296875, 1.177032470703125, 1.25262451171875, 1.328216552734375, 1.40380859375, 1.479400634765625, 1.55499267578125, 1.630584716796875, 1.7061767578125, 1.781768798828125, 1.85736083984375, 1.932952880859375, 2.008544921875, 2.084136962890625, 2.15972900390625, 2.235321044921875, 2.3109130859375, 2.386505126953125, 2.46209716796875, 2.537689208984375, 2.61328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 6.0, 9.0, 6.0, 25.0, 38.0, 44.0, 65.0, 101.0, 171.0, 283.0, 493.0, 846.0, 1644.0, 3394.0, 7290.0, 17327.0, 51126.0, 197217.0, 480864.0, 202412.0, 52717.0, 17983.0, 7221.0, 3398.0, 1687.0, 958.0, 482.0, 286.0, 159.0, 116.0, 69.0, 30.0, 31.0, 22.0, 15.0, 5.0, 2.0, 4.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1573486328125, -0.152191162109375, -0.14703369140625, -0.141876220703125, -0.13671875, -0.131561279296875, -0.12640380859375, -0.121246337890625, -0.1160888671875, -0.110931396484375, -0.10577392578125, -0.100616455078125, -0.095458984375, -0.090301513671875, -0.08514404296875, -0.079986572265625, -0.0748291015625, -0.069671630859375, -0.06451416015625, -0.059356689453125, -0.05419921875, -0.049041748046875, -0.04388427734375, -0.038726806640625, -0.0335693359375, -0.028411865234375, -0.02325439453125, -0.018096923828125, -0.012939453125, -0.007781982421875, -0.00262451171875, 0.002532958984375, 0.0076904296875, 0.012847900390625, 0.01800537109375, 0.023162841796875, 0.0283203125, 0.033477783203125, 0.03863525390625, 0.043792724609375, 0.0489501953125, 0.054107666015625, 0.05926513671875, 0.064422607421875, 0.069580078125, 0.074737548828125, 0.07989501953125, 0.085052490234375, 0.0902099609375, 0.095367431640625, 0.10052490234375, 0.105682373046875, 0.11083984375, 0.115997314453125, 0.12115478515625, 0.126312255859375, 0.1314697265625, 0.136627197265625, 0.14178466796875, 0.146942138671875, 0.152099609375, 0.157257080078125, 0.16241455078125, 0.167572021484375, 0.1727294921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 11.0, 16.0, 11.0, 33.0, 48.0, 62.0, 123.0, 157.0, 175.0, 143.0, 84.0, 50.0, 25.0, 20.0, 12.0, 7.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014579296112060547, -0.00014017336070537567, -0.00013455376029014587, -0.00012893415987491608, -0.00012331455945968628, -0.00011769495904445648, -0.00011207535862922668, -0.00010645575821399689, -0.00010083615779876709, -9.521655738353729e-05, -8.95969569683075e-05, -8.39773565530777e-05, -7.83577561378479e-05, -7.27381557226181e-05, -6.71185553073883e-05, -6.149895489215851e-05, -5.587935447692871e-05, -5.0259754061698914e-05, -4.4640153646469116e-05, -3.902055323123932e-05, -3.340095281600952e-05, -2.7781352400779724e-05, -2.2161751985549927e-05, -1.654215157032013e-05, -1.0922551155090332e-05, -5.302950739860535e-06, 3.166496753692627e-07, 5.93625009059906e-06, 1.1555850505828857e-05, 1.7175450921058655e-05, 2.2795051336288452e-05, 2.841465175151825e-05, 3.403425216674805e-05, 3.9653852581977844e-05, 4.527345299720764e-05, 5.089305341243744e-05, 5.6512653827667236e-05, 6.213225424289703e-05, 6.775185465812683e-05, 7.337145507335663e-05, 7.899105548858643e-05, 8.461065590381622e-05, 9.023025631904602e-05, 9.584985673427582e-05, 0.00010146945714950562, 0.00010708905756473541, 0.00011270865797996521, 0.00011832825839519501, 0.0001239478588104248, 0.0001295674592256546, 0.0001351870596408844, 0.0001408066600561142, 0.000146426260471344, 0.0001520458608865738, 0.0001576654613018036, 0.00016328506171703339, 0.00016890466213226318, 0.00017452426254749298, 0.00018014386296272278, 0.00018576346337795258, 0.00019138306379318237, 0.00019700266420841217, 0.00020262226462364197, 0.00020824186503887177, 0.00021386146545410156]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 11.0, 21.0, 35.0, 54.0, 79.0, 153.0, 302.0, 615.0, 1244.0, 2876.0, 7211.0, 21969.0, 85860.0, 390688.0, 409904.0, 91299.0, 23125.0, 7545.0, 2993.0, 1266.0, 597.0, 297.0, 156.0, 104.0, 56.0, 26.0, 18.0, 11.0, 10.0, 11.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2193603515625, -0.21309661865234375, -0.2068328857421875, -0.20056915283203125, -0.194305419921875, -0.18804168701171875, -0.1817779541015625, -0.17551422119140625, -0.16925048828125, -0.16298675537109375, -0.1567230224609375, -0.15045928955078125, -0.144195556640625, -0.13793182373046875, -0.1316680908203125, -0.12540435791015625, -0.119140625, -0.11287689208984375, -0.1066131591796875, -0.10034942626953125, -0.094085693359375, -0.08782196044921875, -0.0815582275390625, -0.07529449462890625, -0.06903076171875, -0.06276702880859375, -0.0565032958984375, -0.05023956298828125, -0.043975830078125, -0.03771209716796875, -0.0314483642578125, -0.02518463134765625, -0.0189208984375, -0.01265716552734375, -0.0063934326171875, -0.00012969970703125, 0.006134033203125, 0.01239776611328125, 0.0186614990234375, 0.02492523193359375, 0.03118896484375, 0.03745269775390625, 0.0437164306640625, 0.04998016357421875, 0.056243896484375, 0.06250762939453125, 0.0687713623046875, 0.07503509521484375, 0.081298828125, 0.08756256103515625, 0.0938262939453125, 0.10009002685546875, 0.106353759765625, 0.11261749267578125, 0.1188812255859375, 0.12514495849609375, 0.13140869140625, 0.13767242431640625, 0.1439361572265625, 0.15019989013671875, 0.156463623046875, 0.16272735595703125, 0.1689910888671875, 0.17525482177734375, 0.1815185546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 9.0, 5.0, 4.0, 10.0, 10.0, 12.0, 16.0, 24.0, 21.0, 19.0, 34.0, 36.0, 35.0, 44.0, 55.0, 55.0, 64.0, 62.0, 77.0, 75.0, 53.0, 39.0, 34.0, 39.0, 36.0, 21.0, 18.0, 12.0, 20.0, 12.0, 8.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04046630859375, -0.039258480072021484, -0.03805065155029297, -0.03684282302856445, -0.03563499450683594, -0.03442716598510742, -0.033219337463378906, -0.03201150894165039, -0.030803680419921875, -0.02959585189819336, -0.028388023376464844, -0.027180194854736328, -0.025972366333007812, -0.024764537811279297, -0.02355670928955078, -0.022348880767822266, -0.02114105224609375, -0.019933223724365234, -0.01872539520263672, -0.017517566680908203, -0.016309738159179688, -0.015101909637451172, -0.013894081115722656, -0.01268625259399414, -0.011478424072265625, -0.01027059555053711, -0.009062767028808594, -0.007854938507080078, -0.0066471099853515625, -0.005439281463623047, -0.004231452941894531, -0.0030236244201660156, -0.0018157958984375, -0.0006079673767089844, 0.0005998611450195312, 0.0018076896667480469, 0.0030155181884765625, 0.004223346710205078, 0.005431175231933594, 0.006639003753662109, 0.007846832275390625, 0.00905466079711914, 0.010262489318847656, 0.011470317840576172, 0.012678146362304688, 0.013885974884033203, 0.015093803405761719, 0.016301631927490234, 0.01750946044921875, 0.018717288970947266, 0.01992511749267578, 0.021132946014404297, 0.022340774536132812, 0.023548603057861328, 0.024756431579589844, 0.02596426010131836, 0.027172088623046875, 0.02837991714477539, 0.029587745666503906, 0.030795574188232422, 0.03200340270996094, 0.03321123123168945, 0.03441905975341797, 0.035626888275146484, 0.036834716796875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 11.0, 19.0, 44.0, 75.0, 165.0, 233.0, 216.0, 113.0, 62.0, 26.0, 13.0, 12.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6535491943359375, -6.5019450187683105, -6.350340843200684, -6.198736667633057, -6.04713249206543, -5.8955278396606445, -5.743924140930176, -5.592319488525391, -5.440715312957764, -5.289111137390137, -5.13750696182251, -4.985902786254883, -4.834298610687256, -4.682694435119629, -4.531089782714844, -4.379485607147217, -4.22788143157959, -4.076277256011963, -3.924673080444336, -3.773068904876709, -3.621464490890503, -3.469860315322876, -3.318256139755249, -3.166651725769043, -3.015048027038574, -2.8634438514709473, -2.7118396759033203, -2.5602355003356934, -2.4086310863494873, -2.2570269107818604, -2.1054227352142334, -1.953818440437317, -1.8022143840789795, -1.6506102085113525, -1.499005913734436, -1.347401738166809, -1.1957974433898926, -1.0441932678222656, -0.8925890922546387, -0.7409847974777222, -0.5893806219100952, -0.4377763867378235, -0.28617218136787415, -0.1345679759979248, 0.017036259174346924, 0.16864049434661865, 0.3202446699142456, 0.4718489646911621, 0.6234531402587891, 0.7750573754310608, 0.9266616106033325, 1.0782657861709595, 1.229870080947876, 1.381474256515503, 1.5330784320831299, 1.6846827268600464, 1.8362869024276733, 1.9878910779953003, 2.139495372772217, 2.2910995483398438, 2.4427037239074707, 2.5943078994750977, 2.7459120750427246, 2.8975164890289307, 3.0491206645965576]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 9.0, 11.0, 6.0, 9.0, 11.0, 15.0, 19.0, 16.0, 31.0, 33.0, 41.0, 35.0, 33.0, 50.0, 42.0, 46.0, 53.0, 53.0, 48.0, 49.0, 45.0, 42.0, 31.0, 34.0, 34.0, 33.0, 37.0, 16.0, 19.0, 16.0, 17.0, 11.0, 7.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5565255880355835, -1.5122787952423096, -1.4680320024490356, -1.4237852096557617, -1.3795382976531982, -1.3352915048599243, -1.2910447120666504, -1.2467979192733765, -1.2025511264801025, -1.1583043336868286, -1.1140575408935547, -1.0698106288909912, -1.0255638360977173, -0.9813170433044434, -0.9370702505111694, -0.8928234577178955, -0.848576545715332, -0.8043297529220581, -0.7600829005241394, -0.7158361077308655, -0.6715892553329468, -0.6273424625396729, -0.5830956697463989, -0.538848876953125, -0.4946020245552063, -0.45035520195961, -0.40610837936401367, -0.36186158657073975, -0.31761476397514343, -0.2733679413795471, -0.2291211485862732, -0.18487432599067688, -0.14062738418579102, -0.0963805690407753, -0.05213375389575958, -0.007886946201324463, 0.03635987639427185, 0.08060669898986816, 0.12485349178314209, 0.1691003143787384, 0.21334713697433472, 0.25759395956993103, 0.30184078216552734, 0.34608757495880127, 0.3903343975543976, 0.4345812201499939, 0.4788280129432678, 0.5230748653411865, 0.5673216581344604, 0.6115684509277344, 0.6558153033256531, 0.700062096118927, 0.7443089485168457, 0.7885557413101196, 0.8328025341033936, 0.8770493268966675, 0.9212961792945862, 0.9655429720878601, 1.0097898244857788, 1.0540366172790527, 1.0982834100723267, 1.1425302028656006, 1.186777114868164, 1.231023907661438, 1.275270700454712]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 13.0, 14.0, 10.0, 14.0, 15.0, 25.0, 25.0, 30.0, 56.0, 122.0, 327.0, 1040.0, 6851.0, 91040.0, 842071.0, 98057.0, 7081.0, 1127.0, 336.0, 108.0, 47.0, 29.0, 32.0, 15.0, 9.0, 9.0, 12.0, 9.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.24908447265625, -3.1309814453125, -3.01287841796875, -2.894775390625, -2.77667236328125, -2.6585693359375, -2.54046630859375, -2.42236328125, -2.30426025390625, -2.1861572265625, -2.06805419921875, -1.949951171875, -1.83184814453125, -1.7137451171875, -1.59564208984375, -1.4775390625, -1.35943603515625, -1.2413330078125, -1.12322998046875, -1.005126953125, -0.88702392578125, -0.7689208984375, -0.65081787109375, -0.53271484375, -0.41461181640625, -0.2965087890625, -0.17840576171875, -0.060302734375, 0.05780029296875, 0.1759033203125, 0.29400634765625, 0.412109375, 0.53021240234375, 0.6483154296875, 0.76641845703125, 0.884521484375, 1.00262451171875, 1.1207275390625, 1.23883056640625, 1.35693359375, 1.47503662109375, 1.5931396484375, 1.71124267578125, 1.829345703125, 1.94744873046875, 2.0655517578125, 2.18365478515625, 2.3017578125, 2.41986083984375, 2.5379638671875, 2.65606689453125, 2.774169921875, 2.89227294921875, 3.0103759765625, 3.12847900390625, 3.24658203125, 3.36468505859375, 3.4827880859375, 3.60089111328125, 3.718994140625, 3.83709716796875, 3.9552001953125, 4.07330322265625, 4.19140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 7.0, 9.0, 14.0, 15.0, 14.0, 13.0, 23.0, 28.0, 30.0, 33.0, 40.0, 41.0, 50.0, 42.0, 49.0, 42.0, 46.0, 51.0, 39.0, 54.0, 36.0, 35.0, 30.0, 38.0, 27.0, 28.0, 20.0, 19.0, 20.0, 19.0, 9.0, 10.0, 10.0, 11.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.6875, -2.60198974609375, -2.5164794921875, -2.43096923828125, -2.345458984375, -2.25994873046875, -2.1744384765625, -2.08892822265625, -2.00341796875, -1.91790771484375, -1.8323974609375, -1.74688720703125, -1.661376953125, -1.57586669921875, -1.4903564453125, -1.40484619140625, -1.3193359375, -1.23382568359375, -1.1483154296875, -1.06280517578125, -0.977294921875, -0.89178466796875, -0.8062744140625, -0.72076416015625, -0.63525390625, -0.54974365234375, -0.4642333984375, -0.37872314453125, -0.293212890625, -0.20770263671875, -0.1221923828125, -0.03668212890625, 0.048828125, 0.13433837890625, 0.2198486328125, 0.30535888671875, 0.390869140625, 0.47637939453125, 0.5618896484375, 0.64739990234375, 0.73291015625, 0.81842041015625, 0.9039306640625, 0.98944091796875, 1.074951171875, 1.16046142578125, 1.2459716796875, 1.33148193359375, 1.4169921875, 1.50250244140625, 1.5880126953125, 1.67352294921875, 1.759033203125, 1.84454345703125, 1.9300537109375, 2.01556396484375, 2.10107421875, 2.18658447265625, 2.2720947265625, 2.35760498046875, 2.443115234375, 2.52862548828125, 2.6141357421875, 2.69964599609375, 2.78515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 11.0, 8.0, 10.0, 12.0, 11.0, 17.0, 20.0, 34.0, 45.0, 57.0, 54.0, 81.0, 118.0, 141.0, 219.0, 395.0, 1100.0, 6292.0, 219450.0, 801583.0, 15572.0, 1819.0, 583.0, 261.0, 152.0, 107.0, 89.0, 71.0, 38.0, 43.0, 31.0, 27.0, 24.0, 19.0, 7.0, 15.0, 7.0, 4.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.35546875, -4.2061767578125, -4.056884765625, -3.9075927734375, -3.75830078125, -3.6090087890625, -3.459716796875, -3.3104248046875, -3.1611328125, -3.0118408203125, -2.862548828125, -2.7132568359375, -2.56396484375, -2.4146728515625, -2.265380859375, -2.1160888671875, -1.966796875, -1.8175048828125, -1.668212890625, -1.5189208984375, -1.36962890625, -1.2203369140625, -1.071044921875, -0.9217529296875, -0.7724609375, -0.6231689453125, -0.473876953125, -0.3245849609375, -0.17529296875, -0.0260009765625, 0.123291015625, 0.2725830078125, 0.421875, 0.5711669921875, 0.720458984375, 0.8697509765625, 1.01904296875, 1.1683349609375, 1.317626953125, 1.4669189453125, 1.6162109375, 1.7655029296875, 1.914794921875, 2.0640869140625, 2.21337890625, 2.3626708984375, 2.511962890625, 2.6612548828125, 2.810546875, 2.9598388671875, 3.109130859375, 3.2584228515625, 3.40771484375, 3.5570068359375, 3.706298828125, 3.8555908203125, 4.0048828125, 4.1541748046875, 4.303466796875, 4.4527587890625, 4.60205078125, 4.7513427734375, 4.900634765625, 5.0499267578125, 5.19921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 5.0, 10.0, 8.0, 10.0, 12.0, 16.0, 21.0, 29.0, 34.0, 35.0, 30.0, 25.0, 46.0, 56.0, 43.0, 56.0, 49.0, 53.0, 51.0, 57.0, 47.0, 42.0, 42.0, 32.0, 22.0, 31.0, 24.0, 23.0, 19.0, 14.0, 12.0, 8.0, 7.0, 8.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.36932373046875, -3.2679443359375, -3.16656494140625, -3.065185546875, -2.96380615234375, -2.8624267578125, -2.76104736328125, -2.65966796875, -2.55828857421875, -2.4569091796875, -2.35552978515625, -2.254150390625, -2.15277099609375, -2.0513916015625, -1.95001220703125, -1.8486328125, -1.74725341796875, -1.6458740234375, -1.54449462890625, -1.443115234375, -1.34173583984375, -1.2403564453125, -1.13897705078125, -1.03759765625, -0.93621826171875, -0.8348388671875, -0.73345947265625, -0.632080078125, -0.53070068359375, -0.4293212890625, -0.32794189453125, -0.2265625, -0.12518310546875, -0.0238037109375, 0.07757568359375, 0.178955078125, 0.28033447265625, 0.3817138671875, 0.48309326171875, 0.58447265625, 0.68585205078125, 0.7872314453125, 0.88861083984375, 0.989990234375, 1.09136962890625, 1.1927490234375, 1.29412841796875, 1.3955078125, 1.49688720703125, 1.5982666015625, 1.69964599609375, 1.801025390625, 1.90240478515625, 2.0037841796875, 2.10516357421875, 2.20654296875, 2.30792236328125, 2.4093017578125, 2.51068115234375, 2.612060546875, 2.71343994140625, 2.8148193359375, 2.91619873046875, 3.017578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 11.0, 9.0, 28.0, 43.0, 72.0, 146.0, 402.0, 1251.0, 6887.0, 133196.0, 875043.0, 27163.0, 3065.0, 751.0, 245.0, 100.0, 55.0, 28.0, 17.0, 15.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.8959197998046875, -0.849456787109375, -0.8029937744140625, -0.75653076171875, -0.7100677490234375, -0.663604736328125, -0.6171417236328125, -0.5706787109375, -0.5242156982421875, -0.477752685546875, -0.4312896728515625, -0.38482666015625, -0.3383636474609375, -0.291900634765625, -0.2454376220703125, -0.198974609375, -0.1525115966796875, -0.106048583984375, -0.0595855712890625, -0.01312255859375, 0.0333404541015625, 0.079803466796875, 0.1262664794921875, 0.1727294921875, 0.2191925048828125, 0.265655517578125, 0.3121185302734375, 0.35858154296875, 0.4050445556640625, 0.451507568359375, 0.4979705810546875, 0.54443359375, 0.5908966064453125, 0.637359619140625, 0.6838226318359375, 0.73028564453125, 0.7767486572265625, 0.823211669921875, 0.8696746826171875, 0.9161376953125, 0.9626007080078125, 1.009063720703125, 1.0555267333984375, 1.10198974609375, 1.1484527587890625, 1.194915771484375, 1.2413787841796875, 1.287841796875, 1.3343048095703125, 1.380767822265625, 1.4272308349609375, 1.47369384765625, 1.5201568603515625, 1.566619873046875, 1.6130828857421875, 1.6595458984375, 1.7060089111328125, 1.752471923828125, 1.7989349365234375, 1.84539794921875, 1.8918609619140625, 1.938323974609375, 1.9847869873046875, 2.03125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 14.0, 15.0, 18.0, 20.0, 33.0, 58.0, 77.0, 62.0, 94.0, 106.0, 95.0, 90.0, 57.0, 70.0, 48.0, 27.0, 17.0, 25.0, 11.0, 10.0, 8.0, 3.0, 1.0, 8.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.821487426757812e-05, -8.533988147974014e-05, -8.246488869190216e-05, -7.958989590406418e-05, -7.67149031162262e-05, -7.383991032838821e-05, -7.096491754055023e-05, -6.808992475271225e-05, -6.521493196487427e-05, -6.233993917703629e-05, -5.94649463891983e-05, -5.658995360136032e-05, -5.371496081352234e-05, -5.083996802568436e-05, -4.7964975237846375e-05, -4.508998245000839e-05, -4.221498966217041e-05, -3.933999687433243e-05, -3.6465004086494446e-05, -3.3590011298656464e-05, -3.071501851081848e-05, -2.78400257229805e-05, -2.4965032935142517e-05, -2.2090040147304535e-05, -1.9215047359466553e-05, -1.634005457162857e-05, -1.3465061783790588e-05, -1.0590068995952606e-05, -7.715076208114624e-06, -4.840083420276642e-06, -1.9650906324386597e-06, 9.099021553993225e-07, 3.7848949432373047e-06, 6.659887731075287e-06, 9.534880518913269e-06, 1.2409873306751251e-05, 1.5284866094589233e-05, 1.8159858882427216e-05, 2.1034851670265198e-05, 2.390984445810318e-05, 2.6784837245941162e-05, 2.9659830033779144e-05, 3.2534822821617126e-05, 3.540981560945511e-05, 3.828480839729309e-05, 4.115980118513107e-05, 4.4034793972969055e-05, 4.690978676080704e-05, 4.978477954864502e-05, 5.2659772336483e-05, 5.5534765124320984e-05, 5.8409757912158966e-05, 6.128475069999695e-05, 6.415974348783493e-05, 6.703473627567291e-05, 6.99097290635109e-05, 7.278472185134888e-05, 7.565971463918686e-05, 7.853470742702484e-05, 8.140970021486282e-05, 8.42846930027008e-05, 8.715968579053879e-05, 9.003467857837677e-05, 9.290967136621475e-05, 9.578466415405273e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 13.0, 15.0, 20.0, 44.0, 64.0, 124.0, 247.0, 838.0, 3195.0, 22855.0, 607687.0, 392667.0, 16901.0, 2595.0, 716.0, 269.0, 104.0, 69.0, 33.0, 30.0, 10.0, 12.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.508575439453125, -1.46539306640625, -1.422210693359375, -1.3790283203125, -1.335845947265625, -1.29266357421875, -1.249481201171875, -1.206298828125, -1.163116455078125, -1.11993408203125, -1.076751708984375, -1.0335693359375, -0.990386962890625, -0.94720458984375, -0.904022216796875, -0.86083984375, -0.817657470703125, -0.77447509765625, -0.731292724609375, -0.6881103515625, -0.644927978515625, -0.60174560546875, -0.558563232421875, -0.515380859375, -0.472198486328125, -0.42901611328125, -0.385833740234375, -0.3426513671875, -0.299468994140625, -0.25628662109375, -0.213104248046875, -0.169921875, -0.126739501953125, -0.08355712890625, -0.040374755859375, 0.0028076171875, 0.045989990234375, 0.08917236328125, 0.132354736328125, 0.175537109375, 0.218719482421875, 0.26190185546875, 0.305084228515625, 0.3482666015625, 0.391448974609375, 0.43463134765625, 0.477813720703125, 0.52099609375, 0.564178466796875, 0.60736083984375, 0.650543212890625, 0.6937255859375, 0.736907958984375, 0.78009033203125, 0.823272705078125, 0.866455078125, 0.909637451171875, 0.95281982421875, 0.996002197265625, 1.0391845703125, 1.082366943359375, 1.12554931640625, 1.168731689453125, 1.2119140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 21.0, 28.0, 26.0, 54.0, 76.0, 98.0, 117.0, 96.0, 131.0, 91.0, 80.0, 42.0, 34.0, 27.0, 17.0, 14.0, 13.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.41259765625, -0.4003028869628906, -0.38800811767578125, -0.3757133483886719, -0.3634185791015625, -0.3511238098144531, -0.33882904052734375, -0.3265342712402344, -0.314239501953125, -0.3019447326660156, -0.28964996337890625, -0.2773551940917969, -0.2650604248046875, -0.2527656555175781, -0.24047088623046875, -0.22817611694335938, -0.21588134765625, -0.20358657836914062, -0.19129180908203125, -0.17899703979492188, -0.1667022705078125, -0.15440750122070312, -0.14211273193359375, -0.12981796264648438, -0.117523193359375, -0.10522842407226562, -0.09293365478515625, -0.08063888549804688, -0.0683441162109375, -0.056049346923828125, -0.04375457763671875, -0.031459808349609375, -0.0191650390625, -0.006870269775390625, 0.00542449951171875, 0.017719268798828125, 0.0300140380859375, 0.042308807373046875, 0.05460357666015625, 0.06689834594726562, 0.079193115234375, 0.09148788452148438, 0.10378265380859375, 0.11607742309570312, 0.1283721923828125, 0.14066696166992188, 0.15296173095703125, 0.16525650024414062, 0.17755126953125, 0.18984603881835938, 0.20214080810546875, 0.21443557739257812, 0.2267303466796875, 0.23902511596679688, 0.25131988525390625, 0.2636146545410156, 0.275909423828125, 0.2882041931152344, 0.30049896240234375, 0.3127937316894531, 0.3250885009765625, 0.3373832702636719, 0.34967803955078125, 0.3619728088378906, 0.374267578125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 14.0, 10.0, 39.0, 53.0, 77.0, 146.0, 208.0, 168.0, 122.0, 65.0, 32.0, 27.0, 13.0, 11.0, 8.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4694671630859375, -6.219242095947266, -5.969017028808594, -5.718791961669922, -5.46856689453125, -5.218341827392578, -4.968116283416748, -4.717891216278076, -4.467666149139404, -4.217441082000732, -3.9672160148620605, -3.7169907093048096, -3.4667656421661377, -3.216540575027466, -2.966315269470215, -2.716090202331543, -2.465865135192871, -2.215640068054199, -1.9654148817062378, -1.7151896953582764, -1.4649646282196045, -1.2147395610809326, -0.9645143747329712, -0.7142891883850098, -0.4640641212463379, -0.21383899450302124, 0.03638613224029541, 0.28661125898361206, 0.5368363857269287, 0.7870614528656006, 1.037286639213562, 1.2875118255615234, 1.537735939025879, 1.7879610061645508, 2.0381860733032227, 2.2884113788604736, 2.5386364459991455, 2.7888615131378174, 3.0390868186950684, 3.2893118858337402, 3.539536952972412, 3.789762020111084, 4.039987087249756, 4.290212154388428, 4.540437698364258, 4.79066276550293, 5.040887832641602, 5.291112899780273, 5.541337966918945, 5.791563034057617, 6.041788101196289, 6.292013168334961, 6.542238235473633, 6.792463302612305, 7.042688846588135, 7.292913913726807, 7.5431389808654785, 7.79336404800415, 8.04358959197998, 8.293814659118652, 8.544039726257324, 8.794264793395996, 9.044489860534668, 9.29471492767334, 9.544939994812012]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 7.0, 4.0, 15.0, 12.0, 11.0, 12.0, 18.0, 23.0, 22.0, 29.0, 26.0, 31.0, 37.0, 30.0, 45.0, 34.0, 44.0, 44.0, 46.0, 36.0, 43.0, 49.0, 42.0, 37.0, 35.0, 35.0, 39.0, 26.0, 31.0, 21.0, 21.0, 16.0, 13.0, 13.0, 18.0, 5.0, 6.0, 5.0, 4.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.964559555053711, -4.807905197143555, -4.651251316070557, -4.4945969581604, -4.337943077087402, -4.181288719177246, -4.024634838104248, -3.867980480194092, -3.7113263607025146, -3.5546722412109375, -3.3980181217193604, -3.241364002227783, -3.084709644317627, -2.928055763244629, -2.7714014053344727, -2.6147472858428955, -2.4580931663513184, -2.301439046859741, -2.144784927368164, -1.9881306886672974, -1.8314765691757202, -1.674822449684143, -1.5181682109832764, -1.3615140914916992, -1.204859972000122, -1.048205852508545, -0.891551673412323, -0.7348974943161011, -0.5782433748245239, -0.4215892553329468, -0.26493507623672485, -0.10828089714050293, 0.04837322235107422, 0.20502737164497375, 0.3616815209388733, 0.5183357000350952, 0.6749898195266724, 0.8316439390182495, 0.9882981181144714, 1.1449522972106934, 1.3016064167022705, 1.4582605361938477, 1.6149146556854248, 1.7715688943862915, 1.9282230138778687, 2.0848770141601562, 2.2415313720703125, 2.3981854915618896, 2.554839611053467, 2.711493730545044, 2.868147850036621, 3.0248019695281982, 3.1814560890197754, 3.3381104469299316, 3.494764566421509, 3.651418685913086, 3.808072805404663, 3.9647269248962402, 4.1213812828063965, 4.2780351638793945, 4.434689521789551, 4.591343402862549, 4.747997760772705, 4.904651641845703, 5.061305999755859]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 14.0, 18.0, 21.0, 16.0, 47.0, 53.0, 71.0, 139.0, 197.0, 371.0, 566.0, 1190.0, 2626.0, 7066.0, 33444.0, 688273.0, 3215887.0, 216516.0, 19184.0, 4644.0, 1862.0, 883.0, 440.0, 247.0, 166.0, 111.0, 69.0, 43.0, 33.0, 21.0, 14.0, 8.0, 9.0, 8.0, 2.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.87188720703125, -3.7398681640625, -3.60784912109375, -3.475830078125, -3.34381103515625, -3.2117919921875, -3.07977294921875, -2.94775390625, -2.81573486328125, -2.6837158203125, -2.55169677734375, -2.419677734375, -2.28765869140625, -2.1556396484375, -2.02362060546875, -1.8916015625, -1.75958251953125, -1.6275634765625, -1.49554443359375, -1.363525390625, -1.23150634765625, -1.0994873046875, -0.96746826171875, -0.83544921875, -0.70343017578125, -0.5714111328125, -0.43939208984375, -0.307373046875, -0.17535400390625, -0.0433349609375, 0.08868408203125, 0.220703125, 0.35272216796875, 0.4847412109375, 0.61676025390625, 0.748779296875, 0.88079833984375, 1.0128173828125, 1.14483642578125, 1.27685546875, 1.40887451171875, 1.5408935546875, 1.67291259765625, 1.804931640625, 1.93695068359375, 2.0689697265625, 2.20098876953125, 2.3330078125, 2.46502685546875, 2.5970458984375, 2.72906494140625, 2.861083984375, 2.99310302734375, 3.1251220703125, 3.25714111328125, 3.38916015625, 3.52117919921875, 3.6531982421875, 3.78521728515625, 3.917236328125, 4.04925537109375, 4.1812744140625, 4.31329345703125, 4.4453125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 1.0, 5.0, 8.0, 9.0, 11.0, 13.0, 12.0, 15.0, 18.0, 35.0, 31.0, 34.0, 39.0, 55.0, 44.0, 55.0, 55.0, 61.0, 62.0, 56.0, 50.0, 51.0, 49.0, 36.0, 37.0, 37.0, 26.0, 15.0, 16.0, 16.0, 12.0, 14.0, 2.0, 6.0, 5.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.3637847900390625, -2.295928955078125, -2.2280731201171875, -2.16021728515625, -2.0923614501953125, -2.024505615234375, -1.9566497802734375, -1.8887939453125, -1.8209381103515625, -1.753082275390625, -1.6852264404296875, -1.61737060546875, -1.5495147705078125, -1.481658935546875, -1.4138031005859375, -1.345947265625, -1.2780914306640625, -1.210235595703125, -1.1423797607421875, -1.07452392578125, -1.0066680908203125, -0.938812255859375, -0.8709564208984375, -0.8031005859375, -0.7352447509765625, -0.667388916015625, -0.5995330810546875, -0.53167724609375, -0.4638214111328125, -0.395965576171875, -0.3281097412109375, -0.26025390625, -0.1923980712890625, -0.124542236328125, -0.0566864013671875, 0.01116943359375, 0.0790252685546875, 0.146881103515625, 0.2147369384765625, 0.2825927734375, 0.3504486083984375, 0.418304443359375, 0.4861602783203125, 0.55401611328125, 0.6218719482421875, 0.689727783203125, 0.7575836181640625, 0.825439453125, 0.8932952880859375, 0.961151123046875, 1.0290069580078125, 1.09686279296875, 1.1647186279296875, 1.232574462890625, 1.3004302978515625, 1.3682861328125, 1.4361419677734375, 1.503997802734375, 1.5718536376953125, 1.63970947265625, 1.7075653076171875, 1.775421142578125, 1.8432769775390625, 1.9111328125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 5.0, 7.0, 5.0, 8.0, 15.0, 32.0, 22.0, 38.0, 50.0, 93.0, 162.0, 444.0, 1210.0, 4801.0, 32389.0, 2231363.0, 1887254.0, 30040.0, 4418.0, 1123.0, 409.0, 171.0, 76.0, 43.0, 27.0, 24.0, 6.0, 8.0, 5.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.55859375, -5.39971923828125, -5.2408447265625, -5.08197021484375, -4.923095703125, -4.76422119140625, -4.6053466796875, -4.44647216796875, -4.28759765625, -4.12872314453125, -3.9698486328125, -3.81097412109375, -3.652099609375, -3.49322509765625, -3.3343505859375, -3.17547607421875, -3.0166015625, -2.85772705078125, -2.6988525390625, -2.53997802734375, -2.381103515625, -2.22222900390625, -2.0633544921875, -1.90447998046875, -1.74560546875, -1.58673095703125, -1.4278564453125, -1.26898193359375, -1.110107421875, -0.95123291015625, -0.7923583984375, -0.63348388671875, -0.474609375, -0.31573486328125, -0.1568603515625, 0.00201416015625, 0.160888671875, 0.31976318359375, 0.4786376953125, 0.63751220703125, 0.79638671875, 0.95526123046875, 1.1141357421875, 1.27301025390625, 1.431884765625, 1.59075927734375, 1.7496337890625, 1.90850830078125, 2.0673828125, 2.22625732421875, 2.3851318359375, 2.54400634765625, 2.702880859375, 2.86175537109375, 3.0206298828125, 3.17950439453125, 3.33837890625, 3.49725341796875, 3.6561279296875, 3.81500244140625, 3.973876953125, 4.13275146484375, 4.2916259765625, 4.45050048828125, 4.609375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 10.0, 10.0, 10.0, 19.0, 18.0, 22.0, 36.0, 54.0, 92.0, 155.0, 243.0, 415.0, 666.0, 781.0, 531.0, 410.0, 172.0, 126.0, 73.0, 45.0, 46.0, 30.0, 24.0, 24.0, 15.0, 10.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.677734375, -0.6519393920898438, -0.6261444091796875, -0.6003494262695312, -0.574554443359375, -0.5487594604492188, -0.5229644775390625, -0.49716949462890625, -0.47137451171875, -0.44557952880859375, -0.4197845458984375, -0.39398956298828125, -0.368194580078125, -0.34239959716796875, -0.3166046142578125, -0.29080963134765625, -0.2650146484375, -0.23921966552734375, -0.2134246826171875, -0.18762969970703125, -0.161834716796875, -0.13603973388671875, -0.1102447509765625, -0.08444976806640625, -0.05865478515625, -0.03285980224609375, -0.0070648193359375, 0.01873016357421875, 0.044525146484375, 0.07032012939453125, 0.0961151123046875, 0.12191009521484375, 0.147705078125, 0.17350006103515625, 0.1992950439453125, 0.22509002685546875, 0.250885009765625, 0.27667999267578125, 0.3024749755859375, 0.32826995849609375, 0.35406494140625, 0.37985992431640625, 0.4056549072265625, 0.43144989013671875, 0.457244873046875, 0.48303985595703125, 0.5088348388671875, 0.5346298217773438, 0.5604248046875, 0.5862197875976562, 0.6120147705078125, 0.6378097534179688, 0.663604736328125, 0.6893997192382812, 0.7151947021484375, 0.7409896850585938, 0.76678466796875, 0.7925796508789062, 0.8183746337890625, 0.8441696166992188, 0.869964599609375, 0.8957595825195312, 0.9215545654296875, 0.9473495483398438, 0.97314453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 12.0, 8.0, 8.0, 11.0, 21.0, 45.0, 70.0, 87.0, 139.0, 135.0, 122.0, 98.0, 72.0, 56.0, 31.0, 34.0, 17.0, 15.0, 11.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0], "bins": [-6.173605442047119, -6.041611671447754, -5.909617900848389, -5.777623653411865, -5.6456298828125, -5.513636112213135, -5.3816423416137695, -5.249648571014404, -5.117654800415039, -4.985661029815674, -4.853667259216309, -4.721673011779785, -4.58967924118042, -4.457685470581055, -4.3256916999816895, -4.193697929382324, -4.061703681945801, -3.9297099113464355, -3.797715902328491, -3.665722131729126, -3.5337281227111816, -3.4017343521118164, -3.269740581512451, -3.137746810913086, -3.0057528018951416, -2.8737590312957764, -2.741765022277832, -2.609771251678467, -2.4777774810791016, -2.3457834720611572, -2.213789701461792, -2.0817956924438477, -1.9498019218444824, -1.8178080320358276, -1.6858141422271729, -1.5538203716278076, -1.4218264818191528, -1.289832592010498, -1.1578388214111328, -1.025844931602478, -0.8938510417938232, -0.7618571519851685, -0.6298633217811584, -0.49786946177482605, -0.36587560176849365, -0.23388171195983887, -0.10188788175582886, 0.030105948448181152, 0.16209983825683594, 0.29409369826316833, 0.42608755826950073, 0.5580813884735107, 0.6900752782821655, 0.8220691680908203, 0.9540629982948303, 1.0860568284988403, 1.2180507183074951, 1.35004460811615, 1.4820384979248047, 1.61403226852417, 1.7460261583328247, 1.8780200481414795, 2.0100138187408447, 2.142007827758789, 2.2740015983581543]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 7.0, 4.0, 9.0, 9.0, 14.0, 12.0, 12.0, 19.0, 28.0, 23.0, 38.0, 43.0, 38.0, 45.0, 53.0, 53.0, 47.0, 43.0, 49.0, 57.0, 61.0, 41.0, 40.0, 29.0, 40.0, 38.0, 35.0, 22.0, 24.0, 11.0, 10.0, 11.0, 8.0, 8.0, 8.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.113801956176758, -2.0458667278289795, -1.9779313802719116, -1.9099961519241333, -1.8420608043670654, -1.774125576019287, -1.7061903476715088, -1.6382551193237305, -1.5703197717666626, -1.5023845434188843, -1.4344491958618164, -1.366513967514038, -1.2985787391662598, -1.230643391609192, -1.1627081632614136, -1.0947728157043457, -1.0268375873565674, -0.9589022994041443, -0.8909670114517212, -0.8230317831039429, -0.7550964951515198, -0.6871612071990967, -0.6192259788513184, -0.5512906908988953, -0.48335540294647217, -0.4154201149940491, -0.34748485684394836, -0.27954959869384766, -0.21161431074142456, -0.14367902278900146, -0.07574376463890076, -0.007808506488800049, 0.06012701988220215, 0.12806229293346405, 0.19599756598472595, 0.26393282413482666, 0.33186811208724976, 0.39980340003967285, 0.46773865818977356, 0.5356739163398743, 0.6036092042922974, 0.6715444922447205, 0.7394797801971436, 0.8074150085449219, 0.875350296497345, 0.9432855844497681, 1.0112208127975464, 1.0791561603546143, 1.1470913887023926, 1.215026617050171, 1.2829619646072388, 1.350897192955017, 1.418832540512085, 1.4867677688598633, 1.5547029972076416, 1.62263822555542, 1.6905735731124878, 1.7585088014602661, 1.826444149017334, 1.8943793773651123, 1.9623146057128906, 2.030250072479248, 2.0981853008270264, 2.1661205291748047, 2.234055757522583]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 5.0, 15.0, 37.0, 77.0, 154.0, 507.0, 1654.0, 5493.0, 32664.0, 639243.0, 343442.0, 19281.0, 4065.0, 1242.0, 383.0, 143.0, 59.0, 32.0, 9.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.085968017578125, -1.04400634765625, -1.002044677734375, -0.9600830078125, -0.918121337890625, -0.87615966796875, -0.834197998046875, -0.792236328125, -0.750274658203125, -0.70831298828125, -0.666351318359375, -0.6243896484375, -0.582427978515625, -0.54046630859375, -0.498504638671875, -0.45654296875, -0.414581298828125, -0.37261962890625, -0.330657958984375, -0.2886962890625, -0.246734619140625, -0.20477294921875, -0.162811279296875, -0.120849609375, -0.078887939453125, -0.03692626953125, 0.005035400390625, 0.0469970703125, 0.088958740234375, 0.13092041015625, 0.172882080078125, 0.21484375, 0.256805419921875, 0.29876708984375, 0.340728759765625, 0.3826904296875, 0.424652099609375, 0.46661376953125, 0.508575439453125, 0.550537109375, 0.592498779296875, 0.63446044921875, 0.676422119140625, 0.7183837890625, 0.760345458984375, 0.80230712890625, 0.844268798828125, 0.88623046875, 0.928192138671875, 0.97015380859375, 1.012115478515625, 1.0540771484375, 1.096038818359375, 1.13800048828125, 1.179962158203125, 1.221923828125, 1.263885498046875, 1.30584716796875, 1.347808837890625, 1.3897705078125, 1.431732177734375, 1.47369384765625, 1.515655517578125, 1.5576171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 8.0, 8.0, 13.0, 21.0, 21.0, 20.0, 22.0, 45.0, 53.0, 67.0, 64.0, 64.0, 81.0, 69.0, 60.0, 80.0, 56.0, 61.0, 47.0, 34.0, 27.0, 25.0, 15.0, 13.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.9755859375, -1.912109375, -1.8486328125, -1.78515625, -1.7216796875, -1.658203125, -1.5947265625, -1.53125, -1.4677734375, -1.404296875, -1.3408203125, -1.27734375, -1.2138671875, -1.150390625, -1.0869140625, -1.0234375, -0.9599609375, -0.896484375, -0.8330078125, -0.76953125, -0.7060546875, -0.642578125, -0.5791015625, -0.515625, -0.4521484375, -0.388671875, -0.3251953125, -0.26171875, -0.1982421875, -0.134765625, -0.0712890625, -0.0078125, 0.0556640625, 0.119140625, 0.1826171875, 0.24609375, 0.3095703125, 0.373046875, 0.4365234375, 0.5, 0.5634765625, 0.626953125, 0.6904296875, 0.75390625, 0.8173828125, 0.880859375, 0.9443359375, 1.0078125, 1.0712890625, 1.134765625, 1.1982421875, 1.26171875, 1.3251953125, 1.388671875, 1.4521484375, 1.515625, 1.5791015625, 1.642578125, 1.7060546875, 1.76953125, 1.8330078125, 1.896484375, 1.9599609375, 2.0234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 3.0, 10.0, 4.0, 4.0, 8.0, 6.0, 14.0, 19.0, 43.0, 73.0, 104.0, 213.0, 431.0, 870.0, 2188.0, 6428.0, 26575.0, 189160.0, 635188.0, 154636.0, 22976.0, 5863.0, 1984.0, 847.0, 393.0, 203.0, 120.0, 59.0, 32.0, 24.0, 13.0, 21.0, 7.0, 4.0, 6.0, 6.0, 3.0, 9.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.79833984375, -0.7751693725585938, -0.7519989013671875, -0.7288284301757812, -0.705657958984375, -0.6824874877929688, -0.6593170166015625, -0.6361465454101562, -0.61297607421875, -0.5898056030273438, -0.5666351318359375, -0.5434646606445312, -0.520294189453125, -0.49712371826171875, -0.4739532470703125, -0.45078277587890625, -0.4276123046875, -0.40444183349609375, -0.3812713623046875, -0.35810089111328125, -0.334930419921875, -0.31175994873046875, -0.2885894775390625, -0.26541900634765625, -0.24224853515625, -0.21907806396484375, -0.1959075927734375, -0.17273712158203125, -0.149566650390625, -0.12639617919921875, -0.1032257080078125, -0.08005523681640625, -0.056884765625, -0.03371429443359375, -0.0105438232421875, 0.01262664794921875, 0.035797119140625, 0.05896759033203125, 0.0821380615234375, 0.10530853271484375, 0.12847900390625, 0.15164947509765625, 0.1748199462890625, 0.19799041748046875, 0.221160888671875, 0.24433135986328125, 0.2675018310546875, 0.29067230224609375, 0.3138427734375, 0.33701324462890625, 0.3601837158203125, 0.38335418701171875, 0.406524658203125, 0.42969512939453125, 0.4528656005859375, 0.47603607177734375, 0.49920654296875, 0.5223770141601562, 0.5455474853515625, 0.5687179565429688, 0.591888427734375, 0.6150588989257812, 0.6382293701171875, 0.6613998413085938, 0.6845703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 8.0, 13.0, 10.0, 13.0, 12.0, 19.0, 24.0, 20.0, 24.0, 37.0, 35.0, 38.0, 42.0, 57.0, 46.0, 55.0, 55.0, 49.0, 45.0, 46.0, 51.0, 33.0, 44.0, 39.0, 29.0, 32.0, 24.0, 16.0, 15.0, 13.0, 10.0, 9.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.265625, -3.171539306640625, -3.07745361328125, -2.983367919921875, -2.8892822265625, -2.795196533203125, -2.70111083984375, -2.607025146484375, -2.512939453125, -2.418853759765625, -2.32476806640625, -2.230682373046875, -2.1365966796875, -2.042510986328125, -1.94842529296875, -1.854339599609375, -1.76025390625, -1.666168212890625, -1.57208251953125, -1.477996826171875, -1.3839111328125, -1.289825439453125, -1.19573974609375, -1.101654052734375, -1.007568359375, -0.913482666015625, -0.81939697265625, -0.725311279296875, -0.6312255859375, -0.537139892578125, -0.44305419921875, -0.348968505859375, -0.2548828125, -0.160797119140625, -0.06671142578125, 0.027374267578125, 0.1214599609375, 0.215545654296875, 0.30963134765625, 0.403717041015625, 0.497802734375, 0.591888427734375, 0.68597412109375, 0.780059814453125, 0.8741455078125, 0.968231201171875, 1.06231689453125, 1.156402587890625, 1.25048828125, 1.344573974609375, 1.43865966796875, 1.532745361328125, 1.6268310546875, 1.720916748046875, 1.81500244140625, 1.909088134765625, 2.003173828125, 2.097259521484375, 2.19134521484375, 2.285430908203125, 2.3795166015625, 2.473602294921875, 2.56768798828125, 2.661773681640625, 2.755859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 9.0, 12.0, 7.0, 21.0, 22.0, 37.0, 62.0, 77.0, 114.0, 186.0, 320.0, 564.0, 1117.0, 2309.0, 4963.0, 13112.0, 45818.0, 243828.0, 535264.0, 152204.0, 30653.0, 9774.0, 3948.0, 1870.0, 953.0, 517.0, 288.0, 162.0, 101.0, 67.0, 47.0, 32.0, 21.0, 28.0, 13.0, 11.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1739501953125, -0.16840362548828125, -0.1628570556640625, -0.15731048583984375, -0.151763916015625, -0.14621734619140625, -0.1406707763671875, -0.13512420654296875, -0.12957763671875, -0.12403106689453125, -0.1184844970703125, -0.11293792724609375, -0.107391357421875, -0.10184478759765625, -0.0962982177734375, -0.09075164794921875, -0.085205078125, -0.07965850830078125, -0.0741119384765625, -0.06856536865234375, -0.063018798828125, -0.05747222900390625, -0.0519256591796875, -0.04637908935546875, -0.04083251953125, -0.03528594970703125, -0.0297393798828125, -0.02419281005859375, -0.018646240234375, -0.01309967041015625, -0.0075531005859375, -0.00200653076171875, 0.0035400390625, 0.00908660888671875, 0.0146331787109375, 0.02017974853515625, 0.025726318359375, 0.03127288818359375, 0.0368194580078125, 0.04236602783203125, 0.04791259765625, 0.05345916748046875, 0.0590057373046875, 0.06455230712890625, 0.070098876953125, 0.07564544677734375, 0.0811920166015625, 0.08673858642578125, 0.09228515625, 0.09783172607421875, 0.1033782958984375, 0.10892486572265625, 0.114471435546875, 0.12001800537109375, 0.1255645751953125, 0.13111114501953125, 0.13665771484375, 0.14220428466796875, 0.1477508544921875, 0.15329742431640625, 0.158843994140625, 0.16439056396484375, 0.1699371337890625, 0.17548370361328125, 0.1810302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 10.0, 0.0, 3.0, 13.0, 13.0, 10.0, 15.0, 21.0, 42.0, 72.0, 91.0, 105.0, 125.0, 127.0, 95.0, 79.0, 55.0, 38.0, 28.0, 17.0, 14.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00011205673217773438, -0.00010787695646286011, -0.00010369718074798584, -9.951740503311157e-05, -9.53376293182373e-05, -9.115785360336304e-05, -8.697807788848877e-05, -8.27983021736145e-05, -7.861852645874023e-05, -7.443875074386597e-05, -7.02589750289917e-05, -6.607919931411743e-05, -6.189942359924316e-05, -5.7719647884368896e-05, -5.353987216949463e-05, -4.936009645462036e-05, -4.5180320739746094e-05, -4.1000545024871826e-05, -3.682076930999756e-05, -3.264099359512329e-05, -2.8461217880249023e-05, -2.4281442165374756e-05, -2.0101666450500488e-05, -1.592189073562622e-05, -1.1742115020751953e-05, -7.5623393058776855e-06, -3.382563591003418e-06, 7.972121238708496e-07, 4.976987838745117e-06, 9.156763553619385e-06, 1.3336539268493652e-05, 1.751631498336792e-05, 2.1696090698242188e-05, 2.5875866413116455e-05, 3.0055642127990723e-05, 3.423541784286499e-05, 3.841519355773926e-05, 4.2594969272613525e-05, 4.677474498748779e-05, 5.095452070236206e-05, 5.513429641723633e-05, 5.9314072132110596e-05, 6.349384784698486e-05, 6.767362356185913e-05, 7.18533992767334e-05, 7.603317499160767e-05, 8.021295070648193e-05, 8.43927264213562e-05, 8.857250213623047e-05, 9.275227785110474e-05, 9.6932053565979e-05, 0.00010111182928085327, 0.00010529160499572754, 0.0001094713807106018, 0.00011365115642547607, 0.00011783093214035034, 0.00012201070785522461, 0.00012619048357009888, 0.00013037025928497314, 0.0001345500349998474, 0.00013872981071472168, 0.00014290958642959595, 0.00014708936214447021, 0.00015126913785934448, 0.00015544891357421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 11.0, 19.0, 23.0, 38.0, 60.0, 95.0, 179.0, 333.0, 667.0, 1347.0, 3083.0, 9314.0, 38101.0, 239151.0, 570649.0, 148483.0, 25279.0, 6770.0, 2510.0, 1101.0, 557.0, 304.0, 174.0, 92.0, 54.0, 50.0, 21.0, 24.0, 12.0, 9.0, 14.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2291259765625, -0.22299575805664062, -0.21686553955078125, -0.21073532104492188, -0.2046051025390625, -0.19847488403320312, -0.19234466552734375, -0.18621444702148438, -0.180084228515625, -0.17395401000976562, -0.16782379150390625, -0.16169357299804688, -0.1555633544921875, -0.14943313598632812, -0.14330291748046875, -0.13717269897460938, -0.13104248046875, -0.12491226196289062, -0.11878204345703125, -0.11265182495117188, -0.1065216064453125, -0.10039138793945312, -0.09426116943359375, -0.08813095092773438, -0.082000732421875, -0.07587051391601562, -0.06974029541015625, -0.06361007690429688, -0.0574798583984375, -0.051349639892578125, -0.04521942138671875, -0.039089202880859375, -0.032958984375, -0.026828765869140625, -0.02069854736328125, -0.014568328857421875, -0.0084381103515625, -0.002307891845703125, 0.00382232666015625, 0.009952545166015625, 0.016082763671875, 0.022212982177734375, 0.02834320068359375, 0.034473419189453125, 0.0406036376953125, 0.046733856201171875, 0.05286407470703125, 0.058994293212890625, 0.06512451171875, 0.07125473022460938, 0.07738494873046875, 0.08351516723632812, 0.0896453857421875, 0.09577560424804688, 0.10190582275390625, 0.10803604125976562, 0.114166259765625, 0.12029647827148438, 0.12642669677734375, 0.13255691528320312, 0.1386871337890625, 0.14481735229492188, 0.15094757080078125, 0.15707778930664062, 0.1632080078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 19.0, 12.0, 25.0, 29.0, 33.0, 49.0, 65.0, 71.0, 102.0, 92.0, 117.0, 88.0, 94.0, 62.0, 39.0, 28.0, 14.0, 6.0, 9.0, 8.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.04456472396850586, -0.04277324676513672, -0.04098176956176758, -0.03919029235839844, -0.0373988151550293, -0.035607337951660156, -0.033815860748291016, -0.032024383544921875, -0.030232906341552734, -0.028441429138183594, -0.026649951934814453, -0.024858474731445312, -0.023066997528076172, -0.02127552032470703, -0.01948404312133789, -0.01769256591796875, -0.01590108871459961, -0.014109611511230469, -0.012318134307861328, -0.010526657104492188, -0.008735179901123047, -0.006943702697753906, -0.005152225494384766, -0.003360748291015625, -0.0015692710876464844, 0.00022220611572265625, 0.002013683319091797, 0.0038051605224609375, 0.005596637725830078, 0.007388114929199219, 0.00917959213256836, 0.0109710693359375, 0.01276254653930664, 0.014554023742675781, 0.016345500946044922, 0.018136978149414062, 0.019928455352783203, 0.021719932556152344, 0.023511409759521484, 0.025302886962890625, 0.027094364166259766, 0.028885841369628906, 0.030677318572998047, 0.03246879577636719, 0.03426027297973633, 0.03605175018310547, 0.03784322738647461, 0.03963470458984375, 0.04142618179321289, 0.04321765899658203, 0.04500913619995117, 0.04680061340332031, 0.04859209060668945, 0.050383567810058594, 0.052175045013427734, 0.053966522216796875, 0.055757999420166016, 0.057549476623535156, 0.0593409538269043, 0.06113243103027344, 0.06292390823364258, 0.06471538543701172, 0.06650686264038086, 0.06829833984375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 19.0, 22.0, 138.0, 360.0, 312.0, 94.0, 45.0, 9.0, 3.0, 6.0, 4.0, 2.0], "bins": [-13.570354461669922, -13.327719688415527, -13.08508586883545, -12.842451095581055, -12.59981632232666, -12.357182502746582, -12.114547729492188, -11.871912956237793, -11.629279136657715, -11.38664436340332, -11.144010543823242, -10.901375770568848, -10.658740997314453, -10.416107177734375, -10.17347240447998, -9.930837631225586, -9.688203811645508, -9.445569038391113, -9.202935218811035, -8.96030044555664, -8.717665672302246, -8.475031852722168, -8.232397079467773, -7.989762783050537, -7.747127532958984, -7.504493236541748, -7.2618584632873535, -7.019224166870117, -6.776589870452881, -6.5339555740356445, -6.29132080078125, -6.048686504364014, -5.8060526847839355, -5.563418388366699, -5.320783615112305, -5.078149318695068, -4.835515022277832, -4.5928802490234375, -4.350245952606201, -4.107611656188965, -3.8649768829345703, -3.622342348098755, -3.3797080516815186, -3.137073516845703, -2.894439220428467, -2.6518046855926514, -2.409170150756836, -2.1665358543395996, -1.9239014387130737, -1.6812670230865479, -1.4386324882507324, -1.1959980726242065, -0.9533636569976807, -0.7107292413711548, -0.46809470653533936, -0.22546029090881348, 0.017174124717712402, 0.25980857014656067, 0.5024430155754089, 0.7450774908065796, 0.9877119064331055, 1.2303463220596313, 1.4729808568954468, 1.7156152725219727, 1.9582496881484985]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 16.0, 9.0, 13.0, 15.0, 18.0, 32.0, 32.0, 38.0, 64.0, 46.0, 64.0, 63.0, 63.0, 55.0, 72.0, 65.0, 53.0, 52.0, 39.0, 38.0, 33.0, 34.0, 22.0, 13.0, 12.0, 8.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6528923511505127, -1.597794771194458, -1.5426971912384033, -1.4875996112823486, -1.4325021505355835, -1.3774045705795288, -1.3223069906234741, -1.2672094106674194, -1.2121119499206543, -1.1570143699645996, -1.101916790008545, -1.0468192100524902, -0.9917217493057251, -0.9366241693496704, -0.8815265893936157, -0.826429009437561, -0.7713314294815063, -0.7162338495254517, -0.6611363291740417, -0.6060387492179871, -0.5509412288665771, -0.49584364891052246, -0.4407460689544678, -0.3856485188007355, -0.3305509686470032, -0.2754534184932709, -0.22035585343837738, -0.1652582883834839, -0.11016073822975159, -0.05506318807601929, 3.439188003540039e-05, 0.0551319420337677, 0.11022937297821045, 0.16532692313194275, 0.22042448818683624, 0.27552205324172974, 0.33061960339546204, 0.38571715354919434, 0.440814733505249, 0.4959122836589813, 0.5510098338127136, 0.6061074137687683, 0.6612049341201782, 0.7163025140762329, 0.7714000940322876, 0.8264976143836975, 0.8815951943397522, 0.9366927146911621, 0.9917902946472168, 1.0468878746032715, 1.1019854545593262, 1.1570830345153809, 1.212180495262146, 1.2672780752182007, 1.3223756551742554, 1.37747323513031, 1.4325706958770752, 1.4876682758331299, 1.5427658557891846, 1.5978634357452393, 1.6529608964920044, 1.708058476448059, 1.7631560564041138, 1.8182536363601685, 1.8733512163162231]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 9.0, 4.0, 11.0, 3.0, 7.0, 19.0, 29.0, 93.0, 171.0, 528.0, 2241.0, 10988.0, 103601.0, 865497.0, 55416.0, 7573.0, 1672.0, 427.0, 134.0, 53.0, 25.0, 11.0, 10.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.85546875, -4.725616455078125, -4.59576416015625, -4.465911865234375, -4.3360595703125, -4.206207275390625, -4.07635498046875, -3.946502685546875, -3.816650390625, -3.686798095703125, -3.55694580078125, -3.427093505859375, -3.2972412109375, -3.167388916015625, -3.03753662109375, -2.907684326171875, -2.77783203125, -2.647979736328125, -2.51812744140625, -2.388275146484375, -2.2584228515625, -2.128570556640625, -1.99871826171875, -1.868865966796875, -1.739013671875, -1.609161376953125, -1.47930908203125, -1.349456787109375, -1.2196044921875, -1.089752197265625, -0.95989990234375, -0.830047607421875, -0.7001953125, -0.570343017578125, -0.44049072265625, -0.310638427734375, -0.1807861328125, -0.050933837890625, 0.07891845703125, 0.208770751953125, 0.338623046875, 0.468475341796875, 0.59832763671875, 0.728179931640625, 0.8580322265625, 0.987884521484375, 1.11773681640625, 1.247589111328125, 1.37744140625, 1.507293701171875, 1.63714599609375, 1.766998291015625, 1.8968505859375, 2.026702880859375, 2.15655517578125, 2.286407470703125, 2.416259765625, 2.546112060546875, 2.67596435546875, 2.805816650390625, 2.9356689453125, 3.065521240234375, 3.19537353515625, 3.325225830078125, 3.455078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 13.0, 22.0, 34.0, 45.0, 66.0, 84.0, 110.0, 125.0, 120.0, 107.0, 76.0, 73.0, 45.0, 36.0, 26.0, 10.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.816009521484375, -2.61444091796875, -2.412872314453125, -2.2113037109375, -2.009735107421875, -1.80816650390625, -1.606597900390625, -1.405029296875, -1.203460693359375, -1.00189208984375, -0.800323486328125, -0.5987548828125, -0.397186279296875, -0.19561767578125, 0.005950927734375, 0.20751953125, 0.409088134765625, 0.61065673828125, 0.812225341796875, 1.0137939453125, 1.215362548828125, 1.41693115234375, 1.618499755859375, 1.820068359375, 2.021636962890625, 2.22320556640625, 2.424774169921875, 2.6263427734375, 2.827911376953125, 3.02947998046875, 3.231048583984375, 3.4326171875, 3.634185791015625, 3.83575439453125, 4.037322998046875, 4.2388916015625, 4.440460205078125, 4.64202880859375, 4.843597412109375, 5.045166015625, 5.246734619140625, 5.44830322265625, 5.649871826171875, 5.8514404296875, 6.053009033203125, 6.25457763671875, 6.456146240234375, 6.65771484375, 6.859283447265625, 7.06085205078125, 7.262420654296875, 7.4639892578125, 7.665557861328125, 7.86712646484375, 8.068695068359375, 8.270263671875, 8.471832275390625, 8.67340087890625, 8.874969482421875, 9.0765380859375, 9.278106689453125, 9.47967529296875, 9.681243896484375, 9.8828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 7.0, 6.0, 9.0, 11.0, 24.0, 35.0, 41.0, 61.0, 105.0, 213.0, 622.0, 2541.0, 25203.0, 928669.0, 84492.0, 4918.0, 962.0, 289.0, 133.0, 65.0, 45.0, 23.0, 21.0, 9.0, 10.0, 8.0, 13.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4140625, -5.2532958984375, -5.092529296875, -4.9317626953125, -4.77099609375, -4.6102294921875, -4.449462890625, -4.2886962890625, -4.1279296875, -3.9671630859375, -3.806396484375, -3.6456298828125, -3.48486328125, -3.3240966796875, -3.163330078125, -3.0025634765625, -2.841796875, -2.6810302734375, -2.520263671875, -2.3594970703125, -2.19873046875, -2.0379638671875, -1.877197265625, -1.7164306640625, -1.5556640625, -1.3948974609375, -1.234130859375, -1.0733642578125, -0.91259765625, -0.7518310546875, -0.591064453125, -0.4302978515625, -0.26953125, -0.1087646484375, 0.052001953125, 0.2127685546875, 0.37353515625, 0.5343017578125, 0.695068359375, 0.8558349609375, 1.0166015625, 1.1773681640625, 1.338134765625, 1.4989013671875, 1.65966796875, 1.8204345703125, 1.981201171875, 2.1419677734375, 2.302734375, 2.4635009765625, 2.624267578125, 2.7850341796875, 2.94580078125, 3.1065673828125, 3.267333984375, 3.4281005859375, 3.5888671875, 3.7496337890625, 3.910400390625, 4.0711669921875, 4.23193359375, 4.3927001953125, 4.553466796875, 4.7142333984375, 4.875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 3.0, 12.0, 3.0, 11.0, 11.0, 14.0, 14.0, 10.0, 22.0, 15.0, 20.0, 22.0, 28.0, 27.0, 25.0, 33.0, 24.0, 36.0, 41.0, 45.0, 37.0, 42.0, 46.0, 34.0, 41.0, 31.0, 45.0, 24.0, 39.0, 28.0, 27.0, 22.0, 26.0, 18.0, 19.0, 18.0, 14.0, 12.0, 12.0, 4.0, 16.0, 7.0, 1.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.534393310546875, -2.44964599609375, -2.364898681640625, -2.2801513671875, -2.195404052734375, -2.11065673828125, -2.025909423828125, -1.941162109375, -1.856414794921875, -1.77166748046875, -1.686920166015625, -1.6021728515625, -1.517425537109375, -1.43267822265625, -1.347930908203125, -1.26318359375, -1.178436279296875, -1.09368896484375, -1.008941650390625, -0.9241943359375, -0.839447021484375, -0.75469970703125, -0.669952392578125, -0.585205078125, -0.500457763671875, -0.41571044921875, -0.330963134765625, -0.2462158203125, -0.161468505859375, -0.07672119140625, 0.008026123046875, 0.0927734375, 0.177520751953125, 0.26226806640625, 0.347015380859375, 0.4317626953125, 0.516510009765625, 0.60125732421875, 0.686004638671875, 0.770751953125, 0.855499267578125, 0.94024658203125, 1.024993896484375, 1.1097412109375, 1.194488525390625, 1.27923583984375, 1.363983154296875, 1.44873046875, 1.533477783203125, 1.61822509765625, 1.702972412109375, 1.7877197265625, 1.872467041015625, 1.95721435546875, 2.041961669921875, 2.126708984375, 2.211456298828125, 2.29620361328125, 2.380950927734375, 2.4656982421875, 2.550445556640625, 2.63519287109375, 2.719940185546875, 2.8046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 6.0, 6.0, 5.0, 9.0, 12.0, 13.0, 21.0, 30.0, 35.0, 47.0, 73.0, 122.0, 201.0, 286.0, 527.0, 1355.0, 4038.0, 18145.0, 192445.0, 755165.0, 62187.0, 9389.0, 2385.0, 919.0, 420.0, 236.0, 162.0, 85.0, 79.0, 41.0, 33.0, 18.0, 15.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73583984375, -0.7123260498046875, -0.688812255859375, -0.6652984619140625, -0.64178466796875, -0.6182708740234375, -0.594757080078125, -0.5712432861328125, -0.5477294921875, -0.5242156982421875, -0.500701904296875, -0.4771881103515625, -0.45367431640625, -0.4301605224609375, -0.406646728515625, -0.3831329345703125, -0.359619140625, -0.3361053466796875, -0.312591552734375, -0.2890777587890625, -0.26556396484375, -0.2420501708984375, -0.218536376953125, -0.1950225830078125, -0.1715087890625, -0.1479949951171875, -0.124481201171875, -0.1009674072265625, -0.07745361328125, -0.0539398193359375, -0.030426025390625, -0.0069122314453125, 0.0166015625, 0.0401153564453125, 0.063629150390625, 0.0871429443359375, 0.11065673828125, 0.1341705322265625, 0.157684326171875, 0.1811981201171875, 0.2047119140625, 0.2282257080078125, 0.251739501953125, 0.2752532958984375, 0.29876708984375, 0.3222808837890625, 0.345794677734375, 0.3693084716796875, 0.392822265625, 0.4163360595703125, 0.439849853515625, 0.4633636474609375, 0.48687744140625, 0.5103912353515625, 0.533905029296875, 0.5574188232421875, 0.5809326171875, 0.6044464111328125, 0.627960205078125, 0.6514739990234375, 0.67498779296875, 0.6985015869140625, 0.722015380859375, 0.7455291748046875, 0.76904296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 13.0, 23.0, 49.0, 80.0, 134.0, 243.0, 194.0, 110.0, 63.0, 29.0, 21.0, 12.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001342296600341797, -0.00012878701090812683, -0.00012334436178207397, -0.00011790171265602112, -0.00011245906352996826, -0.0001070164144039154, -0.00010157376527786255, -9.613111615180969e-05, -9.068846702575684e-05, -8.524581789970398e-05, -7.980316877365112e-05, -7.436051964759827e-05, -6.891787052154541e-05, -6.347522139549255e-05, -5.80325722694397e-05, -5.258992314338684e-05, -4.7147274017333984e-05, -4.170462489128113e-05, -3.626197576522827e-05, -3.0819326639175415e-05, -2.537667751312256e-05, -1.9934028387069702e-05, -1.4491379261016846e-05, -9.04873013496399e-06, -3.606081008911133e-06, 1.8365681171417236e-06, 7.27921724319458e-06, 1.2721866369247437e-05, 1.8164515495300293e-05, 2.360716462135315e-05, 2.9049813747406006e-05, 3.449246287345886e-05, 3.993511199951172e-05, 4.5377761125564575e-05, 5.082041025161743e-05, 5.626305937767029e-05, 6.170570850372314e-05, 6.7148357629776e-05, 7.259100675582886e-05, 7.803365588188171e-05, 8.347630500793457e-05, 8.891895413398743e-05, 9.436160326004028e-05, 9.980425238609314e-05, 0.000105246901512146, 0.00011068955063819885, 0.00011613219976425171, 0.00012157484889030457, 0.00012701749801635742, 0.00013246014714241028, 0.00013790279626846313, 0.000143345445394516, 0.00014878809452056885, 0.0001542307436466217, 0.00015967339277267456, 0.00016511604189872742, 0.00017055869102478027, 0.00017600134015083313, 0.00018144398927688599, 0.00018688663840293884, 0.0001923292875289917, 0.00019777193665504456, 0.0002032145857810974, 0.00020865723490715027, 0.00021409988403320312]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 9.0, 25.0, 27.0, 56.0, 77.0, 179.0, 393.0, 872.0, 2929.0, 14668.0, 236375.0, 754638.0, 31094.0, 4833.0, 1335.0, 502.0, 245.0, 101.0, 73.0, 31.0, 25.0, 19.0, 7.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2939453125, -1.2609176635742188, -1.2278900146484375, -1.1948623657226562, -1.161834716796875, -1.1288070678710938, -1.0957794189453125, -1.0627517700195312, -1.02972412109375, -0.9966964721679688, -0.9636688232421875, -0.9306411743164062, -0.897613525390625, -0.8645858764648438, -0.8315582275390625, -0.7985305786132812, -0.7655029296875, -0.7324752807617188, -0.6994476318359375, -0.6664199829101562, -0.633392333984375, -0.6003646850585938, -0.5673370361328125, -0.5343093872070312, -0.50128173828125, -0.46825408935546875, -0.4352264404296875, -0.40219879150390625, -0.369171142578125, -0.33614349365234375, -0.3031158447265625, -0.27008819580078125, -0.237060546875, -0.20403289794921875, -0.1710052490234375, -0.13797760009765625, -0.104949951171875, -0.07192230224609375, -0.0388946533203125, -0.00586700439453125, 0.02716064453125, 0.06018829345703125, 0.0932159423828125, 0.12624359130859375, 0.159271240234375, 0.19229888916015625, 0.2253265380859375, 0.25835418701171875, 0.2913818359375, 0.32440948486328125, 0.3574371337890625, 0.39046478271484375, 0.423492431640625, 0.45652008056640625, 0.4895477294921875, 0.5225753784179688, 0.55560302734375, 0.5886306762695312, 0.6216583251953125, 0.6546859741210938, 0.687713623046875, 0.7207412719726562, 0.7537689208984375, 0.7867965698242188, 0.81982421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 7.0, 4.0, 20.0, 17.0, 30.0, 35.0, 53.0, 88.0, 121.0, 134.0, 121.0, 110.0, 79.0, 57.0, 24.0, 18.0, 24.0, 16.0, 11.0, 6.0, 7.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2421875, -0.23244857788085938, -0.22270965576171875, -0.21297073364257812, -0.2032318115234375, -0.19349288940429688, -0.18375396728515625, -0.17401504516601562, -0.164276123046875, -0.15453720092773438, -0.14479827880859375, -0.13505935668945312, -0.1253204345703125, -0.11558151245117188, -0.10584259033203125, -0.09610366821289062, -0.08636474609375, -0.07662582397460938, -0.06688690185546875, -0.057147979736328125, -0.0474090576171875, -0.037670135498046875, -0.02793121337890625, -0.018192291259765625, -0.008453369140625, 0.001285552978515625, 0.01102447509765625, 0.020763397216796875, 0.0305023193359375, 0.040241241455078125, 0.04998016357421875, 0.059719085693359375, 0.0694580078125, 0.07919692993164062, 0.08893585205078125, 0.09867477416992188, 0.1084136962890625, 0.11815261840820312, 0.12789154052734375, 0.13763046264648438, 0.147369384765625, 0.15710830688476562, 0.16684722900390625, 0.17658615112304688, 0.1863250732421875, 0.19606399536132812, 0.20580291748046875, 0.21554183959960938, 0.22528076171875, 0.23501968383789062, 0.24475860595703125, 0.2544975280761719, 0.2642364501953125, 0.2739753723144531, 0.28371429443359375, 0.2934532165527344, 0.303192138671875, 0.3129310607910156, 0.32266998291015625, 0.3324089050292969, 0.3421478271484375, 0.3518867492675781, 0.36162567138671875, 0.3713645935058594, 0.381103515625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 13.0, 19.0, 42.0, 103.0, 177.0, 179.0, 191.0, 125.0, 63.0, 35.0, 22.0, 8.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0], "bins": [-12.65359878540039, -12.409100532531738, -12.16460132598877, -11.920103073120117, -11.675603866577148, -11.431105613708496, -11.186606407165527, -10.942108154296875, -10.697608947753906, -10.453110694885254, -10.208611488342285, -9.964113235473633, -9.719614028930664, -9.475115776062012, -9.230616569519043, -8.98611831665039, -8.741619110107422, -8.49712085723877, -8.2526216506958, -8.008123397827148, -7.76362419128418, -7.519125461578369, -7.274626731872559, -7.030128479003906, -6.785630226135254, -6.541131496429443, -6.296632766723633, -6.052134037017822, -5.807635307312012, -5.563136577606201, -5.318637847900391, -5.074139595031738, -4.8296403884887695, -4.585141658782959, -4.340642929077148, -4.096144199371338, -3.8516454696655273, -3.607146739959717, -3.3626482486724854, -3.118149518966675, -2.873650550842285, -2.6291518211364746, -2.384653091430664, -2.1401543617248535, -1.8956557512283325, -1.651157021522522, -1.406658411026001, -1.1621596813201904, -0.9176609516143799, -0.6731622219085693, -0.42866355180740356, -0.1841648817062378, 0.060333847999572754, 0.3048325777053833, 0.5493311882019043, 0.7938299179077148, 1.0383286476135254, 1.282827377319336, 1.5273261070251465, 1.7718247175216675, 2.0163235664367676, 2.260822296142578, 2.5053207874298096, 2.74981951713562, 2.9943182468414307]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 6.0, 10.0, 9.0, 16.0, 23.0, 19.0, 17.0, 33.0, 32.0, 34.0, 37.0, 39.0, 66.0, 56.0, 58.0, 52.0, 52.0, 49.0, 49.0, 37.0, 39.0, 40.0, 46.0, 35.0, 32.0, 25.0, 26.0, 20.0, 11.0, 9.0, 11.0, 3.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.553948402404785, -6.3491692543029785, -6.144390106201172, -5.939610958099365, -5.734831809997559, -5.530052661895752, -5.325273513793945, -5.120494842529297, -4.915715217590332, -4.710936069488525, -4.506156921386719, -4.301377773284912, -4.0965986251831055, -3.891819477081299, -3.6870405673980713, -3.4822614192962646, -3.277482509613037, -3.0727033615112305, -2.867924213409424, -2.663145065307617, -2.4583659172058105, -2.253586769104004, -2.0488078594207764, -1.8440287113189697, -1.639249563217163, -1.4344704151153564, -1.2296912670135498, -1.0249122381210327, -0.8201330900192261, -0.6153539419174194, -0.41057491302490234, -0.2057957649230957, -0.0010161399841308594, 0.2037629783153534, 0.40854209661483765, 0.6133211851119995, 0.8181003332138062, 1.0228794813156128, 1.2276585102081299, 1.4324376583099365, 1.6372168064117432, 1.8419959545135498, 2.0467751026153564, 2.251554012298584, 2.4563331604003906, 2.6611123085021973, 2.865891456604004, 3.0706706047058105, 3.275449752807617, 3.480228900909424, 3.6850080490112305, 3.889787197113037, 4.094566345214844, 4.29934549331665, 4.504124641418457, 4.7089033126831055, 4.91368293762207, 5.118462085723877, 5.323241233825684, 5.52802038192749, 5.732799530029297, 5.9375786781311035, 6.14235782623291, 6.347136497497559, 6.551915645599365]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 10.0, 10.0, 18.0, 22.0, 31.0, 35.0, 54.0, 103.0, 144.0, 201.0, 306.0, 440.0, 785.0, 1285.0, 2459.0, 5787.0, 19854.0, 233444.0, 3220875.0, 653699.0, 39839.0, 7907.0, 3019.0, 1516.0, 851.0, 518.0, 331.0, 238.0, 115.0, 112.0, 66.0, 39.0, 30.0, 37.0, 23.0, 5.0, 12.0, 10.0, 5.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0], "bins": [-3.5078125, -3.403594970703125, -3.29937744140625, -3.195159912109375, -3.0909423828125, -2.986724853515625, -2.88250732421875, -2.778289794921875, -2.674072265625, -2.569854736328125, -2.46563720703125, -2.361419677734375, -2.2572021484375, -2.152984619140625, -2.04876708984375, -1.944549560546875, -1.84033203125, -1.736114501953125, -1.63189697265625, -1.527679443359375, -1.4234619140625, -1.319244384765625, -1.21502685546875, -1.110809326171875, -1.006591796875, -0.902374267578125, -0.79815673828125, -0.693939208984375, -0.5897216796875, -0.485504150390625, -0.38128662109375, -0.277069091796875, -0.1728515625, -0.068634033203125, 0.03558349609375, 0.139801025390625, 0.2440185546875, 0.348236083984375, 0.45245361328125, 0.556671142578125, 0.660888671875, 0.765106201171875, 0.86932373046875, 0.973541259765625, 1.0777587890625, 1.181976318359375, 1.28619384765625, 1.390411376953125, 1.49462890625, 1.598846435546875, 1.70306396484375, 1.807281494140625, 1.9114990234375, 2.015716552734375, 2.11993408203125, 2.224151611328125, 2.328369140625, 2.432586669921875, 2.53680419921875, 2.641021728515625, 2.7452392578125, 2.849456787109375, 2.95367431640625, 3.057891845703125, 3.162109375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 10.0, 15.0, 10.0, 20.0, 20.0, 29.0, 35.0, 26.0, 49.0, 35.0, 59.0, 59.0, 59.0, 49.0, 69.0, 52.0, 58.0, 37.0, 54.0, 38.0, 39.0, 29.0, 24.0, 31.0, 25.0, 14.0, 15.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.1484375, -2.087158203125, -2.02587890625, -1.964599609375, -1.9033203125, -1.842041015625, -1.78076171875, -1.719482421875, -1.658203125, -1.596923828125, -1.53564453125, -1.474365234375, -1.4130859375, -1.351806640625, -1.29052734375, -1.229248046875, -1.16796875, -1.106689453125, -1.04541015625, -0.984130859375, -0.9228515625, -0.861572265625, -0.80029296875, -0.739013671875, -0.677734375, -0.616455078125, -0.55517578125, -0.493896484375, -0.4326171875, -0.371337890625, -0.31005859375, -0.248779296875, -0.1875, -0.126220703125, -0.06494140625, -0.003662109375, 0.0576171875, 0.118896484375, 0.18017578125, 0.241455078125, 0.302734375, 0.364013671875, 0.42529296875, 0.486572265625, 0.5478515625, 0.609130859375, 0.67041015625, 0.731689453125, 0.79296875, 0.854248046875, 0.91552734375, 0.976806640625, 1.0380859375, 1.099365234375, 1.16064453125, 1.221923828125, 1.283203125, 1.344482421875, 1.40576171875, 1.467041015625, 1.5283203125, 1.589599609375, 1.65087890625, 1.712158203125, 1.7734375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 8.0, 12.0, 18.0, 28.0, 32.0, 42.0, 77.0, 109.0, 184.0, 334.0, 603.0, 1356.0, 3005.0, 8403.0, 33214.0, 340196.0, 3549643.0, 216852.0, 27278.0, 7414.0, 2692.0, 1283.0, 623.0, 320.0, 179.0, 104.0, 70.0, 62.0, 34.0, 30.0, 17.0, 13.0, 13.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.9532470703125, -1.873291015625, -1.7933349609375, -1.71337890625, -1.6334228515625, -1.553466796875, -1.4735107421875, -1.3935546875, -1.3135986328125, -1.233642578125, -1.1536865234375, -1.07373046875, -0.9937744140625, -0.913818359375, -0.8338623046875, -0.75390625, -0.6739501953125, -0.593994140625, -0.5140380859375, -0.43408203125, -0.3541259765625, -0.274169921875, -0.1942138671875, -0.1142578125, -0.0343017578125, 0.045654296875, 0.1256103515625, 0.20556640625, 0.2855224609375, 0.365478515625, 0.4454345703125, 0.525390625, 0.6053466796875, 0.685302734375, 0.7652587890625, 0.84521484375, 0.9251708984375, 1.005126953125, 1.0850830078125, 1.1650390625, 1.2449951171875, 1.324951171875, 1.4049072265625, 1.48486328125, 1.5648193359375, 1.644775390625, 1.7247314453125, 1.8046875, 1.8846435546875, 1.964599609375, 2.0445556640625, 2.12451171875, 2.2044677734375, 2.284423828125, 2.3643798828125, 2.4443359375, 2.5242919921875, 2.604248046875, 2.6842041015625, 2.76416015625, 2.8441162109375, 2.924072265625, 3.0040283203125, 3.083984375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 2.0, 6.0, 3.0, 7.0, 8.0, 12.0, 16.0, 18.0, 30.0, 39.0, 54.0, 83.0, 160.0, 231.0, 434.0, 663.0, 774.0, 617.0, 335.0, 225.0, 136.0, 69.0, 48.0, 27.0, 14.0, 16.0, 9.0, 12.0, 3.0, 9.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.85400390625, -0.8317108154296875, -0.809417724609375, -0.7871246337890625, -0.76483154296875, -0.7425384521484375, -0.720245361328125, -0.6979522705078125, -0.6756591796875, -0.6533660888671875, -0.631072998046875, -0.6087799072265625, -0.58648681640625, -0.5641937255859375, -0.541900634765625, -0.5196075439453125, -0.497314453125, -0.4750213623046875, -0.452728271484375, -0.4304351806640625, -0.40814208984375, -0.3858489990234375, -0.363555908203125, -0.3412628173828125, -0.3189697265625, -0.2966766357421875, -0.274383544921875, -0.2520904541015625, -0.22979736328125, -0.2075042724609375, -0.185211181640625, -0.1629180908203125, -0.140625, -0.1183319091796875, -0.096038818359375, -0.0737457275390625, -0.05145263671875, -0.0291595458984375, -0.006866455078125, 0.0154266357421875, 0.0377197265625, 0.0600128173828125, 0.082305908203125, 0.1045989990234375, 0.12689208984375, 0.1491851806640625, 0.171478271484375, 0.1937713623046875, 0.216064453125, 0.2383575439453125, 0.260650634765625, 0.2829437255859375, 0.30523681640625, 0.3275299072265625, 0.349822998046875, 0.3721160888671875, 0.3944091796875, 0.4167022705078125, 0.438995361328125, 0.4612884521484375, 0.48358154296875, 0.5058746337890625, 0.528167724609375, 0.5504608154296875, 0.57275390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 10.0, 17.0, 29.0, 35.0, 59.0, 97.0, 126.0, 154.0, 148.0, 114.0, 81.0, 40.0, 30.0, 26.0, 12.0, 11.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.09392786026001, -4.971735000610352, -4.849541664123535, -4.727348804473877, -4.605155944824219, -4.482962608337402, -4.360769748687744, -4.238576889038086, -4.1163835525512695, -3.9941904544830322, -3.871997594833374, -3.7498044967651367, -3.6276113986968994, -3.505418300628662, -3.383225440979004, -3.2610323429107666, -3.1388392448425293, -3.016646146774292, -2.894453287124634, -2.7722601890563965, -2.650067090988159, -2.527873992919922, -2.4056811332702637, -2.2834880352020264, -2.161295175552368, -2.039102077484131, -1.916909098625183, -1.7947161197662354, -1.672523021697998, -1.5503300428390503, -1.4281370639801025, -1.3059439659118652, -1.183750867843628, -1.0615578889846802, -0.9393647909164429, -0.8171718120574951, -0.6949787139892578, -0.5727857351303101, -0.45059269666671753, -0.328399658203125, -0.20620661973953247, -0.08401358872652054, 0.038179442286491394, 0.16037246584892273, 0.28256550431251526, 0.4047585129737854, 0.5269515514373779, 0.6491445899009705, 0.771337628364563, 0.8935306668281555, 1.015723705291748, 1.1379166841506958, 1.260109782218933, 1.3823027610778809, 1.5044958591461182, 1.626688838005066, 1.7488818168640137, 1.8710747957229614, 1.9932678937911987, 2.1154608726501465, 2.237653970718384, 2.359847068786621, 2.4820399284362793, 2.6042330265045166, 2.726426124572754]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 7.0, 4.0, 8.0, 7.0, 14.0, 16.0, 16.0, 21.0, 24.0, 30.0, 28.0, 33.0, 39.0, 40.0, 52.0, 58.0, 50.0, 62.0, 55.0, 34.0, 54.0, 52.0, 37.0, 26.0, 35.0, 37.0, 30.0, 21.0, 20.0, 18.0, 16.0, 10.0, 7.0, 8.0, 6.0, 6.0, 3.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8892580270767212, -1.8325881958007812, -1.7759183645248413, -1.7192485332489014, -1.6625787019729614, -1.6059088706970215, -1.549239158630371, -1.4925692081451416, -1.4358994960784912, -1.3792296648025513, -1.3225598335266113, -1.2658900022506714, -1.2092201709747314, -1.1525503396987915, -1.0958805084228516, -1.0392107963562012, -0.9825408458709717, -0.9258710145950317, -0.8692011833190918, -0.8125313520431519, -0.7558615207672119, -0.699191689491272, -0.6425219178199768, -0.5858520865440369, -0.5291822552680969, -0.472512423992157, -0.41584259271621704, -0.3591727912425995, -0.30250295996665955, -0.2458331286907196, -0.18916332721710205, -0.1324934959411621, -0.07582378387451172, -0.019153960049152374, 0.03751586377620697, 0.09418568015098572, 0.15085551142692566, 0.2075253427028656, 0.26419514417648315, 0.3208649754524231, 0.37753480672836304, 0.434204638004303, 0.4908744692802429, 0.5475442409515381, 0.604214072227478, 0.660883903503418, 0.7175537347793579, 0.7742235660552979, 0.8308933973312378, 0.8875632286071777, 0.9442330598831177, 1.0009028911590576, 1.0575727224349976, 1.1142425537109375, 1.170912265777588, 1.2275822162628174, 1.2842519283294678, 1.3409217596054077, 1.3975915908813477, 1.4542614221572876, 1.5109312534332275, 1.5676010847091675, 1.6242709159851074, 1.6809406280517578, 1.7376105785369873]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 10.0, 11.0, 9.0, 10.0, 21.0, 17.0, 29.0, 41.0, 65.0, 85.0, 142.0, 201.0, 322.0, 567.0, 881.0, 1616.0, 3035.0, 6261.0, 12995.0, 28984.0, 68501.0, 157692.0, 284755.0, 256448.0, 126449.0, 54091.0, 23581.0, 10702.0, 5023.0, 2608.0, 1316.0, 793.0, 459.0, 272.0, 180.0, 125.0, 78.0, 38.0, 37.0, 20.0, 22.0, 13.0, 13.0, 12.0, 10.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.23876953125, -0.2315044403076172, -0.22423934936523438, -0.21697425842285156, -0.20970916748046875, -0.20244407653808594, -0.19517898559570312, -0.1879138946533203, -0.1806488037109375, -0.1733837127685547, -0.16611862182617188, -0.15885353088378906, -0.15158843994140625, -0.14432334899902344, -0.13705825805664062, -0.1297931671142578, -0.122528076171875, -0.11526298522949219, -0.10799789428710938, -0.10073280334472656, -0.09346771240234375, -0.08620262145996094, -0.07893753051757812, -0.07167243957519531, -0.0644073486328125, -0.05714225769042969, -0.049877166748046875, -0.04261207580566406, -0.03534698486328125, -0.028081893920898438, -0.020816802978515625, -0.013551712036132812, -0.00628662109375, 0.0009784698486328125, 0.008243560791015625, 0.015508651733398438, 0.02277374267578125, 0.030038833618164062, 0.037303924560546875, 0.04456901550292969, 0.0518341064453125, 0.05909919738769531, 0.06636428833007812, 0.07362937927246094, 0.08089447021484375, 0.08815956115722656, 0.09542465209960938, 0.10268974304199219, 0.109954833984375, 0.11721992492675781, 0.12448501586914062, 0.13175010681152344, 0.13901519775390625, 0.14628028869628906, 0.15354537963867188, 0.1608104705810547, 0.1680755615234375, 0.1753406524658203, 0.18260574340820312, 0.18987083435058594, 0.19713592529296875, 0.20440101623535156, 0.21166610717773438, 0.2189311981201172, 0.2261962890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 6.0, 6.0, 6.0, 13.0, 17.0, 26.0, 24.0, 32.0, 45.0, 43.0, 59.0, 55.0, 55.0, 65.0, 87.0, 65.0, 51.0, 64.0, 41.0, 47.0, 35.0, 32.0, 30.0, 18.0, 21.0, 13.0, 7.0, 10.0, 5.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4443359375, -1.396881103515625, -1.34942626953125, -1.301971435546875, -1.2545166015625, -1.207061767578125, -1.15960693359375, -1.112152099609375, -1.064697265625, -1.017242431640625, -0.96978759765625, -0.922332763671875, -0.8748779296875, -0.827423095703125, -0.77996826171875, -0.732513427734375, -0.68505859375, -0.637603759765625, -0.59014892578125, -0.542694091796875, -0.4952392578125, -0.447784423828125, -0.40032958984375, -0.352874755859375, -0.305419921875, -0.257965087890625, -0.21051025390625, -0.163055419921875, -0.1156005859375, -0.068145751953125, -0.02069091796875, 0.026763916015625, 0.07421875, 0.121673583984375, 0.16912841796875, 0.216583251953125, 0.2640380859375, 0.311492919921875, 0.35894775390625, 0.406402587890625, 0.453857421875, 0.501312255859375, 0.54876708984375, 0.596221923828125, 0.6436767578125, 0.691131591796875, 0.73858642578125, 0.786041259765625, 0.83349609375, 0.880950927734375, 0.92840576171875, 0.975860595703125, 1.0233154296875, 1.070770263671875, 1.11822509765625, 1.165679931640625, 1.213134765625, 1.260589599609375, 1.30804443359375, 1.355499267578125, 1.4029541015625, 1.450408935546875, 1.49786376953125, 1.545318603515625, 1.5927734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 7.0, 21.0, 16.0, 30.0, 40.0, 58.0, 72.0, 136.0, 153.0, 267.0, 399.0, 719.0, 1282.0, 2276.0, 4661.0, 9969.0, 23402.0, 58281.0, 141933.0, 277450.0, 279295.0, 144589.0, 58832.0, 24136.0, 10244.0, 4669.0, 2386.0, 1252.0, 705.0, 426.0, 291.0, 191.0, 95.0, 95.0, 54.0, 36.0, 20.0, 19.0, 6.0, 7.0, 8.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2198467254638672, -0.21252059936523438, -0.20519447326660156, -0.19786834716796875, -0.19054222106933594, -0.18321609497070312, -0.1758899688720703, -0.1685638427734375, -0.1612377166748047, -0.15391159057617188, -0.14658546447753906, -0.13925933837890625, -0.13193321228027344, -0.12460708618164062, -0.11728096008300781, -0.109954833984375, -0.10262870788574219, -0.09530258178710938, -0.08797645568847656, -0.08065032958984375, -0.07332420349121094, -0.06599807739257812, -0.05867195129394531, -0.0513458251953125, -0.04401969909667969, -0.036693572998046875, -0.029367446899414062, -0.02204132080078125, -0.014715194702148438, -0.007389068603515625, -6.29425048828125e-05, 0.00726318359375, 0.014589309692382812, 0.021915435791015625, 0.029241561889648438, 0.03656768798828125, 0.04389381408691406, 0.051219940185546875, 0.05854606628417969, 0.0658721923828125, 0.07319831848144531, 0.08052444458007812, 0.08785057067871094, 0.09517669677734375, 0.10250282287597656, 0.10982894897460938, 0.11715507507324219, 0.124481201171875, 0.1318073272705078, 0.13913345336914062, 0.14645957946777344, 0.15378570556640625, 0.16111183166503906, 0.16843795776367188, 0.1757640838623047, 0.1830902099609375, 0.1904163360595703, 0.19774246215820312, 0.20506858825683594, 0.21239471435546875, 0.21972084045410156, 0.22704696655273438, 0.2343730926513672, 0.24169921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 13.0, 14.0, 16.0, 16.0, 20.0, 22.0, 34.0, 32.0, 38.0, 32.0, 62.0, 45.0, 60.0, 58.0, 41.0, 54.0, 67.0, 51.0, 63.0, 43.0, 56.0, 30.0, 24.0, 19.0, 17.0, 16.0, 14.0, 14.0, 7.0, 10.0, 6.0, 4.0, 1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.240234375, -3.156494140625, -3.07275390625, -2.989013671875, -2.9052734375, -2.821533203125, -2.73779296875, -2.654052734375, -2.5703125, -2.486572265625, -2.40283203125, -2.319091796875, -2.2353515625, -2.151611328125, -2.06787109375, -1.984130859375, -1.900390625, -1.816650390625, -1.73291015625, -1.649169921875, -1.5654296875, -1.481689453125, -1.39794921875, -1.314208984375, -1.23046875, -1.146728515625, -1.06298828125, -0.979248046875, -0.8955078125, -0.811767578125, -0.72802734375, -0.644287109375, -0.560546875, -0.476806640625, -0.39306640625, -0.309326171875, -0.2255859375, -0.141845703125, -0.05810546875, 0.025634765625, 0.109375, 0.193115234375, 0.27685546875, 0.360595703125, 0.4443359375, 0.528076171875, 0.61181640625, 0.695556640625, 0.779296875, 0.863037109375, 0.94677734375, 1.030517578125, 1.1142578125, 1.197998046875, 1.28173828125, 1.365478515625, 1.44921875, 1.532958984375, 1.61669921875, 1.700439453125, 1.7841796875, 1.867919921875, 1.95166015625, 2.035400390625, 2.119140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 4.0, 10.0, 17.0, 24.0, 28.0, 41.0, 67.0, 91.0, 140.0, 233.0, 388.0, 628.0, 1084.0, 2144.0, 4485.0, 10473.0, 29760.0, 102105.0, 362801.0, 375136.0, 107228.0, 30828.0, 11058.0, 4627.0, 2239.0, 1163.0, 665.0, 395.0, 243.0, 182.0, 88.0, 50.0, 34.0, 26.0, 19.0, 15.0, 8.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1158447265625, -0.11279773712158203, -0.10975074768066406, -0.1067037582397461, -0.10365676879882812, -0.10060977935791016, -0.09756278991699219, -0.09451580047607422, -0.09146881103515625, -0.08842182159423828, -0.08537483215332031, -0.08232784271240234, -0.07928085327148438, -0.0762338638305664, -0.07318687438964844, -0.07013988494873047, -0.0670928955078125, -0.06404590606689453, -0.06099891662597656, -0.057951927185058594, -0.054904937744140625, -0.051857948303222656, -0.04881095886230469, -0.04576396942138672, -0.04271697998046875, -0.03966999053955078, -0.03662300109863281, -0.033576011657714844, -0.030529022216796875, -0.027482032775878906, -0.024435043334960938, -0.02138805389404297, -0.018341064453125, -0.015294075012207031, -0.012247085571289062, -0.009200096130371094, -0.006153106689453125, -0.0031061172485351562, -5.91278076171875e-05, 0.0029878616333007812, 0.00603485107421875, 0.009081840515136719, 0.012128829956054688, 0.015175819396972656, 0.018222808837890625, 0.021269798278808594, 0.024316787719726562, 0.02736377716064453, 0.0304107666015625, 0.03345775604248047, 0.03650474548339844, 0.039551734924316406, 0.042598724365234375, 0.045645713806152344, 0.04869270324707031, 0.05173969268798828, 0.05478668212890625, 0.05783367156982422, 0.06088066101074219, 0.06392765045166016, 0.06697463989257812, 0.0700216293334961, 0.07306861877441406, 0.07611560821533203, 0.07916259765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 1.0, 7.0, 8.0, 12.0, 13.0, 27.0, 30.0, 39.0, 60.0, 85.0, 73.0, 104.0, 111.0, 110.0, 80.0, 78.0, 48.0, 33.0, 19.0, 22.0, 9.0, 10.0, 5.0, 11.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.605552673339844e-05, -7.4019655585289e-05, -7.198378443717957e-05, -6.994791328907013e-05, -6.79120421409607e-05, -6.587617099285126e-05, -6.384029984474182e-05, -6.180442869663239e-05, -5.976855754852295e-05, -5.773268640041351e-05, -5.569681525230408e-05, -5.366094410419464e-05, -5.1625072956085205e-05, -4.958920180797577e-05, -4.755333065986633e-05, -4.55174595117569e-05, -4.348158836364746e-05, -4.1445717215538025e-05, -3.940984606742859e-05, -3.737397491931915e-05, -3.533810377120972e-05, -3.330223262310028e-05, -3.1266361474990845e-05, -2.923049032688141e-05, -2.7194619178771973e-05, -2.5158748030662537e-05, -2.31228768825531e-05, -2.1087005734443665e-05, -1.905113458633423e-05, -1.7015263438224792e-05, -1.4979392290115356e-05, -1.294352114200592e-05, -1.0907649993896484e-05, -8.871778845787048e-06, -6.835907697677612e-06, -4.800036549568176e-06, -2.7641654014587402e-06, -7.282942533493042e-07, 1.3075768947601318e-06, 3.343448042869568e-06, 5.379319190979004e-06, 7.41519033908844e-06, 9.451061487197876e-06, 1.1486932635307312e-05, 1.3522803783416748e-05, 1.5558674931526184e-05, 1.759454607963562e-05, 1.9630417227745056e-05, 2.1666288375854492e-05, 2.3702159523963928e-05, 2.5738030672073364e-05, 2.77739018201828e-05, 2.9809772968292236e-05, 3.184564411640167e-05, 3.388151526451111e-05, 3.5917386412620544e-05, 3.795325756072998e-05, 3.9989128708839417e-05, 4.202499985694885e-05, 4.406087100505829e-05, 4.6096742153167725e-05, 4.813261330127716e-05, 5.01684844493866e-05, 5.220435559749603e-05, 5.424022674560547e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 11.0, 4.0, 12.0, 23.0, 19.0, 46.0, 40.0, 67.0, 95.0, 154.0, 269.0, 421.0, 859.0, 1803.0, 3648.0, 8900.0, 22712.0, 61142.0, 163696.0, 323017.0, 272956.0, 116962.0, 43080.0, 16222.0, 6511.0, 2871.0, 1364.0, 681.0, 365.0, 212.0, 110.0, 76.0, 51.0, 42.0, 31.0, 24.0, 17.0, 5.0, 8.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08977890014648438, -0.08727264404296875, -0.08476638793945312, -0.0822601318359375, -0.07975387573242188, -0.07724761962890625, -0.07474136352539062, -0.072235107421875, -0.06972885131835938, -0.06722259521484375, -0.06471633911132812, -0.0622100830078125, -0.059703826904296875, -0.05719757080078125, -0.054691314697265625, -0.05218505859375, -0.049678802490234375, -0.04717254638671875, -0.044666290283203125, -0.0421600341796875, -0.039653778076171875, -0.03714752197265625, -0.034641265869140625, -0.032135009765625, -0.029628753662109375, -0.02712249755859375, -0.024616241455078125, -0.0221099853515625, -0.019603729248046875, -0.01709747314453125, -0.014591217041015625, -0.0120849609375, -0.009578704833984375, -0.00707244873046875, -0.004566192626953125, -0.0020599365234375, 0.000446319580078125, 0.00295257568359375, 0.005458831787109375, 0.007965087890625, 0.010471343994140625, 0.01297760009765625, 0.015483856201171875, 0.0179901123046875, 0.020496368408203125, 0.02300262451171875, 0.025508880615234375, 0.02801513671875, 0.030521392822265625, 0.03302764892578125, 0.035533905029296875, 0.0380401611328125, 0.040546417236328125, 0.04305267333984375, 0.045558929443359375, 0.048065185546875, 0.050571441650390625, 0.05307769775390625, 0.055583953857421875, 0.0580902099609375, 0.060596466064453125, 0.06310272216796875, 0.06560897827148438, 0.068115234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 8.0, 5.0, 12.0, 15.0, 14.0, 14.0, 22.0, 31.0, 35.0, 40.0, 32.0, 31.0, 48.0, 48.0, 58.0, 38.0, 50.0, 55.0, 31.0, 54.0, 42.0, 35.0, 33.0, 35.0, 28.0, 19.0, 27.0, 23.0, 23.0, 14.0, 8.0, 9.0, 5.0, 4.0, 7.0, 9.0, 3.0, 3.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0198822021484375, -0.01922130584716797, -0.018560409545898438, -0.017899513244628906, -0.017238616943359375, -0.016577720642089844, -0.015916824340820312, -0.015255928039550781, -0.01459503173828125, -0.013934135437011719, -0.013273239135742188, -0.012612342834472656, -0.011951446533203125, -0.011290550231933594, -0.010629653930664062, -0.009968757629394531, -0.009307861328125, -0.008646965026855469, -0.007986068725585938, -0.007325172424316406, -0.006664276123046875, -0.006003379821777344, -0.0053424835205078125, -0.004681587219238281, -0.00402069091796875, -0.0033597946166992188, -0.0026988983154296875, -0.0020380020141601562, -0.001377105712890625, -0.0007162094116210938, -5.53131103515625e-05, 0.0006055831909179688, 0.0012664794921875, 0.0019273757934570312, 0.0025882720947265625, 0.0032491683959960938, 0.003910064697265625, 0.004570960998535156, 0.0052318572998046875, 0.005892753601074219, 0.00655364990234375, 0.007214546203613281, 0.007875442504882812, 0.008536338806152344, 0.009197235107421875, 0.009858131408691406, 0.010519027709960938, 0.011179924011230469, 0.0118408203125, 0.012501716613769531, 0.013162612915039062, 0.013823509216308594, 0.014484405517578125, 0.015145301818847656, 0.015806198120117188, 0.01646709442138672, 0.01712799072265625, 0.01778888702392578, 0.018449783325195312, 0.019110679626464844, 0.019771575927734375, 0.020432472229003906, 0.021093368530273438, 0.02175426483154297, 0.0224151611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 14.0, 49.0, 171.0, 381.0, 276.0, 88.0, 15.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.666704177856445, -10.464189529418945, -10.261674880981445, -10.059160232543945, -9.856645584106445, -9.654130935668945, -9.451616287231445, -9.249101638793945, -9.046586990356445, -8.844072341918945, -8.641557693481445, -8.439043045043945, -8.236528396606445, -8.034013748168945, -7.831499099731445, -7.6289849281311035, -7.426470756530762, -7.223956108093262, -7.021441459655762, -6.818926811218262, -6.616412162780762, -6.413897514343262, -6.211382865905762, -6.00886869430542, -5.806353569030762, -5.603838920593262, -5.401324272155762, -5.198809623718262, -4.996294975280762, -4.793780326843262, -4.591265678405762, -4.38875150680542, -4.186237335205078, -3.983722686767578, -3.781208038330078, -3.578693389892578, -3.3761789798736572, -3.1736643314361572, -2.9711496829986572, -2.7686352729797363, -2.566120147705078, -2.363605499267578, -2.161090850830078, -1.9585763216018677, -1.7560617923736572, -1.5535471439361572, -1.3510324954986572, -1.1485179662704468, -0.9460034370422363, -0.7434888482093811, -0.5409742593765259, -0.3384596109390259, -0.13594502210617065, 0.06656956672668457, 0.26908421516418457, 0.471598744392395, 0.674113392829895, 0.8766279816627502, 1.0791425704956055, 1.2816572189331055, 1.4841718673706055, 1.686686396598816, 1.889201045036316, 2.0917155742645264, 2.2942302227020264]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 8.0, 4.0, 5.0, 14.0, 16.0, 21.0, 25.0, 19.0, 45.0, 32.0, 52.0, 38.0, 68.0, 68.0, 70.0, 61.0, 65.0, 62.0, 52.0, 39.0, 39.0, 41.0, 31.0, 27.0, 19.0, 22.0, 16.0, 7.0, 6.0, 8.0, 2.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4718071222305298, -1.427551031112671, -1.383294939994812, -1.3390388488769531, -1.2947826385498047, -1.2505265474319458, -1.206270456314087, -1.162014365196228, -1.1177582740783691, -1.0735021829605103, -1.0292460918426514, -0.9849899411201477, -0.940733790397644, -0.8964776992797852, -0.8522216081619263, -0.8079655170440674, -0.763709306716919, -0.7194532155990601, -0.6751970648765564, -0.6309409737586975, -0.5866848230361938, -0.542428731918335, -0.4981726408004761, -0.4539165198802948, -0.4096603989601135, -0.36540427803993225, -0.321148157119751, -0.2768920660018921, -0.23263594508171082, -0.18837982416152954, -0.14412373304367065, -0.09986761212348938, -0.055611491203308105, -0.011355377733707428, 0.03290073573589325, 0.07715684175491333, 0.1214129626750946, 0.16566908359527588, 0.20992517471313477, 0.25418129563331604, 0.2984374165534973, 0.3426935374736786, 0.38694965839385986, 0.43120574951171875, 0.4754618704319, 0.5197179913520813, 0.5639740824699402, 0.6082302331924438, 0.6524863243103027, 0.6967424154281616, 0.7409985661506653, 0.7852546572685242, 0.8295108079910278, 0.8737668991088867, 0.9180229902267456, 0.9622790813446045, 1.006535291671753, 1.0507913827896118, 1.0950474739074707, 1.1393036842346191, 1.183559775352478, 1.227815866470337, 1.2720719575881958, 1.3163280487060547, 1.3605841398239136]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 5.0, 7.0, 10.0, 11.0, 13.0, 19.0, 33.0, 54.0, 82.0, 102.0, 183.0, 286.0, 492.0, 836.0, 1671.0, 2993.0, 6337.0, 15389.0, 45099.0, 172870.0, 501834.0, 213574.0, 54279.0, 17589.0, 7229.0, 3506.0, 1725.0, 922.0, 550.0, 328.0, 203.0, 110.0, 59.0, 51.0, 43.0, 18.0, 13.0, 12.0, 5.0, 2.0, 9.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1953125, -1.1519622802734375, -1.108612060546875, -1.0652618408203125, -1.02191162109375, -0.9785614013671875, -0.935211181640625, -0.8918609619140625, -0.8485107421875, -0.8051605224609375, -0.761810302734375, -0.7184600830078125, -0.67510986328125, -0.6317596435546875, -0.588409423828125, -0.5450592041015625, -0.501708984375, -0.4583587646484375, -0.415008544921875, -0.3716583251953125, -0.32830810546875, -0.2849578857421875, -0.241607666015625, -0.1982574462890625, -0.1549072265625, -0.1115570068359375, -0.068206787109375, -0.0248565673828125, 0.01849365234375, 0.0618438720703125, 0.105194091796875, 0.1485443115234375, 0.19189453125, 0.2352447509765625, 0.278594970703125, 0.3219451904296875, 0.36529541015625, 0.4086456298828125, 0.451995849609375, 0.4953460693359375, 0.5386962890625, 0.5820465087890625, 0.625396728515625, 0.6687469482421875, 0.71209716796875, 0.7554473876953125, 0.798797607421875, 0.8421478271484375, 0.885498046875, 0.9288482666015625, 0.972198486328125, 1.0155487060546875, 1.05889892578125, 1.1022491455078125, 1.145599365234375, 1.1889495849609375, 1.2322998046875, 1.2756500244140625, 1.319000244140625, 1.3623504638671875, 1.40570068359375, 1.4490509033203125, 1.492401123046875, 1.5357513427734375, 1.5791015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 8.0, 4.0, 6.0, 3.0, 6.0, 8.0, 17.0, 21.0, 20.0, 24.0, 23.0, 27.0, 34.0, 46.0, 48.0, 47.0, 55.0, 61.0, 65.0, 57.0, 49.0, 54.0, 48.0, 46.0, 39.0, 32.0, 29.0, 30.0, 20.0, 22.0, 9.0, 18.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.98828125, -2.906890869140625, -2.82550048828125, -2.744110107421875, -2.6627197265625, -2.581329345703125, -2.49993896484375, -2.418548583984375, -2.337158203125, -2.255767822265625, -2.17437744140625, -2.092987060546875, -2.0115966796875, -1.930206298828125, -1.84881591796875, -1.767425537109375, -1.68603515625, -1.604644775390625, -1.52325439453125, -1.441864013671875, -1.3604736328125, -1.279083251953125, -1.19769287109375, -1.116302490234375, -1.034912109375, -0.953521728515625, -0.87213134765625, -0.790740966796875, -0.7093505859375, -0.627960205078125, -0.54656982421875, -0.465179443359375, -0.3837890625, -0.302398681640625, -0.22100830078125, -0.139617919921875, -0.0582275390625, 0.023162841796875, 0.10455322265625, 0.185943603515625, 0.267333984375, 0.348724365234375, 0.43011474609375, 0.511505126953125, 0.5928955078125, 0.674285888671875, 0.75567626953125, 0.837066650390625, 0.91845703125, 0.999847412109375, 1.08123779296875, 1.162628173828125, 1.2440185546875, 1.325408935546875, 1.40679931640625, 1.488189697265625, 1.569580078125, 1.650970458984375, 1.73236083984375, 1.813751220703125, 1.8951416015625, 1.976531982421875, 2.05792236328125, 2.139312744140625, 2.220703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 4.0, 2.0, 9.0, 11.0, 5.0, 13.0, 21.0, 23.0, 44.0, 50.0, 62.0, 93.0, 165.0, 315.0, 708.0, 2352.0, 13045.0, 157503.0, 792875.0, 70614.0, 7691.0, 1572.0, 566.0, 283.0, 141.0, 109.0, 66.0, 57.0, 33.0, 26.0, 17.0, 19.0, 11.0, 7.0, 6.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59765625, -2.51483154296875, -2.4320068359375, -2.34918212890625, -2.266357421875, -2.18353271484375, -2.1007080078125, -2.01788330078125, -1.93505859375, -1.85223388671875, -1.7694091796875, -1.68658447265625, -1.603759765625, -1.52093505859375, -1.4381103515625, -1.35528564453125, -1.2724609375, -1.18963623046875, -1.1068115234375, -1.02398681640625, -0.941162109375, -0.85833740234375, -0.7755126953125, -0.69268798828125, -0.60986328125, -0.52703857421875, -0.4442138671875, -0.36138916015625, -0.278564453125, -0.19573974609375, -0.1129150390625, -0.03009033203125, 0.052734375, 0.13555908203125, 0.2183837890625, 0.30120849609375, 0.384033203125, 0.46685791015625, 0.5496826171875, 0.63250732421875, 0.71533203125, 0.79815673828125, 0.8809814453125, 0.96380615234375, 1.046630859375, 1.12945556640625, 1.2122802734375, 1.29510498046875, 1.3779296875, 1.46075439453125, 1.5435791015625, 1.62640380859375, 1.709228515625, 1.79205322265625, 1.8748779296875, 1.95770263671875, 2.04052734375, 2.12335205078125, 2.2061767578125, 2.28900146484375, 2.371826171875, 2.45465087890625, 2.5374755859375, 2.62030029296875, 2.703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 3.0, 8.0, 10.0, 4.0, 7.0, 19.0, 6.0, 14.0, 10.0, 16.0, 25.0, 17.0, 25.0, 30.0, 34.0, 25.0, 29.0, 37.0, 35.0, 38.0, 47.0, 34.0, 47.0, 39.0, 50.0, 29.0, 36.0, 34.0, 32.0, 19.0, 30.0, 20.0, 20.0, 28.0, 17.0, 18.0, 15.0, 12.0, 13.0, 11.0, 14.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.1328125, -2.065338134765625, -1.99786376953125, -1.930389404296875, -1.8629150390625, -1.795440673828125, -1.72796630859375, -1.660491943359375, -1.593017578125, -1.525543212890625, -1.45806884765625, -1.390594482421875, -1.3231201171875, -1.255645751953125, -1.18817138671875, -1.120697021484375, -1.05322265625, -0.985748291015625, -0.91827392578125, -0.850799560546875, -0.7833251953125, -0.715850830078125, -0.64837646484375, -0.580902099609375, -0.513427734375, -0.445953369140625, -0.37847900390625, -0.311004638671875, -0.2435302734375, -0.176055908203125, -0.10858154296875, -0.041107177734375, 0.0263671875, 0.093841552734375, 0.16131591796875, 0.228790283203125, 0.2962646484375, 0.363739013671875, 0.43121337890625, 0.498687744140625, 0.566162109375, 0.633636474609375, 0.70111083984375, 0.768585205078125, 0.8360595703125, 0.903533935546875, 0.97100830078125, 1.038482666015625, 1.10595703125, 1.173431396484375, 1.24090576171875, 1.308380126953125, 1.3758544921875, 1.443328857421875, 1.51080322265625, 1.578277587890625, 1.645751953125, 1.713226318359375, 1.78070068359375, 1.848175048828125, 1.9156494140625, 1.983123779296875, 2.05059814453125, 2.118072509765625, 2.185546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 7.0, 11.0, 13.0, 20.0, 53.0, 135.0, 324.0, 1213.0, 9161.0, 805208.0, 226375.0, 4700.0, 837.0, 260.0, 102.0, 59.0, 24.0, 17.0, 6.0, 3.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3642578125, -1.3018646240234375, -1.239471435546875, -1.1770782470703125, -1.11468505859375, -1.0522918701171875, -0.989898681640625, -0.9275054931640625, -0.8651123046875, -0.8027191162109375, -0.740325927734375, -0.6779327392578125, -0.61553955078125, -0.5531463623046875, -0.490753173828125, -0.4283599853515625, -0.365966796875, -0.3035736083984375, -0.241180419921875, -0.1787872314453125, -0.11639404296875, -0.0540008544921875, 0.008392333984375, 0.0707855224609375, 0.1331787109375, 0.1955718994140625, 0.257965087890625, 0.3203582763671875, 0.38275146484375, 0.4451446533203125, 0.507537841796875, 0.5699310302734375, 0.63232421875, 0.6947174072265625, 0.757110595703125, 0.8195037841796875, 0.88189697265625, 0.9442901611328125, 1.006683349609375, 1.0690765380859375, 1.1314697265625, 1.1938629150390625, 1.256256103515625, 1.3186492919921875, 1.38104248046875, 1.4434356689453125, 1.505828857421875, 1.5682220458984375, 1.630615234375, 1.6930084228515625, 1.755401611328125, 1.8177947998046875, 1.88018798828125, 1.9425811767578125, 2.004974365234375, 2.0673675537109375, 2.1297607421875, 2.1921539306640625, 2.254547119140625, 2.3169403076171875, 2.37933349609375, 2.4417266845703125, 2.504119873046875, 2.5665130615234375, 2.62890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 10.0, 18.0, 28.0, 39.0, 70.0, 99.0, 165.0, 149.0, 135.0, 101.0, 70.0, 38.0, 24.0, 15.0, 11.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001862049102783203, -0.00018125027418136597, -0.00017629563808441162, -0.00017134100198745728, -0.00016638636589050293, -0.00016143172979354858, -0.00015647709369659424, -0.0001515224575996399, -0.00014656782150268555, -0.0001416131854057312, -0.00013665854930877686, -0.0001317039132118225, -0.00012674927711486816, -0.00012179464101791382, -0.00011684000492095947, -0.00011188536882400513, -0.00010693073272705078, -0.00010197609663009644, -9.702146053314209e-05, -9.206682443618774e-05, -8.71121883392334e-05, -8.215755224227905e-05, -7.720291614532471e-05, -7.224828004837036e-05, -6.729364395141602e-05, -6.233900785446167e-05, -5.7384371757507324e-05, -5.242973566055298e-05, -4.747509956359863e-05, -4.252046346664429e-05, -3.756582736968994e-05, -3.2611191272735596e-05, -2.765655517578125e-05, -2.2701919078826904e-05, -1.774728298187256e-05, -1.2792646884918213e-05, -7.838010787963867e-06, -2.8833746910095215e-06, 2.0712614059448242e-06, 7.02589750289917e-06, 1.1980533599853516e-05, 1.693516969680786e-05, 2.1889805793762207e-05, 2.6844441890716553e-05, 3.17990779876709e-05, 3.6753714084625244e-05, 4.170835018157959e-05, 4.6662986278533936e-05, 5.161762237548828e-05, 5.657225847244263e-05, 6.152689456939697e-05, 6.648153066635132e-05, 7.143616676330566e-05, 7.639080286026001e-05, 8.134543895721436e-05, 8.63000750541687e-05, 9.125471115112305e-05, 9.620934724807739e-05, 0.00010116398334503174, 0.00010611861944198608, 0.00011107325553894043, 0.00011602789163589478, 0.00012098252773284912, 0.00012593716382980347, 0.0001308917999267578]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 12.0, 14.0, 13.0, 31.0, 65.0, 115.0, 378.0, 1297.0, 5811.0, 102971.0, 901717.0, 31304.0, 3435.0, 856.0, 253.0, 111.0, 67.0, 32.0, 15.0, 11.0, 4.0, 4.0, 5.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8603515625, -1.8105316162109375, -1.760711669921875, -1.7108917236328125, -1.66107177734375, -1.6112518310546875, -1.561431884765625, -1.5116119384765625, -1.4617919921875, -1.4119720458984375, -1.362152099609375, -1.3123321533203125, -1.26251220703125, -1.2126922607421875, -1.162872314453125, -1.1130523681640625, -1.063232421875, -1.0134124755859375, -0.963592529296875, -0.9137725830078125, -0.86395263671875, -0.8141326904296875, -0.764312744140625, -0.7144927978515625, -0.6646728515625, -0.6148529052734375, -0.565032958984375, -0.5152130126953125, -0.46539306640625, -0.4155731201171875, -0.365753173828125, -0.3159332275390625, -0.26611328125, -0.2162933349609375, -0.166473388671875, -0.1166534423828125, -0.06683349609375, -0.0170135498046875, 0.032806396484375, 0.0826263427734375, 0.1324462890625, 0.1822662353515625, 0.232086181640625, 0.2819061279296875, 0.33172607421875, 0.3815460205078125, 0.431365966796875, 0.4811859130859375, 0.531005859375, 0.5808258056640625, 0.630645751953125, 0.6804656982421875, 0.73028564453125, 0.7801055908203125, 0.829925537109375, 0.8797454833984375, 0.9295654296875, 0.9793853759765625, 1.029205322265625, 1.0790252685546875, 1.12884521484375, 1.1786651611328125, 1.228485107421875, 1.2783050537109375, 1.328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 6.0, 8.0, 10.0, 12.0, 18.0, 31.0, 35.0, 51.0, 72.0, 78.0, 97.0, 113.0, 129.0, 90.0, 61.0, 49.0, 51.0, 20.0, 22.0, 11.0, 7.0, 10.0, 11.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2725791931152344, -0.26146697998046875, -0.2503547668457031, -0.2392425537109375, -0.22813034057617188, -0.21701812744140625, -0.20590591430664062, -0.194793701171875, -0.18368148803710938, -0.17256927490234375, -0.16145706176757812, -0.1503448486328125, -0.13923263549804688, -0.12812042236328125, -0.11700820922851562, -0.10589599609375, -0.09478378295898438, -0.08367156982421875, -0.07255935668945312, -0.0614471435546875, -0.050334930419921875, -0.03922271728515625, -0.028110504150390625, -0.016998291015625, -0.005886077880859375, 0.00522613525390625, 0.016338348388671875, 0.0274505615234375, 0.038562774658203125, 0.04967498779296875, 0.060787200927734375, 0.0718994140625, 0.08301162719726562, 0.09412384033203125, 0.10523605346679688, 0.1163482666015625, 0.12746047973632812, 0.13857269287109375, 0.14968490600585938, 0.160797119140625, 0.17190933227539062, 0.18302154541015625, 0.19413375854492188, 0.2052459716796875, 0.21635818481445312, 0.22747039794921875, 0.23858261108398438, 0.24969482421875, 0.2608070373535156, 0.27191925048828125, 0.2830314636230469, 0.2941436767578125, 0.3052558898925781, 0.31636810302734375, 0.3274803161621094, 0.338592529296875, 0.3497047424316406, 0.36081695556640625, 0.3719291687011719, 0.3830413818359375, 0.3941535949707031, 0.40526580810546875, 0.4163780212402344, 0.427490234375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 16.0, 36.0, 115.0, 277.0, 293.0, 171.0, 53.0, 14.0, 13.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1150007247924805, -2.805588960647583, -2.4961771965026855, -2.186765432357788, -1.8773536682128906, -1.5679419040679932, -1.2585301399230957, -0.9491183757781982, -0.6397066116333008, -0.3302948474884033, -0.02088308334350586, 0.2885286808013916, 0.5979404449462891, 0.9073522090911865, 1.216763973236084, 1.5261757373809814, 1.835587501525879, 2.1449992656707764, 2.454411029815674, 2.7638227939605713, 3.0732345581054688, 3.382646322250366, 3.6920580863952637, 4.001469612121582, 4.310881614685059, 4.620293617248535, 4.9297051429748535, 5.239116668701172, 5.548528671264648, 5.857940673828125, 6.167352199554443, 6.476763725280762, 6.786176681518555, 7.095588684082031, 7.40500020980835, 7.714411735534668, 8.023823738098145, 8.333235740661621, 8.642646789550781, 8.952058792114258, 9.261470794677734, 9.570882797241211, 9.880294799804688, 10.189705848693848, 10.499117851257324, 10.8085298538208, 11.117940902709961, 11.427352905273438, 11.736764907836914, 12.04617691040039, 12.355588912963867, 12.664999961853027, 12.974411964416504, 13.28382396697998, 13.59323501586914, 13.902647018432617, 14.212059020996094, 14.52147102355957, 14.830883026123047, 15.140294075012207, 15.449706077575684, 15.75911808013916, 16.06852912902832, 16.377941131591797, 16.687353134155273]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 10.0, 14.0, 14.0, 16.0, 28.0, 19.0, 32.0, 29.0, 35.0, 25.0, 30.0, 48.0, 42.0, 34.0, 42.0, 53.0, 44.0, 26.0, 43.0, 36.0, 35.0, 45.0, 44.0, 22.0, 34.0, 26.0, 14.0, 25.0, 20.0, 19.0, 9.0, 14.0, 9.0, 11.0, 9.0, 4.0, 10.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.420687675476074, -4.2850847244262695, -4.149481773376465, -4.013878345489502, -3.8782753944396973, -3.7426724433898926, -3.607069253921509, -3.471466064453125, -3.3358631134033203, -3.2002601623535156, -3.064656972885132, -2.929053783416748, -2.7934508323669434, -2.6578478813171387, -2.522244691848755, -2.386641502380371, -2.2510385513305664, -2.1154356002807617, -1.979832410812378, -1.8442293405532837, -1.7086262702941895, -1.5730232000350952, -1.437420129776001, -1.3018170595169067, -1.1662139892578125, -1.0306109189987183, -0.895007848739624, -0.7594047784805298, -0.6238017082214355, -0.4881986379623413, -0.35259556770324707, -0.21699249744415283, -0.0813894271850586, 0.054213643074035645, 0.18981671333312988, 0.3254197835922241, 0.46102285385131836, 0.5966259241104126, 0.7322289943695068, 0.8678320646286011, 1.0034351348876953, 1.1390382051467896, 1.2746412754058838, 1.410244345664978, 1.5458474159240723, 1.6814504861831665, 1.8170535564422607, 1.952656626701355, 2.088259696960449, 2.223862648010254, 2.3594658374786377, 2.4950690269470215, 2.630671977996826, 2.766274929046631, 2.9018781185150146, 3.0374813079833984, 3.173084259033203, 3.308687210083008, 3.4442903995513916, 3.5798935890197754, 3.71549654006958, 3.8510994911193848, 3.9867026805877686, 4.122305870056152, 4.257908821105957]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 10.0, 13.0, 22.0, 36.0, 43.0, 78.0, 128.0, 168.0, 320.0, 512.0, 975.0, 1951.0, 4312.0, 12065.0, 69731.0, 1435698.0, 2513885.0, 128222.0, 16401.0, 5022.0, 2153.0, 1085.0, 579.0, 311.0, 192.0, 121.0, 77.0, 48.0, 29.0, 27.0, 14.0, 13.0, 12.0, 4.0, 13.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.73046875, -2.639801025390625, -2.54913330078125, -2.458465576171875, -2.3677978515625, -2.277130126953125, -2.18646240234375, -2.095794677734375, -2.005126953125, -1.914459228515625, -1.82379150390625, -1.733123779296875, -1.6424560546875, -1.551788330078125, -1.46112060546875, -1.370452880859375, -1.27978515625, -1.189117431640625, -1.09844970703125, -1.007781982421875, -0.9171142578125, -0.826446533203125, -0.73577880859375, -0.645111083984375, -0.554443359375, -0.463775634765625, -0.37310791015625, -0.282440185546875, -0.1917724609375, -0.101104736328125, -0.01043701171875, 0.080230712890625, 0.1708984375, 0.261566162109375, 0.35223388671875, 0.442901611328125, 0.5335693359375, 0.624237060546875, 0.71490478515625, 0.805572509765625, 0.896240234375, 0.986907958984375, 1.07757568359375, 1.168243408203125, 1.2589111328125, 1.349578857421875, 1.44024658203125, 1.530914306640625, 1.62158203125, 1.712249755859375, 1.80291748046875, 1.893585205078125, 1.9842529296875, 2.074920654296875, 2.16558837890625, 2.256256103515625, 2.346923828125, 2.437591552734375, 2.52825927734375, 2.618927001953125, 2.7095947265625, 2.800262451171875, 2.89093017578125, 2.981597900390625, 3.072265625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 1.0, 10.0, 7.0, 9.0, 19.0, 15.0, 17.0, 22.0, 17.0, 31.0, 29.0, 45.0, 49.0, 39.0, 60.0, 69.0, 54.0, 58.0, 65.0, 60.0, 45.0, 47.0, 49.0, 29.0, 39.0, 23.0, 15.0, 18.0, 9.0, 13.0, 6.0, 5.0, 14.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.7452850341796875, -1.693695068359375, -1.6421051025390625, -1.59051513671875, -1.5389251708984375, -1.487335205078125, -1.4357452392578125, -1.3841552734375, -1.3325653076171875, -1.280975341796875, -1.2293853759765625, -1.17779541015625, -1.1262054443359375, -1.074615478515625, -1.0230255126953125, -0.971435546875, -0.9198455810546875, -0.868255615234375, -0.8166656494140625, -0.76507568359375, -0.7134857177734375, -0.661895751953125, -0.6103057861328125, -0.5587158203125, -0.5071258544921875, -0.455535888671875, -0.4039459228515625, -0.35235595703125, -0.3007659912109375, -0.249176025390625, -0.1975860595703125, -0.14599609375, -0.0944061279296875, -0.042816162109375, 0.0087738037109375, 0.06036376953125, 0.1119537353515625, 0.163543701171875, 0.2151336669921875, 0.2667236328125, 0.3183135986328125, 0.369903564453125, 0.4214935302734375, 0.47308349609375, 0.5246734619140625, 0.576263427734375, 0.6278533935546875, 0.679443359375, 0.7310333251953125, 0.782623291015625, 0.8342132568359375, 0.88580322265625, 0.9373931884765625, 0.988983154296875, 1.0405731201171875, 1.0921630859375, 1.1437530517578125, 1.195343017578125, 1.2469329833984375, 1.29852294921875, 1.3501129150390625, 1.401702880859375, 1.4532928466796875, 1.5048828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 9.0, 9.0, 13.0, 11.0, 22.0, 25.0, 27.0, 51.0, 92.0, 135.0, 204.0, 337.0, 736.0, 1493.0, 3547.0, 10588.0, 45461.0, 497350.0, 3403216.0, 189905.0, 27829.0, 7684.0, 2800.0, 1183.0, 599.0, 332.0, 171.0, 126.0, 85.0, 52.0, 46.0, 24.0, 22.0, 17.0, 19.0, 11.0, 14.0, 11.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9287109375, -1.8581695556640625, -1.787628173828125, -1.7170867919921875, -1.64654541015625, -1.5760040283203125, -1.505462646484375, -1.4349212646484375, -1.3643798828125, -1.2938385009765625, -1.223297119140625, -1.1527557373046875, -1.08221435546875, -1.0116729736328125, -0.941131591796875, -0.8705902099609375, -0.800048828125, -0.7295074462890625, -0.658966064453125, -0.5884246826171875, -0.51788330078125, -0.4473419189453125, -0.376800537109375, -0.3062591552734375, -0.2357177734375, -0.1651763916015625, -0.094635009765625, -0.0240936279296875, 0.04644775390625, 0.1169891357421875, 0.187530517578125, 0.2580718994140625, 0.32861328125, 0.3991546630859375, 0.469696044921875, 0.5402374267578125, 0.61077880859375, 0.6813201904296875, 0.751861572265625, 0.8224029541015625, 0.8929443359375, 0.9634857177734375, 1.034027099609375, 1.1045684814453125, 1.17510986328125, 1.2456512451171875, 1.316192626953125, 1.3867340087890625, 1.457275390625, 1.5278167724609375, 1.598358154296875, 1.6688995361328125, 1.73944091796875, 1.8099822998046875, 1.880523681640625, 1.9510650634765625, 2.0216064453125, 2.0921478271484375, 2.162689208984375, 2.2332305908203125, 2.30377197265625, 2.3743133544921875, 2.444854736328125, 2.5153961181640625, 2.5859375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 8.0, 5.0, 3.0, 5.0, 5.0, 14.0, 9.0, 21.0, 21.0, 28.0, 32.0, 59.0, 59.0, 120.0, 186.0, 321.0, 504.0, 665.0, 683.0, 507.0, 293.0, 164.0, 117.0, 71.0, 49.0, 34.0, 17.0, 21.0, 9.0, 8.0, 11.0, 6.0, 2.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67529296875, -0.65594482421875, -0.6365966796875, -0.61724853515625, -0.597900390625, -0.57855224609375, -0.5592041015625, -0.53985595703125, -0.5205078125, -0.50115966796875, -0.4818115234375, -0.46246337890625, -0.443115234375, -0.42376708984375, -0.4044189453125, -0.38507080078125, -0.36572265625, -0.34637451171875, -0.3270263671875, -0.30767822265625, -0.288330078125, -0.26898193359375, -0.2496337890625, -0.23028564453125, -0.2109375, -0.19158935546875, -0.1722412109375, -0.15289306640625, -0.133544921875, -0.11419677734375, -0.0948486328125, -0.07550048828125, -0.05615234375, -0.03680419921875, -0.0174560546875, 0.00189208984375, 0.021240234375, 0.04058837890625, 0.0599365234375, 0.07928466796875, 0.0986328125, 0.11798095703125, 0.1373291015625, 0.15667724609375, 0.176025390625, 0.19537353515625, 0.2147216796875, 0.23406982421875, 0.25341796875, 0.27276611328125, 0.2921142578125, 0.31146240234375, 0.330810546875, 0.35015869140625, 0.3695068359375, 0.38885498046875, 0.408203125, 0.42755126953125, 0.4468994140625, 0.46624755859375, 0.485595703125, 0.50494384765625, 0.5242919921875, 0.54364013671875, 0.56298828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 7.0, 10.0, 26.0, 32.0, 57.0, 62.0, 97.0, 105.0, 121.0, 121.0, 97.0, 72.0, 55.0, 32.0, 27.0, 24.0, 12.0, 8.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.478421688079834, -2.3924384117126465, -2.30645489692688, -2.2204716205596924, -2.134488105773926, -2.0485048294067383, -1.9625215530395508, -1.8765381574630737, -1.7905547618865967, -1.7045713663101196, -1.6185879707336426, -1.532604694366455, -1.446621298789978, -1.360637903213501, -1.2746546268463135, -1.1886712312698364, -1.1026878356933594, -1.0167044401168823, -0.93072110414505, -0.8447377681732178, -0.7587543725967407, -0.6727709770202637, -0.5867876410484314, -0.5008043050765991, -0.41482090950012207, -0.3288375437259674, -0.24285417795181274, -0.15687081217765808, -0.07088744640350342, 0.015095919370651245, 0.10107928514480591, 0.18706262111663818, 0.27304577827453613, 0.3590291440486908, 0.44501250982284546, 0.5309958457946777, 0.6169792413711548, 0.7029626369476318, 0.7889459729194641, 0.8749293088912964, 0.9609127044677734, 1.0468961000442505, 1.1328794956207275, 1.218862771987915, 1.304846167564392, 1.3908295631408691, 1.4768128395080566, 1.5627962350845337, 1.6487796306610107, 1.7347630262374878, 1.8207464218139648, 1.9067296981811523, 1.9927130937576294, 2.0786964893341064, 2.164679765701294, 2.2506632804870605, 2.336646556854248, 2.4226298332214355, 2.508613348007202, 2.5945966243743896, 2.6805801391601562, 2.7665634155273438, 2.8525466918945312, 2.9385299682617188, 3.0245134830474854]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 12.0, 9.0, 8.0, 13.0, 18.0, 20.0, 19.0, 24.0, 27.0, 35.0, 35.0, 33.0, 41.0, 39.0, 38.0, 37.0, 38.0, 45.0, 45.0, 44.0, 38.0, 40.0, 42.0, 44.0, 29.0, 28.0, 22.0, 21.0, 22.0, 22.0, 15.0, 25.0, 9.0, 10.0, 8.0, 13.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2231305837631226, -1.1789320707321167, -1.1347335577011108, -1.0905351638793945, -1.0463366508483887, -1.0021381378173828, -0.957939624786377, -0.9137411117553711, -0.8695425987243652, -0.8253440856933594, -0.7811456322669983, -0.7369471192359924, -0.6927486062049866, -0.6485501527786255, -0.6043516397476196, -0.5601531267166138, -0.5159546732902527, -0.4717561900615692, -0.42755767703056335, -0.3833591938018799, -0.339160680770874, -0.29496219754219055, -0.2507637143135071, -0.20656520128250122, -0.16236671805381775, -0.11816821992397308, -0.07396972924470901, -0.029771238565444946, 0.01442725956439972, 0.058625757694244385, 0.10282424092292786, 0.14702275395393372, 0.1912212371826172, 0.23541973531246185, 0.2796182334423065, 0.32381671667099, 0.36801522970199585, 0.4122137129306793, 0.4564121961593628, 0.5006107091903687, 0.5448092222213745, 0.5890077352523804, 0.6332061886787415, 0.6774047017097473, 0.7216032147407532, 0.7658016681671143, 0.8100001811981201, 0.854198694229126, 0.8983971476554871, 0.9425956606864929, 0.986794114112854, 1.0309926271438599, 1.0751911401748657, 1.1193896532058716, 1.163588047027588, 1.2077865600585938, 1.2519850730895996, 1.2961835861206055, 1.3403820991516113, 1.3845806121826172, 1.4287790060043335, 1.4729775190353394, 1.5171760320663452, 1.561374545097351, 1.605573058128357]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 8.0, 9.0, 20.0, 25.0, 31.0, 36.0, 46.0, 68.0, 105.0, 180.0, 280.0, 485.0, 805.0, 1462.0, 3062.0, 6794.0, 16657.0, 46084.0, 129914.0, 300637.0, 315434.0, 142843.0, 50730.0, 18527.0, 7322.0, 3165.0, 1602.0, 823.0, 453.0, 280.0, 210.0, 134.0, 92.0, 65.0, 48.0, 28.0, 23.0, 8.0, 10.0, 6.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.251708984375, -0.2433319091796875, -0.234954833984375, -0.2265777587890625, -0.21820068359375, -0.2098236083984375, -0.201446533203125, -0.1930694580078125, -0.1846923828125, -0.1763153076171875, -0.167938232421875, -0.1595611572265625, -0.15118408203125, -0.1428070068359375, -0.134429931640625, -0.1260528564453125, -0.11767578125, -0.1092987060546875, -0.100921630859375, -0.0925445556640625, -0.08416748046875, -0.0757904052734375, -0.067413330078125, -0.0590362548828125, -0.0506591796875, -0.0422821044921875, -0.033905029296875, -0.0255279541015625, -0.01715087890625, -0.0087738037109375, -0.000396728515625, 0.0079803466796875, 0.016357421875, 0.0247344970703125, 0.033111572265625, 0.0414886474609375, 0.04986572265625, 0.0582427978515625, 0.066619873046875, 0.0749969482421875, 0.0833740234375, 0.0917510986328125, 0.100128173828125, 0.1085052490234375, 0.11688232421875, 0.1252593994140625, 0.133636474609375, 0.1420135498046875, 0.150390625, 0.1587677001953125, 0.167144775390625, 0.1755218505859375, 0.18389892578125, 0.1922760009765625, 0.200653076171875, 0.2090301513671875, 0.2174072265625, 0.2257843017578125, 0.234161376953125, 0.2425384521484375, 0.25091552734375, 0.2592926025390625, 0.267669677734375, 0.2760467529296875, 0.284423828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 3.0, 10.0, 7.0, 8.0, 15.0, 15.0, 14.0, 16.0, 29.0, 34.0, 40.0, 39.0, 36.0, 62.0, 37.0, 57.0, 50.0, 65.0, 50.0, 64.0, 53.0, 48.0, 38.0, 33.0, 22.0, 39.0, 20.0, 15.0, 16.0, 14.0, 10.0, 14.0, 9.0, 3.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0068359375, -0.968353271484375, -0.92987060546875, -0.891387939453125, -0.8529052734375, -0.814422607421875, -0.77593994140625, -0.737457275390625, -0.698974609375, -0.660491943359375, -0.62200927734375, -0.583526611328125, -0.5450439453125, -0.506561279296875, -0.46807861328125, -0.429595947265625, -0.39111328125, -0.352630615234375, -0.31414794921875, -0.275665283203125, -0.2371826171875, -0.198699951171875, -0.16021728515625, -0.121734619140625, -0.083251953125, -0.044769287109375, -0.00628662109375, 0.032196044921875, 0.0706787109375, 0.109161376953125, 0.14764404296875, 0.186126708984375, 0.224609375, 0.263092041015625, 0.30157470703125, 0.340057373046875, 0.3785400390625, 0.417022705078125, 0.45550537109375, 0.493988037109375, 0.532470703125, 0.570953369140625, 0.60943603515625, 0.647918701171875, 0.6864013671875, 0.724884033203125, 0.76336669921875, 0.801849365234375, 0.84033203125, 0.878814697265625, 0.91729736328125, 0.955780029296875, 0.9942626953125, 1.032745361328125, 1.07122802734375, 1.109710693359375, 1.148193359375, 1.186676025390625, 1.22515869140625, 1.263641357421875, 1.3021240234375, 1.340606689453125, 1.37908935546875, 1.417572021484375, 1.4560546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 8.0, 6.0, 4.0, 6.0, 14.0, 19.0, 23.0, 38.0, 49.0, 79.0, 87.0, 149.0, 231.0, 404.0, 729.0, 1540.0, 3271.0, 7853.0, 20239.0, 59133.0, 173736.0, 354552.0, 269623.0, 101209.0, 33912.0, 12101.0, 4808.0, 2206.0, 1065.0, 558.0, 333.0, 173.0, 115.0, 74.0, 59.0, 39.0, 29.0, 17.0, 19.0, 7.0, 11.0, 10.0, 5.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.262451171875, -0.25391387939453125, -0.2453765869140625, -0.23683929443359375, -0.228302001953125, -0.21976470947265625, -0.2112274169921875, -0.20269012451171875, -0.19415283203125, -0.18561553955078125, -0.1770782470703125, -0.16854095458984375, -0.160003662109375, -0.15146636962890625, -0.1429290771484375, -0.13439178466796875, -0.1258544921875, -0.11731719970703125, -0.1087799072265625, -0.10024261474609375, -0.091705322265625, -0.08316802978515625, -0.0746307373046875, -0.06609344482421875, -0.05755615234375, -0.04901885986328125, -0.0404815673828125, -0.03194427490234375, -0.023406982421875, -0.01486968994140625, -0.0063323974609375, 0.00220489501953125, 0.0107421875, 0.01927947998046875, 0.0278167724609375, 0.03635406494140625, 0.044891357421875, 0.05342864990234375, 0.0619659423828125, 0.07050323486328125, 0.07904052734375, 0.08757781982421875, 0.0961151123046875, 0.10465240478515625, 0.113189697265625, 0.12172698974609375, 0.1302642822265625, 0.13880157470703125, 0.1473388671875, 0.15587615966796875, 0.1644134521484375, 0.17295074462890625, 0.181488037109375, 0.19002532958984375, 0.1985626220703125, 0.20709991455078125, 0.21563720703125, 0.22417449951171875, 0.2327117919921875, 0.24124908447265625, 0.249786376953125, 0.25832366943359375, 0.2668609619140625, 0.27539825439453125, 0.283935546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 6.0, 1.0, 10.0, 14.0, 17.0, 16.0, 20.0, 28.0, 27.0, 36.0, 42.0, 54.0, 31.0, 53.0, 56.0, 41.0, 46.0, 57.0, 47.0, 51.0, 51.0, 37.0, 53.0, 23.0, 34.0, 25.0, 19.0, 16.0, 14.0, 8.0, 14.0, 8.0, 13.0, 8.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-2.509765625, -2.4396209716796875, -2.369476318359375, -2.2993316650390625, -2.22918701171875, -2.1590423583984375, -2.088897705078125, -2.0187530517578125, -1.9486083984375, -1.8784637451171875, -1.808319091796875, -1.7381744384765625, -1.66802978515625, -1.5978851318359375, -1.527740478515625, -1.4575958251953125, -1.387451171875, -1.3173065185546875, -1.247161865234375, -1.1770172119140625, -1.10687255859375, -1.0367279052734375, -0.966583251953125, -0.8964385986328125, -0.8262939453125, -0.7561492919921875, -0.686004638671875, -0.6158599853515625, -0.54571533203125, -0.4755706787109375, -0.405426025390625, -0.3352813720703125, -0.26513671875, -0.1949920654296875, -0.124847412109375, -0.0547027587890625, 0.01544189453125, 0.0855865478515625, 0.155731201171875, 0.2258758544921875, 0.2960205078125, 0.3661651611328125, 0.436309814453125, 0.5064544677734375, 0.57659912109375, 0.6467437744140625, 0.716888427734375, 0.7870330810546875, 0.857177734375, 0.9273223876953125, 0.997467041015625, 1.0676116943359375, 1.13775634765625, 1.2079010009765625, 1.278045654296875, 1.3481903076171875, 1.4183349609375, 1.4884796142578125, 1.558624267578125, 1.6287689208984375, 1.69891357421875, 1.7690582275390625, 1.839202880859375, 1.9093475341796875, 1.9794921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 23.0, 20.0, 33.0, 32.0, 40.0, 90.0, 118.0, 172.0, 232.0, 407.0, 667.0, 1252.0, 2334.0, 4994.0, 12666.0, 37252.0, 128534.0, 353099.0, 334610.0, 116026.0, 34362.0, 11679.0, 4774.0, 2175.0, 1151.0, 661.0, 378.0, 240.0, 154.0, 112.0, 78.0, 43.0, 42.0, 19.0, 19.0, 8.0, 10.0, 7.0, 7.0, 2.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.0888671875, -0.08625030517578125, -0.0836334228515625, -0.08101654052734375, -0.078399658203125, -0.07578277587890625, -0.0731658935546875, -0.07054901123046875, -0.06793212890625, -0.06531524658203125, -0.0626983642578125, -0.06008148193359375, -0.057464599609375, -0.05484771728515625, -0.0522308349609375, -0.04961395263671875, -0.0469970703125, -0.04438018798828125, -0.0417633056640625, -0.03914642333984375, -0.036529541015625, -0.03391265869140625, -0.0312957763671875, -0.02867889404296875, -0.02606201171875, -0.02344512939453125, -0.0208282470703125, -0.01821136474609375, -0.015594482421875, -0.01297760009765625, -0.0103607177734375, -0.00774383544921875, -0.005126953125, -0.00251007080078125, 0.0001068115234375, 0.00272369384765625, 0.005340576171875, 0.00795745849609375, 0.0105743408203125, 0.01319122314453125, 0.01580810546875, 0.01842498779296875, 0.0210418701171875, 0.02365875244140625, 0.026275634765625, 0.02889251708984375, 0.0315093994140625, 0.03412628173828125, 0.0367431640625, 0.03936004638671875, 0.0419769287109375, 0.04459381103515625, 0.047210693359375, 0.04982757568359375, 0.0524444580078125, 0.05506134033203125, 0.05767822265625, 0.06029510498046875, 0.0629119873046875, 0.06552886962890625, 0.068145751953125, 0.07076263427734375, 0.0733795166015625, 0.07599639892578125, 0.07861328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 8.0, 9.0, 9.0, 10.0, 25.0, 34.0, 42.0, 47.0, 60.0, 69.0, 94.0, 87.0, 95.0, 72.0, 70.0, 65.0, 48.0, 40.0, 28.0, 22.0, 23.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.2751431465148926e-05, -4.1097402572631836e-05, -3.9443373680114746e-05, -3.7789344787597656e-05, -3.6135315895080566e-05, -3.4481287002563477e-05, -3.282725811004639e-05, -3.11732292175293e-05, -2.9519200325012207e-05, -2.7865171432495117e-05, -2.6211142539978027e-05, -2.4557113647460938e-05, -2.2903084754943848e-05, -2.1249055862426758e-05, -1.9595026969909668e-05, -1.7940998077392578e-05, -1.6286969184875488e-05, -1.4632940292358398e-05, -1.2978911399841309e-05, -1.1324882507324219e-05, -9.670853614807129e-06, -8.016824722290039e-06, -6.362795829772949e-06, -4.708766937255859e-06, -3.0547380447387695e-06, -1.4007091522216797e-06, 2.5331974029541016e-07, 1.9073486328125e-06, 3.56137752532959e-06, 5.21540641784668e-06, 6.8694353103637695e-06, 8.52346420288086e-06, 1.017749309539795e-05, 1.1831521987915039e-05, 1.3485550880432129e-05, 1.5139579772949219e-05, 1.679360866546631e-05, 1.84476375579834e-05, 2.0101666450500488e-05, 2.1755695343017578e-05, 2.3409724235534668e-05, 2.5063753128051758e-05, 2.6717782020568848e-05, 2.8371810913085938e-05, 3.0025839805603027e-05, 3.167986869812012e-05, 3.333389759063721e-05, 3.49879264831543e-05, 3.664195537567139e-05, 3.8295984268188477e-05, 3.9950013160705566e-05, 4.1604042053222656e-05, 4.3258070945739746e-05, 4.4912099838256836e-05, 4.6566128730773926e-05, 4.8220157623291016e-05, 4.9874186515808105e-05, 5.1528215408325195e-05, 5.3182244300842285e-05, 5.4836273193359375e-05, 5.6490302085876465e-05, 5.8144330978393555e-05, 5.9798359870910645e-05, 6.145238876342773e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 10.0, 16.0, 19.0, 24.0, 41.0, 61.0, 96.0, 167.0, 302.0, 531.0, 1260.0, 3830.0, 14089.0, 65045.0, 290215.0, 465575.0, 161862.0, 33321.0, 7849.0, 2422.0, 921.0, 364.0, 217.0, 106.0, 69.0, 45.0, 24.0, 18.0, 15.0, 16.0, 7.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.131591796875, -0.12815475463867188, -0.12471771240234375, -0.12128067016601562, -0.1178436279296875, -0.11440658569335938, -0.11096954345703125, -0.10753250122070312, -0.104095458984375, -0.10065841674804688, -0.09722137451171875, -0.09378433227539062, -0.0903472900390625, -0.08691024780273438, -0.08347320556640625, -0.08003616333007812, -0.07659912109375, -0.07316207885742188, -0.06972503662109375, -0.06628799438476562, -0.0628509521484375, -0.059413909912109375, -0.05597686767578125, -0.052539825439453125, -0.049102783203125, -0.045665740966796875, -0.04222869873046875, -0.038791656494140625, -0.0353546142578125, -0.031917572021484375, -0.02848052978515625, -0.025043487548828125, -0.0216064453125, -0.018169403076171875, -0.01473236083984375, -0.011295318603515625, -0.0078582763671875, -0.004421234130859375, -0.00098419189453125, 0.002452850341796875, 0.005889892578125, 0.009326934814453125, 0.01276397705078125, 0.016201019287109375, 0.0196380615234375, 0.023075103759765625, 0.02651214599609375, 0.029949188232421875, 0.03338623046875, 0.036823272705078125, 0.04026031494140625, 0.043697357177734375, 0.0471343994140625, 0.050571441650390625, 0.05400848388671875, 0.057445526123046875, 0.060882568359375, 0.06431961059570312, 0.06775665283203125, 0.07119369506835938, 0.0746307373046875, 0.07806777954101562, 0.08150482177734375, 0.08494186401367188, 0.08837890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 12.0, 8.0, 12.0, 10.0, 15.0, 22.0, 23.0, 24.0, 43.0, 30.0, 42.0, 66.0, 61.0, 59.0, 62.0, 47.0, 58.0, 53.0, 59.0, 47.0, 47.0, 29.0, 27.0, 20.0, 24.0, 18.0, 10.0, 17.0, 13.0, 7.0, 6.0, 3.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02105712890625, -0.020326614379882812, -0.019596099853515625, -0.018865585327148438, -0.01813507080078125, -0.017404556274414062, -0.016674041748046875, -0.015943527221679688, -0.0152130126953125, -0.014482498168945312, -0.013751983642578125, -0.013021469116210938, -0.01229095458984375, -0.011560440063476562, -0.010829925537109375, -0.010099411010742188, -0.009368896484375, -0.008638381958007812, -0.007907867431640625, -0.0071773529052734375, -0.00644683837890625, -0.0057163238525390625, -0.004985809326171875, -0.0042552947998046875, -0.0035247802734375, -0.0027942657470703125, -0.002063751220703125, -0.0013332366943359375, -0.00060272216796875, 0.0001277923583984375, 0.000858306884765625, 0.0015888214111328125, 0.0023193359375, 0.0030498504638671875, 0.003780364990234375, 0.0045108795166015625, 0.00524139404296875, 0.0059719085693359375, 0.006702423095703125, 0.0074329376220703125, 0.0081634521484375, 0.008893966674804688, 0.009624481201171875, 0.010354995727539062, 0.01108551025390625, 0.011816024780273438, 0.012546539306640625, 0.013277053833007812, 0.014007568359375, 0.014738082885742188, 0.015468597412109375, 0.016199111938476562, 0.01692962646484375, 0.017660140991210938, 0.018390655517578125, 0.019121170043945312, 0.0198516845703125, 0.020582199096679688, 0.021312713623046875, 0.022043228149414062, 0.02277374267578125, 0.023504257202148438, 0.024234771728515625, 0.024965286254882812, 0.02569580078125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 14.0, 46.0, 173.0, 390.0, 269.0, 73.0, 21.0, 11.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.299095630645752, -5.120827674865723, -4.942559719085693, -4.764291763305664, -4.586023330688477, -4.407755374908447, -4.229487419128418, -4.051219463348389, -3.8729512691497803, -3.694683313369751, -3.5164151191711426, -3.3381471633911133, -3.159879207611084, -2.9816110134124756, -2.8033430576324463, -2.625074863433838, -2.4468069076538086, -2.2685389518737793, -2.090270757675171, -1.9120028018951416, -1.7337347269058228, -1.555466651916504, -1.3771986961364746, -1.1989306211471558, -1.020662546157837, -0.8423944711685181, -0.664126455783844, -0.4858584403991699, -0.3075903654098511, -0.12932229042053223, 0.04894566535949707, 0.22721374034881592, 0.40548181533813477, 0.5837498903274536, 0.7620179057121277, 0.9402859210968018, 1.1185539960861206, 1.2968220710754395, 1.4750900268554688, 1.6533581018447876, 1.8316261768341064, 2.0098941326141357, 2.188162326812744, 2.3664302825927734, 2.5446982383728027, 2.722966432571411, 2.9012343883514404, 3.079502582550049, 3.257770538330078, 3.4360384941101074, 3.614306688308716, 3.792574644088745, 3.9708428382873535, 4.149110794067383, 4.327378749847412, 4.505646705627441, 4.683915138244629, 4.862183094024658, 5.0404510498046875, 5.218719482421875, 5.396987438201904, 5.575255393981934, 5.753523349761963, 5.931791305541992, 6.1100592613220215]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 9.0, 5.0, 8.0, 17.0, 16.0, 20.0, 15.0, 35.0, 19.0, 46.0, 38.0, 41.0, 56.0, 49.0, 40.0, 45.0, 57.0, 51.0, 49.0, 52.0, 47.0, 53.0, 38.0, 25.0, 23.0, 24.0, 25.0, 18.0, 20.0, 12.0, 11.0, 10.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9607269167900085, -0.9244585633277893, -0.8881902098655701, -0.8519218564033508, -0.8156535029411316, -0.7793851494789124, -0.7431167364120483, -0.7068483829498291, -0.6705800294876099, -0.6343116760253906, -0.5980433225631714, -0.5617749691009521, -0.5255066156387329, -0.48923826217651367, -0.45296987891197205, -0.4167015254497528, -0.38043320178985596, -0.3441648483276367, -0.3078964948654175, -0.27162814140319824, -0.2353597730398178, -0.19909141957759857, -0.16282305121421814, -0.1265546977519989, -0.09028634428977966, -0.054017987102270126, -0.01774962991476059, 0.018518730998039246, 0.054787084460258484, 0.09105543792247772, 0.12732380628585815, 0.1635921597480774, 0.1998605728149414, 0.23612892627716064, 0.2723972797393799, 0.3086656332015991, 0.34493398666381836, 0.3812023401260376, 0.4174707233905792, 0.45373907685279846, 0.4900074303150177, 0.5262758135795593, 0.5625441670417786, 0.5988125205039978, 0.635080873966217, 0.6713492274284363, 0.7076175808906555, 0.7438859343528748, 0.780154287815094, 0.8164226412773132, 0.8526909947395325, 0.8889593482017517, 0.925227701663971, 0.9614960551261902, 0.9977644681930542, 1.0340328216552734, 1.0703011751174927, 1.106569528579712, 1.1428378820419312, 1.1791062355041504, 1.2153745889663696, 1.2516429424285889, 1.287911295890808, 1.3241796493530273, 1.3604480028152466]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 8.0, 21.0, 23.0, 22.0, 36.0, 69.0, 120.0, 152.0, 261.0, 405.0, 721.0, 1453.0, 3134.0, 7638.0, 22445.0, 88508.0, 471496.0, 355365.0, 66835.0, 17948.0, 6284.0, 2627.0, 1276.0, 685.0, 389.0, 221.0, 125.0, 91.0, 54.0, 36.0, 22.0, 28.0, 8.0, 11.0, 8.0, 11.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1845703125, -1.1474456787109375, -1.110321044921875, -1.0731964111328125, -1.03607177734375, -0.9989471435546875, -0.961822509765625, -0.9246978759765625, -0.8875732421875, -0.8504486083984375, -0.813323974609375, -0.7761993408203125, -0.73907470703125, -0.7019500732421875, -0.664825439453125, -0.6277008056640625, -0.590576171875, -0.5534515380859375, -0.516326904296875, -0.4792022705078125, -0.44207763671875, -0.4049530029296875, -0.367828369140625, -0.3307037353515625, -0.2935791015625, -0.2564544677734375, -0.219329833984375, -0.1822052001953125, -0.14508056640625, -0.1079559326171875, -0.070831298828125, -0.0337066650390625, 0.00341796875, 0.0405426025390625, 0.077667236328125, 0.1147918701171875, 0.15191650390625, 0.1890411376953125, 0.226165771484375, 0.2632904052734375, 0.3004150390625, 0.3375396728515625, 0.374664306640625, 0.4117889404296875, 0.44891357421875, 0.4860382080078125, 0.523162841796875, 0.5602874755859375, 0.597412109375, 0.6345367431640625, 0.671661376953125, 0.7087860107421875, 0.74591064453125, 0.7830352783203125, 0.820159912109375, 0.8572845458984375, 0.8944091796875, 0.9315338134765625, 0.968658447265625, 1.0057830810546875, 1.04290771484375, 1.0800323486328125, 1.117156982421875, 1.1542816162109375, 1.19140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 6.0, 10.0, 12.0, 16.0, 10.0, 26.0, 23.0, 21.0, 30.0, 36.0, 38.0, 42.0, 40.0, 47.0, 45.0, 46.0, 51.0, 49.0, 45.0, 53.0, 45.0, 34.0, 43.0, 31.0, 23.0, 31.0, 20.0, 24.0, 16.0, 13.0, 17.0, 11.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.041015625, -1.974334716796875, -1.90765380859375, -1.840972900390625, -1.7742919921875, -1.707611083984375, -1.64093017578125, -1.574249267578125, -1.507568359375, -1.440887451171875, -1.37420654296875, -1.307525634765625, -1.2408447265625, -1.174163818359375, -1.10748291015625, -1.040802001953125, -0.97412109375, -0.907440185546875, -0.84075927734375, -0.774078369140625, -0.7073974609375, -0.640716552734375, -0.57403564453125, -0.507354736328125, -0.440673828125, -0.373992919921875, -0.30731201171875, -0.240631103515625, -0.1739501953125, -0.107269287109375, -0.04058837890625, 0.026092529296875, 0.0927734375, 0.159454345703125, 0.22613525390625, 0.292816162109375, 0.3594970703125, 0.426177978515625, 0.49285888671875, 0.559539794921875, 0.626220703125, 0.692901611328125, 0.75958251953125, 0.826263427734375, 0.8929443359375, 0.959625244140625, 1.02630615234375, 1.092987060546875, 1.15966796875, 1.226348876953125, 1.29302978515625, 1.359710693359375, 1.4263916015625, 1.493072509765625, 1.55975341796875, 1.626434326171875, 1.693115234375, 1.759796142578125, 1.82647705078125, 1.893157958984375, 1.9598388671875, 2.026519775390625, 2.09320068359375, 2.159881591796875, 2.2265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 6.0, 21.0, 25.0, 40.0, 65.0, 148.0, 375.0, 1141.0, 7902.0, 806319.0, 227088.0, 4121.0, 730.0, 257.0, 134.0, 57.0, 39.0, 25.0, 19.0, 10.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.182525634765625, -5.05255126953125, -4.922576904296875, -4.7926025390625, -4.662628173828125, -4.53265380859375, -4.402679443359375, -4.272705078125, -4.142730712890625, -4.01275634765625, -3.882781982421875, -3.7528076171875, -3.622833251953125, -3.49285888671875, -3.362884521484375, -3.23291015625, -3.102935791015625, -2.97296142578125, -2.842987060546875, -2.7130126953125, -2.583038330078125, -2.45306396484375, -2.323089599609375, -2.193115234375, -2.063140869140625, -1.93316650390625, -1.803192138671875, -1.6732177734375, -1.543243408203125, -1.41326904296875, -1.283294677734375, -1.1533203125, -1.023345947265625, -0.89337158203125, -0.763397216796875, -0.6334228515625, -0.503448486328125, -0.37347412109375, -0.243499755859375, -0.113525390625, 0.016448974609375, 0.14642333984375, 0.276397705078125, 0.4063720703125, 0.536346435546875, 0.66632080078125, 0.796295166015625, 0.92626953125, 1.056243896484375, 1.18621826171875, 1.316192626953125, 1.4461669921875, 1.576141357421875, 1.70611572265625, 1.836090087890625, 1.966064453125, 2.096038818359375, 2.22601318359375, 2.355987548828125, 2.4859619140625, 2.615936279296875, 2.74591064453125, 2.875885009765625, 3.005859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 14.0, 14.0, 20.0, 14.0, 27.0, 30.0, 33.0, 41.0, 52.0, 39.0, 47.0, 80.0, 56.0, 71.0, 55.0, 47.0, 56.0, 46.0, 40.0, 34.0, 29.0, 31.0, 18.0, 31.0, 12.0, 15.0, 9.0, 4.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.904266357421875, -3.79681396484375, -3.689361572265625, -3.5819091796875, -3.474456787109375, -3.36700439453125, -3.259552001953125, -3.152099609375, -3.044647216796875, -2.93719482421875, -2.829742431640625, -2.7222900390625, -2.614837646484375, -2.50738525390625, -2.399932861328125, -2.29248046875, -2.185028076171875, -2.07757568359375, -1.970123291015625, -1.8626708984375, -1.755218505859375, -1.64776611328125, -1.540313720703125, -1.432861328125, -1.325408935546875, -1.21795654296875, -1.110504150390625, -1.0030517578125, -0.895599365234375, -0.78814697265625, -0.680694580078125, -0.5732421875, -0.465789794921875, -0.35833740234375, -0.250885009765625, -0.1434326171875, -0.035980224609375, 0.07147216796875, 0.178924560546875, 0.286376953125, 0.393829345703125, 0.50128173828125, 0.608734130859375, 0.7161865234375, 0.823638916015625, 0.93109130859375, 1.038543701171875, 1.14599609375, 1.253448486328125, 1.36090087890625, 1.468353271484375, 1.5758056640625, 1.683258056640625, 1.79071044921875, 1.898162841796875, 2.005615234375, 2.113067626953125, 2.22052001953125, 2.327972412109375, 2.4354248046875, 2.542877197265625, 2.65032958984375, 2.757781982421875, 2.865234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 11.0, 28.0, 53.0, 144.0, 441.0, 1918.0, 92640.0, 947005.0, 5223.0, 702.0, 201.0, 85.0, 45.0, 15.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.603546142578125, -2.52740478515625, -2.451263427734375, -2.3751220703125, -2.298980712890625, -2.22283935546875, -2.146697998046875, -2.070556640625, -1.994415283203125, -1.91827392578125, -1.842132568359375, -1.7659912109375, -1.689849853515625, -1.61370849609375, -1.537567138671875, -1.46142578125, -1.385284423828125, -1.30914306640625, -1.233001708984375, -1.1568603515625, -1.080718994140625, -1.00457763671875, -0.928436279296875, -0.852294921875, -0.776153564453125, -0.70001220703125, -0.623870849609375, -0.5477294921875, -0.471588134765625, -0.39544677734375, -0.319305419921875, -0.2431640625, -0.167022705078125, -0.09088134765625, -0.014739990234375, 0.0614013671875, 0.137542724609375, 0.21368408203125, 0.289825439453125, 0.365966796875, 0.442108154296875, 0.51824951171875, 0.594390869140625, 0.6705322265625, 0.746673583984375, 0.82281494140625, 0.898956298828125, 0.97509765625, 1.051239013671875, 1.12738037109375, 1.203521728515625, 1.2796630859375, 1.355804443359375, 1.43194580078125, 1.508087158203125, 1.584228515625, 1.660369873046875, 1.73651123046875, 1.812652587890625, 1.8887939453125, 1.964935302734375, 2.04107666015625, 2.117218017578125, 2.193359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 16.0, 26.0, 61.0, 103.0, 214.0, 292.0, 142.0, 68.0, 28.0, 27.0, 8.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001742839813232422, -0.00016739219427108765, -0.0001605004072189331, -0.00015360862016677856, -0.00014671683311462402, -0.00013982504606246948, -0.00013293325901031494, -0.0001260414719581604, -0.00011914968490600586, -0.00011225789785385132, -0.00010536611080169678, -9.847432374954224e-05, -9.15825366973877e-05, -8.469074964523315e-05, -7.779896259307861e-05, -7.090717554092407e-05, -6.401538848876953e-05, -5.712360143661499e-05, -5.023181438446045e-05, -4.334002733230591e-05, -3.644824028015137e-05, -2.9556453227996826e-05, -2.2664666175842285e-05, -1.5772879123687744e-05, -8.881092071533203e-06, -1.989305019378662e-06, 4.902482032775879e-06, 1.179426908493042e-05, 1.868605613708496e-05, 2.5577843189239502e-05, 3.246963024139404e-05, 3.9361417293548584e-05, 4.6253204345703125e-05, 5.3144991397857666e-05, 6.003677845001221e-05, 6.692856550216675e-05, 7.382035255432129e-05, 8.071213960647583e-05, 8.760392665863037e-05, 9.449571371078491e-05, 0.00010138750076293945, 0.000108279287815094, 0.00011517107486724854, 0.00012206286191940308, 0.00012895464897155762, 0.00013584643602371216, 0.0001427382230758667, 0.00014963001012802124, 0.00015652179718017578, 0.00016341358423233032, 0.00017030537128448486, 0.0001771971583366394, 0.00018408894538879395, 0.00019098073244094849, 0.00019787251949310303, 0.00020476430654525757, 0.0002116560935974121, 0.00021854788064956665, 0.0002254396677017212, 0.00023233145475387573, 0.00023922324180603027, 0.0002461150288581848, 0.00025300681591033936, 0.0002598986029624939, 0.00026679039001464844]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 15.0, 14.0, 16.0, 24.0, 68.0, 120.0, 338.0, 915.0, 3894.0, 55646.0, 957130.0, 26353.0, 2741.0, 787.0, 239.0, 101.0, 39.0, 28.0, 21.0, 10.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.669921875, -1.6167449951171875, -1.563568115234375, -1.5103912353515625, -1.45721435546875, -1.4040374755859375, -1.350860595703125, -1.2976837158203125, -1.2445068359375, -1.1913299560546875, -1.138153076171875, -1.0849761962890625, -1.03179931640625, -0.9786224365234375, -0.925445556640625, -0.8722686767578125, -0.819091796875, -0.7659149169921875, -0.712738037109375, -0.6595611572265625, -0.60638427734375, -0.5532073974609375, -0.500030517578125, -0.4468536376953125, -0.3936767578125, -0.3404998779296875, -0.287322998046875, -0.2341461181640625, -0.18096923828125, -0.1277923583984375, -0.074615478515625, -0.0214385986328125, 0.03173828125, 0.0849151611328125, 0.138092041015625, 0.1912689208984375, 0.24444580078125, 0.2976226806640625, 0.350799560546875, 0.4039764404296875, 0.4571533203125, 0.5103302001953125, 0.563507080078125, 0.6166839599609375, 0.66986083984375, 0.7230377197265625, 0.776214599609375, 0.8293914794921875, 0.882568359375, 0.9357452392578125, 0.988922119140625, 1.0420989990234375, 1.09527587890625, 1.1484527587890625, 1.201629638671875, 1.2548065185546875, 1.3079833984375, 1.3611602783203125, 1.414337158203125, 1.4675140380859375, 1.52069091796875, 1.5738677978515625, 1.627044677734375, 1.6802215576171875, 1.7333984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 1.0, 17.0, 12.0, 17.0, 41.0, 39.0, 74.0, 137.0, 176.0, 152.0, 98.0, 61.0, 50.0, 29.0, 22.0, 15.0, 14.0, 6.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.443115234375, -0.42999267578125, -0.4168701171875, -0.40374755859375, -0.390625, -0.37750244140625, -0.3643798828125, -0.35125732421875, -0.338134765625, -0.32501220703125, -0.3118896484375, -0.29876708984375, -0.28564453125, -0.27252197265625, -0.2593994140625, -0.24627685546875, -0.233154296875, -0.22003173828125, -0.2069091796875, -0.19378662109375, -0.1806640625, -0.16754150390625, -0.1544189453125, -0.14129638671875, -0.128173828125, -0.11505126953125, -0.1019287109375, -0.08880615234375, -0.07568359375, -0.06256103515625, -0.0494384765625, -0.03631591796875, -0.023193359375, -0.01007080078125, 0.0030517578125, 0.01617431640625, 0.029296875, 0.04241943359375, 0.0555419921875, 0.06866455078125, 0.081787109375, 0.09490966796875, 0.1080322265625, 0.12115478515625, 0.13427734375, 0.14739990234375, 0.1605224609375, 0.17364501953125, 0.186767578125, 0.19989013671875, 0.2130126953125, 0.22613525390625, 0.2392578125, 0.25238037109375, 0.2655029296875, 0.27862548828125, 0.291748046875, 0.30487060546875, 0.3179931640625, 0.33111572265625, 0.34423828125, 0.35736083984375, 0.3704833984375, 0.38360595703125, 0.396728515625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 15.0, 39.0, 124.0, 280.0, 338.0, 136.0, 41.0, 18.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2233095169067383, -2.903202533721924, -2.5830955505371094, -2.262988567352295, -1.9428815841674805, -1.622774600982666, -1.3026676177978516, -0.9825606346130371, -0.6624536514282227, -0.3423466682434082, -0.02223968505859375, 0.2978672981262207, 0.6179742813110352, 0.9380812644958496, 1.258188247680664, 1.5782952308654785, 1.898402214050293, 2.2185091972351074, 2.538616180419922, 2.8587231636047363, 3.178830146789551, 3.4989371299743652, 3.8190441131591797, 4.139151096343994, 4.459258079528809, 4.779365062713623, 5.0994720458984375, 5.419579029083252, 5.739686012268066, 6.059792995452881, 6.379899978637695, 6.70000696182251, 7.020114898681641, 7.340221881866455, 7.6603288650512695, 7.980435848236084, 8.300542831420898, 8.620649337768555, 8.940756797790527, 9.2608642578125, 9.580970764160156, 9.901077270507812, 10.221184730529785, 10.541292190551758, 10.861398696899414, 11.18150520324707, 11.501612663269043, 11.821720123291016, 12.141826629638672, 12.461933135986328, 12.7820405960083, 13.102148056030273, 13.42225456237793, 13.742361068725586, 14.062468528747559, 14.382575988769531, 14.702682495117188, 15.022789001464844, 15.342896461486816, 15.663003921508789, 15.983110427856445, 16.3032169342041, 16.62332534790039, 16.943431854248047, 17.263538360595703]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 8.0, 16.0, 15.0, 18.0, 23.0, 27.0, 40.0, 31.0, 32.0, 49.0, 35.0, 44.0, 49.0, 59.0, 58.0, 37.0, 56.0, 63.0, 47.0, 48.0, 47.0, 45.0, 21.0, 30.0, 22.0, 11.0, 12.0, 9.0, 8.0, 14.0, 9.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.598597049713135, -4.434200286865234, -4.269803524017334, -4.105406761169434, -3.9410102367401123, -3.776613473892212, -3.6122167110443115, -3.4478201866149902, -3.28342342376709, -3.1190266609191895, -2.954629898071289, -2.7902331352233887, -2.6258366107940674, -2.461439847946167, -2.2970430850982666, -2.1326465606689453, -1.9682495594024658, -1.8038527965545654, -1.6394561529159546, -1.4750593900680542, -1.3106627464294434, -1.146265983581543, -0.9818692207336426, -0.8174725770950317, -0.6530758142471313, -0.48867911100387573, -0.32428237795829773, -0.15988564491271973, 0.004511058330535889, 0.1689077615737915, 0.3333045244216919, 0.49770116806030273, 0.6620979309082031, 0.8264946341514587, 0.9908913373947144, 1.1552881002426147, 1.3196847438812256, 1.484081506729126, 1.6484782695770264, 1.8128749132156372, 1.9772716760635376, 2.1416683197021484, 2.306065082550049, 2.470461845397949, 2.6348586082458496, 2.79925537109375, 2.9636521339416504, 3.1280486583709717, 3.292445421218872, 3.4568421840667725, 3.621238946914673, 3.785635471343994, 3.9500322341918945, 4.114428997039795, 4.278825759887695, 4.443222522735596, 4.607619285583496, 4.7720160484313965, 4.936412811279297, 5.100809574127197, 5.265206336975098, 5.42960262298584, 5.593999862670898, 5.758396148681641, 5.922792911529541]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 8.0, 22.0, 36.0, 46.0, 96.0, 129.0, 233.0, 453.0, 790.0, 1773.0, 4879.0, 23247.0, 455687.0, 3532464.0, 154586.0, 13305.0, 3621.0, 1348.0, 644.0, 341.0, 189.0, 110.0, 83.0, 55.0, 35.0, 27.0, 11.0, 9.0, 7.0, 7.0, 5.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.83984375, -3.737060546875, -3.63427734375, -3.531494140625, -3.4287109375, -3.325927734375, -3.22314453125, -3.120361328125, -3.017578125, -2.914794921875, -2.81201171875, -2.709228515625, -2.6064453125, -2.503662109375, -2.40087890625, -2.298095703125, -2.1953125, -2.092529296875, -1.98974609375, -1.886962890625, -1.7841796875, -1.681396484375, -1.57861328125, -1.475830078125, -1.373046875, -1.270263671875, -1.16748046875, -1.064697265625, -0.9619140625, -0.859130859375, -0.75634765625, -0.653564453125, -0.55078125, -0.447998046875, -0.34521484375, -0.242431640625, -0.1396484375, -0.036865234375, 0.06591796875, 0.168701171875, 0.271484375, 0.374267578125, 0.47705078125, 0.579833984375, 0.6826171875, 0.785400390625, 0.88818359375, 0.990966796875, 1.09375, 1.196533203125, 1.29931640625, 1.402099609375, 1.5048828125, 1.607666015625, 1.71044921875, 1.813232421875, 1.916015625, 2.018798828125, 2.12158203125, 2.224365234375, 2.3271484375, 2.429931640625, 2.53271484375, 2.635498046875, 2.73828125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 9.0, 8.0, 9.0, 17.0, 11.0, 18.0, 23.0, 28.0, 49.0, 63.0, 84.0, 74.0, 60.0, 87.0, 63.0, 80.0, 70.0, 51.0, 49.0, 44.0, 32.0, 25.0, 13.0, 19.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8525390625, -1.7922210693359375, -1.731903076171875, -1.6715850830078125, -1.61126708984375, -1.5509490966796875, -1.490631103515625, -1.4303131103515625, -1.3699951171875, -1.3096771240234375, -1.249359130859375, -1.1890411376953125, -1.12872314453125, -1.0684051513671875, -1.008087158203125, -0.9477691650390625, -0.887451171875, -0.8271331787109375, -0.766815185546875, -0.7064971923828125, -0.64617919921875, -0.5858612060546875, -0.525543212890625, -0.4652252197265625, -0.4049072265625, -0.3445892333984375, -0.284271240234375, -0.2239532470703125, -0.16363525390625, -0.1033172607421875, -0.042999267578125, 0.0173187255859375, 0.07763671875, 0.1379547119140625, 0.198272705078125, 0.2585906982421875, 0.31890869140625, 0.3792266845703125, 0.439544677734375, 0.4998626708984375, 0.5601806640625, 0.6204986572265625, 0.680816650390625, 0.7411346435546875, 0.80145263671875, 0.8617706298828125, 0.922088623046875, 0.9824066162109375, 1.042724609375, 1.1030426025390625, 1.163360595703125, 1.2236785888671875, 1.28399658203125, 1.3443145751953125, 1.404632568359375, 1.4649505615234375, 1.5252685546875, 1.5855865478515625, 1.645904541015625, 1.7062225341796875, 1.76654052734375, 1.8268585205078125, 1.887176513671875, 1.9474945068359375, 2.0078125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 17.0, 20.0, 19.0, 33.0, 39.0, 82.0, 154.0, 222.0, 442.0, 1107.0, 3198.0, 13087.0, 128088.0, 3771760.0, 251112.0, 18566.0, 3898.0, 1263.0, 559.0, 247.0, 133.0, 73.0, 36.0, 32.0, 20.0, 8.0, 11.0, 6.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0625, -2.971343994140625, -2.88018798828125, -2.789031982421875, -2.6978759765625, -2.606719970703125, -2.51556396484375, -2.424407958984375, -2.333251953125, -2.242095947265625, -2.15093994140625, -2.059783935546875, -1.9686279296875, -1.877471923828125, -1.78631591796875, -1.695159912109375, -1.60400390625, -1.512847900390625, -1.42169189453125, -1.330535888671875, -1.2393798828125, -1.148223876953125, -1.05706787109375, -0.965911865234375, -0.874755859375, -0.783599853515625, -0.69244384765625, -0.601287841796875, -0.5101318359375, -0.418975830078125, -0.32781982421875, -0.236663818359375, -0.1455078125, -0.054351806640625, 0.03680419921875, 0.127960205078125, 0.2191162109375, 0.310272216796875, 0.40142822265625, 0.492584228515625, 0.583740234375, 0.674896240234375, 0.76605224609375, 0.857208251953125, 0.9483642578125, 1.039520263671875, 1.13067626953125, 1.221832275390625, 1.31298828125, 1.404144287109375, 1.49530029296875, 1.586456298828125, 1.6776123046875, 1.768768310546875, 1.85992431640625, 1.951080322265625, 2.042236328125, 2.133392333984375, 2.22454833984375, 2.315704345703125, 2.4068603515625, 2.498016357421875, 2.58917236328125, 2.680328369140625, 2.771484375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 8.0, 5.0, 18.0, 6.0, 19.0, 29.0, 38.0, 44.0, 94.0, 147.0, 219.0, 386.0, 629.0, 779.0, 602.0, 391.0, 228.0, 124.0, 83.0, 54.0, 37.0, 30.0, 24.0, 14.0, 19.0, 6.0, 10.0, 3.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5908203125, -0.572662353515625, -0.55450439453125, -0.536346435546875, -0.5181884765625, -0.500030517578125, -0.48187255859375, -0.463714599609375, -0.445556640625, -0.427398681640625, -0.40924072265625, -0.391082763671875, -0.3729248046875, -0.354766845703125, -0.33660888671875, -0.318450927734375, -0.30029296875, -0.282135009765625, -0.26397705078125, -0.245819091796875, -0.2276611328125, -0.209503173828125, -0.19134521484375, -0.173187255859375, -0.155029296875, -0.136871337890625, -0.11871337890625, -0.100555419921875, -0.0823974609375, -0.064239501953125, -0.04608154296875, -0.027923583984375, -0.009765625, 0.008392333984375, 0.02655029296875, 0.044708251953125, 0.0628662109375, 0.081024169921875, 0.09918212890625, 0.117340087890625, 0.135498046875, 0.153656005859375, 0.17181396484375, 0.189971923828125, 0.2081298828125, 0.226287841796875, 0.24444580078125, 0.262603759765625, 0.28076171875, 0.298919677734375, 0.31707763671875, 0.335235595703125, 0.3533935546875, 0.371551513671875, 0.38970947265625, 0.407867431640625, 0.426025390625, 0.444183349609375, 0.46234130859375, 0.480499267578125, 0.4986572265625, 0.516815185546875, 0.53497314453125, 0.553131103515625, 0.5712890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 12.0, 24.0, 35.0, 63.0, 101.0, 101.0, 149.0, 140.0, 125.0, 94.0, 56.0, 39.0, 15.0, 13.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3596158027648926, -3.261350154876709, -3.1630845069885254, -3.064818859100342, -2.966552972793579, -2.8682873249053955, -2.770021677017212, -2.6717560291290283, -2.5734901428222656, -2.475224494934082, -2.3769588470458984, -2.278693199157715, -2.180427312850952, -2.0821616649627686, -1.983896017074585, -1.8856303691864014, -1.7873647212982178, -1.6890990734100342, -1.590833306312561, -1.4925676584243774, -1.3943018913269043, -1.2960362434387207, -1.197770595550537, -1.0995049476623535, -1.0012391805648804, -0.902973473072052, -0.8047077655792236, -0.70644211769104, -0.6081764101982117, -0.5099107027053833, -0.4116450548171997, -0.31337934732437134, -0.21511340141296387, -0.11684770882129669, -0.018582016229629517, 0.07968366146087646, 0.17794936895370483, 0.2762150764465332, 0.3744807243347168, 0.47274643182754517, 0.5710121393203735, 0.6692778468132019, 0.7675435543060303, 0.8658092021942139, 0.9640749096870422, 1.0623406171798706, 1.1606062650680542, 1.2588720321655273, 1.357137680053711, 1.4554033279418945, 1.5536690950393677, 1.6519347429275513, 1.7502005100250244, 1.848466157913208, 1.9467318058013916, 2.044997453689575, 2.143263339996338, 2.2415289878845215, 2.339794635772705, 2.4380602836608887, 2.5363261699676514, 2.634591817855835, 2.7328574657440186, 2.831123113632202, 2.9293887615203857]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 12.0, 19.0, 22.0, 21.0, 29.0, 30.0, 38.0, 50.0, 54.0, 57.0, 68.0, 74.0, 68.0, 52.0, 52.0, 49.0, 63.0, 40.0, 39.0, 24.0, 38.0, 19.0, 18.0, 18.0, 12.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.286694884300232, -1.23004150390625, -1.1733882427215576, -1.1167348623275757, -1.0600814819335938, -1.0034282207489014, -0.9467748403549194, -0.8901214599609375, -0.8334681391716003, -0.7768148183822632, -0.7201614379882812, -0.6635081171989441, -0.6068547964096069, -0.550201416015625, -0.49354809522628784, -0.4368947446346283, -0.38024139404296875, -0.3235880434513092, -0.26693469285964966, -0.2102813720703125, -0.15362802147865295, -0.09697467088699341, -0.04032135009765625, 0.016332000494003296, 0.07298535108566284, 0.1296387016773224, 0.18629203736782074, 0.2429453730583191, 0.29959872364997864, 0.3562520742416382, 0.41290539503097534, 0.4695587456226349, 0.526212215423584, 0.5828655362129211, 0.6395189166069031, 0.6961722373962402, 0.7528256177902222, 0.8094789385795593, 0.8661322593688965, 0.9227856397628784, 0.9794389605522156, 1.0360922813415527, 1.0927456617355347, 1.1493990421295166, 1.206052303314209, 1.262705683708191, 1.3193590641021729, 1.3760123252868652, 1.4326657056808472, 1.489319086074829, 1.5459723472595215, 1.6026257276535034, 1.6592791080474854, 1.7159323692321777, 1.7725857496261597, 1.8292391300201416, 1.885892391204834, 1.942545771598816, 1.9991990327835083, 2.0558524131774902, 2.1125056743621826, 2.169159173965454, 2.2258124351501465, 2.282465696334839, 2.3391191959381104]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 16.0, 30.0, 54.0, 116.0, 278.0, 735.0, 2487.0, 9853.0, 85642.0, 817063.0, 116424.0, 11564.0, 2879.0, 844.0, 294.0, 125.0, 60.0, 24.0, 15.0, 10.0, 7.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73974609375, -0.7107925415039062, -0.6818389892578125, -0.6528854370117188, -0.623931884765625, -0.5949783325195312, -0.5660247802734375, -0.5370712280273438, -0.50811767578125, -0.47916412353515625, -0.4502105712890625, -0.42125701904296875, -0.392303466796875, -0.36334991455078125, -0.3343963623046875, -0.30544281005859375, -0.2764892578125, -0.24753570556640625, -0.2185821533203125, -0.18962860107421875, -0.160675048828125, -0.13172149658203125, -0.1027679443359375, -0.07381439208984375, -0.04486083984375, -0.01590728759765625, 0.0130462646484375, 0.04199981689453125, 0.070953369140625, 0.09990692138671875, 0.1288604736328125, 0.15781402587890625, 0.186767578125, 0.21572113037109375, 0.2446746826171875, 0.27362823486328125, 0.302581787109375, 0.33153533935546875, 0.3604888916015625, 0.38944244384765625, 0.41839599609375, 0.44734954833984375, 0.4763031005859375, 0.5052566528320312, 0.534210205078125, 0.5631637573242188, 0.5921173095703125, 0.6210708618164062, 0.6500244140625, 0.6789779663085938, 0.7079315185546875, 0.7368850708007812, 0.765838623046875, 0.7947921752929688, 0.8237457275390625, 0.8526992797851562, 0.88165283203125, 0.9106063842773438, 0.9395599365234375, 0.9685134887695312, 0.997467041015625, 1.0264205932617188, 1.0553741455078125, 1.0843276977539062, 1.11328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 19.0, 26.0, 31.0, 61.0, 83.0, 106.0, 108.0, 133.0, 116.0, 100.0, 67.0, 55.0, 41.0, 28.0, 12.0, 7.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.604522705078125, -1.53326416015625, -1.462005615234375, -1.3907470703125, -1.319488525390625, -1.24822998046875, -1.176971435546875, -1.105712890625, -1.034454345703125, -0.96319580078125, -0.891937255859375, -0.8206787109375, -0.749420166015625, -0.67816162109375, -0.606903076171875, -0.53564453125, -0.464385986328125, -0.39312744140625, -0.321868896484375, -0.2506103515625, -0.179351806640625, -0.10809326171875, -0.036834716796875, 0.034423828125, 0.105682373046875, 0.17694091796875, 0.248199462890625, 0.3194580078125, 0.390716552734375, 0.46197509765625, 0.533233642578125, 0.6044921875, 0.675750732421875, 0.74700927734375, 0.818267822265625, 0.8895263671875, 0.960784912109375, 1.03204345703125, 1.103302001953125, 1.174560546875, 1.245819091796875, 1.31707763671875, 1.388336181640625, 1.4595947265625, 1.530853271484375, 1.60211181640625, 1.673370361328125, 1.74462890625, 1.815887451171875, 1.88714599609375, 1.958404541015625, 2.0296630859375, 2.100921630859375, 2.17218017578125, 2.243438720703125, 2.314697265625, 2.385955810546875, 2.45721435546875, 2.528472900390625, 2.5997314453125, 2.670989990234375, 2.74224853515625, 2.813507080078125, 2.884765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 11.0, 8.0, 16.0, 37.0, 57.0, 95.0, 200.0, 466.0, 1135.0, 3698.0, 15202.0, 163085.0, 757475.0, 91503.0, 10963.0, 2930.0, 931.0, 353.0, 165.0, 92.0, 41.0, 34.0, 20.0, 13.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80419921875, -0.7821044921875, -0.760009765625, -0.7379150390625, -0.7158203125, -0.6937255859375, -0.671630859375, -0.6495361328125, -0.62744140625, -0.6053466796875, -0.583251953125, -0.5611572265625, -0.5390625, -0.5169677734375, -0.494873046875, -0.4727783203125, -0.45068359375, -0.4285888671875, -0.406494140625, -0.3843994140625, -0.3623046875, -0.3402099609375, -0.318115234375, -0.2960205078125, -0.27392578125, -0.2518310546875, -0.229736328125, -0.2076416015625, -0.185546875, -0.1634521484375, -0.141357421875, -0.1192626953125, -0.09716796875, -0.0750732421875, -0.052978515625, -0.0308837890625, -0.0087890625, 0.0133056640625, 0.035400390625, 0.0574951171875, 0.07958984375, 0.1016845703125, 0.123779296875, 0.1458740234375, 0.16796875, 0.1900634765625, 0.212158203125, 0.2342529296875, 0.25634765625, 0.2784423828125, 0.300537109375, 0.3226318359375, 0.3447265625, 0.3668212890625, 0.388916015625, 0.4110107421875, 0.43310546875, 0.4552001953125, 0.477294921875, 0.4993896484375, 0.521484375, 0.5435791015625, 0.565673828125, 0.5877685546875, 0.60986328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 0.0, 5.0, 1.0, 6.0, 6.0, 8.0, 12.0, 16.0, 6.0, 9.0, 15.0, 15.0, 23.0, 27.0, 26.0, 28.0, 34.0, 32.0, 37.0, 41.0, 34.0, 45.0, 32.0, 58.0, 34.0, 38.0, 35.0, 45.0, 40.0, 45.0, 30.0, 30.0, 34.0, 20.0, 18.0, 24.0, 14.0, 15.0, 14.0, 11.0, 7.0, 6.0, 4.0, 3.0, 3.0, 6.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.265960693359375, -1.21649169921875, -1.167022705078125, -1.1175537109375, -1.068084716796875, -1.01861572265625, -0.969146728515625, -0.919677734375, -0.870208740234375, -0.82073974609375, -0.771270751953125, -0.7218017578125, -0.672332763671875, -0.62286376953125, -0.573394775390625, -0.52392578125, -0.474456787109375, -0.42498779296875, -0.375518798828125, -0.3260498046875, -0.276580810546875, -0.22711181640625, -0.177642822265625, -0.128173828125, -0.078704833984375, -0.02923583984375, 0.020233154296875, 0.0697021484375, 0.119171142578125, 0.16864013671875, 0.218109130859375, 0.267578125, 0.317047119140625, 0.36651611328125, 0.415985107421875, 0.4654541015625, 0.514923095703125, 0.56439208984375, 0.613861083984375, 0.663330078125, 0.712799072265625, 0.76226806640625, 0.811737060546875, 0.8612060546875, 0.910675048828125, 0.96014404296875, 1.009613037109375, 1.05908203125, 1.108551025390625, 1.15802001953125, 1.207489013671875, 1.2569580078125, 1.306427001953125, 1.35589599609375, 1.405364990234375, 1.454833984375, 1.504302978515625, 1.55377197265625, 1.603240966796875, 1.6527099609375, 1.702178955078125, 1.75164794921875, 1.801116943359375, 1.8505859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 10.0, 7.0, 7.0, 19.0, 28.0, 28.0, 53.0, 88.0, 137.0, 181.0, 331.0, 528.0, 981.0, 1819.0, 4022.0, 9844.0, 30669.0, 118214.0, 382578.0, 352703.0, 102193.0, 27208.0, 9274.0, 3711.0, 1671.0, 832.0, 518.0, 315.0, 188.0, 124.0, 86.0, 56.0, 38.0, 27.0, 24.0, 7.0, 13.0, 4.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08819580078125, -0.08534622192382812, -0.08249664306640625, -0.07964706420898438, -0.0767974853515625, -0.07394790649414062, -0.07109832763671875, -0.06824874877929688, -0.065399169921875, -0.06254959106445312, -0.05970001220703125, -0.056850433349609375, -0.0540008544921875, -0.051151275634765625, -0.04830169677734375, -0.045452117919921875, -0.0426025390625, -0.039752960205078125, -0.03690338134765625, -0.034053802490234375, -0.0312042236328125, -0.028354644775390625, -0.02550506591796875, -0.022655487060546875, -0.019805908203125, -0.016956329345703125, -0.01410675048828125, -0.011257171630859375, -0.0084075927734375, -0.005558013916015625, -0.00270843505859375, 0.000141143798828125, 0.00299072265625, 0.005840301513671875, 0.00868988037109375, 0.011539459228515625, 0.0143890380859375, 0.017238616943359375, 0.02008819580078125, 0.022937774658203125, 0.025787353515625, 0.028636932373046875, 0.03148651123046875, 0.034336090087890625, 0.0371856689453125, 0.040035247802734375, 0.04288482666015625, 0.045734405517578125, 0.048583984375, 0.051433563232421875, 0.05428314208984375, 0.057132720947265625, 0.0599822998046875, 0.06283187866210938, 0.06568145751953125, 0.06853103637695312, 0.071380615234375, 0.07423019409179688, 0.07707977294921875, 0.07992935180664062, 0.0827789306640625, 0.08562850952148438, 0.08847808837890625, 0.09132766723632812, 0.09417724609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 0.0, 4.0, 7.0, 13.0, 21.0, 30.0, 46.0, 60.0, 73.0, 91.0, 108.0, 130.0, 109.0, 85.0, 63.0, 52.0, 30.0, 21.0, 17.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.131431579589844e-05, -8.903536945581436e-05, -8.675642311573029e-05, -8.447747677564621e-05, -8.219853043556213e-05, -7.991958409547806e-05, -7.764063775539398e-05, -7.53616914153099e-05, -7.308274507522583e-05, -7.080379873514175e-05, -6.852485239505768e-05, -6.62459060549736e-05, -6.396695971488953e-05, -6.168801337480545e-05, -5.9409067034721375e-05, -5.71301206946373e-05, -5.485117435455322e-05, -5.257222801446915e-05, -5.029328167438507e-05, -4.8014335334300995e-05, -4.573538899421692e-05, -4.345644265413284e-05, -4.117749631404877e-05, -3.889854997396469e-05, -3.6619603633880615e-05, -3.434065729379654e-05, -3.206171095371246e-05, -2.9782764613628387e-05, -2.750381827354431e-05, -2.5224871933460236e-05, -2.294592559337616e-05, -2.0666979253292084e-05, -1.8388032913208008e-05, -1.6109086573123932e-05, -1.3830140233039856e-05, -1.155119389295578e-05, -9.272247552871704e-06, -6.993301212787628e-06, -4.714354872703552e-06, -2.4354085326194763e-06, -1.564621925354004e-07, 2.1224841475486755e-06, 4.4014304876327515e-06, 6.680376827716827e-06, 8.959323167800903e-06, 1.123826950788498e-05, 1.3517215847969055e-05, 1.579616218805313e-05, 1.8075108528137207e-05, 2.0354054868221283e-05, 2.263300120830536e-05, 2.4911947548389435e-05, 2.719089388847351e-05, 2.9469840228557587e-05, 3.174878656864166e-05, 3.402773290872574e-05, 3.6306679248809814e-05, 3.858562558889389e-05, 4.0864571928977966e-05, 4.314351826906204e-05, 4.542246460914612e-05, 4.7701410949230194e-05, 4.998035728931427e-05, 5.2259303629398346e-05, 5.453824996948242e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 14.0, 11.0, 17.0, 36.0, 51.0, 67.0, 99.0, 166.0, 256.0, 419.0, 725.0, 1187.0, 2162.0, 4373.0, 9041.0, 21550.0, 58881.0, 166653.0, 332703.0, 272401.0, 110412.0, 38471.0, 14848.0, 6596.0, 3247.0, 1692.0, 898.0, 560.0, 333.0, 228.0, 146.0, 104.0, 64.0, 42.0, 25.0, 16.0, 8.0, 10.0, 4.0, 7.0, 5.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0740966796875, -0.07169055938720703, -0.06928443908691406, -0.0668783187866211, -0.06447219848632812, -0.062066078186035156, -0.05965995788574219, -0.05725383758544922, -0.05484771728515625, -0.05244159698486328, -0.05003547668457031, -0.047629356384277344, -0.045223236083984375, -0.042817115783691406, -0.04041099548339844, -0.03800487518310547, -0.0355987548828125, -0.03319263458251953, -0.030786514282226562, -0.028380393981933594, -0.025974273681640625, -0.023568153381347656, -0.021162033081054688, -0.01875591278076172, -0.01634979248046875, -0.013943672180175781, -0.011537551879882812, -0.009131431579589844, -0.006725311279296875, -0.004319190979003906, -0.0019130706787109375, 0.0004930496215820312, 0.002899169921875, 0.005305290222167969, 0.0077114105224609375, 0.010117530822753906, 0.012523651123046875, 0.014929771423339844, 0.017335891723632812, 0.01974201202392578, 0.02214813232421875, 0.02455425262451172, 0.026960372924804688, 0.029366493225097656, 0.031772613525390625, 0.034178733825683594, 0.03658485412597656, 0.03899097442626953, 0.0413970947265625, 0.04380321502685547, 0.04620933532714844, 0.048615455627441406, 0.051021575927734375, 0.053427696228027344, 0.05583381652832031, 0.05823993682861328, 0.06064605712890625, 0.06305217742919922, 0.06545829772949219, 0.06786441802978516, 0.07027053833007812, 0.0726766586303711, 0.07508277893066406, 0.07748889923095703, 0.07989501953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 9.0, 3.0, 5.0, 6.0, 3.0, 8.0, 9.0, 10.0, 10.0, 25.0, 25.0, 27.0, 37.0, 31.0, 38.0, 51.0, 51.0, 62.0, 60.0, 49.0, 57.0, 54.0, 56.0, 60.0, 48.0, 32.0, 25.0, 27.0, 34.0, 16.0, 13.0, 17.0, 11.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0215301513671875, -0.020805835723876953, -0.020081520080566406, -0.01935720443725586, -0.018632888793945312, -0.017908573150634766, -0.01718425750732422, -0.016459941864013672, -0.015735626220703125, -0.015011310577392578, -0.014286994934082031, -0.013562679290771484, -0.012838363647460938, -0.01211404800415039, -0.011389732360839844, -0.010665416717529297, -0.00994110107421875, -0.009216785430908203, -0.008492469787597656, -0.007768154144287109, -0.0070438385009765625, -0.006319522857666016, -0.005595207214355469, -0.004870891571044922, -0.004146575927734375, -0.003422260284423828, -0.0026979446411132812, -0.0019736289978027344, -0.0012493133544921875, -0.0005249977111816406, 0.00019931793212890625, 0.0009236335754394531, 0.00164794921875, 0.002372264862060547, 0.0030965805053710938, 0.0038208961486816406, 0.0045452117919921875, 0.005269527435302734, 0.005993843078613281, 0.006718158721923828, 0.007442474365234375, 0.008166790008544922, 0.008891105651855469, 0.009615421295166016, 0.010339736938476562, 0.01106405258178711, 0.011788368225097656, 0.012512683868408203, 0.01323699951171875, 0.013961315155029297, 0.014685630798339844, 0.01540994644165039, 0.016134262084960938, 0.016858577728271484, 0.01758289337158203, 0.018307209014892578, 0.019031524658203125, 0.019755840301513672, 0.02048015594482422, 0.021204471588134766, 0.021928787231445312, 0.02265310287475586, 0.023377418518066406, 0.024101734161376953, 0.0248260498046875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 12.0, 20.0, 48.0, 133.0, 263.0, 266.0, 158.0, 72.0, 26.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.386814594268799, -4.2717509269714355, -4.156687259674072, -4.041623592376709, -3.9265599250793457, -3.8114962577819824, -3.69643235206604, -3.5813686847686768, -3.4663050174713135, -3.35124135017395, -3.236177682876587, -3.1211140155792236, -3.0060501098632812, -2.890986442565918, -2.7759227752685547, -2.6608591079711914, -2.545795440673828, -2.430731773376465, -2.3156681060791016, -2.2006044387817383, -2.085540771484375, -1.9704769849777222, -1.8554131984710693, -1.740349531173706, -1.6252858638763428, -1.5102221965789795, -1.3951585292816162, -1.2800947427749634, -1.1650310754776, -1.0499674081802368, -0.9349036812782288, -0.8198399543762207, -0.7047765254974365, -0.5897128582000732, -0.4746491312980652, -0.3595854341983795, -0.24452173709869385, -0.12945806980133057, -0.01439434289932251, 0.10066938400268555, 0.21573305130004883, 0.3307967483997345, 0.44586044549942017, 0.5609241724014282, 0.6759878396987915, 0.7910515069961548, 0.9061152338981628, 1.021178960800171, 1.1362426280975342, 1.2513062953948975, 1.3663699626922607, 1.4814337491989136, 1.5964974164962769, 1.7115610837936401, 1.826624870300293, 1.9416885375976562, 2.0567522048950195, 2.171815872192383, 2.286879539489746, 2.4019432067871094, 2.5170068740844727, 2.632070541381836, 2.7471344470977783, 2.8621981143951416, 2.977261781692505]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 7.0, 12.0, 21.0, 30.0, 26.0, 43.0, 67.0, 66.0, 94.0, 98.0, 101.0, 78.0, 84.0, 75.0, 48.0, 48.0, 40.0, 30.0, 15.0, 6.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0811282396316528, -1.0282928943634033, -0.9754575490951538, -0.9226221442222595, -0.86978679895401, -0.8169514536857605, -0.7641160488128662, -0.7112807035446167, -0.6584453582763672, -0.6056100130081177, -0.5527746677398682, -0.4999392628669739, -0.44710391759872437, -0.39426857233047485, -0.34143319725990295, -0.28859782218933105, -0.23576247692108154, -0.18292711675167084, -0.13009175658226013, -0.07725639641284943, -0.02442103624343872, 0.02841430902481079, 0.08124968409538269, 0.1340850591659546, 0.1869204044342041, 0.2397557646036148, 0.2925911247730255, 0.3454264998435974, 0.3982618451118469, 0.45109719038009644, 0.5039325952529907, 0.5567679405212402, 0.6096031665802002, 0.6624385118484497, 0.7152738571166992, 0.7681092619895935, 0.820944607257843, 0.8737799525260925, 0.9266153573989868, 0.9794507026672363, 1.0322860479354858, 1.0851213932037354, 1.1379567384719849, 1.1907920837402344, 1.2436275482177734, 1.2964627742767334, 1.3492982387542725, 1.402133584022522, 1.4549689292907715, 1.507804274559021, 1.5606396198272705, 1.61347496509552, 1.6663103103637695, 1.7191457748413086, 1.771981120109558, 1.8248164653778076, 1.8776518106460571, 1.9304871559143066, 1.9833225011825562, 2.0361578464508057, 2.0889933109283447, 2.1418285369873047, 2.1946640014648438, 2.247499465942383, 2.3003346920013428]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 14.0, 15.0, 20.0, 23.0, 29.0, 50.0, 62.0, 76.0, 115.0, 152.0, 264.0, 361.0, 664.0, 1118.0, 1983.0, 3941.0, 8717.0, 21787.0, 63580.0, 247542.0, 505501.0, 127163.0, 38138.0, 14216.0, 6174.0, 2898.0, 1497.0, 878.0, 520.0, 347.0, 202.0, 126.0, 111.0, 73.0, 49.0, 28.0, 21.0, 14.0, 16.0, 15.0, 11.0, 10.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0], "bins": [-0.80908203125, -0.7847671508789062, -0.7604522705078125, -0.7361373901367188, -0.711822509765625, -0.6875076293945312, -0.6631927490234375, -0.6388778686523438, -0.61456298828125, -0.5902481079101562, -0.5659332275390625, -0.5416183471679688, -0.517303466796875, -0.49298858642578125, -0.4686737060546875, -0.44435882568359375, -0.4200439453125, -0.39572906494140625, -0.3714141845703125, -0.34709930419921875, -0.322784423828125, -0.29846954345703125, -0.2741546630859375, -0.24983978271484375, -0.22552490234375, -0.20121002197265625, -0.1768951416015625, -0.15258026123046875, -0.128265380859375, -0.10395050048828125, -0.0796356201171875, -0.05532073974609375, -0.031005859375, -0.00669097900390625, 0.0176239013671875, 0.04193878173828125, 0.066253662109375, 0.09056854248046875, 0.1148834228515625, 0.13919830322265625, 0.16351318359375, 0.18782806396484375, 0.2121429443359375, 0.23645782470703125, 0.260772705078125, 0.28508758544921875, 0.3094024658203125, 0.33371734619140625, 0.3580322265625, 0.38234710693359375, 0.4066619873046875, 0.43097686767578125, 0.455291748046875, 0.47960662841796875, 0.5039215087890625, 0.5282363891601562, 0.55255126953125, 0.5768661499023438, 0.6011810302734375, 0.6254959106445312, 0.649810791015625, 0.6741256713867188, 0.6984405517578125, 0.7227554321289062, 0.7470703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 16.0, 11.0, 4.0, 10.0, 15.0, 17.0, 16.0, 23.0, 32.0, 37.0, 28.0, 35.0, 40.0, 53.0, 50.0, 52.0, 54.0, 55.0, 44.0, 49.0, 53.0, 41.0, 33.0, 43.0, 29.0, 35.0, 20.0, 19.0, 17.0, 14.0, 7.0, 9.0, 4.0, 2.0, 7.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7734375, -1.71551513671875, -1.6575927734375, -1.59967041015625, -1.541748046875, -1.48382568359375, -1.4259033203125, -1.36798095703125, -1.31005859375, -1.25213623046875, -1.1942138671875, -1.13629150390625, -1.078369140625, -1.02044677734375, -0.9625244140625, -0.90460205078125, -0.8466796875, -0.78875732421875, -0.7308349609375, -0.67291259765625, -0.614990234375, -0.55706787109375, -0.4991455078125, -0.44122314453125, -0.38330078125, -0.32537841796875, -0.2674560546875, -0.20953369140625, -0.151611328125, -0.09368896484375, -0.0357666015625, 0.02215576171875, 0.080078125, 0.13800048828125, 0.1959228515625, 0.25384521484375, 0.311767578125, 0.36968994140625, 0.4276123046875, 0.48553466796875, 0.54345703125, 0.60137939453125, 0.6593017578125, 0.71722412109375, 0.775146484375, 0.83306884765625, 0.8909912109375, 0.94891357421875, 1.0068359375, 1.06475830078125, 1.1226806640625, 1.18060302734375, 1.238525390625, 1.29644775390625, 1.3543701171875, 1.41229248046875, 1.47021484375, 1.52813720703125, 1.5860595703125, 1.64398193359375, 1.701904296875, 1.75982666015625, 1.8177490234375, 1.87567138671875, 1.93359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 10.0, 10.0, 10.0, 11.0, 16.0, 24.0, 34.0, 45.0, 62.0, 64.0, 78.0, 121.0, 125.0, 167.0, 241.0, 339.0, 615.0, 1392.0, 11021.0, 803987.0, 221606.0, 5705.0, 1063.0, 490.0, 312.0, 219.0, 148.0, 145.0, 106.0, 81.0, 63.0, 55.0, 31.0, 38.0, 20.0, 21.0, 12.0, 18.0, 9.0, 8.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.93359375, -2.8443603515625, -2.755126953125, -2.6658935546875, -2.57666015625, -2.4874267578125, -2.398193359375, -2.3089599609375, -2.2197265625, -2.1304931640625, -2.041259765625, -1.9520263671875, -1.86279296875, -1.7735595703125, -1.684326171875, -1.5950927734375, -1.505859375, -1.4166259765625, -1.327392578125, -1.2381591796875, -1.14892578125, -1.0596923828125, -0.970458984375, -0.8812255859375, -0.7919921875, -0.7027587890625, -0.613525390625, -0.5242919921875, -0.43505859375, -0.3458251953125, -0.256591796875, -0.1673583984375, -0.078125, 0.0111083984375, 0.100341796875, 0.1895751953125, 0.27880859375, 0.3680419921875, 0.457275390625, 0.5465087890625, 0.6357421875, 0.7249755859375, 0.814208984375, 0.9034423828125, 0.99267578125, 1.0819091796875, 1.171142578125, 1.2603759765625, 1.349609375, 1.4388427734375, 1.528076171875, 1.6173095703125, 1.70654296875, 1.7957763671875, 1.885009765625, 1.9742431640625, 2.0634765625, 2.1527099609375, 2.241943359375, 2.3311767578125, 2.42041015625, 2.5096435546875, 2.598876953125, 2.6881103515625, 2.77734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 10.0, 4.0, 4.0, 14.0, 16.0, 19.0, 13.0, 15.0, 26.0, 30.0, 23.0, 30.0, 44.0, 48.0, 48.0, 49.0, 54.0, 45.0, 40.0, 51.0, 58.0, 60.0, 47.0, 42.0, 32.0, 30.0, 25.0, 20.0, 20.0, 17.0, 7.0, 9.0, 6.0, 8.0, 7.0, 6.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.075439453125, -2.00048828125, -1.925537109375, -1.8505859375, -1.775634765625, -1.70068359375, -1.625732421875, -1.55078125, -1.475830078125, -1.40087890625, -1.325927734375, -1.2509765625, -1.176025390625, -1.10107421875, -1.026123046875, -0.951171875, -0.876220703125, -0.80126953125, -0.726318359375, -0.6513671875, -0.576416015625, -0.50146484375, -0.426513671875, -0.3515625, -0.276611328125, -0.20166015625, -0.126708984375, -0.0517578125, 0.023193359375, 0.09814453125, 0.173095703125, 0.248046875, 0.322998046875, 0.39794921875, 0.472900390625, 0.5478515625, 0.622802734375, 0.69775390625, 0.772705078125, 0.84765625, 0.922607421875, 0.99755859375, 1.072509765625, 1.1474609375, 1.222412109375, 1.29736328125, 1.372314453125, 1.447265625, 1.522216796875, 1.59716796875, 1.672119140625, 1.7470703125, 1.822021484375, 1.89697265625, 1.971923828125, 2.046875, 2.121826171875, 2.19677734375, 2.271728515625, 2.3466796875, 2.421630859375, 2.49658203125, 2.571533203125, 2.646484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 11.0, 21.0, 29.0, 51.0, 139.0, 306.0, 883.0, 3876.0, 154517.0, 879004.0, 7694.0, 1241.0, 415.0, 171.0, 89.0, 37.0, 15.0, 13.0, 7.0, 10.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.703125, -1.6617279052734375, -1.620330810546875, -1.5789337158203125, -1.53753662109375, -1.4961395263671875, -1.454742431640625, -1.4133453369140625, -1.3719482421875, -1.3305511474609375, -1.289154052734375, -1.2477569580078125, -1.20635986328125, -1.1649627685546875, -1.123565673828125, -1.0821685791015625, -1.040771484375, -0.9993743896484375, -0.957977294921875, -0.9165802001953125, -0.87518310546875, -0.8337860107421875, -0.792388916015625, -0.7509918212890625, -0.7095947265625, -0.6681976318359375, -0.626800537109375, -0.5854034423828125, -0.54400634765625, -0.5026092529296875, -0.461212158203125, -0.4198150634765625, -0.37841796875, -0.3370208740234375, -0.295623779296875, -0.2542266845703125, -0.21282958984375, -0.1714324951171875, -0.130035400390625, -0.0886383056640625, -0.0472412109375, -0.0058441162109375, 0.035552978515625, 0.0769500732421875, 0.11834716796875, 0.1597442626953125, 0.201141357421875, 0.2425384521484375, 0.283935546875, 0.3253326416015625, 0.366729736328125, 0.4081268310546875, 0.44952392578125, 0.4909210205078125, 0.532318115234375, 0.5737152099609375, 0.6151123046875, 0.6565093994140625, 0.697906494140625, 0.7393035888671875, 0.78070068359375, 0.8220977783203125, 0.863494873046875, 0.9048919677734375, 0.9462890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 10.0, 26.0, 47.0, 130.0, 449.0, 188.0, 76.0, 43.0, 16.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001373291015625, -0.00013101845979690552, -0.00012470781803131104, -0.00011839717626571655, -0.00011208653450012207, -0.00010577589273452759, -9.94652509689331e-05, -9.315460920333862e-05, -8.684396743774414e-05, -8.053332567214966e-05, -7.422268390655518e-05, -6.79120421409607e-05, -6.160140037536621e-05, -5.529075860977173e-05, -4.8980116844177246e-05, -4.2669475078582764e-05, -3.635883331298828e-05, -3.00481915473938e-05, -2.3737549781799316e-05, -1.7426908016204834e-05, -1.1116266250610352e-05, -4.805624485015869e-06, 1.5050172805786133e-06, 7.815659046173096e-06, 1.4126300811767578e-05, 2.043694257736206e-05, 2.6747584342956543e-05, 3.3058226108551025e-05, 3.936886787414551e-05, 4.567950963973999e-05, 5.199015140533447e-05, 5.8300793170928955e-05, 6.461143493652344e-05, 7.092207670211792e-05, 7.72327184677124e-05, 8.354336023330688e-05, 8.985400199890137e-05, 9.616464376449585e-05, 0.00010247528553009033, 0.00010878592729568481, 0.0001150965690612793, 0.00012140721082687378, 0.00012771785259246826, 0.00013402849435806274, 0.00014033913612365723, 0.0001466497778892517, 0.0001529604196548462, 0.00015927106142044067, 0.00016558170318603516, 0.00017189234495162964, 0.00017820298671722412, 0.0001845136284828186, 0.00019082427024841309, 0.00019713491201400757, 0.00020344555377960205, 0.00020975619554519653, 0.00021606683731079102, 0.0002223774790763855, 0.00022868812084197998, 0.00023499876260757446, 0.00024130940437316895, 0.00024762004613876343, 0.0002539306879043579, 0.0002602413296699524, 0.0002665519714355469]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 6.0, 5.0, 12.0, 15.0, 13.0, 27.0, 37.0, 71.0, 118.0, 183.0, 307.0, 584.0, 1371.0, 7129.0, 514620.0, 514220.0, 7102.0, 1376.0, 579.0, 309.0, 160.0, 95.0, 65.0, 46.0, 25.0, 24.0, 19.0, 11.0, 2.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.30078125, -1.2601318359375, -1.219482421875, -1.1788330078125, -1.13818359375, -1.0975341796875, -1.056884765625, -1.0162353515625, -0.9755859375, -0.9349365234375, -0.894287109375, -0.8536376953125, -0.81298828125, -0.7723388671875, -0.731689453125, -0.6910400390625, -0.650390625, -0.6097412109375, -0.569091796875, -0.5284423828125, -0.48779296875, -0.4471435546875, -0.406494140625, -0.3658447265625, -0.3251953125, -0.2845458984375, -0.243896484375, -0.2032470703125, -0.16259765625, -0.1219482421875, -0.081298828125, -0.0406494140625, 0.0, 0.0406494140625, 0.081298828125, 0.1219482421875, 0.16259765625, 0.2032470703125, 0.243896484375, 0.2845458984375, 0.3251953125, 0.3658447265625, 0.406494140625, 0.4471435546875, 0.48779296875, 0.5284423828125, 0.569091796875, 0.6097412109375, 0.650390625, 0.6910400390625, 0.731689453125, 0.7723388671875, 0.81298828125, 0.8536376953125, 0.894287109375, 0.9349365234375, 0.9755859375, 1.0162353515625, 1.056884765625, 1.0975341796875, 1.13818359375, 1.1788330078125, 1.219482421875, 1.2601318359375, 1.30078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 18.0, 45.0, 52.0, 112.0, 273.0, 275.0, 91.0, 54.0, 24.0, 16.0, 16.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5168571472167969, -0.5039291381835938, -0.4910011291503906, -0.4780731201171875, -0.4651451110839844, -0.45221710205078125, -0.4392890930175781, -0.426361083984375, -0.4134330749511719, -0.40050506591796875, -0.3875770568847656, -0.3746490478515625, -0.3617210388183594, -0.34879302978515625, -0.3358650207519531, -0.32293701171875, -0.3100090026855469, -0.29708099365234375, -0.2841529846191406, -0.2712249755859375, -0.2582969665527344, -0.24536895751953125, -0.23244094848632812, -0.219512939453125, -0.20658493041992188, -0.19365692138671875, -0.18072891235351562, -0.1678009033203125, -0.15487289428710938, -0.14194488525390625, -0.12901687622070312, -0.1160888671875, -0.10316085815429688, -0.09023284912109375, -0.07730484008789062, -0.0643768310546875, -0.051448822021484375, -0.03852081298828125, -0.025592803955078125, -0.012664794921875, 0.000263214111328125, 0.01319122314453125, 0.026119232177734375, 0.0390472412109375, 0.051975250244140625, 0.06490325927734375, 0.07783126831054688, 0.09075927734375, 0.10368728637695312, 0.11661529541015625, 0.12954330444335938, 0.1424713134765625, 0.15539932250976562, 0.16832733154296875, 0.18125534057617188, 0.194183349609375, 0.20711135864257812, 0.22003936767578125, 0.23296737670898438, 0.2458953857421875, 0.2588233947753906, 0.27175140380859375, 0.2846794128417969, 0.297607421875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 13.0, 39.0, 117.0, 300.0, 297.0, 167.0, 49.0, 16.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.533207893371582, -11.25961685180664, -10.986024856567383, -10.712432861328125, -10.438841819763184, -10.165250778198242, -9.891658782958984, -9.618066787719727, -9.344475746154785, -9.070884704589844, -8.797292709350586, -8.523700714111328, -8.250109672546387, -7.976518154144287, -7.7029266357421875, -7.429335117340088, -7.155743598937988, -6.882152080535889, -6.608560562133789, -6.3349690437316895, -6.06137752532959, -5.78778600692749, -5.514194488525391, -5.240602970123291, -4.967011451721191, -4.693419933319092, -4.419828414916992, -4.146236896514893, -3.872645378112793, -3.5990538597106934, -3.3254623413085938, -3.051870822906494, -2.778278350830078, -2.5046868324279785, -2.231095314025879, -1.9575037956237793, -1.6839122772216797, -1.41032075881958, -1.1367292404174805, -0.8631377220153809, -0.5895462036132812, -0.31595468521118164, -0.04236316680908203, 0.23122835159301758, 0.5048198699951172, 0.7784113883972168, 1.0520029067993164, 1.325594425201416, 1.5991859436035156, 1.8727774620056152, 2.146368980407715, 2.4199604988098145, 2.693552017211914, 2.9671435356140137, 3.2407350540161133, 3.514326572418213, 3.7879180908203125, 4.061509609222412, 4.335101127624512, 4.608692646026611, 4.882284164428711, 5.1558756828308105, 5.42946720123291, 5.70305871963501, 5.976650238037109]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 8.0, 4.0, 6.0, 5.0, 13.0, 23.0, 14.0, 23.0, 20.0, 17.0, 36.0, 33.0, 32.0, 41.0, 47.0, 53.0, 42.0, 36.0, 36.0, 40.0, 50.0, 28.0, 41.0, 30.0, 32.0, 36.0, 29.0, 19.0, 27.0, 29.0, 17.0, 15.0, 19.0, 24.0, 9.0, 19.0, 5.0, 5.0, 12.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.07650089263916, -2.976104736328125, -2.875708818435669, -2.775312662124634, -2.6749167442321777, -2.5745205879211426, -2.4741244316101074, -2.3737282752990723, -2.273332357406616, -2.172936201095581, -2.072540283203125, -1.9721441268920898, -1.8717480897903442, -1.7713520526885986, -1.6709558963775635, -1.5705598592758179, -1.4701638221740723, -1.3697677850723267, -1.269371747970581, -1.168975591659546, -1.0685795545578003, -0.9681835174560547, -0.8677874207496643, -0.7673913240432739, -0.6669952869415283, -0.5665992498397827, -0.46620315313339233, -0.36580708622932434, -0.26541101932525635, -0.16501498222351074, -0.06461888551712036, 0.03577721118927002, 0.13617300987243652, 0.23656907677650452, 0.3369651436805725, 0.4373612105846405, 0.5377572774887085, 0.6381533145904541, 0.7385494112968445, 0.8389455080032349, 0.9393415451049805, 1.039737582206726, 1.1401336193084717, 1.2405297756195068, 1.3409258127212524, 1.441321849822998, 1.5417180061340332, 1.6421140432357788, 1.7425100803375244, 1.84290611743927, 1.9433021545410156, 2.043698310852051, 2.144094467163086, 2.244490385055542, 2.344886541366577, 2.445282459259033, 2.5456786155700684, 2.6460747718811035, 2.7464706897735596, 2.8468668460845947, 2.947262763977051, 3.047658920288086, 3.148055076599121, 3.2484512329101562, 3.3488471508026123]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 8.0, 6.0, 13.0, 15.0, 16.0, 18.0, 16.0, 26.0, 31.0, 35.0, 47.0, 46.0, 69.0, 207.0, 929.0, 10475.0, 4122446.0, 57471.0, 1646.0, 308.0, 120.0, 69.0, 43.0, 42.0, 26.0, 14.0, 29.0, 17.0, 16.0, 12.0, 5.0, 11.0, 14.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.68609619140625, -6.4151611328125, -6.14422607421875, -5.873291015625, -5.60235595703125, -5.3314208984375, -5.06048583984375, -4.78955078125, -4.51861572265625, -4.2476806640625, -3.97674560546875, -3.705810546875, -3.43487548828125, -3.1639404296875, -2.89300537109375, -2.6220703125, -2.35113525390625, -2.0802001953125, -1.80926513671875, -1.538330078125, -1.26739501953125, -0.9964599609375, -0.72552490234375, -0.45458984375, -0.18365478515625, 0.0872802734375, 0.35821533203125, 0.629150390625, 0.90008544921875, 1.1710205078125, 1.44195556640625, 1.712890625, 1.98382568359375, 2.2547607421875, 2.52569580078125, 2.796630859375, 3.06756591796875, 3.3385009765625, 3.60943603515625, 3.88037109375, 4.15130615234375, 4.4222412109375, 4.69317626953125, 4.964111328125, 5.23504638671875, 5.5059814453125, 5.77691650390625, 6.0478515625, 6.31878662109375, 6.5897216796875, 6.86065673828125, 7.131591796875, 7.40252685546875, 7.6734619140625, 7.94439697265625, 8.21533203125, 8.48626708984375, 8.7572021484375, 9.02813720703125, 9.299072265625, 9.57000732421875, 9.8409423828125, 10.11187744140625, 10.3828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 16.0, 12.0, 17.0, 9.0, 28.0, 20.0, 25.0, 32.0, 31.0, 43.0, 59.0, 55.0, 57.0, 69.0, 60.0, 57.0, 59.0, 53.0, 45.0, 51.0, 46.0, 27.0, 17.0, 22.0, 19.0, 17.0, 13.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0420379638671875, -1.004974365234375, -0.9679107666015625, -0.93084716796875, -0.8937835693359375, -0.856719970703125, -0.8196563720703125, -0.7825927734375, -0.7455291748046875, -0.708465576171875, -0.6714019775390625, -0.63433837890625, -0.5972747802734375, -0.560211181640625, -0.5231475830078125, -0.486083984375, -0.4490203857421875, -0.411956787109375, -0.3748931884765625, -0.33782958984375, -0.3007659912109375, -0.263702392578125, -0.2266387939453125, -0.1895751953125, -0.1525115966796875, -0.115447998046875, -0.0783843994140625, -0.04132080078125, -0.0042572021484375, 0.032806396484375, 0.0698699951171875, 0.10693359375, 0.1439971923828125, 0.181060791015625, 0.2181243896484375, 0.25518798828125, 0.2922515869140625, 0.329315185546875, 0.3663787841796875, 0.4034423828125, 0.4405059814453125, 0.477569580078125, 0.5146331787109375, 0.55169677734375, 0.5887603759765625, 0.625823974609375, 0.6628875732421875, 0.699951171875, 0.7370147705078125, 0.774078369140625, 0.8111419677734375, 0.84820556640625, 0.8852691650390625, 0.922332763671875, 0.9593963623046875, 0.9964599609375, 1.0335235595703125, 1.070587158203125, 1.1076507568359375, 1.14471435546875, 1.1817779541015625, 1.218841552734375, 1.2559051513671875, 1.29296875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 9.0, 20.0, 16.0, 41.0, 69.0, 174.0, 457.0, 1911.0, 21160.0, 3871774.0, 290933.0, 6233.0, 980.0, 268.0, 114.0, 44.0, 30.0, 14.0, 9.0, 6.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.372344970703125, -2.23101806640625, -2.089691162109375, -1.9483642578125, -1.807037353515625, -1.66571044921875, -1.524383544921875, -1.383056640625, -1.241729736328125, -1.10040283203125, -0.959075927734375, -0.8177490234375, -0.676422119140625, -0.53509521484375, -0.393768310546875, -0.25244140625, -0.111114501953125, 0.03021240234375, 0.171539306640625, 0.3128662109375, 0.454193115234375, 0.59552001953125, 0.736846923828125, 0.878173828125, 1.019500732421875, 1.16082763671875, 1.302154541015625, 1.4434814453125, 1.584808349609375, 1.72613525390625, 1.867462158203125, 2.0087890625, 2.150115966796875, 2.29144287109375, 2.432769775390625, 2.5740966796875, 2.715423583984375, 2.85675048828125, 2.998077392578125, 3.139404296875, 3.280731201171875, 3.42205810546875, 3.563385009765625, 3.7047119140625, 3.846038818359375, 3.98736572265625, 4.128692626953125, 4.27001953125, 4.411346435546875, 4.55267333984375, 4.694000244140625, 4.8353271484375, 4.976654052734375, 5.11798095703125, 5.259307861328125, 5.400634765625, 5.541961669921875, 5.68328857421875, 5.824615478515625, 5.9659423828125, 6.107269287109375, 6.24859619140625, 6.389923095703125, 6.53125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 11.0, 9.0, 18.0, 19.0, 39.0, 48.0, 92.0, 153.0, 232.0, 450.0, 790.0, 872.0, 563.0, 284.0, 194.0, 86.0, 53.0, 46.0, 37.0, 22.0, 19.0, 6.0, 4.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6034622192382812, -0.5858306884765625, -0.5681991577148438, -0.550567626953125, -0.5329360961914062, -0.5153045654296875, -0.49767303466796875, -0.48004150390625, -0.46240997314453125, -0.4447784423828125, -0.42714691162109375, -0.409515380859375, -0.39188385009765625, -0.3742523193359375, -0.35662078857421875, -0.3389892578125, -0.32135772705078125, -0.3037261962890625, -0.28609466552734375, -0.268463134765625, -0.25083160400390625, -0.2332000732421875, -0.21556854248046875, -0.19793701171875, -0.18030548095703125, -0.1626739501953125, -0.14504241943359375, -0.127410888671875, -0.10977935791015625, -0.0921478271484375, -0.07451629638671875, -0.056884765625, -0.03925323486328125, -0.0216217041015625, -0.00399017333984375, 0.013641357421875, 0.03127288818359375, 0.0489044189453125, 0.06653594970703125, 0.08416748046875, 0.10179901123046875, 0.1194305419921875, 0.13706207275390625, 0.154693603515625, 0.17232513427734375, 0.1899566650390625, 0.20758819580078125, 0.2252197265625, 0.24285125732421875, 0.2604827880859375, 0.27811431884765625, 0.295745849609375, 0.31337738037109375, 0.3310089111328125, 0.34864044189453125, 0.36627197265625, 0.38390350341796875, 0.4015350341796875, 0.41916656494140625, 0.436798095703125, 0.45442962646484375, 0.4720611572265625, 0.48969268798828125, 0.50732421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 5.0, 10.0, 10.0, 15.0, 27.0, 37.0, 60.0, 79.0, 65.0, 100.0, 118.0, 111.0, 100.0, 93.0, 50.0, 36.0, 24.0, 18.0, 14.0, 10.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0975778102874756, -1.0359746217727661, -0.9743713736534119, -0.9127681851387024, -0.8511649370193481, -0.7895617485046387, -0.7279585599899292, -0.6663553714752197, -0.6047521233558655, -0.543148934841156, -0.48154568672180176, -0.4199424982070923, -0.3583392798900604, -0.29673606157302856, -0.2351328730583191, -0.17352965474128723, -0.11192643642425537, -0.05032322555780411, 0.011279985308647156, 0.07288318872451782, 0.13448640704154968, 0.19608962535858154, 0.257692813873291, 0.3192960321903229, 0.38089925050735474, 0.4425024688243866, 0.5041056871414185, 0.5657088756561279, 0.6273120641708374, 0.6889153122901917, 0.7505185008049011, 0.8121217489242554, 0.8737249374389648, 0.9353281259536743, 0.9969313740730286, 1.0585346221923828, 1.1201378107070923, 1.1817409992218018, 1.2433441877365112, 1.3049473762512207, 1.3665506839752197, 1.4281538724899292, 1.4897570610046387, 1.5513603687286377, 1.6129635572433472, 1.6745667457580566, 1.7361699342727661, 1.7977731227874756, 1.859376311302185, 1.9209794998168945, 1.982582688331604, 2.0441858768463135, 2.1057891845703125, 2.1673922538757324, 2.2289955615997314, 2.2905988693237305, 2.3522019386291504, 2.4138052463531494, 2.4754083156585693, 2.5370116233825684, 2.5986146926879883, 2.6602180004119873, 2.7218213081359863, 2.7834243774414062, 2.8450276851654053]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 9.0, 6.0, 12.0, 7.0, 15.0, 22.0, 29.0, 15.0, 30.0, 37.0, 34.0, 53.0, 48.0, 38.0, 41.0, 56.0, 60.0, 51.0, 48.0, 39.0, 57.0, 52.0, 36.0, 38.0, 26.0, 25.0, 18.0, 18.0, 21.0, 17.0, 11.0, 6.0, 5.0, 9.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1894696950912476, -1.1517117023468018, -1.1139538288116455, -1.0761959552764893, -1.0384379625320435, -1.0006799697875977, -0.9629220962524414, -0.9251641631126404, -0.8874062299728394, -0.8496482968330383, -0.8118903636932373, -0.7741324305534363, -0.7363744974136353, -0.6986165642738342, -0.6608586311340332, -0.6231006979942322, -0.5853427648544312, -0.5475848317146301, -0.5098268985748291, -0.4720689654350281, -0.43431103229522705, -0.396553099155426, -0.358795166015625, -0.321037232875824, -0.28327929973602295, -0.24552136659622192, -0.2077634334564209, -0.17000550031661987, -0.13224756717681885, -0.09448963403701782, -0.0567317008972168, -0.01897376775741577, 0.018784165382385254, 0.05654209852218628, 0.0943000316619873, 0.13205796480178833, 0.16981589794158936, 0.20757383108139038, 0.2453317642211914, 0.28308969736099243, 0.32084763050079346, 0.3586055636405945, 0.3963634967803955, 0.43412142992019653, 0.47187936305999756, 0.5096372961997986, 0.5473952293395996, 0.5851531624794006, 0.6229110956192017, 0.6606690287590027, 0.6984269618988037, 0.7361848950386047, 0.7739428281784058, 0.8117007613182068, 0.8494586944580078, 0.8872166275978088, 0.9249745607376099, 0.9627324938774109, 1.000490427017212, 1.0382483005523682, 1.076006293296814, 1.1137642860412598, 1.151522159576416, 1.1892800331115723, 1.227038025856018]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 12.0, 21.0, 35.0, 56.0, 119.0, 253.0, 534.0, 1554.0, 4424.0, 14478.0, 81353.0, 762027.0, 155333.0, 19403.0, 5725.0, 1892.0, 718.0, 258.0, 157.0, 66.0, 30.0, 16.0, 13.0, 11.0, 9.0, 9.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.146484375, -1.118255615234375, -1.09002685546875, -1.061798095703125, -1.0335693359375, -1.005340576171875, -0.97711181640625, -0.948883056640625, -0.920654296875, -0.892425537109375, -0.86419677734375, -0.835968017578125, -0.8077392578125, -0.779510498046875, -0.75128173828125, -0.723052978515625, -0.69482421875, -0.666595458984375, -0.63836669921875, -0.610137939453125, -0.5819091796875, -0.553680419921875, -0.52545166015625, -0.497222900390625, -0.468994140625, -0.440765380859375, -0.41253662109375, -0.384307861328125, -0.3560791015625, -0.327850341796875, -0.29962158203125, -0.271392822265625, -0.2431640625, -0.214935302734375, -0.18670654296875, -0.158477783203125, -0.1302490234375, -0.102020263671875, -0.07379150390625, -0.045562744140625, -0.017333984375, 0.010894775390625, 0.03912353515625, 0.067352294921875, 0.0955810546875, 0.123809814453125, 0.15203857421875, 0.180267333984375, 0.20849609375, 0.236724853515625, 0.26495361328125, 0.293182373046875, 0.3214111328125, 0.349639892578125, 0.37786865234375, 0.406097412109375, 0.434326171875, 0.462554931640625, 0.49078369140625, 0.519012451171875, 0.5472412109375, 0.575469970703125, 0.60369873046875, 0.631927490234375, 0.66015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 10.0, 7.0, 14.0, 25.0, 23.0, 16.0, 36.0, 33.0, 45.0, 56.0, 60.0, 44.0, 64.0, 66.0, 48.0, 62.0, 55.0, 54.0, 49.0, 36.0, 39.0, 28.0, 32.0, 20.0, 18.0, 13.0, 14.0, 12.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.998046875, -0.966949462890625, -0.93585205078125, -0.904754638671875, -0.8736572265625, -0.842559814453125, -0.81146240234375, -0.780364990234375, -0.749267578125, -0.718170166015625, -0.68707275390625, -0.655975341796875, -0.6248779296875, -0.593780517578125, -0.56268310546875, -0.531585693359375, -0.50048828125, -0.469390869140625, -0.43829345703125, -0.407196044921875, -0.3760986328125, -0.345001220703125, -0.31390380859375, -0.282806396484375, -0.251708984375, -0.220611572265625, -0.18951416015625, -0.158416748046875, -0.1273193359375, -0.096221923828125, -0.06512451171875, -0.034027099609375, -0.0029296875, 0.028167724609375, 0.05926513671875, 0.090362548828125, 0.1214599609375, 0.152557373046875, 0.18365478515625, 0.214752197265625, 0.245849609375, 0.276947021484375, 0.30804443359375, 0.339141845703125, 0.3702392578125, 0.401336669921875, 0.43243408203125, 0.463531494140625, 0.49462890625, 0.525726318359375, 0.55682373046875, 0.587921142578125, 0.6190185546875, 0.650115966796875, 0.68121337890625, 0.712310791015625, 0.743408203125, 0.774505615234375, 0.80560302734375, 0.836700439453125, 0.8677978515625, 0.898895263671875, 0.92999267578125, 0.961090087890625, 0.9921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 10.0, 10.0, 17.0, 16.0, 30.0, 37.0, 57.0, 52.0, 97.0, 161.0, 302.0, 553.0, 1136.0, 2439.0, 6053.0, 17527.0, 72819.0, 402646.0, 433517.0, 80247.0, 19020.0, 6574.0, 2640.0, 1158.0, 524.0, 346.0, 183.0, 97.0, 75.0, 50.0, 29.0, 36.0, 21.0, 11.0, 8.0, 8.0, 11.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.43359375, -0.4196205139160156, -0.40564727783203125, -0.3916740417480469, -0.3777008056640625, -0.3637275695800781, -0.34975433349609375, -0.3357810974121094, -0.321807861328125, -0.3078346252441406, -0.29386138916015625, -0.2798881530761719, -0.2659149169921875, -0.2519416809082031, -0.23796844482421875, -0.22399520874023438, -0.21002197265625, -0.19604873657226562, -0.18207550048828125, -0.16810226440429688, -0.1541290283203125, -0.14015579223632812, -0.12618255615234375, -0.11220932006835938, -0.098236083984375, -0.08426284790039062, -0.07028961181640625, -0.056316375732421875, -0.0423431396484375, -0.028369903564453125, -0.01439666748046875, -0.000423431396484375, 0.0135498046875, 0.027523040771484375, 0.04149627685546875, 0.055469512939453125, 0.0694427490234375, 0.08341598510742188, 0.09738922119140625, 0.11136245727539062, 0.125335693359375, 0.13930892944335938, 0.15328216552734375, 0.16725540161132812, 0.1812286376953125, 0.19520187377929688, 0.20917510986328125, 0.22314834594726562, 0.23712158203125, 0.2510948181152344, 0.26506805419921875, 0.2790412902832031, 0.2930145263671875, 0.3069877624511719, 0.32096099853515625, 0.3349342346191406, 0.348907470703125, 0.3628807067871094, 0.37685394287109375, 0.3908271789550781, 0.4048004150390625, 0.4187736511230469, 0.43274688720703125, 0.4467201232910156, 0.460693359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 9.0, 11.0, 14.0, 17.0, 13.0, 19.0, 23.0, 26.0, 36.0, 34.0, 32.0, 49.0, 60.0, 51.0, 51.0, 51.0, 51.0, 40.0, 44.0, 60.0, 37.0, 28.0, 38.0, 32.0, 28.0, 28.0, 14.0, 27.0, 18.0, 13.0, 14.0, 2.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.9767303466796875, -1.920257568359375, -1.8637847900390625, -1.80731201171875, -1.7508392333984375, -1.694366455078125, -1.6378936767578125, -1.5814208984375, -1.5249481201171875, -1.468475341796875, -1.4120025634765625, -1.35552978515625, -1.2990570068359375, -1.242584228515625, -1.1861114501953125, -1.129638671875, -1.0731658935546875, -1.016693115234375, -0.9602203369140625, -0.90374755859375, -0.8472747802734375, -0.790802001953125, -0.7343292236328125, -0.6778564453125, -0.6213836669921875, -0.564910888671875, -0.5084381103515625, -0.45196533203125, -0.3954925537109375, -0.339019775390625, -0.2825469970703125, -0.22607421875, -0.1696014404296875, -0.113128662109375, -0.0566558837890625, -0.00018310546875, 0.0562896728515625, 0.112762451171875, 0.1692352294921875, 0.2257080078125, 0.2821807861328125, 0.338653564453125, 0.3951263427734375, 0.45159912109375, 0.5080718994140625, 0.564544677734375, 0.6210174560546875, 0.677490234375, 0.7339630126953125, 0.790435791015625, 0.8469085693359375, 0.90338134765625, 0.9598541259765625, 1.016326904296875, 1.0727996826171875, 1.1292724609375, 1.1857452392578125, 1.242218017578125, 1.2986907958984375, 1.35516357421875, 1.4116363525390625, 1.468109130859375, 1.5245819091796875, 1.5810546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 10.0, 7.0, 25.0, 31.0, 35.0, 47.0, 72.0, 123.0, 181.0, 280.0, 409.0, 725.0, 1248.0, 2186.0, 4538.0, 10196.0, 35536.0, 332514.0, 573208.0, 61095.0, 14127.0, 5579.0, 2728.0, 1481.0, 774.0, 499.0, 309.0, 182.0, 122.0, 77.0, 53.0, 45.0, 32.0, 21.0, 16.0, 8.0, 7.0, 5.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1717529296875, -0.16605567932128906, -0.16035842895507812, -0.1546611785888672, -0.14896392822265625, -0.1432666778564453, -0.13756942749023438, -0.13187217712402344, -0.1261749267578125, -0.12047767639160156, -0.11478042602539062, -0.10908317565917969, -0.10338592529296875, -0.09768867492675781, -0.09199142456054688, -0.08629417419433594, -0.080596923828125, -0.07489967346191406, -0.06920242309570312, -0.06350517272949219, -0.05780792236328125, -0.05211067199707031, -0.046413421630859375, -0.04071617126464844, -0.0350189208984375, -0.029321670532226562, -0.023624420166015625, -0.017927169799804688, -0.01222991943359375, -0.0065326690673828125, -0.000835418701171875, 0.0048618316650390625, 0.01055908203125, 0.016256332397460938, 0.021953582763671875, 0.027650833129882812, 0.03334808349609375, 0.03904533386230469, 0.044742584228515625, 0.05043983459472656, 0.0561370849609375, 0.06183433532714844, 0.06753158569335938, 0.07322883605957031, 0.07892608642578125, 0.08462333679199219, 0.09032058715820312, 0.09601783752441406, 0.101715087890625, 0.10741233825683594, 0.11310958862304688, 0.11880683898925781, 0.12450408935546875, 0.1302013397216797, 0.13589859008789062, 0.14159584045410156, 0.1472930908203125, 0.15299034118652344, 0.15868759155273438, 0.1643848419189453, 0.17008209228515625, 0.1757793426513672, 0.18147659301757812, 0.18717384338378906, 0.19287109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 13.0, 21.0, 39.0, 60.0, 123.0, 162.0, 182.0, 137.0, 85.0, 62.0, 28.0, 24.0, 11.0, 4.0, 5.0, 2.0, 3.0, 7.0, 4.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00013947486877441406, -0.0001359395682811737, -0.00013240426778793335, -0.000128868967294693, -0.00012533366680145264, -0.00012179836630821228, -0.00011826306581497192, -0.00011472776532173157, -0.00011119246482849121, -0.00010765716433525085, -0.0001041218638420105, -0.00010058656334877014, -9.705126285552979e-05, -9.351596236228943e-05, -8.998066186904907e-05, -8.644536137580872e-05, -8.291006088256836e-05, -7.9374760389328e-05, -7.583945989608765e-05, -7.230415940284729e-05, -6.876885890960693e-05, -6.523355841636658e-05, -6.169825792312622e-05, -5.8162957429885864e-05, -5.462765693664551e-05, -5.109235644340515e-05, -4.7557055950164795e-05, -4.402175545692444e-05, -4.048645496368408e-05, -3.6951154470443726e-05, -3.341585397720337e-05, -2.9880553483963013e-05, -2.6345252990722656e-05, -2.28099524974823e-05, -1.9274652004241943e-05, -1.5739351511001587e-05, -1.220405101776123e-05, -8.668750524520874e-06, -5.133450031280518e-06, -1.5981495380401611e-06, 1.9371509552001953e-06, 5.472451448440552e-06, 9.007751941680908e-06, 1.2543052434921265e-05, 1.607835292816162e-05, 1.9613653421401978e-05, 2.3148953914642334e-05, 2.668425440788269e-05, 3.0219554901123047e-05, 3.37548553943634e-05, 3.729015588760376e-05, 4.0825456380844116e-05, 4.436075687408447e-05, 4.789605736732483e-05, 5.1431357860565186e-05, 5.496665835380554e-05, 5.85019588470459e-05, 6.203725934028625e-05, 6.557255983352661e-05, 6.910786032676697e-05, 7.264316082000732e-05, 7.617846131324768e-05, 7.971376180648804e-05, 8.32490622997284e-05, 8.678436279296875e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 11.0, 13.0, 8.0, 20.0, 23.0, 31.0, 44.0, 61.0, 90.0, 153.0, 242.0, 320.0, 523.0, 847.0, 1319.0, 2174.0, 4067.0, 9764.0, 40935.0, 457630.0, 468388.0, 41964.0, 9858.0, 4159.0, 2290.0, 1298.0, 781.0, 496.0, 318.0, 234.0, 147.0, 90.0, 88.0, 49.0, 33.0, 18.0, 15.0, 12.0, 10.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.226318359375, -0.21946144104003906, -0.21260452270507812, -0.2057476043701172, -0.19889068603515625, -0.1920337677001953, -0.18517684936523438, -0.17831993103027344, -0.1714630126953125, -0.16460609436035156, -0.15774917602539062, -0.1508922576904297, -0.14403533935546875, -0.1371784210205078, -0.13032150268554688, -0.12346458435058594, -0.116607666015625, -0.10975074768066406, -0.10289382934570312, -0.09603691101074219, -0.08917999267578125, -0.08232307434082031, -0.07546615600585938, -0.06860923767089844, -0.0617523193359375, -0.05489540100097656, -0.048038482666015625, -0.04118156433105469, -0.03432464599609375, -0.027467727661132812, -0.020610809326171875, -0.013753890991210938, -0.00689697265625, -4.00543212890625e-05, 0.006816864013671875, 0.013673782348632812, 0.02053070068359375, 0.027387619018554688, 0.034244537353515625, 0.04110145568847656, 0.0479583740234375, 0.05481529235839844, 0.061672210693359375, 0.06852912902832031, 0.07538604736328125, 0.08224296569824219, 0.08909988403320312, 0.09595680236816406, 0.102813720703125, 0.10967063903808594, 0.11652755737304688, 0.12338447570800781, 0.13024139404296875, 0.1370983123779297, 0.14395523071289062, 0.15081214904785156, 0.1576690673828125, 0.16452598571777344, 0.17138290405273438, 0.1782398223876953, 0.18509674072265625, 0.1919536590576172, 0.19881057739257812, 0.20566749572753906, 0.2125244140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 9.0, 13.0, 28.0, 40.0, 97.0, 137.0, 153.0, 142.0, 125.0, 93.0, 44.0, 29.0, 14.0, 11.0, 5.0, 6.0, 5.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07218456268310547, -0.06984519958496094, -0.0675058364868164, -0.06516647338867188, -0.06282711029052734, -0.06048774719238281, -0.05814838409423828, -0.05580902099609375, -0.05346965789794922, -0.05113029479980469, -0.048790931701660156, -0.046451568603515625, -0.044112205505371094, -0.04177284240722656, -0.03943347930908203, -0.0370941162109375, -0.03475475311279297, -0.03241539001464844, -0.030076026916503906, -0.027736663818359375, -0.025397300720214844, -0.023057937622070312, -0.02071857452392578, -0.01837921142578125, -0.01603984832763672, -0.013700485229492188, -0.011361122131347656, -0.009021759033203125, -0.006682395935058594, -0.0043430328369140625, -0.0020036697387695312, 0.000335693359375, 0.0026750564575195312, 0.0050144195556640625, 0.007353782653808594, 0.009693145751953125, 0.012032508850097656, 0.014371871948242188, 0.01671123504638672, 0.01905059814453125, 0.02138996124267578, 0.023729324340820312, 0.026068687438964844, 0.028408050537109375, 0.030747413635253906, 0.03308677673339844, 0.03542613983154297, 0.0377655029296875, 0.04010486602783203, 0.04244422912597656, 0.044783592224121094, 0.047122955322265625, 0.049462318420410156, 0.05180168151855469, 0.05414104461669922, 0.05648040771484375, 0.05881977081298828, 0.06115913391113281, 0.06349849700927734, 0.06583786010742188, 0.0681772232055664, 0.07051658630371094, 0.07285594940185547, 0.0751953125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 13.0, 22.0, 83.0, 142.0, 226.0, 276.0, 142.0, 57.0, 25.0, 11.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8847786784172058, -0.7868735194206238, -0.6889683604240417, -0.5910632610321045, -0.4931580722332001, -0.39525291323661804, -0.2973477840423584, -0.19944262504577637, -0.10153746604919434, -0.0036323145031929016, 0.09427283704280853, 0.19217798113822937, 0.2900831401348114, 0.38798829913139343, 0.4858934283256531, 0.5837985873222351, 0.6817037463188171, 0.7796089053153992, 0.8775140643119812, 0.9754191637039185, 1.0733243227005005, 1.1712294816970825, 1.2691346406936646, 1.3670397996902466, 1.4649449586868286, 1.5628501176834106, 1.6607552766799927, 1.7586604356765747, 1.8565655946731567, 1.9544707536697388, 2.0523757934570312, 2.1502809524536133, 2.2481863498687744, 2.3460915088653564, 2.4439966678619385, 2.5419018268585205, 2.6398069858551025, 2.7377121448516846, 2.8356173038482666, 2.9335224628448486, 3.0314276218414307, 3.1293327808380127, 3.2272379398345947, 3.3251430988311768, 3.423048257827759, 3.520953416824341, 3.618858575820923, 3.716763734817505, 3.814668655395508, 3.91257381439209, 4.010478973388672, 4.108384132385254, 4.206289291381836, 4.304194450378418, 4.402099609375, 4.500004768371582, 4.597909927368164, 4.695815086364746, 4.793720245361328, 4.89162540435791, 4.989530563354492, 5.087435722351074, 5.185340881347656, 5.283246040344238, 5.38115119934082]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 3.0, 6.0, 6.0, 3.0, 6.0, 13.0, 14.0, 21.0, 15.0, 19.0, 25.0, 33.0, 37.0, 38.0, 45.0, 49.0, 52.0, 46.0, 48.0, 42.0, 61.0, 54.0, 57.0, 46.0, 33.0, 42.0, 25.0, 27.0, 19.0, 27.0, 20.0, 15.0, 17.0, 10.0, 5.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7308099269866943, -0.7049691677093506, -0.6791284084320068, -0.6532876491546631, -0.6274468898773193, -0.6016061305999756, -0.5757653713226318, -0.5499246120452881, -0.5240838527679443, -0.4982430934906006, -0.47240233421325684, -0.4465615749359131, -0.42072081565856934, -0.3948800563812256, -0.36903926730155945, -0.3431985080242157, -0.31735771894454956, -0.2915169596672058, -0.26567620038986206, -0.23983542621135712, -0.21399466693401337, -0.18815390765666962, -0.16231313347816467, -0.13647237420082092, -0.11063161492347717, -0.08479085564613342, -0.058950088918209076, -0.03310932219028473, -0.007268562912940979, 0.01857219636440277, 0.044412970542907715, 0.07025372982025146, 0.09609442949295044, 0.12193518877029419, 0.14777594804763794, 0.17361672222614288, 0.19945748150348663, 0.22529824078083038, 0.2511390149593353, 0.2769797742366791, 0.3028205335140228, 0.3286612927913666, 0.3545020520687103, 0.38034284114837646, 0.4061836004257202, 0.43202435970306396, 0.4578651189804077, 0.48370587825775146, 0.5095466375350952, 0.535387396812439, 0.5612281560897827, 0.5870689153671265, 0.6129096746444702, 0.638750433921814, 0.6645911931991577, 0.6904319524765015, 0.7162727117538452, 0.742113471031189, 0.7679542303085327, 0.7937949895858765, 0.8196357488632202, 0.845476508140564, 0.8713172674179077, 0.8971580266952515, 0.92299884557724]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 14.0, 21.0, 21.0, 23.0, 38.0, 52.0, 53.0, 113.0, 164.0, 297.0, 464.0, 832.0, 1594.0, 3218.0, 6902.0, 18278.0, 69903.0, 481130.0, 379347.0, 57781.0, 15740.0, 6329.0, 2823.0, 1425.0, 780.0, 447.0, 239.0, 158.0, 91.0, 74.0, 46.0, 36.0, 25.0, 16.0, 16.0, 8.0, 15.0, 3.0, 7.0, 4.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1220703125, -1.0858001708984375, -1.049530029296875, -1.0132598876953125, -0.97698974609375, -0.9407196044921875, -0.904449462890625, -0.8681793212890625, -0.8319091796875, -0.7956390380859375, -0.759368896484375, -0.7230987548828125, -0.68682861328125, -0.6505584716796875, -0.614288330078125, -0.5780181884765625, -0.541748046875, -0.5054779052734375, -0.469207763671875, -0.4329376220703125, -0.39666748046875, -0.3603973388671875, -0.324127197265625, -0.2878570556640625, -0.2515869140625, -0.2153167724609375, -0.179046630859375, -0.1427764892578125, -0.10650634765625, -0.0702362060546875, -0.033966064453125, 0.0023040771484375, 0.03857421875, 0.0748443603515625, 0.111114501953125, 0.1473846435546875, 0.18365478515625, 0.2199249267578125, 0.256195068359375, 0.2924652099609375, 0.3287353515625, 0.3650054931640625, 0.401275634765625, 0.4375457763671875, 0.47381591796875, 0.5100860595703125, 0.546356201171875, 0.5826263427734375, 0.618896484375, 0.6551666259765625, 0.691436767578125, 0.7277069091796875, 0.76397705078125, 0.8002471923828125, 0.836517333984375, 0.8727874755859375, 0.9090576171875, 0.9453277587890625, 0.981597900390625, 1.0178680419921875, 1.05413818359375, 1.0904083251953125, 1.126678466796875, 1.1629486083984375, 1.19921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 2.0, 10.0, 7.0, 10.0, 11.0, 14.0, 16.0, 15.0, 14.0, 21.0, 30.0, 26.0, 35.0, 35.0, 32.0, 44.0, 44.0, 44.0, 48.0, 34.0, 58.0, 49.0, 32.0, 43.0, 37.0, 51.0, 36.0, 29.0, 31.0, 18.0, 27.0, 20.0, 10.0, 16.0, 8.0, 11.0, 5.0, 3.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.325286865234375, -1.28045654296875, -1.235626220703125, -1.1907958984375, -1.145965576171875, -1.10113525390625, -1.056304931640625, -1.011474609375, -0.966644287109375, -0.92181396484375, -0.876983642578125, -0.8321533203125, -0.787322998046875, -0.74249267578125, -0.697662353515625, -0.65283203125, -0.608001708984375, -0.56317138671875, -0.518341064453125, -0.4735107421875, -0.428680419921875, -0.38385009765625, -0.339019775390625, -0.294189453125, -0.249359130859375, -0.20452880859375, -0.159698486328125, -0.1148681640625, -0.070037841796875, -0.02520751953125, 0.019622802734375, 0.064453125, 0.109283447265625, 0.15411376953125, 0.198944091796875, 0.2437744140625, 0.288604736328125, 0.33343505859375, 0.378265380859375, 0.423095703125, 0.467926025390625, 0.51275634765625, 0.557586669921875, 0.6024169921875, 0.647247314453125, 0.69207763671875, 0.736907958984375, 0.78173828125, 0.826568603515625, 0.87139892578125, 0.916229248046875, 0.9610595703125, 1.005889892578125, 1.05072021484375, 1.095550537109375, 1.140380859375, 1.185211181640625, 1.23004150390625, 1.274871826171875, 1.3197021484375, 1.364532470703125, 1.40936279296875, 1.454193115234375, 1.4990234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 6.0, 10.0, 10.0, 10.0, 19.0, 32.0, 34.0, 37.0, 67.0, 112.0, 174.0, 313.0, 1067.0, 7877.0, 491438.0, 537203.0, 8322.0, 1059.0, 298.0, 148.0, 93.0, 60.0, 48.0, 34.0, 22.0, 17.0, 9.0, 10.0, 9.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.007598876953125, -3.88238525390625, -3.757171630859375, -3.6319580078125, -3.506744384765625, -3.38153076171875, -3.256317138671875, -3.131103515625, -3.005889892578125, -2.88067626953125, -2.755462646484375, -2.6302490234375, -2.505035400390625, -2.37982177734375, -2.254608154296875, -2.12939453125, -2.004180908203125, -1.87896728515625, -1.753753662109375, -1.6285400390625, -1.503326416015625, -1.37811279296875, -1.252899169921875, -1.127685546875, -1.002471923828125, -0.87725830078125, -0.752044677734375, -0.6268310546875, -0.501617431640625, -0.37640380859375, -0.251190185546875, -0.1259765625, -0.000762939453125, 0.12445068359375, 0.249664306640625, 0.3748779296875, 0.500091552734375, 0.62530517578125, 0.750518798828125, 0.875732421875, 1.000946044921875, 1.12615966796875, 1.251373291015625, 1.3765869140625, 1.501800537109375, 1.62701416015625, 1.752227783203125, 1.87744140625, 2.002655029296875, 2.12786865234375, 2.253082275390625, 2.3782958984375, 2.503509521484375, 2.62872314453125, 2.753936767578125, 2.879150390625, 3.004364013671875, 3.12957763671875, 3.254791259765625, 3.3800048828125, 3.505218505859375, 3.63043212890625, 3.755645751953125, 3.880859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 13.0, 6.0, 9.0, 12.0, 23.0, 22.0, 28.0, 23.0, 36.0, 45.0, 55.0, 51.0, 52.0, 79.0, 64.0, 59.0, 51.0, 48.0, 66.0, 44.0, 41.0, 36.0, 26.0, 28.0, 19.0, 11.0, 13.0, 7.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40625, -2.33026123046875, -2.2542724609375, -2.17828369140625, -2.102294921875, -2.02630615234375, -1.9503173828125, -1.87432861328125, -1.79833984375, -1.72235107421875, -1.6463623046875, -1.57037353515625, -1.494384765625, -1.41839599609375, -1.3424072265625, -1.26641845703125, -1.1904296875, -1.11444091796875, -1.0384521484375, -0.96246337890625, -0.886474609375, -0.81048583984375, -0.7344970703125, -0.65850830078125, -0.58251953125, -0.50653076171875, -0.4305419921875, -0.35455322265625, -0.278564453125, -0.20257568359375, -0.1265869140625, -0.05059814453125, 0.025390625, 0.10137939453125, 0.1773681640625, 0.25335693359375, 0.329345703125, 0.40533447265625, 0.4813232421875, 0.55731201171875, 0.63330078125, 0.70928955078125, 0.7852783203125, 0.86126708984375, 0.937255859375, 1.01324462890625, 1.0892333984375, 1.16522216796875, 1.2412109375, 1.31719970703125, 1.3931884765625, 1.46917724609375, 1.545166015625, 1.62115478515625, 1.6971435546875, 1.77313232421875, 1.84912109375, 1.92510986328125, 2.0010986328125, 2.07708740234375, 2.153076171875, 2.22906494140625, 2.3050537109375, 2.38104248046875, 2.45703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 14.0, 30.0, 40.0, 132.0, 341.0, 1329.0, 7579.0, 138065.0, 864576.0, 31975.0, 3303.0, 707.0, 240.0, 100.0, 34.0, 29.0, 11.0, 18.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0224609375, -0.995758056640625, -0.96905517578125, -0.942352294921875, -0.9156494140625, -0.888946533203125, -0.86224365234375, -0.835540771484375, -0.808837890625, -0.782135009765625, -0.75543212890625, -0.728729248046875, -0.7020263671875, -0.675323486328125, -0.64862060546875, -0.621917724609375, -0.59521484375, -0.568511962890625, -0.54180908203125, -0.515106201171875, -0.4884033203125, -0.461700439453125, -0.43499755859375, -0.408294677734375, -0.381591796875, -0.354888916015625, -0.32818603515625, -0.301483154296875, -0.2747802734375, -0.248077392578125, -0.22137451171875, -0.194671630859375, -0.16796875, -0.141265869140625, -0.11456298828125, -0.087860107421875, -0.0611572265625, -0.034454345703125, -0.00775146484375, 0.018951416015625, 0.045654296875, 0.072357177734375, 0.09906005859375, 0.125762939453125, 0.1524658203125, 0.179168701171875, 0.20587158203125, 0.232574462890625, 0.25927734375, 0.285980224609375, 0.31268310546875, 0.339385986328125, 0.3660888671875, 0.392791748046875, 0.41949462890625, 0.446197509765625, 0.472900390625, 0.499603271484375, 0.52630615234375, 0.553009033203125, 0.5797119140625, 0.606414794921875, 0.63311767578125, 0.659820556640625, 0.6865234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 8.0, 8.0, 11.0, 20.0, 30.0, 31.0, 38.0, 70.0, 70.0, 97.0, 107.0, 104.0, 94.0, 65.0, 54.0, 49.0, 30.0, 25.0, 14.0, 8.0, 10.0, 6.0, 3.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-7.12275505065918e-05, -6.934907287359238e-05, -6.747059524059296e-05, -6.559211760759354e-05, -6.371363997459412e-05, -6.18351623415947e-05, -5.9956684708595276e-05, -5.8078207075595856e-05, -5.6199729442596436e-05, -5.4321251809597015e-05, -5.2442774176597595e-05, -5.0564296543598175e-05, -4.8685818910598755e-05, -4.6807341277599335e-05, -4.4928863644599915e-05, -4.3050386011600494e-05, -4.1171908378601074e-05, -3.9293430745601654e-05, -3.7414953112602234e-05, -3.5536475479602814e-05, -3.3657997846603394e-05, -3.1779520213603973e-05, -2.9901042580604553e-05, -2.8022564947605133e-05, -2.6144087314605713e-05, -2.4265609681606293e-05, -2.2387132048606873e-05, -2.0508654415607452e-05, -1.8630176782608032e-05, -1.6751699149608612e-05, -1.4873221516609192e-05, -1.2994743883609772e-05, -1.1116266250610352e-05, -9.237788617610931e-06, -7.359310984611511e-06, -5.480833351612091e-06, -3.602355718612671e-06, -1.7238780856132507e-06, 1.5459954738616943e-07, 2.0330771803855896e-06, 3.91155481338501e-06, 5.79003244638443e-06, 7.66851007938385e-06, 9.54698771238327e-06, 1.142546534538269e-05, 1.330394297838211e-05, 1.518242061138153e-05, 1.706089824438095e-05, 1.893937587738037e-05, 2.081785351037979e-05, 2.269633114337921e-05, 2.457480877637863e-05, 2.6453286409378052e-05, 2.8331764042377472e-05, 3.0210241675376892e-05, 3.208871930837631e-05, 3.396719694137573e-05, 3.584567457437515e-05, 3.772415220737457e-05, 3.960262984037399e-05, 4.148110747337341e-05, 4.335958510637283e-05, 4.5238062739372253e-05, 4.7116540372371674e-05, 4.8995018005371094e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 21.0, 38.0, 120.0, 344.0, 1764.0, 23831.0, 964719.0, 54392.0, 2540.0, 510.0, 150.0, 45.0, 26.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.435455322265625, -1.39727783203125, -1.359100341796875, -1.3209228515625, -1.282745361328125, -1.24456787109375, -1.206390380859375, -1.168212890625, -1.130035400390625, -1.09185791015625, -1.053680419921875, -1.0155029296875, -0.977325439453125, -0.93914794921875, -0.900970458984375, -0.86279296875, -0.824615478515625, -0.78643798828125, -0.748260498046875, -0.7100830078125, -0.671905517578125, -0.63372802734375, -0.595550537109375, -0.557373046875, -0.519195556640625, -0.48101806640625, -0.442840576171875, -0.4046630859375, -0.366485595703125, -0.32830810546875, -0.290130615234375, -0.251953125, -0.213775634765625, -0.17559814453125, -0.137420654296875, -0.0992431640625, -0.061065673828125, -0.02288818359375, 0.015289306640625, 0.053466796875, 0.091644287109375, 0.12982177734375, 0.167999267578125, 0.2061767578125, 0.244354248046875, 0.28253173828125, 0.320709228515625, 0.35888671875, 0.397064208984375, 0.43524169921875, 0.473419189453125, 0.5115966796875, 0.549774169921875, 0.58795166015625, 0.626129150390625, 0.664306640625, 0.702484130859375, 0.74066162109375, 0.778839111328125, 0.8170166015625, 0.855194091796875, 0.89337158203125, 0.931549072265625, 0.9697265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 15.0, 22.0, 19.0, 21.0, 40.0, 64.0, 83.0, 122.0, 145.0, 137.0, 88.0, 75.0, 45.0, 39.0, 22.0, 24.0, 8.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1723003387451172, -0.16503524780273438, -0.15777015686035156, -0.15050506591796875, -0.14323997497558594, -0.13597488403320312, -0.1287097930908203, -0.1214447021484375, -0.11417961120605469, -0.10691452026367188, -0.09964942932128906, -0.09238433837890625, -0.08511924743652344, -0.07785415649414062, -0.07058906555175781, -0.063323974609375, -0.05605888366699219, -0.048793792724609375, -0.04152870178222656, -0.03426361083984375, -0.026998519897460938, -0.019733428955078125, -0.012468338012695312, -0.0052032470703125, 0.0020618438720703125, 0.009326934814453125, 0.016592025756835938, 0.02385711669921875, 0.031122207641601562, 0.038387298583984375, 0.04565238952636719, 0.05291748046875, 0.06018257141113281, 0.06744766235351562, 0.07471275329589844, 0.08197784423828125, 0.08924293518066406, 0.09650802612304688, 0.10377311706542969, 0.1110382080078125, 0.11830329895019531, 0.12556838989257812, 0.13283348083496094, 0.14009857177734375, 0.14736366271972656, 0.15462875366210938, 0.1618938446044922, 0.169158935546875, 0.1764240264892578, 0.18368911743164062, 0.19095420837402344, 0.19821929931640625, 0.20548439025878906, 0.21274948120117188, 0.2200145721435547, 0.2272796630859375, 0.2345447540283203, 0.24180984497070312, 0.24907493591308594, 0.25634002685546875, 0.26360511779785156, 0.2708702087402344, 0.2781352996826172, 0.285400390625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 8.0, 15.0, 46.0, 99.0, 137.0, 199.0, 224.0, 139.0, 72.0, 29.0, 17.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.860669136047363, -6.704534530639648, -6.548400402069092, -6.392265796661377, -6.23613166809082, -6.0799970626831055, -5.923862934112549, -5.767728328704834, -5.611594200134277, -5.4554595947265625, -5.299325466156006, -5.143190860748291, -4.987056732177734, -4.8309221267700195, -4.674787998199463, -4.518653392791748, -4.362519264221191, -4.206384658813477, -4.05025053024292, -3.894116163253784, -3.7379817962646484, -3.5818474292755127, -3.425713062286377, -3.269578456878662, -3.1134438514709473, -2.9573094844818115, -2.801175117492676, -2.64504075050354, -2.4889063835144043, -2.3327720165252686, -2.176637649536133, -2.020503044128418, -1.8643691539764404, -1.7082347869873047, -1.552100419998169, -1.3959660530090332, -1.2398316860198975, -1.0836973190307617, -0.9275628328323364, -0.7714284658432007, -0.6152940988540649, -0.4591597318649292, -0.30302533507347107, -0.14689093828201294, 0.009243428707122803, 0.16537779569625854, 0.32151222229003906, 0.4776465892791748, 0.6337809562683105, 0.7899153232574463, 0.946049690246582, 1.1021840572357178, 1.2583184242248535, 1.4144527912139893, 1.5705872774124146, 1.7267216444015503, 1.882856011390686, 2.0389904975891113, 2.195124864578247, 2.351259231567383, 2.5073935985565186, 2.6635279655456543, 2.81966233253479, 2.975796699523926, 3.1319310665130615]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 7.0, 7.0, 7.0, 13.0, 23.0, 30.0, 14.0, 26.0, 24.0, 17.0, 39.0, 21.0, 39.0, 40.0, 34.0, 48.0, 36.0, 40.0, 42.0, 56.0, 30.0, 34.0, 33.0, 36.0, 37.0, 27.0, 38.0, 28.0, 27.0, 23.0, 25.0, 28.0, 11.0, 11.0, 5.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.092231273651123, -2.9933876991271973, -2.8945441246032715, -2.7957005500793457, -2.69685697555542, -2.598013162612915, -2.4991695880889893, -2.4003260135650635, -2.3014824390411377, -2.202638864517212, -2.103795289993286, -2.0049517154693604, -1.906108021736145, -1.8072644472122192, -1.708420753479004, -1.6095771789550781, -1.5107336044311523, -1.4118900299072266, -1.3130464553833008, -1.2142027616500854, -1.1153591871261597, -1.0165156126022339, -0.9176719784736633, -0.8188283443450928, -0.719984769821167, -0.6211411952972412, -0.5222975611686707, -0.4234539568424225, -0.3246103525161743, -0.22576674818992615, -0.12692314386367798, -0.028079509735107422, 0.07076406478881836, 0.16960766911506653, 0.2684512734413147, 0.36729487776756287, 0.46613848209381104, 0.5649820566177368, 0.6638256907463074, 0.7626693248748779, 0.8615128993988037, 0.9603564739227295, 1.0592000484466553, 1.1580437421798706, 1.2568873167037964, 1.3557308912277222, 1.4545745849609375, 1.5534181594848633, 1.652261734008789, 1.7511053085327148, 1.8499488830566406, 1.948792576789856, 2.047636032104492, 2.146479845046997, 2.245323419570923, 2.3441669940948486, 2.4430105686187744, 2.5418541431427, 2.640697717666626, 2.7395412921905518, 2.8383851051330566, 2.9372286796569824, 3.036072254180908, 3.134915828704834, 3.2337594032287598]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 6.0, 9.0, 13.0, 23.0, 40.0, 62.0, 85.0, 206.0, 283.0, 504.0, 1175.0, 3283.0, 14560.0, 171838.0, 3674030.0, 302866.0, 18796.0, 3866.0, 1324.0, 575.0, 308.0, 160.0, 97.0, 58.0, 27.0, 27.0, 21.0, 10.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.114715576171875, -2.03802490234375, -1.961334228515625, -1.8846435546875, -1.807952880859375, -1.73126220703125, -1.654571533203125, -1.577880859375, -1.501190185546875, -1.42449951171875, -1.347808837890625, -1.2711181640625, -1.194427490234375, -1.11773681640625, -1.041046142578125, -0.96435546875, -0.887664794921875, -0.81097412109375, -0.734283447265625, -0.6575927734375, -0.580902099609375, -0.50421142578125, -0.427520751953125, -0.350830078125, -0.274139404296875, -0.19744873046875, -0.120758056640625, -0.0440673828125, 0.032623291015625, 0.10931396484375, 0.186004638671875, 0.2626953125, 0.339385986328125, 0.41607666015625, 0.492767333984375, 0.5694580078125, 0.646148681640625, 0.72283935546875, 0.799530029296875, 0.876220703125, 0.952911376953125, 1.02960205078125, 1.106292724609375, 1.1829833984375, 1.259674072265625, 1.33636474609375, 1.413055419921875, 1.48974609375, 1.566436767578125, 1.64312744140625, 1.719818115234375, 1.7965087890625, 1.873199462890625, 1.94989013671875, 2.026580810546875, 2.103271484375, 2.179962158203125, 2.25665283203125, 2.333343505859375, 2.4100341796875, 2.486724853515625, 2.56341552734375, 2.640106201171875, 2.716796875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 9.0, 17.0, 16.0, 22.0, 30.0, 30.0, 28.0, 55.0, 62.0, 42.0, 52.0, 79.0, 62.0, 66.0, 68.0, 63.0, 62.0, 42.0, 46.0, 37.0, 22.0, 23.0, 17.0, 14.0, 5.0, 4.0, 8.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88427734375, -0.8483810424804688, -0.8124847412109375, -0.7765884399414062, -0.740692138671875, -0.7047958374023438, -0.6688995361328125, -0.6330032348632812, -0.59710693359375, -0.5612106323242188, -0.5253143310546875, -0.48941802978515625, -0.453521728515625, -0.41762542724609375, -0.3817291259765625, -0.34583282470703125, -0.3099365234375, -0.27404022216796875, -0.2381439208984375, -0.20224761962890625, -0.166351318359375, -0.13045501708984375, -0.0945587158203125, -0.05866241455078125, -0.02276611328125, 0.01313018798828125, 0.0490264892578125, 0.08492279052734375, 0.120819091796875, 0.15671539306640625, 0.1926116943359375, 0.22850799560546875, 0.264404296875, 0.30030059814453125, 0.3361968994140625, 0.37209320068359375, 0.407989501953125, 0.44388580322265625, 0.4797821044921875, 0.5156784057617188, 0.55157470703125, 0.5874710083007812, 0.6233673095703125, 0.6592636108398438, 0.695159912109375, 0.7310562133789062, 0.7669525146484375, 0.8028488159179688, 0.8387451171875, 0.8746414184570312, 0.9105377197265625, 0.9464340209960938, 0.982330322265625, 1.0182266235351562, 1.0541229248046875, 1.0900192260742188, 1.12591552734375, 1.1618118286132812, 1.1977081298828125, 1.2336044311523438, 1.269500732421875, 1.3053970336914062, 1.3412933349609375, 1.3771896362304688, 1.4130859375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 1.0, 12.0, 20.0, 36.0, 55.0, 97.0, 179.0, 803.0, 6883.0, 1647608.0, 2529385.0, 8037.0, 736.0, 212.0, 89.0, 45.0, 22.0, 13.0, 11.0, 5.0, 7.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.919677734375, -3.76904296875, -3.618408203125, -3.4677734375, -3.317138671875, -3.16650390625, -3.015869140625, -2.865234375, -2.714599609375, -2.56396484375, -2.413330078125, -2.2626953125, -2.112060546875, -1.96142578125, -1.810791015625, -1.66015625, -1.509521484375, -1.35888671875, -1.208251953125, -1.0576171875, -0.906982421875, -0.75634765625, -0.605712890625, -0.455078125, -0.304443359375, -0.15380859375, -0.003173828125, 0.1474609375, 0.298095703125, 0.44873046875, 0.599365234375, 0.75, 0.900634765625, 1.05126953125, 1.201904296875, 1.3525390625, 1.503173828125, 1.65380859375, 1.804443359375, 1.955078125, 2.105712890625, 2.25634765625, 2.406982421875, 2.5576171875, 2.708251953125, 2.85888671875, 3.009521484375, 3.16015625, 3.310791015625, 3.46142578125, 3.612060546875, 3.7626953125, 3.913330078125, 4.06396484375, 4.214599609375, 4.365234375, 4.515869140625, 4.66650390625, 4.817138671875, 4.9677734375, 5.118408203125, 5.26904296875, 5.419677734375, 5.5703125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 3.0, 10.0, 8.0, 17.0, 18.0, 26.0, 31.0, 48.0, 81.0, 120.0, 237.0, 424.0, 699.0, 790.0, 594.0, 364.0, 207.0, 115.0, 84.0, 51.0, 44.0, 27.0, 18.0, 17.0, 7.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.5712890625, -0.5563926696777344, -0.5414962768554688, -0.5265998840332031, -0.5117034912109375, -0.4968070983886719, -0.48191070556640625, -0.4670143127441406, -0.452117919921875, -0.4372215270996094, -0.42232513427734375, -0.4074287414550781, -0.3925323486328125, -0.3776359558105469, -0.36273956298828125, -0.3478431701660156, -0.33294677734375, -0.3180503845214844, -0.30315399169921875, -0.2882575988769531, -0.2733612060546875, -0.2584648132324219, -0.24356842041015625, -0.22867202758789062, -0.213775634765625, -0.19887924194335938, -0.18398284912109375, -0.16908645629882812, -0.1541900634765625, -0.13929367065429688, -0.12439727783203125, -0.10950088500976562, -0.0946044921875, -0.07970809936523438, -0.06481170654296875, -0.049915313720703125, -0.0350189208984375, -0.020122528076171875, -0.00522613525390625, 0.009670257568359375, 0.024566650390625, 0.039463043212890625, 0.05435943603515625, 0.06925582885742188, 0.0841522216796875, 0.09904861450195312, 0.11394500732421875, 0.12884140014648438, 0.14373779296875, 0.15863418579101562, 0.17353057861328125, 0.18842697143554688, 0.2033233642578125, 0.21821975708007812, 0.23311614990234375, 0.24801254272460938, 0.262908935546875, 0.2778053283691406, 0.29270172119140625, 0.3075981140136719, 0.3224945068359375, 0.3373908996582031, 0.35228729248046875, 0.3671836853027344, 0.382080078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 13.0, 11.0, 15.0, 11.0, 16.0, 30.0, 39.0, 44.0, 51.0, 50.0, 64.0, 70.0, 86.0, 87.0, 78.0, 65.0, 57.0, 57.0, 39.0, 23.0, 27.0, 18.0, 16.0, 12.0, 8.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7531993985176086, -0.7133648991584778, -0.6735304594039917, -0.6336959600448608, -0.59386146068573, -0.5540270209312439, -0.514192521572113, -0.47435805201530457, -0.4345235824584961, -0.3946891129016876, -0.35485464334487915, -0.3150201439857483, -0.2751856744289398, -0.23535120487213135, -0.19551672041416168, -0.15568223595619202, -0.11584776639938354, -0.07601328939199448, -0.03617881238460541, 0.003655664622783661, 0.04349014163017273, 0.0833246111869812, 0.12315909564495087, 0.16299358010292053, 0.202828049659729, 0.24266251921653748, 0.28249698877334595, 0.3223314881324768, 0.3621659576892853, 0.40200042724609375, 0.4418349266052246, 0.4816693961620331, 0.5215038061141968, 0.5613383054733276, 0.6011727452278137, 0.6410072445869446, 0.6808416843414307, 0.7206761837005615, 0.7605106830596924, 0.8003451824188232, 0.8401796221733093, 0.8800141215324402, 0.9198485612869263, 0.9596830606460571, 0.999517560005188, 1.0393519401550293, 1.0791864395141602, 1.119020938873291, 1.1588554382324219, 1.1986899375915527, 1.2385244369506836, 1.278358817100525, 1.3181933164596558, 1.3580278158187866, 1.3978623151779175, 1.4376968145370483, 1.4775311946868896, 1.5173656940460205, 1.5572001934051514, 1.5970345735549927, 1.6368690729141235, 1.6767035722732544, 1.7165380716323853, 1.7563725709915161, 1.796207070350647]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 2.0, 3.0, 5.0, 15.0, 10.0, 11.0, 9.0, 18.0, 11.0, 20.0, 19.0, 23.0, 40.0, 20.0, 29.0, 35.0, 23.0, 48.0, 38.0, 46.0, 45.0, 42.0, 39.0, 50.0, 41.0, 36.0, 31.0, 32.0, 29.0, 36.0, 32.0, 19.0, 21.0, 19.0, 14.0, 17.0, 19.0, 14.0, 6.0, 8.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8946117758750916, -0.8673585653305054, -0.8401052951812744, -0.8128520846366882, -0.785598874092102, -0.7583456039428711, -0.7310923933982849, -0.7038391828536987, -0.6765859127044678, -0.6493327021598816, -0.6220794320106506, -0.5948262214660645, -0.5675729513168335, -0.5403197407722473, -0.5130665302276611, -0.48581328988075256, -0.458560049533844, -0.4313068091869354, -0.40405356884002686, -0.3768003582954407, -0.3495471179485321, -0.32229387760162354, -0.29504066705703735, -0.2677874267101288, -0.24053418636322021, -0.21328094601631165, -0.18602772057056427, -0.1587744951248169, -0.13152125477790833, -0.10426801443099976, -0.07701478898525238, -0.049761563539505005, -0.02250826358795166, 0.004744969308376312, 0.031998202204704285, 0.05925143510103226, 0.08650466799736023, 0.1137579083442688, 0.14101113379001617, 0.16826435923576355, 0.19551759958267212, 0.2227708399295807, 0.25002408027648926, 0.27727729082107544, 0.304530531167984, 0.3317837715148926, 0.35903698205947876, 0.38629022240638733, 0.4135434627532959, 0.44079670310020447, 0.46804994344711304, 0.4953031539916992, 0.5225564241409302, 0.5498096346855164, 0.5770628452301025, 0.6043161153793335, 0.6315693259239197, 0.6588225364685059, 0.6860758066177368, 0.713329017162323, 0.7405822277069092, 0.7678354978561401, 0.7950887084007263, 0.8223419189453125, 0.8495951890945435]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 1.0, 5.0, 8.0, 10.0, 18.0, 24.0, 41.0, 54.0, 88.0, 172.0, 252.0, 444.0, 836.0, 1428.0, 2640.0, 5145.0, 11186.0, 30852.0, 138093.0, 558766.0, 227559.0, 43285.0, 14196.0, 6203.0, 3209.0, 1792.0, 958.0, 536.0, 316.0, 178.0, 86.0, 54.0, 34.0, 40.0, 17.0, 15.0, 9.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4580078125, -0.4430580139160156, -0.42810821533203125, -0.4131584167480469, -0.3982086181640625, -0.3832588195800781, -0.36830902099609375, -0.3533592224121094, -0.338409423828125, -0.3234596252441406, -0.30850982666015625, -0.2935600280761719, -0.2786102294921875, -0.2636604309082031, -0.24871063232421875, -0.23376083374023438, -0.21881103515625, -0.20386123657226562, -0.18891143798828125, -0.17396163940429688, -0.1590118408203125, -0.14406204223632812, -0.12911224365234375, -0.11416244506835938, -0.099212646484375, -0.08426284790039062, -0.06931304931640625, -0.054363250732421875, -0.0394134521484375, -0.024463653564453125, -0.00951385498046875, 0.005435943603515625, 0.0203857421875, 0.035335540771484375, 0.05028533935546875, 0.06523513793945312, 0.0801849365234375, 0.09513473510742188, 0.11008453369140625, 0.12503433227539062, 0.139984130859375, 0.15493392944335938, 0.16988372802734375, 0.18483352661132812, 0.1997833251953125, 0.21473312377929688, 0.22968292236328125, 0.24463272094726562, 0.25958251953125, 0.2745323181152344, 0.28948211669921875, 0.3044319152832031, 0.3193817138671875, 0.3343315124511719, 0.34928131103515625, 0.3642311096191406, 0.379180908203125, 0.3941307067871094, 0.40908050537109375, 0.4240303039550781, 0.4389801025390625, 0.4539299011230469, 0.46887969970703125, 0.4838294982910156, 0.498779296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 8.0, 6.0, 6.0, 11.0, 18.0, 18.0, 21.0, 28.0, 33.0, 36.0, 41.0, 49.0, 57.0, 48.0, 74.0, 71.0, 55.0, 65.0, 49.0, 44.0, 34.0, 40.0, 39.0, 33.0, 27.0, 26.0, 20.0, 14.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.5531005859375, -0.530517578125, -0.5079345703125, -0.4853515625, -0.4627685546875, -0.440185546875, -0.4176025390625, -0.39501953125, -0.3724365234375, -0.349853515625, -0.3272705078125, -0.3046875, -0.2821044921875, -0.259521484375, -0.2369384765625, -0.21435546875, -0.1917724609375, -0.169189453125, -0.1466064453125, -0.1240234375, -0.1014404296875, -0.078857421875, -0.0562744140625, -0.03369140625, -0.0111083984375, 0.011474609375, 0.0340576171875, 0.056640625, 0.0792236328125, 0.101806640625, 0.1243896484375, 0.14697265625, 0.1695556640625, 0.192138671875, 0.2147216796875, 0.2373046875, 0.2598876953125, 0.282470703125, 0.3050537109375, 0.32763671875, 0.3502197265625, 0.372802734375, 0.3953857421875, 0.41796875, 0.4405517578125, 0.463134765625, 0.4857177734375, 0.50830078125, 0.5308837890625, 0.553466796875, 0.5760498046875, 0.5986328125, 0.6212158203125, 0.643798828125, 0.6663818359375, 0.68896484375, 0.7115478515625, 0.734130859375, 0.7567138671875, 0.779296875, 0.8018798828125, 0.824462890625, 0.8470458984375, 0.86962890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 9.0, 9.0, 7.0, 15.0, 21.0, 31.0, 40.0, 57.0, 109.0, 161.0, 285.0, 581.0, 1234.0, 3270.0, 10392.0, 50176.0, 441380.0, 469138.0, 54495.0, 11063.0, 3347.0, 1384.0, 564.0, 288.0, 190.0, 103.0, 71.0, 50.0, 30.0, 15.0, 14.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48779296875, -0.4715423583984375, -0.455291748046875, -0.4390411376953125, -0.42279052734375, -0.4065399169921875, -0.390289306640625, -0.3740386962890625, -0.3577880859375, -0.3415374755859375, -0.325286865234375, -0.3090362548828125, -0.29278564453125, -0.2765350341796875, -0.260284423828125, -0.2440338134765625, -0.227783203125, -0.2115325927734375, -0.195281982421875, -0.1790313720703125, -0.16278076171875, -0.1465301513671875, -0.130279541015625, -0.1140289306640625, -0.0977783203125, -0.0815277099609375, -0.065277099609375, -0.0490264892578125, -0.03277587890625, -0.0165252685546875, -0.000274658203125, 0.0159759521484375, 0.0322265625, 0.0484771728515625, 0.064727783203125, 0.0809783935546875, 0.09722900390625, 0.1134796142578125, 0.129730224609375, 0.1459808349609375, 0.1622314453125, 0.1784820556640625, 0.194732666015625, 0.2109832763671875, 0.22723388671875, 0.2434844970703125, 0.259735107421875, 0.2759857177734375, 0.292236328125, 0.3084869384765625, 0.324737548828125, 0.3409881591796875, 0.35723876953125, 0.3734893798828125, 0.389739990234375, 0.4059906005859375, 0.4222412109375, 0.4384918212890625, 0.454742431640625, 0.4709930419921875, 0.48724365234375, 0.5034942626953125, 0.519744873046875, 0.5359954833984375, 0.55224609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 2.0, 8.0, 10.0, 10.0, 9.0, 16.0, 15.0, 22.0, 20.0, 26.0, 30.0, 35.0, 38.0, 40.0, 41.0, 39.0, 53.0, 44.0, 43.0, 43.0, 50.0, 43.0, 36.0, 36.0, 30.0, 32.0, 29.0, 24.0, 26.0, 25.0, 19.0, 17.0, 10.0, 10.0, 14.0, 10.0, 7.0, 7.0, 8.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.2333984375, -1.19427490234375, -1.1551513671875, -1.11602783203125, -1.076904296875, -1.03778076171875, -0.9986572265625, -0.95953369140625, -0.92041015625, -0.88128662109375, -0.8421630859375, -0.80303955078125, -0.763916015625, -0.72479248046875, -0.6856689453125, -0.64654541015625, -0.607421875, -0.56829833984375, -0.5291748046875, -0.49005126953125, -0.450927734375, -0.41180419921875, -0.3726806640625, -0.33355712890625, -0.29443359375, -0.25531005859375, -0.2161865234375, -0.17706298828125, -0.137939453125, -0.09881591796875, -0.0596923828125, -0.02056884765625, 0.0185546875, 0.05767822265625, 0.0968017578125, 0.13592529296875, 0.175048828125, 0.21417236328125, 0.2532958984375, 0.29241943359375, 0.33154296875, 0.37066650390625, 0.4097900390625, 0.44891357421875, 0.488037109375, 0.52716064453125, 0.5662841796875, 0.60540771484375, 0.64453125, 0.68365478515625, 0.7227783203125, 0.76190185546875, 0.801025390625, 0.84014892578125, 0.8792724609375, 0.91839599609375, 0.95751953125, 0.99664306640625, 1.0357666015625, 1.07489013671875, 1.114013671875, 1.15313720703125, 1.1922607421875, 1.23138427734375, 1.2705078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 7.0, 4.0, 5.0, 9.0, 8.0, 19.0, 20.0, 35.0, 50.0, 89.0, 105.0, 211.0, 370.0, 594.0, 1125.0, 2038.0, 4236.0, 11244.0, 55994.0, 746600.0, 192875.0, 20569.0, 6407.0, 2718.0, 1325.0, 784.0, 437.0, 243.0, 143.0, 89.0, 66.0, 35.0, 32.0, 20.0, 11.0, 9.0, 6.0, 4.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2802734375, -0.2714385986328125, -0.262603759765625, -0.2537689208984375, -0.24493408203125, -0.2360992431640625, -0.227264404296875, -0.2184295654296875, -0.2095947265625, -0.2007598876953125, -0.191925048828125, -0.1830902099609375, -0.17425537109375, -0.1654205322265625, -0.156585693359375, -0.1477508544921875, -0.138916015625, -0.1300811767578125, -0.121246337890625, -0.1124114990234375, -0.10357666015625, -0.0947418212890625, -0.085906982421875, -0.0770721435546875, -0.0682373046875, -0.0594024658203125, -0.050567626953125, -0.0417327880859375, -0.03289794921875, -0.0240631103515625, -0.015228271484375, -0.0063934326171875, 0.00244140625, 0.0112762451171875, 0.020111083984375, 0.0289459228515625, 0.03778076171875, 0.0466156005859375, 0.055450439453125, 0.0642852783203125, 0.0731201171875, 0.0819549560546875, 0.090789794921875, 0.0996246337890625, 0.10845947265625, 0.1172943115234375, 0.126129150390625, 0.1349639892578125, 0.143798828125, 0.1526336669921875, 0.161468505859375, 0.1703033447265625, 0.17913818359375, 0.1879730224609375, 0.196807861328125, 0.2056427001953125, 0.2144775390625, 0.2233123779296875, 0.232147216796875, 0.2409820556640625, 0.24981689453125, 0.2586517333984375, 0.267486572265625, 0.2763214111328125, 0.28515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 1.0, 12.0, 23.0, 26.0, 38.0, 77.0, 193.0, 251.0, 189.0, 93.0, 34.0, 20.0, 15.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0], "bins": [-0.0002696514129638672, -0.0002644127234816551, -0.00025917403399944305, -0.000253935344517231, -0.0002486966550350189, -0.00024345796555280685, -0.0002382192760705948, -0.00023298058658838272, -0.00022774189710617065, -0.0002225032076239586, -0.00021726451814174652, -0.00021202582865953445, -0.0002067871391773224, -0.00020154844969511032, -0.00019630976021289825, -0.0001910710707306862, -0.00018583238124847412, -0.00018059369176626205, -0.00017535500228405, -0.00017011631280183792, -0.00016487762331962585, -0.0001596389338374138, -0.00015440024435520172, -0.00014916155487298965, -0.0001439228653907776, -0.00013868417590856552, -0.00013344548642635345, -0.0001282067969441414, -0.00012296810746192932, -0.00011772941797971725, -0.00011249072849750519, -0.00010725203901529312, -0.00010201334953308105, -9.677466005086899e-05, -9.153597056865692e-05, -8.629728108644485e-05, -8.105859160423279e-05, -7.581990212202072e-05, -7.058121263980865e-05, -6.534252315759659e-05, -6.010383367538452e-05, -5.4865144193172455e-05, -4.962645471096039e-05, -4.438776522874832e-05, -3.9149075746536255e-05, -3.391038626432419e-05, -2.867169678211212e-05, -2.3433007299900055e-05, -1.8194317817687988e-05, -1.2955628335475922e-05, -7.716938853263855e-06, -2.4782493710517883e-06, 2.7604401111602783e-06, 7.999129593372345e-06, 1.3237819075584412e-05, 1.8476508557796478e-05, 2.3715198040008545e-05, 2.895388752222061e-05, 3.419257700443268e-05, 3.9431266486644745e-05, 4.466995596885681e-05, 4.990864545106888e-05, 5.5147334933280945e-05, 6.038602441549301e-05, 6.562471389770508e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 18.0, 20.0, 27.0, 42.0, 72.0, 143.0, 226.0, 466.0, 942.0, 2127.0, 5840.0, 24666.0, 440331.0, 535245.0, 27810.0, 6269.0, 2292.0, 969.0, 457.0, 242.0, 122.0, 75.0, 39.0, 35.0, 24.0, 10.0, 10.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.480712890625, -0.4677314758300781, -0.45475006103515625, -0.4417686462402344, -0.4287872314453125, -0.4158058166503906, -0.40282440185546875, -0.3898429870605469, -0.376861572265625, -0.3638801574707031, -0.35089874267578125, -0.3379173278808594, -0.3249359130859375, -0.3119544982910156, -0.29897308349609375, -0.2859916687011719, -0.27301025390625, -0.2600288391113281, -0.24704742431640625, -0.23406600952148438, -0.2210845947265625, -0.20810317993164062, -0.19512176513671875, -0.18214035034179688, -0.169158935546875, -0.15617752075195312, -0.14319610595703125, -0.13021469116210938, -0.1172332763671875, -0.10425186157226562, -0.09127044677734375, -0.07828903198242188, -0.0653076171875, -0.052326202392578125, -0.03934478759765625, -0.026363372802734375, -0.0133819580078125, -0.000400543212890625, 0.01258087158203125, 0.025562286376953125, 0.038543701171875, 0.051525115966796875, 0.06450653076171875, 0.07748794555664062, 0.0904693603515625, 0.10345077514648438, 0.11643218994140625, 0.12941360473632812, 0.14239501953125, 0.15537643432617188, 0.16835784912109375, 0.18133926391601562, 0.1943206787109375, 0.20730209350585938, 0.22028350830078125, 0.23326492309570312, 0.246246337890625, 0.2592277526855469, 0.27220916748046875, 0.2851905822753906, 0.2981719970703125, 0.3111534118652344, 0.32413482666015625, 0.3371162414550781, 0.35009765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 13.0, 18.0, 20.0, 37.0, 76.0, 143.0, 253.0, 183.0, 85.0, 58.0, 37.0, 19.0, 8.0, 8.0, 7.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0936279296875, -0.08998680114746094, -0.08634567260742188, -0.08270454406738281, -0.07906341552734375, -0.07542228698730469, -0.07178115844726562, -0.06814002990722656, -0.0644989013671875, -0.06085777282714844, -0.057216644287109375, -0.05357551574707031, -0.04993438720703125, -0.04629325866699219, -0.042652130126953125, -0.03901100158691406, -0.035369873046875, -0.03172874450683594, -0.028087615966796875, -0.024446487426757812, -0.02080535888671875, -0.017164230346679688, -0.013523101806640625, -0.009881973266601562, -0.0062408447265625, -0.0025997161865234375, 0.001041412353515625, 0.0046825408935546875, 0.00832366943359375, 0.011964797973632812, 0.015605926513671875, 0.019247055053710938, 0.02288818359375, 0.026529312133789062, 0.030170440673828125, 0.03381156921386719, 0.03745269775390625, 0.04109382629394531, 0.044734954833984375, 0.04837608337402344, 0.0520172119140625, 0.05565834045410156, 0.059299468994140625, 0.06294059753417969, 0.06658172607421875, 0.07022285461425781, 0.07386398315429688, 0.07750511169433594, 0.081146240234375, 0.08478736877441406, 0.08842849731445312, 0.09206962585449219, 0.09571075439453125, 0.09935188293457031, 0.10299301147460938, 0.10663414001464844, 0.1102752685546875, 0.11391639709472656, 0.11755752563476562, 0.12119865417480469, 0.12483978271484375, 0.1284809112548828, 0.13212203979492188, 0.13576316833496094, 0.139404296875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 21.0, 40.0, 44.0, 85.0, 108.0, 137.0, 147.0, 141.0, 86.0, 76.0, 43.0, 36.0, 18.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3893704414367676, -1.347721815109253, -1.3060733079910278, -1.2644246816635132, -1.222776174545288, -1.1811275482177734, -1.1394790410995483, -1.0978304147720337, -1.0561819076538086, -1.014533281326294, -0.9728847742080688, -0.931236207485199, -0.8895876407623291, -0.8479390740394592, -0.8062905073165894, -0.7646418809890747, -0.7229933142662048, -0.681344747543335, -0.6396961808204651, -0.5980476140975952, -0.5563990473747253, -0.5147504806518555, -0.4731018841266632, -0.43145331740379333, -0.38980475068092346, -0.3481561839580536, -0.3065076172351837, -0.26485902070999146, -0.22321046888828278, -0.1815619021654129, -0.13991332054138184, -0.09826475381851196, -0.05661618709564209, -0.014967616647481918, 0.026680953800678253, 0.06832952797412872, 0.1099780946969986, 0.15162666141986847, 0.19327524304389954, 0.2349238097667694, 0.2765723764896393, 0.31822094321250916, 0.35986950993537903, 0.4015181064605713, 0.44316667318344116, 0.48481523990631104, 0.5264638066291809, 0.5681123733520508, 0.6097609400749207, 0.6514095067977905, 0.6930580735206604, 0.7347066402435303, 0.7763552069664001, 0.81800377368927, 0.8596524000167847, 0.9013009071350098, 0.9429495334625244, 0.9845981001853943, 1.0262466669082642, 1.0678952932357788, 1.109543800354004, 1.1511924266815186, 1.1928409337997437, 1.2344895601272583, 1.2761380672454834]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 16.0, 17.0, 16.0, 24.0, 42.0, 21.0, 24.0, 34.0, 50.0, 44.0, 40.0, 57.0, 66.0, 65.0, 47.0, 51.0, 46.0, 45.0, 39.0, 33.0, 35.0, 28.0, 19.0, 21.0, 16.0, 21.0, 11.0, 15.0, 3.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48366406559944153, -0.4644789695739746, -0.4452938735485077, -0.42610877752304077, -0.40692368149757385, -0.38773858547210693, -0.3685535192489624, -0.3493683934211731, -0.33018332719802856, -0.31099823117256165, -0.2918131351470947, -0.2726280391216278, -0.2534429430961609, -0.23425784707069397, -0.21507276594638824, -0.19588766992092133, -0.1767025589942932, -0.1575174629688263, -0.13833236694335938, -0.11914727836847305, -0.09996218234300613, -0.08077708631753922, -0.06159199774265289, -0.042406901717185974, -0.023221805691719055, -0.0040367115288972855, 0.015148382633924484, 0.034333474934101105, 0.053518570959568024, 0.07270366698503494, 0.09188875555992126, 0.11107385158538818, 0.13025891780853271, 0.14944401383399963, 0.16862910985946655, 0.18781420588493347, 0.2069993019104004, 0.2261843979358673, 0.24536947906017303, 0.26455456018447876, 0.28373968601226807, 0.302924782037735, 0.3221098780632019, 0.3412949740886688, 0.36048007011413574, 0.37966516613960266, 0.3988502621650696, 0.4180353283882141, 0.43722042441368103, 0.45640552043914795, 0.47559061646461487, 0.4947757124900818, 0.5139607787132263, 0.5331459045410156, 0.5523309707641602, 0.5715160965919495, 0.590701162815094, 0.6098862290382385, 0.6290713548660278, 0.6482564210891724, 0.6674415469169617, 0.6866266131401062, 0.7058117389678955, 0.72499680519104, 0.7441819310188293]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 1.0, 8.0, 14.0, 13.0, 30.0, 37.0, 48.0, 116.0, 166.0, 325.0, 565.0, 1007.0, 2146.0, 4155.0, 8926.0, 20184.0, 54089.0, 194089.0, 492121.0, 182755.0, 51318.0, 19583.0, 8413.0, 4031.0, 2073.0, 1040.0, 554.0, 323.0, 159.0, 105.0, 63.0, 37.0, 18.0, 11.0, 9.0, 17.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7724609375, -0.7421417236328125, -0.711822509765625, -0.6815032958984375, -0.65118408203125, -0.6208648681640625, -0.590545654296875, -0.5602264404296875, -0.5299072265625, -0.4995880126953125, -0.469268798828125, -0.4389495849609375, -0.40863037109375, -0.3783111572265625, -0.347991943359375, -0.3176727294921875, -0.287353515625, -0.2570343017578125, -0.226715087890625, -0.1963958740234375, -0.16607666015625, -0.1357574462890625, -0.105438232421875, -0.0751190185546875, -0.0447998046875, -0.0144805908203125, 0.015838623046875, 0.0461578369140625, 0.07647705078125, 0.1067962646484375, 0.137115478515625, 0.1674346923828125, 0.19775390625, 0.2280731201171875, 0.258392333984375, 0.2887115478515625, 0.31903076171875, 0.3493499755859375, 0.379669189453125, 0.4099884033203125, 0.4403076171875, 0.4706268310546875, 0.500946044921875, 0.5312652587890625, 0.56158447265625, 0.5919036865234375, 0.622222900390625, 0.6525421142578125, 0.682861328125, 0.7131805419921875, 0.743499755859375, 0.7738189697265625, 0.80413818359375, 0.8344573974609375, 0.864776611328125, 0.8950958251953125, 0.9254150390625, 0.9557342529296875, 0.986053466796875, 1.0163726806640625, 1.04669189453125, 1.0770111083984375, 1.107330322265625, 1.1376495361328125, 1.16796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 6.0, 13.0, 13.0, 12.0, 17.0, 24.0, 23.0, 21.0, 23.0, 20.0, 29.0, 43.0, 50.0, 44.0, 42.0, 72.0, 51.0, 56.0, 45.0, 49.0, 46.0, 48.0, 38.0, 29.0, 32.0, 30.0, 17.0, 19.0, 12.0, 20.0, 13.0, 7.0, 7.0, 5.0, 4.0, 7.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2236328125, -1.186126708984375, -1.14862060546875, -1.111114501953125, -1.0736083984375, -1.036102294921875, -0.99859619140625, -0.961090087890625, -0.923583984375, -0.886077880859375, -0.84857177734375, -0.811065673828125, -0.7735595703125, -0.736053466796875, -0.69854736328125, -0.661041259765625, -0.62353515625, -0.586029052734375, -0.54852294921875, -0.511016845703125, -0.4735107421875, -0.436004638671875, -0.39849853515625, -0.360992431640625, -0.323486328125, -0.285980224609375, -0.24847412109375, -0.210968017578125, -0.1734619140625, -0.135955810546875, -0.09844970703125, -0.060943603515625, -0.0234375, 0.014068603515625, 0.05157470703125, 0.089080810546875, 0.1265869140625, 0.164093017578125, 0.20159912109375, 0.239105224609375, 0.276611328125, 0.314117431640625, 0.35162353515625, 0.389129638671875, 0.4266357421875, 0.464141845703125, 0.50164794921875, 0.539154052734375, 0.57666015625, 0.614166259765625, 0.65167236328125, 0.689178466796875, 0.7266845703125, 0.764190673828125, 0.80169677734375, 0.839202880859375, 0.876708984375, 0.914215087890625, 0.95172119140625, 0.989227294921875, 1.0267333984375, 1.064239501953125, 1.10174560546875, 1.139251708984375, 1.1767578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 3.0, 13.0, 16.0, 26.0, 28.0, 34.0, 58.0, 80.0, 145.0, 244.0, 552.0, 1469.0, 5325.0, 25973.0, 223607.0, 684249.0, 88326.0, 13385.0, 3115.0, 956.0, 391.0, 194.0, 114.0, 62.0, 38.0, 38.0, 27.0, 17.0, 15.0, 9.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4196624755859375, -1.365692138671875, -1.3117218017578125, -1.25775146484375, -1.2037811279296875, -1.149810791015625, -1.0958404541015625, -1.0418701171875, -0.9878997802734375, -0.933929443359375, -0.8799591064453125, -0.82598876953125, -0.7720184326171875, -0.718048095703125, -0.6640777587890625, -0.610107421875, -0.5561370849609375, -0.502166748046875, -0.4481964111328125, -0.39422607421875, -0.3402557373046875, -0.286285400390625, -0.2323150634765625, -0.1783447265625, -0.1243743896484375, -0.070404052734375, -0.0164337158203125, 0.03753662109375, 0.0915069580078125, 0.145477294921875, 0.1994476318359375, 0.25341796875, 0.3073883056640625, 0.361358642578125, 0.4153289794921875, 0.46929931640625, 0.5232696533203125, 0.577239990234375, 0.6312103271484375, 0.6851806640625, 0.7391510009765625, 0.793121337890625, 0.8470916748046875, 0.90106201171875, 0.9550323486328125, 1.009002685546875, 1.0629730224609375, 1.116943359375, 1.1709136962890625, 1.224884033203125, 1.2788543701171875, 1.33282470703125, 1.3867950439453125, 1.440765380859375, 1.4947357177734375, 1.5487060546875, 1.6026763916015625, 1.656646728515625, 1.7106170654296875, 1.76458740234375, 1.8185577392578125, 1.872528076171875, 1.9264984130859375, 1.98046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 8.0, 11.0, 15.0, 17.0, 18.0, 27.0, 19.0, 33.0, 30.0, 37.0, 40.0, 47.0, 56.0, 60.0, 56.0, 52.0, 57.0, 64.0, 49.0, 39.0, 43.0, 41.0, 34.0, 23.0, 24.0, 23.0, 7.0, 14.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4384765625, -1.3890533447265625, -1.339630126953125, -1.2902069091796875, -1.24078369140625, -1.1913604736328125, -1.141937255859375, -1.0925140380859375, -1.0430908203125, -0.9936676025390625, -0.944244384765625, -0.8948211669921875, -0.84539794921875, -0.7959747314453125, -0.746551513671875, -0.6971282958984375, -0.647705078125, -0.5982818603515625, -0.548858642578125, -0.4994354248046875, -0.45001220703125, -0.4005889892578125, -0.351165771484375, -0.3017425537109375, -0.2523193359375, -0.2028961181640625, -0.153472900390625, -0.1040496826171875, -0.05462646484375, -0.0052032470703125, 0.044219970703125, 0.0936431884765625, 0.14306640625, 0.1924896240234375, 0.241912841796875, 0.2913360595703125, 0.34075927734375, 0.3901824951171875, 0.439605712890625, 0.4890289306640625, 0.5384521484375, 0.5878753662109375, 0.637298583984375, 0.6867218017578125, 0.73614501953125, 0.7855682373046875, 0.834991455078125, 0.8844146728515625, 0.933837890625, 0.9832611083984375, 1.032684326171875, 1.0821075439453125, 1.13153076171875, 1.1809539794921875, 1.230377197265625, 1.2798004150390625, 1.3292236328125, 1.3786468505859375, 1.428070068359375, 1.4774932861328125, 1.52691650390625, 1.5763397216796875, 1.625762939453125, 1.6751861572265625, 1.724609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 9.0, 12.0, 21.0, 37.0, 61.0, 98.0, 170.0, 500.0, 1598.0, 7657.0, 102769.0, 838603.0, 87691.0, 6880.0, 1488.0, 499.0, 205.0, 100.0, 50.0, 19.0, 17.0, 13.0, 7.0, 6.0, 6.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.6080398559570312, -0.5866851806640625, -0.5653305053710938, -0.543975830078125, -0.5226211547851562, -0.5012664794921875, -0.47991180419921875, -0.45855712890625, -0.43720245361328125, -0.4158477783203125, -0.39449310302734375, -0.373138427734375, -0.35178375244140625, -0.3304290771484375, -0.30907440185546875, -0.2877197265625, -0.26636505126953125, -0.2450103759765625, -0.22365570068359375, -0.202301025390625, -0.18094635009765625, -0.1595916748046875, -0.13823699951171875, -0.11688232421875, -0.09552764892578125, -0.0741729736328125, -0.05281829833984375, -0.031463623046875, -0.01010894775390625, 0.0112457275390625, 0.03260040283203125, 0.053955078125, 0.07530975341796875, 0.0966644287109375, 0.11801910400390625, 0.139373779296875, 0.16072845458984375, 0.1820831298828125, 0.20343780517578125, 0.22479248046875, 0.24614715576171875, 0.2675018310546875, 0.28885650634765625, 0.310211181640625, 0.33156585693359375, 0.3529205322265625, 0.37427520751953125, 0.3956298828125, 0.41698455810546875, 0.4383392333984375, 0.45969390869140625, 0.481048583984375, 0.5024032592773438, 0.5237579345703125, 0.5451126098632812, 0.56646728515625, 0.5878219604492188, 0.6091766357421875, 0.6305313110351562, 0.651885986328125, 0.6732406616210938, 0.6945953369140625, 0.7159500122070312, 0.7373046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 3.0, 4.0, 9.0, 10.0, 25.0, 29.0, 34.0, 35.0, 45.0, 77.0, 104.0, 150.0, 117.0, 98.0, 68.0, 53.0, 50.0, 27.0, 24.0, 14.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.26716423034668e-05, -8.049327880144119e-05, -7.831491529941559e-05, -7.613655179738998e-05, -7.395818829536438e-05, -7.177982479333878e-05, -6.960146129131317e-05, -6.742309778928757e-05, -6.524473428726196e-05, -6.306637078523636e-05, -6.0888007283210754e-05, -5.870964378118515e-05, -5.6531280279159546e-05, -5.435291677713394e-05, -5.217455327510834e-05, -4.999618977308273e-05, -4.781782627105713e-05, -4.5639462769031525e-05, -4.346109926700592e-05, -4.1282735764980316e-05, -3.910437226295471e-05, -3.692600876092911e-05, -3.4747645258903503e-05, -3.25692817568779e-05, -3.0390918254852295e-05, -2.821255475282669e-05, -2.6034191250801086e-05, -2.3855827748775482e-05, -2.1677464246749878e-05, -1.9499100744724274e-05, -1.732073724269867e-05, -1.5142373740673065e-05, -1.2964010238647461e-05, -1.0785646736621857e-05, -8.607283234596252e-06, -6.428919732570648e-06, -4.250556230545044e-06, -2.0721927285194397e-06, 1.0617077350616455e-07, 2.284534275531769e-06, 4.462897777557373e-06, 6.641261279582977e-06, 8.819624781608582e-06, 1.0997988283634186e-05, 1.317635178565979e-05, 1.5354715287685394e-05, 1.7533078789711e-05, 1.9711442291736603e-05, 2.1889805793762207e-05, 2.406816929578781e-05, 2.6246532797813416e-05, 2.842489629983902e-05, 3.0603259801864624e-05, 3.278162330389023e-05, 3.495998680591583e-05, 3.713835030794144e-05, 3.931671380996704e-05, 4.1495077311992645e-05, 4.367344081401825e-05, 4.5851804316043854e-05, 4.803016781806946e-05, 5.020853132009506e-05, 5.2386894822120667e-05, 5.456525832414627e-05, 5.6743621826171875e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 7.0, 4.0, 10.0, 20.0, 30.0, 40.0, 63.0, 130.0, 241.0, 463.0, 972.0, 2390.0, 9552.0, 85803.0, 781000.0, 149287.0, 13299.0, 2963.0, 1115.0, 530.0, 275.0, 137.0, 93.0, 41.0, 30.0, 16.0, 15.0, 6.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.89892578125, -0.8773155212402344, -0.8557052612304688, -0.8340950012207031, -0.8124847412109375, -0.7908744812011719, -0.7692642211914062, -0.7476539611816406, -0.726043701171875, -0.7044334411621094, -0.6828231811523438, -0.6612129211425781, -0.6396026611328125, -0.6179924011230469, -0.5963821411132812, -0.5747718811035156, -0.55316162109375, -0.5315513610839844, -0.5099411010742188, -0.4883308410644531, -0.4667205810546875, -0.4451103210449219, -0.42350006103515625, -0.4018898010253906, -0.380279541015625, -0.3586692810058594, -0.33705902099609375, -0.3154487609863281, -0.2938385009765625, -0.2722282409667969, -0.25061798095703125, -0.22900772094726562, -0.2073974609375, -0.18578720092773438, -0.16417694091796875, -0.14256668090820312, -0.1209564208984375, -0.09934616088867188, -0.07773590087890625, -0.056125640869140625, -0.034515380859375, -0.012905120849609375, 0.00870513916015625, 0.030315399169921875, 0.0519256591796875, 0.07353591918945312, 0.09514617919921875, 0.11675643920898438, 0.13836669921875, 0.15997695922851562, 0.18158721923828125, 0.20319747924804688, 0.2248077392578125, 0.24641799926757812, 0.26802825927734375, 0.2896385192871094, 0.311248779296875, 0.3328590393066406, 0.35446929931640625, 0.3760795593261719, 0.3976898193359375, 0.4193000793457031, 0.44091033935546875, 0.4625205993652344, 0.484130859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 7.0, 6.0, 7.0, 17.0, 21.0, 26.0, 31.0, 45.0, 62.0, 83.0, 108.0, 121.0, 115.0, 89.0, 75.0, 42.0, 33.0, 28.0, 22.0, 20.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.218017578125, -0.21059799194335938, -0.20317840576171875, -0.19575881958007812, -0.1883392333984375, -0.18091964721679688, -0.17350006103515625, -0.16608047485351562, -0.158660888671875, -0.15124130249023438, -0.14382171630859375, -0.13640213012695312, -0.1289825439453125, -0.12156295776367188, -0.11414337158203125, -0.10672378540039062, -0.09930419921875, -0.09188461303710938, -0.08446502685546875, -0.07704544067382812, -0.0696258544921875, -0.062206268310546875, -0.05478668212890625, -0.047367095947265625, -0.039947509765625, -0.032527923583984375, -0.02510833740234375, -0.017688751220703125, -0.0102691650390625, -0.002849578857421875, 0.00457000732421875, 0.011989593505859375, 0.0194091796875, 0.026828765869140625, 0.03424835205078125, 0.041667938232421875, 0.0490875244140625, 0.056507110595703125, 0.06392669677734375, 0.07134628295898438, 0.078765869140625, 0.08618545532226562, 0.09360504150390625, 0.10102462768554688, 0.1084442138671875, 0.11586380004882812, 0.12328338623046875, 0.13070297241210938, 0.13812255859375, 0.14554214477539062, 0.15296173095703125, 0.16038131713867188, 0.1678009033203125, 0.17522048950195312, 0.18264007568359375, 0.19005966186523438, 0.197479248046875, 0.20489883422851562, 0.21231842041015625, 0.21973800659179688, 0.2271575927734375, 0.23457717895507812, 0.24199676513671875, 0.24941635131835938, 0.2568359375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 13.0, 85.0, 305.0, 397.0, 169.0, 40.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.147091031074524, -0.8759806156158447, -0.6048701405525208, -0.3337596654891968, -0.06264925003051758, 0.20846116542816162, 0.47957170009613037, 0.7506821155548096, 1.0217925310134888, 1.292902946472168, 1.5640134811401367, 1.835123896598816, 2.106234312057495, 2.3773446083068848, 2.6484551429748535, 2.9195656776428223, 3.190676212310791, 3.4617867469787598, 3.7328970432281494, 4.004007339477539, 4.275117874145508, 4.546228408813477, 4.817338943481445, 5.088449478149414, 5.359559535980225, 5.630670070648193, 5.901780605316162, 6.172890663146973, 6.444001197814941, 6.71511173248291, 6.986222267150879, 7.257332801818848, 7.528443336486816, 7.799553871154785, 8.070664405822754, 8.341774940490723, 8.612885475158691, 8.883995056152344, 9.155105590820312, 9.426216125488281, 9.69732666015625, 9.968437194824219, 10.239547729492188, 10.510658264160156, 10.781768798828125, 11.052879333496094, 11.323989868164062, 11.595099449157715, 11.8662109375, 12.137321472167969, 12.408432006835938, 12.679542541503906, 12.950653076171875, 13.221763610839844, 13.492874145507812, 13.763983726501465, 14.035094261169434, 14.306204795837402, 14.577315330505371, 14.84842586517334, 15.119536399841309, 15.390645980834961, 15.66175651550293, 15.932867050170898, 16.203977584838867]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 5.0, 11.0, 8.0, 17.0, 11.0, 8.0, 21.0, 24.0, 26.0, 14.0, 20.0, 24.0, 38.0, 40.0, 38.0, 40.0, 41.0, 37.0, 43.0, 57.0, 44.0, 44.0, 47.0, 42.0, 45.0, 32.0, 26.0, 32.0, 25.0, 22.0, 21.0, 21.0, 17.0, 6.0, 5.0, 9.0, 5.0, 4.0, 9.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-2.36063551902771, -2.2927160263061523, -2.2247965335845947, -2.156876802444458, -2.0889573097229004, -2.0210378170013428, -1.9531183242797852, -1.885198712348938, -1.8172791004180908, -1.7493596076965332, -1.681439995765686, -1.6135205030441284, -1.5456008911132812, -1.4776813983917236, -1.409761905670166, -1.3418422937393188, -1.2739228010177612, -1.2060033082962036, -1.1380836963653564, -1.0701642036437988, -1.0022445917129517, -0.934325098991394, -0.8664055466651917, -0.7984859943389893, -0.7305664420127869, -0.6626468896865845, -0.5947273373603821, -0.5268077850341797, -0.4588882625102997, -0.3909687101840973, -0.3230491876602173, -0.2551296353340149, -0.18721020221710205, -0.11929065734148026, -0.05137111246585846, 0.01654842495918274, 0.08446797728538513, 0.15238752961158752, 0.22030705213546753, 0.2882266044616699, 0.3561461567878723, 0.4240657091140747, 0.4919852614402771, 0.5599048137664795, 0.6278243064880371, 0.6957439184188843, 0.7636634111404419, 0.8315829634666443, 0.8995025157928467, 0.9674220681190491, 1.0353416204452515, 1.103261113166809, 1.1711807250976562, 1.2391002178192139, 1.3070197105407715, 1.3749393224716187, 1.4428589344024658, 1.5107784271240234, 1.5786980390548706, 1.6466175317764282, 1.7145371437072754, 1.782456636428833, 1.8503761291503906, 1.9182957410812378, 1.9862152338027954]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 7.0, 10.0, 15.0, 18.0, 18.0, 30.0, 32.0, 43.0, 47.0, 71.0, 87.0, 203.0, 357.0, 753.0, 1832.0, 6102.0, 29859.0, 500099.0, 3462296.0, 167823.0, 17588.0, 4251.0, 1402.0, 579.0, 242.0, 142.0, 92.0, 65.0, 35.0, 49.0, 28.0, 18.0, 13.0, 18.0, 12.0, 9.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6669921875, -1.610198974609375, -1.55340576171875, -1.496612548828125, -1.4398193359375, -1.383026123046875, -1.32623291015625, -1.269439697265625, -1.212646484375, -1.155853271484375, -1.09906005859375, -1.042266845703125, -0.9854736328125, -0.928680419921875, -0.87188720703125, -0.815093994140625, -0.75830078125, -0.701507568359375, -0.64471435546875, -0.587921142578125, -0.5311279296875, -0.474334716796875, -0.41754150390625, -0.360748291015625, -0.303955078125, -0.247161865234375, -0.19036865234375, -0.133575439453125, -0.0767822265625, -0.019989013671875, 0.03680419921875, 0.093597412109375, 0.150390625, 0.207183837890625, 0.26397705078125, 0.320770263671875, 0.3775634765625, 0.434356689453125, 0.49114990234375, 0.547943115234375, 0.604736328125, 0.661529541015625, 0.71832275390625, 0.775115966796875, 0.8319091796875, 0.888702392578125, 0.94549560546875, 1.002288818359375, 1.05908203125, 1.115875244140625, 1.17266845703125, 1.229461669921875, 1.2862548828125, 1.343048095703125, 1.39984130859375, 1.456634521484375, 1.513427734375, 1.570220947265625, 1.62701416015625, 1.683807373046875, 1.7406005859375, 1.797393798828125, 1.85418701171875, 1.910980224609375, 1.9677734375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 12.0, 9.0, 14.0, 17.0, 16.0, 27.0, 35.0, 32.0, 37.0, 38.0, 54.0, 63.0, 73.0, 66.0, 61.0, 59.0, 58.0, 51.0, 57.0, 55.0, 39.0, 25.0, 29.0, 19.0, 13.0, 8.0, 8.0, 11.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77294921875, -0.7472076416015625, -0.721466064453125, -0.6957244873046875, -0.66998291015625, -0.6442413330078125, -0.618499755859375, -0.5927581787109375, -0.5670166015625, -0.5412750244140625, -0.515533447265625, -0.4897918701171875, -0.46405029296875, -0.4383087158203125, -0.412567138671875, -0.3868255615234375, -0.361083984375, -0.3353424072265625, -0.309600830078125, -0.2838592529296875, -0.25811767578125, -0.2323760986328125, -0.206634521484375, -0.1808929443359375, -0.1551513671875, -0.1294097900390625, -0.103668212890625, -0.0779266357421875, -0.05218505859375, -0.0264434814453125, -0.000701904296875, 0.0250396728515625, 0.05078125, 0.0765228271484375, 0.102264404296875, 0.1280059814453125, 0.15374755859375, 0.1794891357421875, 0.205230712890625, 0.2309722900390625, 0.2567138671875, 0.2824554443359375, 0.308197021484375, 0.3339385986328125, 0.35968017578125, 0.3854217529296875, 0.411163330078125, 0.4369049072265625, 0.462646484375, 0.4883880615234375, 0.514129638671875, 0.5398712158203125, 0.56561279296875, 0.5913543701171875, 0.617095947265625, 0.6428375244140625, 0.6685791015625, 0.6943206787109375, 0.720062255859375, 0.7458038330078125, 0.77154541015625, 0.7972869873046875, 0.823028564453125, 0.8487701416015625, 0.87451171875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 12.0, 33.0, 38.0, 77.0, 239.0, 1206.0, 12812.0, 4027504.0, 148444.0, 3056.0, 519.0, 155.0, 74.0, 34.0, 26.0, 11.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.65625, -4.5140380859375, -4.371826171875, -4.2296142578125, -4.08740234375, -3.9451904296875, -3.802978515625, -3.6607666015625, -3.5185546875, -3.3763427734375, -3.234130859375, -3.0919189453125, -2.94970703125, -2.8074951171875, -2.665283203125, -2.5230712890625, -2.380859375, -2.2386474609375, -2.096435546875, -1.9542236328125, -1.81201171875, -1.6697998046875, -1.527587890625, -1.3853759765625, -1.2431640625, -1.1009521484375, -0.958740234375, -0.8165283203125, -0.67431640625, -0.5321044921875, -0.389892578125, -0.2476806640625, -0.10546875, 0.0367431640625, 0.178955078125, 0.3211669921875, 0.46337890625, 0.6055908203125, 0.747802734375, 0.8900146484375, 1.0322265625, 1.1744384765625, 1.316650390625, 1.4588623046875, 1.60107421875, 1.7432861328125, 1.885498046875, 2.0277099609375, 2.169921875, 2.3121337890625, 2.454345703125, 2.5965576171875, 2.73876953125, 2.8809814453125, 3.023193359375, 3.1654052734375, 3.3076171875, 3.4498291015625, 3.592041015625, 3.7342529296875, 3.87646484375, 4.0186767578125, 4.160888671875, 4.3031005859375, 4.4453125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 9.0, 17.0, 16.0, 58.0, 71.0, 189.0, 391.0, 887.0, 1154.0, 683.0, 291.0, 148.0, 75.0, 34.0, 15.0, 13.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.662017822265625, -0.64093017578125, -0.619842529296875, -0.5987548828125, -0.577667236328125, -0.55657958984375, -0.535491943359375, -0.514404296875, -0.493316650390625, -0.47222900390625, -0.451141357421875, -0.4300537109375, -0.408966064453125, -0.38787841796875, -0.366790771484375, -0.345703125, -0.324615478515625, -0.30352783203125, -0.282440185546875, -0.2613525390625, -0.240264892578125, -0.21917724609375, -0.198089599609375, -0.177001953125, -0.155914306640625, -0.13482666015625, -0.113739013671875, -0.0926513671875, -0.071563720703125, -0.05047607421875, -0.029388427734375, -0.00830078125, 0.012786865234375, 0.03387451171875, 0.054962158203125, 0.0760498046875, 0.097137451171875, 0.11822509765625, 0.139312744140625, 0.160400390625, 0.181488037109375, 0.20257568359375, 0.223663330078125, 0.2447509765625, 0.265838623046875, 0.28692626953125, 0.308013916015625, 0.3291015625, 0.350189208984375, 0.37127685546875, 0.392364501953125, 0.4134521484375, 0.434539794921875, 0.45562744140625, 0.476715087890625, 0.497802734375, 0.518890380859375, 0.53997802734375, 0.561065673828125, 0.5821533203125, 0.603240966796875, 0.62432861328125, 0.645416259765625, 0.66650390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 11.0, 9.0, 14.0, 12.0, 28.0, 25.0, 45.0, 42.0, 59.0, 64.0, 88.0, 70.0, 85.0, 78.0, 71.0, 57.0, 49.0, 49.0, 29.0, 31.0, 27.0, 20.0, 13.0, 4.0, 11.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8160516619682312, -0.7804990410804749, -0.7449464797973633, -0.7093938589096069, -0.6738412380218506, -0.6382886171340942, -0.6027359962463379, -0.5671834349632263, -0.53163081407547, -0.4960781931877136, -0.46052560210227966, -0.4249730110168457, -0.38942039012908936, -0.353867769241333, -0.31831517815589905, -0.2827625870704651, -0.24720996618270874, -0.2116573601961136, -0.17610475420951843, -0.14055214822292328, -0.10499954223632812, -0.06944693624973297, -0.03389433026313782, 0.0016582757234573364, 0.03721088171005249, 0.07276348769664764, 0.1083160936832428, 0.14386869966983795, 0.1794213056564331, 0.21497391164302826, 0.2505265176296234, 0.2860791087150574, 0.3216317892074585, 0.35718441009521484, 0.3927370011806488, 0.42828959226608276, 0.4638422131538391, 0.49939483404159546, 0.534947395324707, 0.5705000162124634, 0.6060526371002197, 0.6416052579879761, 0.6771578788757324, 0.712710440158844, 0.7482630610466003, 0.7838156819343567, 0.8193682432174683, 0.8549208641052246, 0.890473484992981, 0.9260261058807373, 0.9615787267684937, 0.9971312880516052, 1.0326838493347168, 1.0682364702224731, 1.1037890911102295, 1.1393417119979858, 1.1748943328857422, 1.2104469537734985, 1.2459995746612549, 1.2815521955490112, 1.3171048164367676, 1.3526573181152344, 1.3882099390029907, 1.423762559890747, 1.4593151807785034]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 0.0, 6.0, 4.0, 9.0, 10.0, 11.0, 11.0, 9.0, 21.0, 13.0, 28.0, 28.0, 34.0, 20.0, 30.0, 36.0, 40.0, 39.0, 47.0, 48.0, 41.0, 48.0, 39.0, 42.0, 41.0, 40.0, 20.0, 46.0, 39.0, 31.0, 26.0, 17.0, 17.0, 19.0, 16.0, 12.0, 10.0, 7.0, 8.0, 8.0, 13.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7138119339942932, -0.6913244128227234, -0.6688368916511536, -0.6463493704795837, -0.6238618493080139, -0.6013742685317993, -0.5788867473602295, -0.5563992261886597, -0.5339117050170898, -0.51142418384552, -0.4889366626739502, -0.46644914150238037, -0.44396159052848816, -0.42147406935691833, -0.3989865481853485, -0.3764989972114563, -0.35401150584220886, -0.33152398467063904, -0.3090364634990692, -0.286548912525177, -0.2640613913536072, -0.24157387018203735, -0.21908634901046753, -0.1965988129377365, -0.1741112917661667, -0.15162377059459686, -0.12913623452186584, -0.10664871335029602, -0.0841611847281456, -0.06167365610599518, -0.039186134934425354, -0.016698598861694336, 0.005788922309875488, 0.02827644906938076, 0.05076397582888603, 0.07325150072574615, 0.09573902934789658, 0.118226557970047, 0.14071407914161682, 0.16320161521434784, 0.18568913638591766, 0.2081766575574875, 0.2306641936302185, 0.25315171480178833, 0.27563923597335815, 0.298126757144928, 0.3206142783164978, 0.34310182929039, 0.36558935046195984, 0.38807687163352966, 0.4105643928050995, 0.4330519437789917, 0.4555394649505615, 0.47802698612213135, 0.5005145072937012, 0.523002028465271, 0.5454895496368408, 0.5679770708084106, 0.5904645919799805, 0.6129521131515503, 0.6354396343231201, 0.6579271554946899, 0.6804146766662598, 0.7029022574424744, 0.7253897786140442]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 12.0, 11.0, 7.0, 17.0, 24.0, 30.0, 59.0, 78.0, 103.0, 168.0, 264.0, 482.0, 837.0, 1622.0, 3367.0, 6837.0, 15929.0, 46704.0, 227837.0, 524705.0, 158859.0, 35306.0, 13138.0, 6109.0, 2812.0, 1366.0, 761.0, 404.0, 235.0, 138.0, 102.0, 73.0, 44.0, 27.0, 21.0, 17.0, 11.0, 12.0, 8.0, 6.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30908203125, -0.2992362976074219, -0.28939056396484375, -0.2795448303222656, -0.2696990966796875, -0.2598533630371094, -0.25000762939453125, -0.24016189575195312, -0.230316162109375, -0.22047042846679688, -0.21062469482421875, -0.20077896118164062, -0.1909332275390625, -0.18108749389648438, -0.17124176025390625, -0.16139602661132812, -0.15155029296875, -0.14170455932617188, -0.13185882568359375, -0.12201309204101562, -0.1121673583984375, -0.10232162475585938, -0.09247589111328125, -0.08263015747070312, -0.072784423828125, -0.06293869018554688, -0.05309295654296875, -0.043247222900390625, -0.0334014892578125, -0.023555755615234375, -0.01371002197265625, -0.003864288330078125, 0.0059814453125, 0.015827178955078125, 0.02567291259765625, 0.035518646240234375, 0.0453643798828125, 0.055210113525390625, 0.06505584716796875, 0.07490158081054688, 0.084747314453125, 0.09459304809570312, 0.10443878173828125, 0.11428451538085938, 0.1241302490234375, 0.13397598266601562, 0.14382171630859375, 0.15366744995117188, 0.16351318359375, 0.17335891723632812, 0.18320465087890625, 0.19305038452148438, 0.2028961181640625, 0.21274185180664062, 0.22258758544921875, 0.23243331909179688, 0.242279052734375, 0.2521247863769531, 0.26197052001953125, 0.2718162536621094, 0.2816619873046875, 0.2915077209472656, 0.30135345458984375, 0.3111991882324219, 0.321044921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 6.0, 6.0, 10.0, 12.0, 9.0, 14.0, 22.0, 19.0, 23.0, 28.0, 24.0, 24.0, 37.0, 43.0, 39.0, 47.0, 51.0, 46.0, 58.0, 34.0, 29.0, 37.0, 40.0, 44.0, 37.0, 37.0, 29.0, 23.0, 29.0, 18.0, 19.0, 13.0, 10.0, 14.0, 14.0, 11.0, 6.0, 3.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46728515625, -0.4530029296875, -0.438720703125, -0.4244384765625, -0.41015625, -0.3958740234375, -0.381591796875, -0.3673095703125, -0.35302734375, -0.3387451171875, -0.324462890625, -0.3101806640625, -0.2958984375, -0.2816162109375, -0.267333984375, -0.2530517578125, -0.23876953125, -0.2244873046875, -0.210205078125, -0.1959228515625, -0.181640625, -0.1673583984375, -0.153076171875, -0.1387939453125, -0.12451171875, -0.1102294921875, -0.095947265625, -0.0816650390625, -0.0673828125, -0.0531005859375, -0.038818359375, -0.0245361328125, -0.01025390625, 0.0040283203125, 0.018310546875, 0.0325927734375, 0.046875, 0.0611572265625, 0.075439453125, 0.0897216796875, 0.10400390625, 0.1182861328125, 0.132568359375, 0.1468505859375, 0.1611328125, 0.1754150390625, 0.189697265625, 0.2039794921875, 0.21826171875, 0.2325439453125, 0.246826171875, 0.2611083984375, 0.275390625, 0.2896728515625, 0.303955078125, 0.3182373046875, 0.33251953125, 0.3468017578125, 0.361083984375, 0.3753662109375, 0.3896484375, 0.4039306640625, 0.418212890625, 0.4324951171875, 0.44677734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 10.0, 6.0, 5.0, 5.0, 14.0, 18.0, 20.0, 24.0, 41.0, 76.0, 113.0, 199.0, 289.0, 550.0, 1122.0, 2157.0, 5282.0, 12858.0, 41048.0, 205817.0, 547552.0, 174288.0, 35756.0, 11935.0, 4796.0, 2155.0, 1051.0, 542.0, 278.0, 172.0, 108.0, 72.0, 59.0, 41.0, 26.0, 18.0, 7.0, 16.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.315673828125, -0.30651092529296875, -0.2973480224609375, -0.28818511962890625, -0.279022216796875, -0.26985931396484375, -0.2606964111328125, -0.25153350830078125, -0.24237060546875, -0.23320770263671875, -0.2240447998046875, -0.21488189697265625, -0.205718994140625, -0.19655609130859375, -0.1873931884765625, -0.17823028564453125, -0.1690673828125, -0.15990447998046875, -0.1507415771484375, -0.14157867431640625, -0.132415771484375, -0.12325286865234375, -0.1140899658203125, -0.10492706298828125, -0.09576416015625, -0.08660125732421875, -0.0774383544921875, -0.06827545166015625, -0.059112548828125, -0.04994964599609375, -0.0407867431640625, -0.03162384033203125, -0.0224609375, -0.01329803466796875, -0.0041351318359375, 0.00502777099609375, 0.014190673828125, 0.02335357666015625, 0.0325164794921875, 0.04167938232421875, 0.05084228515625, 0.06000518798828125, 0.0691680908203125, 0.07833099365234375, 0.087493896484375, 0.09665679931640625, 0.1058197021484375, 0.11498260498046875, 0.1241455078125, 0.13330841064453125, 0.1424713134765625, 0.15163421630859375, 0.160797119140625, 0.16996002197265625, 0.1791229248046875, 0.18828582763671875, 0.19744873046875, 0.20661163330078125, 0.2157745361328125, 0.22493743896484375, 0.234100341796875, 0.24326324462890625, 0.2524261474609375, 0.26158905029296875, 0.270751953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 12.0, 8.0, 10.0, 10.0, 14.0, 17.0, 18.0, 18.0, 33.0, 28.0, 31.0, 37.0, 34.0, 39.0, 48.0, 47.0, 50.0, 43.0, 56.0, 39.0, 32.0, 35.0, 34.0, 39.0, 29.0, 45.0, 24.0, 30.0, 16.0, 27.0, 15.0, 12.0, 13.0, 5.0, 11.0, 4.0, 4.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2568359375, -1.2203826904296875, -1.183929443359375, -1.1474761962890625, -1.11102294921875, -1.0745697021484375, -1.038116455078125, -1.0016632080078125, -0.9652099609375, -0.9287567138671875, -0.892303466796875, -0.8558502197265625, -0.81939697265625, -0.7829437255859375, -0.746490478515625, -0.7100372314453125, -0.673583984375, -0.6371307373046875, -0.600677490234375, -0.5642242431640625, -0.52777099609375, -0.4913177490234375, -0.454864501953125, -0.4184112548828125, -0.3819580078125, -0.3455047607421875, -0.309051513671875, -0.2725982666015625, -0.23614501953125, -0.1996917724609375, -0.163238525390625, -0.1267852783203125, -0.09033203125, -0.0538787841796875, -0.017425537109375, 0.0190277099609375, 0.05548095703125, 0.0919342041015625, 0.128387451171875, 0.1648406982421875, 0.2012939453125, 0.2377471923828125, 0.274200439453125, 0.3106536865234375, 0.34710693359375, 0.3835601806640625, 0.420013427734375, 0.4564666748046875, 0.492919921875, 0.5293731689453125, 0.565826416015625, 0.6022796630859375, 0.63873291015625, 0.6751861572265625, 0.711639404296875, 0.7480926513671875, 0.7845458984375, 0.8209991455078125, 0.857452392578125, 0.8939056396484375, 0.93035888671875, 0.9668121337890625, 1.003265380859375, 1.0397186279296875, 1.076171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 7.0, 3.0, 10.0, 23.0, 26.0, 37.0, 64.0, 108.0, 224.0, 398.0, 870.0, 1987.0, 4950.0, 14403.0, 87489.0, 843410.0, 72809.0, 13554.0, 4586.0, 1836.0, 841.0, 419.0, 204.0, 113.0, 71.0, 31.0, 30.0, 13.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243896484375, -0.23532867431640625, -0.2267608642578125, -0.21819305419921875, -0.209625244140625, -0.20105743408203125, -0.1924896240234375, -0.18392181396484375, -0.17535400390625, -0.16678619384765625, -0.1582183837890625, -0.14965057373046875, -0.141082763671875, -0.13251495361328125, -0.1239471435546875, -0.11537933349609375, -0.1068115234375, -0.09824371337890625, -0.0896759033203125, -0.08110809326171875, -0.072540283203125, -0.06397247314453125, -0.0554046630859375, -0.04683685302734375, -0.03826904296875, -0.02970123291015625, -0.0211334228515625, -0.01256561279296875, -0.003997802734375, 0.00457000732421875, 0.0131378173828125, 0.02170562744140625, 0.0302734375, 0.03884124755859375, 0.0474090576171875, 0.05597686767578125, 0.064544677734375, 0.07311248779296875, 0.0816802978515625, 0.09024810791015625, 0.09881591796875, 0.10738372802734375, 0.1159515380859375, 0.12451934814453125, 0.133087158203125, 0.14165496826171875, 0.1502227783203125, 0.15879058837890625, 0.1673583984375, 0.17592620849609375, 0.1844940185546875, 0.19306182861328125, 0.201629638671875, 0.21019744873046875, 0.2187652587890625, 0.22733306884765625, 0.23590087890625, 0.24446868896484375, 0.2530364990234375, 0.26160430908203125, 0.270172119140625, 0.27873992919921875, 0.2873077392578125, 0.29587554931640625, 0.304443359375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 6.0, 5.0, 5.0, 13.0, 11.0, 19.0, 62.0, 173.0, 302.0, 223.0, 98.0, 29.0, 18.0, 6.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00019288063049316406, -0.00018747150897979736, -0.00018206238746643066, -0.00017665326595306396, -0.00017124414443969727, -0.00016583502292633057, -0.00016042590141296387, -0.00015501677989959717, -0.00014960765838623047, -0.00014419853687286377, -0.00013878941535949707, -0.00013338029384613037, -0.00012797117233276367, -0.00012256205081939697, -0.00011715292930603027, -0.00011174380779266357, -0.00010633468627929688, -0.00010092556476593018, -9.551644325256348e-05, -9.010732173919678e-05, -8.469820022583008e-05, -7.928907871246338e-05, -7.387995719909668e-05, -6.847083568572998e-05, -6.306171417236328e-05, -5.765259265899658e-05, -5.224347114562988e-05, -4.6834349632263184e-05, -4.1425228118896484e-05, -3.6016106605529785e-05, -3.0606985092163086e-05, -2.5197863578796387e-05, -1.9788742065429688e-05, -1.4379620552062988e-05, -8.970499038696289e-06, -3.56137752532959e-06, 1.8477439880371094e-06, 7.256865501403809e-06, 1.2665987014770508e-05, 1.8075108528137207e-05, 2.3484230041503906e-05, 2.8893351554870605e-05, 3.4302473068237305e-05, 3.9711594581604004e-05, 4.51207160949707e-05, 5.05298376083374e-05, 5.59389591217041e-05, 6.13480806350708e-05, 6.67572021484375e-05, 7.21663236618042e-05, 7.75754451751709e-05, 8.29845666885376e-05, 8.83936882019043e-05, 9.3802809715271e-05, 9.92119312286377e-05, 0.0001046210527420044, 0.0001100301742553711, 0.00011543929576873779, 0.00012084841728210449, 0.0001262575387954712, 0.0001316666603088379, 0.0001370757818222046, 0.0001424849033355713, 0.000147894024848938, 0.0001533031463623047]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 11.0, 11.0, 18.0, 20.0, 24.0, 41.0, 62.0, 82.0, 126.0, 189.0, 298.0, 419.0, 728.0, 1172.0, 2043.0, 3635.0, 6796.0, 14941.0, 43000.0, 202651.0, 525661.0, 177839.0, 39208.0, 14016.0, 6695.0, 3480.0, 1977.0, 1197.0, 725.0, 483.0, 288.0, 218.0, 133.0, 110.0, 76.0, 52.0, 29.0, 31.0, 19.0, 13.0, 8.0, 3.0, 5.0, 6.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.150634765625, -0.1461334228515625, -0.141632080078125, -0.1371307373046875, -0.13262939453125, -0.1281280517578125, -0.123626708984375, -0.1191253662109375, -0.1146240234375, -0.1101226806640625, -0.105621337890625, -0.1011199951171875, -0.09661865234375, -0.0921173095703125, -0.087615966796875, -0.0831146240234375, -0.07861328125, -0.0741119384765625, -0.069610595703125, -0.0651092529296875, -0.06060791015625, -0.0561065673828125, -0.051605224609375, -0.0471038818359375, -0.0426025390625, -0.0381011962890625, -0.033599853515625, -0.0290985107421875, -0.02459716796875, -0.0200958251953125, -0.015594482421875, -0.0110931396484375, -0.006591796875, -0.0020904541015625, 0.002410888671875, 0.0069122314453125, 0.01141357421875, 0.0159149169921875, 0.020416259765625, 0.0249176025390625, 0.0294189453125, 0.0339202880859375, 0.038421630859375, 0.0429229736328125, 0.04742431640625, 0.0519256591796875, 0.056427001953125, 0.0609283447265625, 0.0654296875, 0.0699310302734375, 0.074432373046875, 0.0789337158203125, 0.08343505859375, 0.0879364013671875, 0.092437744140625, 0.0969390869140625, 0.1014404296875, 0.1059417724609375, 0.110443115234375, 0.1149444580078125, 0.11944580078125, 0.1239471435546875, 0.128448486328125, 0.1329498291015625, 0.137451171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 9.0, 21.0, 10.0, 25.0, 42.0, 66.0, 107.0, 124.0, 164.0, 157.0, 94.0, 53.0, 31.0, 21.0, 12.0, 5.0, 6.0, 8.0, 7.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0618896484375, -0.06003093719482422, -0.05817222595214844, -0.056313514709472656, -0.054454803466796875, -0.052596092224121094, -0.05073738098144531, -0.04887866973876953, -0.04701995849609375, -0.04516124725341797, -0.04330253601074219, -0.041443824768066406, -0.039585113525390625, -0.037726402282714844, -0.03586769104003906, -0.03400897979736328, -0.0321502685546875, -0.03029155731201172, -0.028432846069335938, -0.026574134826660156, -0.024715423583984375, -0.022856712341308594, -0.020998001098632812, -0.01913928985595703, -0.01728057861328125, -0.015421867370605469, -0.013563156127929688, -0.011704444885253906, -0.009845733642578125, -0.007987022399902344, -0.0061283111572265625, -0.004269599914550781, -0.002410888671875, -0.0005521774291992188, 0.0013065338134765625, 0.0031652450561523438, 0.005023956298828125, 0.006882667541503906, 0.008741378784179688, 0.010600090026855469, 0.01245880126953125, 0.014317512512207031, 0.016176223754882812, 0.018034934997558594, 0.019893646240234375, 0.021752357482910156, 0.023611068725585938, 0.02546977996826172, 0.0273284912109375, 0.02918720245361328, 0.031045913696289062, 0.032904624938964844, 0.034763336181640625, 0.036622047424316406, 0.03848075866699219, 0.04033946990966797, 0.04219818115234375, 0.04405689239501953, 0.04591560363769531, 0.047774314880371094, 0.049633026123046875, 0.051491737365722656, 0.05335044860839844, 0.05520915985107422, 0.05706787109375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 2.0, 7.0, 15.0, 16.0, 16.0, 26.0, 21.0, 37.0, 53.0, 47.0, 51.0, 63.0, 63.0, 71.0, 72.0, 73.0, 54.0, 50.0, 65.0, 37.0, 38.0, 29.0, 19.0, 18.0, 13.0, 10.0, 7.0, 8.0, 5.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5058618783950806, -0.4864986836910248, -0.4671354591846466, -0.4477722644805908, -0.42840903997421265, -0.40904584527015686, -0.3896826505661011, -0.3703194260597229, -0.3509562313556671, -0.33159303665161133, -0.31222981214523315, -0.29286661744117737, -0.2735034227371216, -0.2541401982307434, -0.23477700352668762, -0.21541379392147064, -0.19605058431625366, -0.17668737471103668, -0.1573241651058197, -0.13796097040176392, -0.11859776079654694, -0.09923455119132996, -0.07987134903669357, -0.06050814688205719, -0.04114493727684021, -0.02178173139691353, -0.002418525516986847, 0.016944680362939835, 0.036307886242866516, 0.055671095848083496, 0.07503429800271988, 0.09439750015735626, 0.11376076936721802, 0.133123978972435, 0.15248718857765198, 0.17185038328170776, 0.19121359288692474, 0.21057680249214172, 0.2299399971961975, 0.2493032068014145, 0.26866641640663147, 0.28802961111068726, 0.30739283561706543, 0.3267560303211212, 0.346119225025177, 0.3654824495315552, 0.38484564423561096, 0.40420883893966675, 0.4235720634460449, 0.4429352581501007, 0.4622984826564789, 0.48166167736053467, 0.5010249018669128, 0.520388126373291, 0.5397512912750244, 0.5591145157814026, 0.5784777402877808, 0.5978409647941589, 0.6172041296958923, 0.6365673542022705, 0.6559305787086487, 0.6752938032150269, 0.6946569681167603, 0.7140201926231384, 0.7333833575248718]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 2.0, 5.0, 3.0, 7.0, 15.0, 12.0, 14.0, 24.0, 20.0, 23.0, 32.0, 28.0, 33.0, 38.0, 32.0, 37.0, 48.0, 39.0, 45.0, 44.0, 45.0, 48.0, 38.0, 46.0, 31.0, 31.0, 28.0, 36.0, 28.0, 28.0, 20.0, 18.0, 18.0, 6.0, 15.0, 11.0, 8.0, 10.0, 6.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.4304371476173401, -0.4162605404853821, -0.4020839333534241, -0.38790732622146606, -0.37373071908950806, -0.35955411195755005, -0.34537750482559204, -0.33120086789131165, -0.31702426075935364, -0.30284765362739563, -0.2886710464954376, -0.2744944393634796, -0.2603178322315216, -0.2461412101984024, -0.2319646030664444, -0.2177879810333252, -0.20361138880252838, -0.18943478167057037, -0.17525817453861237, -0.16108155250549316, -0.14690494537353516, -0.13272833824157715, -0.11855173110961914, -0.10437511652708054, -0.09019850939512253, -0.07602190226316452, -0.061845287680625916, -0.04766868054866791, -0.0334920696914196, -0.019315458834171295, -0.005138851702213287, 0.009037762880325317, 0.023214370012283325, 0.03739098086953163, 0.05156759172677994, 0.06574419885873795, 0.07992081344127655, 0.09409742057323456, 0.10827402770519257, 0.12245064228773117, 0.13662725687026978, 0.15080386400222778, 0.1649804711341858, 0.1791570782661438, 0.193333700299263, 0.207510307431221, 0.22168691456317902, 0.23586353659629822, 0.25004011392593384, 0.26421672105789185, 0.27839332818984985, 0.29256993532180786, 0.30674654245376587, 0.3209231495857239, 0.3350997567176819, 0.3492763936519623, 0.3634530007839203, 0.3776296079158783, 0.3918062150478363, 0.4059828221797943, 0.4201594293117523, 0.4343360662460327, 0.4485126733779907, 0.46268928050994873, 0.47686588764190674]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 10.0, 13.0, 19.0, 35.0, 54.0, 93.0, 193.0, 329.0, 741.0, 1991.0, 5861.0, 19612.0, 73324.0, 276918.0, 455969.0, 155857.0, 40203.0, 11267.0, 3547.0, 1340.0, 591.0, 276.0, 126.0, 62.0, 47.0, 28.0, 23.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3662109375, -1.32855224609375, -1.2908935546875, -1.25323486328125, -1.215576171875, -1.17791748046875, -1.1402587890625, -1.10260009765625, -1.06494140625, -1.02728271484375, -0.9896240234375, -0.95196533203125, -0.914306640625, -0.87664794921875, -0.8389892578125, -0.80133056640625, -0.763671875, -0.72601318359375, -0.6883544921875, -0.65069580078125, -0.613037109375, -0.57537841796875, -0.5377197265625, -0.50006103515625, -0.46240234375, -0.42474365234375, -0.3870849609375, -0.34942626953125, -0.311767578125, -0.27410888671875, -0.2364501953125, -0.19879150390625, -0.1611328125, -0.12347412109375, -0.0858154296875, -0.04815673828125, -0.010498046875, 0.02716064453125, 0.0648193359375, 0.10247802734375, 0.14013671875, 0.17779541015625, 0.2154541015625, 0.25311279296875, 0.290771484375, 0.32843017578125, 0.3660888671875, 0.40374755859375, 0.44140625, 0.47906494140625, 0.5167236328125, 0.55438232421875, 0.592041015625, 0.62969970703125, 0.6673583984375, 0.70501708984375, 0.74267578125, 0.78033447265625, 0.8179931640625, 0.85565185546875, 0.893310546875, 0.93096923828125, 0.9686279296875, 1.00628662109375, 1.0439453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 7.0, 6.0, 7.0, 10.0, 11.0, 11.0, 26.0, 26.0, 36.0, 39.0, 37.0, 47.0, 51.0, 63.0, 68.0, 67.0, 68.0, 53.0, 56.0, 49.0, 38.0, 47.0, 44.0, 28.0, 26.0, 18.0, 17.0, 11.0, 10.0, 9.0, 10.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.34375, -1.3082122802734375, -1.272674560546875, -1.2371368408203125, -1.20159912109375, -1.1660614013671875, -1.130523681640625, -1.0949859619140625, -1.0594482421875, -1.0239105224609375, -0.988372802734375, -0.9528350830078125, -0.91729736328125, -0.8817596435546875, -0.846221923828125, -0.8106842041015625, -0.775146484375, -0.7396087646484375, -0.704071044921875, -0.6685333251953125, -0.63299560546875, -0.5974578857421875, -0.561920166015625, -0.5263824462890625, -0.4908447265625, -0.4553070068359375, -0.419769287109375, -0.3842315673828125, -0.34869384765625, -0.3131561279296875, -0.277618408203125, -0.2420806884765625, -0.20654296875, -0.1710052490234375, -0.135467529296875, -0.0999298095703125, -0.06439208984375, -0.0288543701171875, 0.006683349609375, 0.0422210693359375, 0.0777587890625, 0.1132965087890625, 0.148834228515625, 0.1843719482421875, 0.21990966796875, 0.2554473876953125, 0.290985107421875, 0.3265228271484375, 0.362060546875, 0.3975982666015625, 0.433135986328125, 0.4686737060546875, 0.50421142578125, 0.5397491455078125, 0.575286865234375, 0.6108245849609375, 0.6463623046875, 0.6819000244140625, 0.717437744140625, 0.7529754638671875, 0.78851318359375, 0.8240509033203125, 0.859588623046875, 0.8951263427734375, 0.9306640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 9.0, 13.0, 17.0, 29.0, 33.0, 50.0, 84.0, 130.0, 239.0, 426.0, 813.0, 1653.0, 3452.0, 8423.0, 21435.0, 60366.0, 181545.0, 405256.0, 238635.0, 79240.0, 27628.0, 10574.0, 4354.0, 1960.0, 983.0, 507.0, 296.0, 147.0, 83.0, 53.0, 30.0, 18.0, 14.0, 18.0, 15.0, 6.0, 8.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9873046875, -0.9539794921875, -0.920654296875, -0.8873291015625, -0.85400390625, -0.8206787109375, -0.787353515625, -0.7540283203125, -0.720703125, -0.6873779296875, -0.654052734375, -0.6207275390625, -0.58740234375, -0.5540771484375, -0.520751953125, -0.4874267578125, -0.4541015625, -0.4207763671875, -0.387451171875, -0.3541259765625, -0.32080078125, -0.2874755859375, -0.254150390625, -0.2208251953125, -0.1875, -0.1541748046875, -0.120849609375, -0.0875244140625, -0.05419921875, -0.0208740234375, 0.012451171875, 0.0457763671875, 0.0791015625, 0.1124267578125, 0.145751953125, 0.1790771484375, 0.21240234375, 0.2457275390625, 0.279052734375, 0.3123779296875, 0.345703125, 0.3790283203125, 0.412353515625, 0.4456787109375, 0.47900390625, 0.5123291015625, 0.545654296875, 0.5789794921875, 0.6123046875, 0.6456298828125, 0.678955078125, 0.7122802734375, 0.74560546875, 0.7789306640625, 0.812255859375, 0.8455810546875, 0.87890625, 0.9122314453125, 0.945556640625, 0.9788818359375, 1.01220703125, 1.0455322265625, 1.078857421875, 1.1121826171875, 1.1455078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 3.0, 10.0, 16.0, 15.0, 17.0, 21.0, 41.0, 34.0, 52.0, 43.0, 68.0, 58.0, 57.0, 49.0, 67.0, 64.0, 65.0, 64.0, 42.0, 38.0, 32.0, 30.0, 22.0, 26.0, 15.0, 11.0, 13.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.515625, -1.4735870361328125, -1.431549072265625, -1.3895111083984375, -1.34747314453125, -1.3054351806640625, -1.263397216796875, -1.2213592529296875, -1.1793212890625, -1.1372833251953125, -1.095245361328125, -1.0532073974609375, -1.01116943359375, -0.9691314697265625, -0.927093505859375, -0.8850555419921875, -0.843017578125, -0.8009796142578125, -0.758941650390625, -0.7169036865234375, -0.67486572265625, -0.6328277587890625, -0.590789794921875, -0.5487518310546875, -0.5067138671875, -0.4646759033203125, -0.422637939453125, -0.3805999755859375, -0.33856201171875, -0.2965240478515625, -0.254486083984375, -0.2124481201171875, -0.17041015625, -0.1283721923828125, -0.086334228515625, -0.0442962646484375, -0.00225830078125, 0.0397796630859375, 0.081817626953125, 0.1238555908203125, 0.1658935546875, 0.2079315185546875, 0.249969482421875, 0.2920074462890625, 0.33404541015625, 0.3760833740234375, 0.418121337890625, 0.4601593017578125, 0.502197265625, 0.5442352294921875, 0.586273193359375, 0.6283111572265625, 0.67034912109375, 0.7123870849609375, 0.754425048828125, 0.7964630126953125, 0.8385009765625, 0.8805389404296875, 0.922576904296875, 0.9646148681640625, 1.00665283203125, 1.0486907958984375, 1.090728759765625, 1.1327667236328125, 1.1748046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 12.0, 9.0, 20.0, 35.0, 28.0, 39.0, 42.0, 67.0, 84.0, 112.0, 147.0, 207.0, 289.0, 377.0, 505.0, 753.0, 1024.0, 1615.0, 2596.0, 4708.0, 9138.0, 20455.0, 52948.0, 150848.0, 405495.0, 246065.0, 89222.0, 32338.0, 13223.0, 6291.0, 3409.0, 2041.0, 1280.0, 824.0, 602.0, 426.0, 302.0, 232.0, 158.0, 138.0, 122.0, 89.0, 54.0, 51.0, 38.0, 30.0, 15.0, 16.0, 8.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2003173828125, -0.19400787353515625, -0.1876983642578125, -0.18138885498046875, -0.175079345703125, -0.16876983642578125, -0.1624603271484375, -0.15615081787109375, -0.14984130859375, -0.14353179931640625, -0.1372222900390625, -0.13091278076171875, -0.124603271484375, -0.11829376220703125, -0.1119842529296875, -0.10567474365234375, -0.099365234375, -0.09305572509765625, -0.0867462158203125, -0.08043670654296875, -0.074127197265625, -0.06781768798828125, -0.0615081787109375, -0.05519866943359375, -0.04888916015625, -0.04257965087890625, -0.0362701416015625, -0.02996063232421875, -0.023651123046875, -0.01734161376953125, -0.0110321044921875, -0.00472259521484375, 0.0015869140625, 0.00789642333984375, 0.0142059326171875, 0.02051544189453125, 0.026824951171875, 0.03313446044921875, 0.0394439697265625, 0.04575347900390625, 0.05206298828125, 0.05837249755859375, 0.0646820068359375, 0.07099151611328125, 0.077301025390625, 0.08361053466796875, 0.0899200439453125, 0.09622955322265625, 0.1025390625, 0.10884857177734375, 0.1151580810546875, 0.12146759033203125, 0.127777099609375, 0.13408660888671875, 0.1403961181640625, 0.14670562744140625, 0.15301513671875, 0.15932464599609375, 0.1656341552734375, 0.17194366455078125, 0.178253173828125, 0.18456268310546875, 0.1908721923828125, 0.19718170166015625, 0.2034912109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 5.0, 14.0, 16.0, 28.0, 24.0, 44.0, 59.0, 93.0, 97.0, 166.0, 124.0, 96.0, 73.0, 48.0, 30.0, 19.0, 21.0, 14.0, 7.0, 9.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32133674621582e-05, -4.1241757571697235e-05, -3.927014768123627e-05, -3.72985377907753e-05, -3.532692790031433e-05, -3.335531800985336e-05, -3.1383708119392395e-05, -2.9412098228931427e-05, -2.744048833847046e-05, -2.546887844800949e-05, -2.3497268557548523e-05, -2.1525658667087555e-05, -1.9554048776626587e-05, -1.758243888616562e-05, -1.561082899570465e-05, -1.3639219105243683e-05, -1.1667609214782715e-05, -9.695999324321747e-06, -7.724389433860779e-06, -5.752779543399811e-06, -3.7811696529388428e-06, -1.8095597624778748e-06, 1.6205012798309326e-07, 2.1336600184440613e-06, 4.105269908905029e-06, 6.076879799365997e-06, 8.048489689826965e-06, 1.0020099580287933e-05, 1.1991709470748901e-05, 1.396331936120987e-05, 1.5934929251670837e-05, 1.7906539142131805e-05, 1.9878149032592773e-05, 2.184975892305374e-05, 2.382136881351471e-05, 2.5792978703975677e-05, 2.7764588594436646e-05, 2.9736198484897614e-05, 3.170780837535858e-05, 3.367941826581955e-05, 3.565102815628052e-05, 3.7622638046741486e-05, 3.9594247937202454e-05, 4.156585782766342e-05, 4.353746771812439e-05, 4.550907760858536e-05, 4.7480687499046326e-05, 4.9452297389507294e-05, 5.142390727996826e-05, 5.339551717042923e-05, 5.53671270608902e-05, 5.7338736951351166e-05, 5.9310346841812134e-05, 6.12819567322731e-05, 6.325356662273407e-05, 6.522517651319504e-05, 6.7196786403656e-05, 6.916839629411697e-05, 7.114000618457794e-05, 7.311161607503891e-05, 7.508322596549988e-05, 7.705483585596085e-05, 7.902644574642181e-05, 8.099805563688278e-05, 8.296966552734375e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 9.0, 8.0, 10.0, 18.0, 25.0, 17.0, 28.0, 15.0, 29.0, 47.0, 49.0, 96.0, 119.0, 164.0, 225.0, 313.0, 442.0, 674.0, 1118.0, 2275.0, 4746.0, 13596.0, 60559.0, 385565.0, 485750.0, 67216.0, 14662.0, 5009.0, 2180.0, 1178.0, 746.0, 494.0, 319.0, 196.0, 159.0, 102.0, 85.0, 70.0, 45.0, 43.0, 33.0, 23.0, 31.0, 13.0, 15.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.411376953125, -0.3985328674316406, -0.38568878173828125, -0.3728446960449219, -0.3600006103515625, -0.3471565246582031, -0.33431243896484375, -0.3214683532714844, -0.308624267578125, -0.2957801818847656, -0.28293609619140625, -0.2700920104980469, -0.2572479248046875, -0.24440383911132812, -0.23155975341796875, -0.21871566772460938, -0.20587158203125, -0.19302749633789062, -0.18018341064453125, -0.16733932495117188, -0.1544952392578125, -0.14165115356445312, -0.12880706787109375, -0.11596298217773438, -0.103118896484375, -0.09027481079101562, -0.07743072509765625, -0.06458663940429688, -0.0517425537109375, -0.038898468017578125, -0.02605438232421875, -0.013210296630859375, -0.0003662109375, 0.012477874755859375, 0.02532196044921875, 0.038166046142578125, 0.0510101318359375, 0.06385421752929688, 0.07669830322265625, 0.08954238891601562, 0.102386474609375, 0.11523056030273438, 0.12807464599609375, 0.14091873168945312, 0.1537628173828125, 0.16660690307617188, 0.17945098876953125, 0.19229507446289062, 0.20513916015625, 0.21798324584960938, 0.23082733154296875, 0.24367141723632812, 0.2565155029296875, 0.2693595886230469, 0.28220367431640625, 0.2950477600097656, 0.307891845703125, 0.3207359313964844, 0.33358001708984375, 0.3464241027832031, 0.3592681884765625, 0.3721122741699219, 0.38495635986328125, 0.3978004455566406, 0.41064453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 11.0, 7.0, 13.0, 19.0, 29.0, 57.0, 107.0, 161.0, 268.0, 152.0, 89.0, 35.0, 19.0, 19.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430908203125, -0.4190025329589844, -0.40709686279296875, -0.3951911926269531, -0.3832855224609375, -0.3713798522949219, -0.35947418212890625, -0.3475685119628906, -0.335662841796875, -0.3237571716308594, -0.31185150146484375, -0.2999458312988281, -0.2880401611328125, -0.2761344909667969, -0.26422882080078125, -0.2523231506347656, -0.24041748046875, -0.22851181030273438, -0.21660614013671875, -0.20470046997070312, -0.1927947998046875, -0.18088912963867188, -0.16898345947265625, -0.15707778930664062, -0.145172119140625, -0.13326644897460938, -0.12136077880859375, -0.10945510864257812, -0.0975494384765625, -0.08564376831054688, -0.07373809814453125, -0.061832427978515625, -0.0499267578125, -0.038021087646484375, -0.02611541748046875, -0.014209747314453125, -0.0023040771484375, 0.009601593017578125, 0.02150726318359375, 0.033412933349609375, 0.045318603515625, 0.057224273681640625, 0.06912994384765625, 0.08103561401367188, 0.0929412841796875, 0.10484695434570312, 0.11675262451171875, 0.12865829467773438, 0.14056396484375, 0.15246963500976562, 0.16437530517578125, 0.17628097534179688, 0.1881866455078125, 0.20009231567382812, 0.21199798583984375, 0.22390365600585938, 0.235809326171875, 0.24771499633789062, 0.25962066650390625, 0.2715263366699219, 0.2834320068359375, 0.2953376770019531, 0.30724334716796875, 0.3191490173339844, 0.3310546875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 26.0, 75.0, 146.0, 233.0, 224.0, 159.0, 76.0, 29.0, 14.0, 8.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4147908687591553, -2.273193359375, -2.1315956115722656, -1.9899981021881104, -1.848400592803955, -1.7068029642105103, -1.5652053356170654, -1.4236078262329102, -1.2820101976394653, -1.1404125690460205, -0.9988150596618652, -0.8572174310684204, -0.7156198620796204, -0.5740222930908203, -0.4324246644973755, -0.29082709550857544, -0.1492295265197754, -0.007631942629814148, 0.1339656412601471, 0.27556324005126953, 0.4171608090400696, 0.5587583780288696, 0.7003560066223145, 0.8419535756111145, 0.9835511445999146, 1.1251487731933594, 1.2667462825775146, 1.4083439111709595, 1.5499415397644043, 1.6915390491485596, 1.8331366777420044, 1.9747343063354492, 2.1163320541381836, 2.257929563522339, 2.3995273113250732, 2.5411248207092285, 2.682722330093384, 2.824319839477539, 2.9659175872802734, 3.1075150966644287, 3.249112606048584, 3.3907101154327393, 3.5323078632354736, 3.673905372619629, 3.815502882003784, 3.9571003913879395, 4.098698139190674, 4.240295886993408, 4.381893157958984, 4.523490905761719, 4.665088176727295, 4.806685924530029, 4.948283672332764, 5.08988094329834, 5.231478691101074, 5.373076438903809, 5.514674186706543, 5.656271934509277, 5.7978692054748535, 5.939466953277588, 6.081064701080322, 6.222661972045898, 6.364259719848633, 6.505857467651367, 6.647454738616943]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 6.0, 10.0, 6.0, 10.0, 20.0, 13.0, 13.0, 18.0, 26.0, 28.0, 30.0, 24.0, 31.0, 28.0, 32.0, 38.0, 38.0, 44.0, 33.0, 31.0, 20.0, 33.0, 28.0, 32.0, 36.0, 31.0, 29.0, 29.0, 21.0, 22.0, 29.0, 31.0, 25.0, 21.0, 21.0, 14.0, 9.0, 11.0, 13.0, 16.0, 11.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.3897453546524048, -1.3478212356567383, -1.3058971166610718, -1.2639729976654053, -1.2220488786697388, -1.1801247596740723, -1.1382007598876953, -1.0962765216827393, -1.0543525218963623, -1.0124284029006958, -0.9705042839050293, -0.9285801649093628, -0.8866560459136963, -0.8447319269180298, -0.8028078675270081, -0.7608837485313416, -0.7189595699310303, -0.6770354509353638, -0.6351113319396973, -0.5931872129440308, -0.5512630939483643, -0.5093389749526978, -0.467414915561676, -0.4254907965660095, -0.383566677570343, -0.3416425585746765, -0.29971843957901, -0.2577943503856659, -0.2158702313899994, -0.17394611239433289, -0.13202202320098877, -0.09009790420532227, -0.04817378520965576, -0.006249673664569855, 0.03567443788051605, 0.07759854197502136, 0.11952266097068787, 0.16144677996635437, 0.2033708691596985, 0.245294988155365, 0.2872191071510315, 0.329143226146698, 0.3710673451423645, 0.4129914343357086, 0.4549155533313751, 0.4968396723270416, 0.5387637615203857, 0.5806878805160522, 0.6226119995117188, 0.6645361185073853, 0.7064602375030518, 0.7483843564987183, 0.7903084754943848, 0.8322325944900513, 0.874156653881073, 0.9160807728767395, 0.958004891872406, 0.9999290108680725, 1.0418530702590942, 1.0837771892547607, 1.1257013082504272, 1.1676254272460938, 1.2095495462417603, 1.2514736652374268, 1.2933977842330933]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 7.0, 2.0, 2.0, 4.0, 6.0, 4.0, 11.0, 11.0, 19.0, 23.0, 27.0, 39.0, 59.0, 74.0, 95.0, 123.0, 177.0, 247.0, 323.0, 458.0, 667.0, 903.0, 1227.0, 1625.0, 2239.0, 3015.0, 3997.0, 1020211.0, 3917.0, 2925.0, 2200.0, 1604.0, 1170.0, 842.0, 624.0, 453.0, 338.0, 252.0, 188.0, 127.0, 96.0, 59.0, 52.0, 47.0, 33.0, 28.0, 15.0, 11.0, 6.0, 5.0, 9.0, 7.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.337107539176941, -1.2932158708572388, -1.249324083328247, -1.205432415008545, -1.1615407466888428, -1.117648959159851, -1.073757290840149, -1.0298655033111572, -0.9859738349914551, -0.9420821070671082, -0.8981903791427612, -0.8542987108230591, -0.8104069828987122, -0.7665152549743652, -0.7226235866546631, -0.6787318587303162, -0.6348401308059692, -0.5909484028816223, -0.5470566749572754, -0.5031650066375732, -0.4592732787132263, -0.4153815507888794, -0.37148985266685486, -0.3275981545448303, -0.2837064266204834, -0.23981471359729767, -0.19592300057411194, -0.1520312875509262, -0.10813957452774048, -0.06424786150455475, -0.02035614848136902, 0.023535549640655518, 0.06742739677429199, 0.11131910979747772, 0.15521082282066345, 0.19910253584384918, 0.2429942488670349, 0.28688597679138184, 0.33077767491340637, 0.3746693730354309, 0.41856110095977783, 0.46245282888412476, 0.5063445568084717, 0.5502362251281738, 0.5941279530525208, 0.6380196809768677, 0.6819113492965698, 0.7258030772209167, 0.7696948051452637, 0.8135865330696106, 0.8574782609939575, 0.9013699293136597, 0.9452616572380066, 0.9891533851623535, 1.0330450534820557, 1.0769367218017578, 1.1208285093307495, 1.1647201776504517, 1.2086119651794434, 1.2525036334991455, 1.2963953018188477, 1.3402870893478394, 1.3841787576675415, 1.4280705451965332, 1.4719622135162354]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 27.0, 58.0, 110.0, 261.0, 1269.0, 51465392.0, 2554.0, 350.0, 150.0, 78.0, 36.0, 14.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.8051528930664, -101.13446807861328, -96.46379089355469, -91.79310607910156, -87.12242889404297, -82.45174407958984, -77.78106689453125, -73.11038208007812, -68.439697265625, -63.76901626586914, -59.09833526611328, -54.427650451660156, -49.75697326660156, -45.08628845214844, -40.41560745239258, -35.74492645263672, -31.074249267578125, -26.403568267822266, -21.732887268066406, -17.062204360961914, -12.391523361206055, -7.720842361450195, -3.050159454345703, 1.6205215454101562, 6.291202545166016, 10.961883544921875, 15.63256549835205, 20.303247451782227, 24.973928451538086, 29.644609451293945, 34.31529235839844, 38.9859733581543, 43.656646728515625, 48.327327728271484, 52.998008728027344, 57.66869354248047, 62.33937072753906, 67.01005554199219, 71.68074035644531, 76.3514175415039, 81.0220947265625, 85.69277954101562, 90.36345672607422, 95.03414154052734, 99.70481872558594, 104.37550354003906, 109.04618835449219, 113.71686553955078, 118.3875503540039, 123.05823516845703, 127.72891235351562, 132.39959716796875, 137.07028198242188, 141.74095153808594, 146.41163635253906, 151.0823211669922, 155.7530059814453, 160.42369079589844, 165.09437561035156, 169.76504516601562, 174.43572998046875, 179.10641479492188, 183.777099609375, 188.44778442382812, 193.1184539794922]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 12.0, 20.0, 25.0, 54.0, 64.0, 108.0, 176.0, 263.0, 427.0, 822.0, 1369.0, 2597.0, 5120.0, 10124.0, 20557.0, 43281.0, 93949.0, 205776.0, 421725.0, 1253393.0, 3287776.0, 488509.0, 243153.0, 111917.0, 51361.0, 24105.0, 11703.0, 5882.0, 2954.0, 1694.0, 939.0, 570.0, 362.0, 208.0, 129.0, 104.0, 66.0, 31.0, 38.0, 19.0, 11.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.8515625, -2.75360107421875, -2.6556396484375, -2.55767822265625, -2.459716796875, -2.36175537109375, -2.2637939453125, -2.16583251953125, -2.06787109375, -1.96990966796875, -1.8719482421875, -1.77398681640625, -1.676025390625, -1.57806396484375, -1.4801025390625, -1.38214111328125, -1.2841796875, -1.18621826171875, -1.0882568359375, -0.99029541015625, -0.892333984375, -0.79437255859375, -0.6964111328125, -0.59844970703125, -0.50048828125, -0.40252685546875, -0.3045654296875, -0.20660400390625, -0.108642578125, -0.01068115234375, 0.0872802734375, 0.18524169921875, 0.283203125, 0.38116455078125, 0.4791259765625, 0.57708740234375, 0.675048828125, 0.77301025390625, 0.8709716796875, 0.96893310546875, 1.06689453125, 1.16485595703125, 1.2628173828125, 1.36077880859375, 1.458740234375, 1.55670166015625, 1.6546630859375, 1.75262451171875, 1.8505859375, 1.94854736328125, 2.0465087890625, 2.14447021484375, 2.242431640625, 2.34039306640625, 2.4383544921875, 2.53631591796875, 2.63427734375, 2.73223876953125, 2.8302001953125, 2.92816162109375, 3.026123046875, 3.12408447265625, 3.2220458984375, 3.32000732421875, 3.41796875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 2.0, 6.0, 9.0, 5.0, 3.0, 5.0, 18.0, 17.0, 19.0, 23.0, 23.0, 25.0, 18.0, 13.0, 30.0, 31.0, 40.0, 36.0, 43.0, 52.0, 139.0, 748.0, 232.0, 54.0, 39.0, 38.0, 38.0, 40.0, 36.0, 33.0, 25.0, 20.0, 22.0, 21.0, 23.0, 20.0, 14.0, 17.0, 7.0, 10.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.4765625, -15.0029296875, -14.529296875, -14.0556640625, -13.58203125, -13.1083984375, -12.634765625, -12.1611328125, -11.6875, -11.2138671875, -10.740234375, -10.2666015625, -9.79296875, -9.3193359375, -8.845703125, -8.3720703125, -7.8984375, -7.4248046875, -6.951171875, -6.4775390625, -6.00390625, -5.5302734375, -5.056640625, -4.5830078125, -4.109375, -3.6357421875, -3.162109375, -2.6884765625, -2.21484375, -1.7412109375, -1.267578125, -0.7939453125, -0.3203125, 0.1533203125, 0.626953125, 1.1005859375, 1.57421875, 2.0478515625, 2.521484375, 2.9951171875, 3.46875, 3.9423828125, 4.416015625, 4.8896484375, 5.36328125, 5.8369140625, 6.310546875, 6.7841796875, 7.2578125, 7.7314453125, 8.205078125, 8.6787109375, 9.15234375, 9.6259765625, 10.099609375, 10.5732421875, 11.046875, 11.5205078125, 11.994140625, 12.4677734375, 12.94140625, 13.4150390625, 13.888671875, 14.3623046875, 14.8359375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 16.0, 20.0, 33.0, 48.0, 85.0, 138.0, 189.0, 294.0, 505.0, 671.0, 989.0, 1508.0, 2292.0, 3457.0, 5317.0, 8070.0, 12797.0, 20478.0, 32867.0, 53277.0, 84689.0, 133572.0, 200293.0, 282401.0, 369415.0, 2648586.0, 1297886.0, 349646.0, 265361.0, 185249.0, 122352.0, 77627.0, 48739.0, 30204.0, 18674.0, 11808.0, 7629.0, 4955.0, 3154.0, 2076.0, 1385.0, 897.0, 583.0, 423.0, 289.0, 185.0, 118.0, 80.0, 43.0, 28.0, 27.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.439453125, -1.3943328857421875, -1.349212646484375, -1.3040924072265625, -1.25897216796875, -1.2138519287109375, -1.168731689453125, -1.1236114501953125, -1.0784912109375, -1.0333709716796875, -0.988250732421875, -0.9431304931640625, -0.89801025390625, -0.8528900146484375, -0.807769775390625, -0.7626495361328125, -0.717529296875, -0.6724090576171875, -0.627288818359375, -0.5821685791015625, -0.53704833984375, -0.4919281005859375, -0.446807861328125, -0.4016876220703125, -0.3565673828125, -0.3114471435546875, -0.266326904296875, -0.2212066650390625, -0.17608642578125, -0.1309661865234375, -0.085845947265625, -0.0407257080078125, 0.00439453125, 0.0495147705078125, 0.094635009765625, 0.1397552490234375, 0.18487548828125, 0.2299957275390625, 0.275115966796875, 0.3202362060546875, 0.3653564453125, 0.4104766845703125, 0.455596923828125, 0.5007171630859375, 0.54583740234375, 0.5909576416015625, 0.636077880859375, 0.6811981201171875, 0.726318359375, 0.7714385986328125, 0.816558837890625, 0.8616790771484375, 0.90679931640625, 0.9519195556640625, 0.997039794921875, 1.0421600341796875, 1.0872802734375, 1.1324005126953125, 1.177520751953125, 1.2226409912109375, 1.26776123046875, 1.3128814697265625, 1.358001708984375, 1.4031219482421875, 1.4482421875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 13.0, 10.0, 18.0, 15.0, 22.0, 9.0, 20.0, 23.0, 26.0, 32.0, 31.0, 25.0, 31.0, 43.0, 46.0, 35.0, 92.0, 798.0, 263.0, 57.0, 34.0, 34.0, 37.0, 38.0, 35.0, 29.0, 26.0, 28.0, 24.0, 23.0, 17.0, 17.0, 7.0, 8.0, 7.0, 12.0, 6.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.515625, -15.0418701171875, -14.568115234375, -14.0943603515625, -13.62060546875, -13.1468505859375, -12.673095703125, -12.1993408203125, -11.7255859375, -11.2518310546875, -10.778076171875, -10.3043212890625, -9.83056640625, -9.3568115234375, -8.883056640625, -8.4093017578125, -7.935546875, -7.4617919921875, -6.988037109375, -6.5142822265625, -6.04052734375, -5.5667724609375, -5.093017578125, -4.6192626953125, -4.1455078125, -3.6717529296875, -3.197998046875, -2.7242431640625, -2.25048828125, -1.7767333984375, -1.302978515625, -0.8292236328125, -0.35546875, 0.1182861328125, 0.592041015625, 1.0657958984375, 1.53955078125, 2.0133056640625, 2.487060546875, 2.9608154296875, 3.4345703125, 3.9083251953125, 4.382080078125, 4.8558349609375, 5.32958984375, 5.8033447265625, 6.277099609375, 6.7508544921875, 7.224609375, 7.6983642578125, 8.172119140625, 8.6458740234375, 9.11962890625, 9.5933837890625, 10.067138671875, 10.5408935546875, 11.0146484375, 11.4884033203125, 11.962158203125, 12.4359130859375, 12.90966796875, 13.3834228515625, 13.857177734375, 14.3309326171875, 14.8046875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 5.0, 22.0, 26.0, 21.0, 47.0, 70.0, 108.0, 126.0, 177.0, 254.0, 347.0, 514.0, 783.0, 1342.0, 2153.0, 4113.0, 7969.0, 18154.0, 42879.0, 102544.0, 592500.0, 5302602.0, 121922.0, 50947.0, 21347.0, 9429.0, 4442.0, 2467.0, 1345.0, 875.0, 519.0, 414.0, 315.0, 184.0, 152.0, 88.0, 64.0, 43.0, 28.0, 17.0, 17.0, 5.0, 12.0, 12.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.58984375, -6.3907470703125, -6.191650390625, -5.9925537109375, -5.79345703125, -5.5943603515625, -5.395263671875, -5.1961669921875, -4.9970703125, -4.7979736328125, -4.598876953125, -4.3997802734375, -4.20068359375, -4.0015869140625, -3.802490234375, -3.6033935546875, -3.404296875, -3.2052001953125, -3.006103515625, -2.8070068359375, -2.60791015625, -2.4088134765625, -2.209716796875, -2.0106201171875, -1.8115234375, -1.6124267578125, -1.413330078125, -1.2142333984375, -1.01513671875, -0.8160400390625, -0.616943359375, -0.4178466796875, -0.21875, -0.0196533203125, 0.179443359375, 0.3785400390625, 0.57763671875, 0.7767333984375, 0.975830078125, 1.1749267578125, 1.3740234375, 1.5731201171875, 1.772216796875, 1.9713134765625, 2.17041015625, 2.3695068359375, 2.568603515625, 2.7677001953125, 2.966796875, 3.1658935546875, 3.364990234375, 3.5640869140625, 3.76318359375, 3.9622802734375, 4.161376953125, 4.3604736328125, 4.5595703125, 4.7586669921875, 4.957763671875, 5.1568603515625, 5.35595703125, 5.5550537109375, 5.754150390625, 5.9532470703125, 6.15234375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 8.0, 7.0, 8.0, 7.0, 9.0, 21.0, 10.0, 13.0, 25.0, 21.0, 25.0, 30.0, 30.0, 39.0, 31.0, 33.0, 30.0, 26.0, 38.0, 50.0, 377.0, 702.0, 37.0, 46.0, 43.0, 34.0, 33.0, 32.0, 31.0, 21.0, 18.0, 25.0, 24.0, 22.0, 14.0, 18.0, 20.0, 15.0, 9.0, 10.0, 8.0, 6.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.8359375, -13.3450927734375, -12.854248046875, -12.3634033203125, -11.87255859375, -11.3817138671875, -10.890869140625, -10.4000244140625, -9.9091796875, -9.4183349609375, -8.927490234375, -8.4366455078125, -7.94580078125, -7.4549560546875, -6.964111328125, -6.4732666015625, -5.982421875, -5.4915771484375, -5.000732421875, -4.5098876953125, -4.01904296875, -3.5281982421875, -3.037353515625, -2.5465087890625, -2.0556640625, -1.5648193359375, -1.073974609375, -0.5831298828125, -0.09228515625, 0.3985595703125, 0.889404296875, 1.3802490234375, 1.87109375, 2.3619384765625, 2.852783203125, 3.3436279296875, 3.83447265625, 4.3253173828125, 4.816162109375, 5.3070068359375, 5.7978515625, 6.2886962890625, 6.779541015625, 7.2703857421875, 7.76123046875, 8.2520751953125, 8.742919921875, 9.2337646484375, 9.724609375, 10.2154541015625, 10.706298828125, 11.1971435546875, 11.68798828125, 12.1788330078125, 12.669677734375, 13.1605224609375, 13.6513671875, 14.1422119140625, 14.633056640625, 15.1239013671875, 15.61474609375, 16.1055908203125, 16.596435546875, 17.0872802734375, 17.578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 4.0, 6.0, 11.0, 13.0, 13.0, 31.0, 58.0, 88.0, 158.0, 218.0, 140.0, 82.0, 58.0, 39.0, 22.0, 20.0, 8.0, 6.0, 6.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.68365478515625, -59.89925765991211, -58.11486053466797, -56.33045959472656, -54.54606246948242, -52.76166534423828, -50.977264404296875, -49.192867279052734, -47.408470153808594, -45.62407302856445, -43.83967590332031, -42.055274963378906, -40.270877838134766, -38.486480712890625, -36.70207977294922, -34.91768264770508, -33.13328552246094, -31.348888397216797, -29.564489364624023, -27.78009033203125, -25.99569320678711, -24.21129608154297, -22.426897048950195, -20.642498016357422, -18.85810089111328, -17.07370376586914, -15.289304733276367, -13.50490665435791, -11.720508575439453, -9.936110496520996, -8.151712417602539, -6.367314338684082, -4.582912445068359, -2.7985143661499023, -1.0141162872314453, 0.7702817916870117, 2.5546798706054688, 4.339077949523926, 6.123476028442383, 7.90787410736084, 9.692272186279297, 11.476670265197754, 13.261068344116211, 15.045466423034668, 16.829864501953125, 18.614261627197266, 20.39866065979004, 22.183059692382812, 23.967456817626953, 25.751853942871094, 27.536252975463867, 29.32065200805664, 31.10504913330078, 32.88944625854492, 34.67384338378906, 36.45824432373047, 38.24264144897461, 40.02703857421875, 41.811439514160156, 43.5958366394043, 45.38023376464844, 47.16463088989258, 48.94902801513672, 50.733428955078125, 52.517826080322266]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 0.0, 8.0, 6.0, 7.0, 15.0, 12.0, 17.0, 20.0, 30.0, 32.0, 36.0, 34.0, 51.0, 76.0, 77.0, 74.0, 77.0, 73.0, 60.0, 49.0, 41.0, 39.0, 29.0, 23.0, 23.0, 18.0, 12.0, 9.0, 12.0, 10.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.64680480957031, -83.25886535644531, -80.87093353271484, -78.48299407958984, -76.09506225585938, -73.70712280273438, -71.31918334960938, -68.9312515258789, -66.5433120727539, -64.1553726196289, -61.76744079589844, -59.37950134277344, -56.9915657043457, -54.60363006591797, -52.215694427490234, -49.8277587890625, -47.439823150634766, -45.05188751220703, -42.6639518737793, -40.27601623535156, -37.88807678222656, -35.50014114379883, -33.112205505371094, -30.724267959594727, -28.336332321166992, -25.948396682739258, -23.56045913696289, -21.172523498535156, -18.784587860107422, -16.396650314331055, -14.00871467590332, -11.620777130126953, -9.232841491699219, -6.844904899597168, -4.456968784332275, -2.069032669067383, 0.31890392303466797, 2.7068405151367188, 5.094776153564453, 7.48271369934082, 9.870649337768555, 12.258585929870605, 14.646522521972656, 17.03445816040039, 19.422393798828125, 21.810331344604492, 24.198266983032227, 26.586204528808594, 28.974140167236328, 31.362075805664062, 33.7500114440918, 36.13794708251953, 38.52588653564453, 40.913822174072266, 43.3017578125, 45.689697265625, 48.07762908935547, 50.4655647277832, 52.85350036621094, 55.24143981933594, 57.62937545776367, 60.017311096191406, 62.40524673461914, 64.79318237304688, 67.18112182617188]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 5.0, 7.0, 17.0, 16.0, 32.0, 41.0, 47.0, 89.0, 118.0, 189.0, 246.0, 413.0, 653.0, 1171.0, 2036.0, 3972.0, 8919.0, 26837.0, 248810.0, 3830979.0, 45262.0, 12930.0, 5232.0, 2609.0, 1410.0, 819.0, 492.0, 305.0, 183.0, 132.0, 96.0, 62.0, 46.0, 24.0, 21.0, 12.0, 10.0, 11.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.58349609375, -0.5653610229492188, -0.5472259521484375, -0.5290908813476562, -0.510955810546875, -0.49282073974609375, -0.4746856689453125, -0.45655059814453125, -0.43841552734375, -0.42028045654296875, -0.4021453857421875, -0.38401031494140625, -0.365875244140625, -0.34774017333984375, -0.3296051025390625, -0.31147003173828125, -0.2933349609375, -0.27519989013671875, -0.2570648193359375, -0.23892974853515625, -0.220794677734375, -0.20265960693359375, -0.1845245361328125, -0.16638946533203125, -0.14825439453125, -0.13011932373046875, -0.1119842529296875, -0.09384918212890625, -0.075714111328125, -0.05757904052734375, -0.0394439697265625, -0.02130889892578125, -0.003173828125, 0.01496124267578125, 0.0330963134765625, 0.05123138427734375, 0.069366455078125, 0.08750152587890625, 0.1056365966796875, 0.12377166748046875, 0.14190673828125, 0.16004180908203125, 0.1781768798828125, 0.19631195068359375, 0.214447021484375, 0.23258209228515625, 0.2507171630859375, 0.26885223388671875, 0.2869873046875, 0.30512237548828125, 0.3232574462890625, 0.34139251708984375, 0.359527587890625, 0.37766265869140625, 0.3957977294921875, 0.41393280029296875, 0.43206787109375, 0.45020294189453125, 0.4683380126953125, 0.48647308349609375, 0.504608154296875, 0.5227432250976562, 0.5408782958984375, 0.5590133666992188, 0.5771484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 11.0, 4.0, 8.0, 15.0, 16.0, 13.0, 9.0, 35.0, 57.0, 226.0, 400.0, 55.0, 35.0, 17.0, 18.0, 9.0, 9.0, 8.0, 9.0, 9.0, 9.0, 5.0, 2.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2154541015625, -0.2093048095703125, -0.203155517578125, -0.1970062255859375, -0.19085693359375, -0.1847076416015625, -0.178558349609375, -0.1724090576171875, -0.166259765625, -0.1601104736328125, -0.153961181640625, -0.1478118896484375, -0.14166259765625, -0.1355133056640625, -0.129364013671875, -0.1232147216796875, -0.1170654296875, -0.1109161376953125, -0.104766845703125, -0.0986175537109375, -0.09246826171875, -0.0863189697265625, -0.080169677734375, -0.0740203857421875, -0.06787109375, -0.0617218017578125, -0.055572509765625, -0.0494232177734375, -0.04327392578125, -0.0371246337890625, -0.030975341796875, -0.0248260498046875, -0.0186767578125, -0.0125274658203125, -0.006378173828125, -0.0002288818359375, 0.00592041015625, 0.0120697021484375, 0.018218994140625, 0.0243682861328125, 0.030517578125, 0.0366668701171875, 0.042816162109375, 0.0489654541015625, 0.05511474609375, 0.0612640380859375, 0.067413330078125, 0.0735626220703125, 0.0797119140625, 0.0858612060546875, 0.092010498046875, 0.0981597900390625, 0.10430908203125, 0.1104583740234375, 0.116607666015625, 0.1227569580078125, 0.12890625, 0.1350555419921875, 0.141204833984375, 0.1473541259765625, 0.15350341796875, 0.1596527099609375, 0.165802001953125, 0.1719512939453125, 0.1781005859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 15.0, 13.0, 22.0, 33.0, 49.0, 54.0, 116.0, 175.0, 254.0, 548.0, 1455.0, 4820.0, 24097.0, 257515.0, 3700963.0, 178135.0, 19547.0, 4129.0, 1327.0, 489.0, 230.0, 128.0, 63.0, 36.0, 18.0, 12.0, 9.0, 14.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.951171875, -0.9297676086425781, -0.9083633422851562, -0.8869590759277344, -0.8655548095703125, -0.8441505432128906, -0.8227462768554688, -0.8013420104980469, -0.779937744140625, -0.7585334777832031, -0.7371292114257812, -0.7157249450683594, -0.6943206787109375, -0.6729164123535156, -0.6515121459960938, -0.6301078796386719, -0.60870361328125, -0.5872993469238281, -0.5658950805664062, -0.5444908142089844, -0.5230865478515625, -0.5016822814941406, -0.48027801513671875, -0.4588737487792969, -0.437469482421875, -0.4160652160644531, -0.39466094970703125, -0.3732566833496094, -0.3518524169921875, -0.3304481506347656, -0.30904388427734375, -0.2876396179199219, -0.2662353515625, -0.24483108520507812, -0.22342681884765625, -0.20202255249023438, -0.1806182861328125, -0.15921401977539062, -0.13780975341796875, -0.11640548706054688, -0.095001220703125, -0.07359695434570312, -0.05219268798828125, -0.030788421630859375, -0.0093841552734375, 0.012020111083984375, 0.03342437744140625, 0.054828643798828125, 0.07623291015625, 0.09763717651367188, 0.11904144287109375, 0.14044570922851562, 0.1618499755859375, 0.18325424194335938, 0.20465850830078125, 0.22606277465820312, 0.247467041015625, 0.2688713073730469, 0.29027557373046875, 0.3116798400878906, 0.3330841064453125, 0.3544883728027344, 0.37589263916015625, 0.3972969055175781, 0.418701171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 13.0, 17.0, 30.0, 38.0, 68.0, 127.0, 200.0, 453.0, 1611.0, 821.0, 277.0, 161.0, 90.0, 51.0, 27.0, 30.0, 12.0, 10.0, 5.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.373291015625, -0.3649444580078125, -0.356597900390625, -0.3482513427734375, -0.33990478515625, -0.3315582275390625, -0.323211669921875, -0.3148651123046875, -0.3065185546875, -0.2981719970703125, -0.289825439453125, -0.2814788818359375, -0.27313232421875, -0.2647857666015625, -0.256439208984375, -0.2480926513671875, -0.23974609375, -0.2313995361328125, -0.223052978515625, -0.2147064208984375, -0.20635986328125, -0.1980133056640625, -0.189666748046875, -0.1813201904296875, -0.1729736328125, -0.1646270751953125, -0.156280517578125, -0.1479339599609375, -0.13958740234375, -0.1312408447265625, -0.122894287109375, -0.1145477294921875, -0.106201171875, -0.0978546142578125, -0.089508056640625, -0.0811614990234375, -0.07281494140625, -0.0644683837890625, -0.056121826171875, -0.0477752685546875, -0.0394287109375, -0.0310821533203125, -0.022735595703125, -0.0143890380859375, -0.00604248046875, 0.0023040771484375, 0.010650634765625, 0.0189971923828125, 0.02734375, 0.0356903076171875, 0.044036865234375, 0.0523834228515625, 0.06072998046875, 0.0690765380859375, 0.077423095703125, 0.0857696533203125, 0.0941162109375, 0.1024627685546875, 0.110809326171875, 0.1191558837890625, 0.12750244140625, 0.1358489990234375, 0.144195556640625, 0.1525421142578125, 0.160888671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 9.0, 16.0, 21.0, 39.0, 84.0, 150.0, 188.0, 194.0, 128.0, 76.0, 44.0, 22.0, 11.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2163350582122803, -1.1814018487930298, -1.1464686393737793, -1.1115355491638184, -1.0766023397445679, -1.0416691303253174, -1.006735920906067, -0.9718027114868164, -0.9368695616722107, -0.9019363522529602, -0.8670032024383545, -0.832069993019104, -0.7971367835998535, -0.7622036337852478, -0.7272704243659973, -0.6923372745513916, -0.6574040651321411, -0.6224708557128906, -0.5875377058982849, -0.5526044964790344, -0.5176713466644287, -0.4827381372451782, -0.44780492782592773, -0.41287174820899963, -0.37793856859207153, -0.34300538897514343, -0.30807220935821533, -0.27313899993896484, -0.23820582032203674, -0.20327264070510864, -0.16833944618701935, -0.13340625166893005, -0.09847307205200195, -0.06353988498449326, -0.028606697916984558, 0.006326489150524139, 0.04125967621803284, 0.07619285583496094, 0.11112605035305023, 0.14605924487113953, 0.18099242448806763, 0.21592560410499573, 0.25085878372192383, 0.2857919931411743, 0.3207251727581024, 0.3556583523750305, 0.390591561794281, 0.4255247414112091, 0.4604579210281372, 0.4953911006450653, 0.5303242802619934, 0.5652574896812439, 0.6001906394958496, 0.6351238489151001, 0.6700570583343506, 0.7049902677536011, 0.7399234175682068, 0.7748566269874573, 0.809789776802063, 0.8447229862213135, 0.879656195640564, 0.9145893454551697, 0.9495225548744202, 0.9844557046890259, 1.0193889141082764]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 2.0, 7.0, 7.0, 12.0, 24.0, 27.0, 27.0, 40.0, 51.0, 56.0, 60.0, 57.0, 75.0, 98.0, 52.0, 70.0, 71.0, 55.0, 45.0, 39.0, 20.0, 27.0, 17.0, 7.0, 7.0, 9.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0234506130218506, -0.9917458295822144, -0.9600411057472229, -0.9283363819122314, -0.8966315984725952, -0.864926815032959, -0.8332220911979675, -0.8015173673629761, -0.7698125839233398, -0.7381078004837036, -0.7064030766487122, -0.6746983528137207, -0.6429935693740845, -0.6112887859344482, -0.5795840620994568, -0.5478793382644653, -0.5161745548248291, -0.48446980118751526, -0.4527650475502014, -0.4210602939128876, -0.38935554027557373, -0.3576507866382599, -0.32594603300094604, -0.2942412793636322, -0.26253652572631836, -0.23083177208900452, -0.19912701845169067, -0.16742226481437683, -0.135717511177063, -0.10401275753974915, -0.0723080039024353, -0.04060325026512146, -0.008898496627807617, 0.022806257009506226, 0.05451101064682007, 0.08621576428413391, 0.11792051792144775, 0.1496252715587616, 0.18133002519607544, 0.21303477883338928, 0.24473953247070312, 0.27644428610801697, 0.3081490397453308, 0.33985379338264465, 0.3715585470199585, 0.40326330065727234, 0.4349680542945862, 0.4666728079319, 0.49837756156921387, 0.5300823450088501, 0.5617870688438416, 0.593491792678833, 0.6251965761184692, 0.6569013595581055, 0.6886060833930969, 0.7203108072280884, 0.7520155906677246, 0.7837203741073608, 0.8154250979423523, 0.8471298217773438, 0.87883460521698, 0.9105393886566162, 0.9422441124916077, 0.9739488363265991, 1.0056536197662354]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 2.0, 7.0, 13.0, 16.0, 31.0, 42.0, 41.0, 53.0, 96.0, 127.0, 211.0, 282.0, 462.0, 633.0, 1105.0, 1877.0, 3091.0, 5487.0, 10215.0, 20484.0, 50510.0, 736139.0, 149948.0, 33495.0, 15239.0, 7894.0, 4351.0, 2504.0, 1444.0, 944.0, 598.0, 397.0, 259.0, 154.0, 112.0, 81.0, 57.0, 35.0, 39.0, 16.0, 20.0, 11.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.69384765625, -0.672027587890625, -0.65020751953125, -0.628387451171875, -0.6065673828125, -0.584747314453125, -0.56292724609375, -0.541107177734375, -0.519287109375, -0.497467041015625, -0.47564697265625, -0.453826904296875, -0.4320068359375, -0.410186767578125, -0.38836669921875, -0.366546630859375, -0.3447265625, -0.322906494140625, -0.30108642578125, -0.279266357421875, -0.2574462890625, -0.235626220703125, -0.21380615234375, -0.191986083984375, -0.170166015625, -0.148345947265625, -0.12652587890625, -0.104705810546875, -0.0828857421875, -0.061065673828125, -0.03924560546875, -0.017425537109375, 0.00439453125, 0.026214599609375, 0.04803466796875, 0.069854736328125, 0.0916748046875, 0.113494873046875, 0.13531494140625, 0.157135009765625, 0.178955078125, 0.200775146484375, 0.22259521484375, 0.244415283203125, 0.2662353515625, 0.288055419921875, 0.30987548828125, 0.331695556640625, 0.353515625, 0.375335693359375, 0.39715576171875, 0.418975830078125, 0.4407958984375, 0.462615966796875, 0.48443603515625, 0.506256103515625, 0.528076171875, 0.549896240234375, 0.57171630859375, 0.593536376953125, 0.6153564453125, 0.637176513671875, 0.65899658203125, 0.680816650390625, 0.70263671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 12.0, 14.0, 13.0, 11.0, 18.0, 18.0, 63.0, 173.0, 421.0, 82.0, 35.0, 22.0, 20.0, 9.0, 9.0, 14.0, 7.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.218994140625, -0.21295547485351562, -0.20691680908203125, -0.20087814331054688, -0.1948394775390625, -0.18880081176757812, -0.18276214599609375, -0.17672348022460938, -0.170684814453125, -0.16464614868164062, -0.15860748291015625, -0.15256881713867188, -0.1465301513671875, -0.14049148559570312, -0.13445281982421875, -0.12841415405273438, -0.12237548828125, -0.11633682250976562, -0.11029815673828125, -0.10425949096679688, -0.0982208251953125, -0.09218215942382812, -0.08614349365234375, -0.08010482788085938, -0.074066162109375, -0.06802749633789062, -0.06198883056640625, -0.055950164794921875, -0.0499114990234375, -0.043872833251953125, -0.03783416748046875, -0.031795501708984375, -0.0257568359375, -0.019718170166015625, -0.01367950439453125, -0.007640838623046875, -0.0016021728515625, 0.004436492919921875, 0.01047515869140625, 0.016513824462890625, 0.022552490234375, 0.028591156005859375, 0.03462982177734375, 0.040668487548828125, 0.0467071533203125, 0.052745819091796875, 0.05878448486328125, 0.06482315063476562, 0.07086181640625, 0.07690048217773438, 0.08293914794921875, 0.08897781372070312, 0.0950164794921875, 0.10105514526367188, 0.10709381103515625, 0.11313247680664062, 0.119171142578125, 0.12520980834960938, 0.13124847412109375, 0.13728713989257812, 0.1433258056640625, 0.14936447143554688, 0.15540313720703125, 0.16144180297851562, 0.16748046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 9.0, 0.0, 17.0, 13.0, 21.0, 31.0, 47.0, 76.0, 113.0, 193.0, 352.0, 596.0, 1109.0, 2333.0, 5241.0, 13594.0, 42111.0, 166167.0, 521425.0, 215569.0, 52032.0, 16358.0, 5931.0, 2539.0, 1237.0, 577.0, 320.0, 193.0, 120.0, 74.0, 62.0, 28.0, 10.0, 20.0, 14.0, 10.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.426605224609375, -0.41351318359375, -0.400421142578125, -0.3873291015625, -0.374237060546875, -0.36114501953125, -0.348052978515625, -0.3349609375, -0.321868896484375, -0.30877685546875, -0.295684814453125, -0.2825927734375, -0.269500732421875, -0.25640869140625, -0.243316650390625, -0.230224609375, -0.217132568359375, -0.20404052734375, -0.190948486328125, -0.1778564453125, -0.164764404296875, -0.15167236328125, -0.138580322265625, -0.12548828125, -0.112396240234375, -0.09930419921875, -0.086212158203125, -0.0731201171875, -0.060028076171875, -0.04693603515625, -0.033843994140625, -0.020751953125, -0.007659912109375, 0.00543212890625, 0.018524169921875, 0.0316162109375, 0.044708251953125, 0.05780029296875, 0.070892333984375, 0.083984375, 0.097076416015625, 0.11016845703125, 0.123260498046875, 0.1363525390625, 0.149444580078125, 0.16253662109375, 0.175628662109375, 0.188720703125, 0.201812744140625, 0.21490478515625, 0.227996826171875, 0.2410888671875, 0.254180908203125, 0.26727294921875, 0.280364990234375, 0.29345703125, 0.306549072265625, 0.31964111328125, 0.332733154296875, 0.3458251953125, 0.358917236328125, 0.37200927734375, 0.385101318359375, 0.398193359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 3.0, 3.0, 6.0, 2.0, 10.0, 8.0, 8.0, 11.0, 15.0, 23.0, 24.0, 32.0, 33.0, 26.0, 58.0, 44.0, 33.0, 48.0, 48.0, 60.0, 73.0, 50.0, 50.0, 46.0, 57.0, 46.0, 31.0, 38.0, 28.0, 25.0, 17.0, 18.0, 11.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68505859375, -0.6649093627929688, -0.6447601318359375, -0.6246109008789062, -0.604461669921875, -0.5843124389648438, -0.5641632080078125, -0.5440139770507812, -0.52386474609375, -0.5037155151367188, -0.4835662841796875, -0.46341705322265625, -0.443267822265625, -0.42311859130859375, -0.4029693603515625, -0.38282012939453125, -0.3626708984375, -0.34252166748046875, -0.3223724365234375, -0.30222320556640625, -0.282073974609375, -0.26192474365234375, -0.2417755126953125, -0.22162628173828125, -0.20147705078125, -0.18132781982421875, -0.1611785888671875, -0.14102935791015625, -0.120880126953125, -0.10073089599609375, -0.0805816650390625, -0.06043243408203125, -0.040283203125, -0.02013397216796875, 1.52587890625e-05, 0.02016448974609375, 0.040313720703125, 0.06046295166015625, 0.0806121826171875, 0.10076141357421875, 0.12091064453125, 0.14105987548828125, 0.1612091064453125, 0.18135833740234375, 0.201507568359375, 0.22165679931640625, 0.2418060302734375, 0.26195526123046875, 0.2821044921875, 0.30225372314453125, 0.3224029541015625, 0.34255218505859375, 0.362701416015625, 0.38285064697265625, 0.4029998779296875, 0.42314910888671875, 0.44329833984375, 0.46344757080078125, 0.4835968017578125, 0.5037460327148438, 0.523895263671875, 0.5440444946289062, 0.5641937255859375, 0.5843429565429688, 0.6044921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 15.0, 13.0, 13.0, 21.0, 31.0, 48.0, 71.0, 114.0, 220.0, 367.0, 806.0, 1914.0, 5718.0, 25112.0, 399374.0, 572242.0, 31736.0, 6562.0, 2202.0, 930.0, 438.0, 234.0, 143.0, 71.0, 51.0, 40.0, 27.0, 16.0, 4.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.456787109375, -0.4392585754394531, -0.42173004150390625, -0.4042015075683594, -0.3866729736328125, -0.3691444396972656, -0.35161590576171875, -0.3340873718261719, -0.316558837890625, -0.2990303039550781, -0.28150177001953125, -0.2639732360839844, -0.2464447021484375, -0.22891616821289062, -0.21138763427734375, -0.19385910034179688, -0.17633056640625, -0.15880203247070312, -0.14127349853515625, -0.12374496459960938, -0.1062164306640625, -0.08868789672851562, -0.07115936279296875, -0.053630828857421875, -0.036102294921875, -0.018573760986328125, -0.00104522705078125, 0.016483306884765625, 0.0340118408203125, 0.051540374755859375, 0.06906890869140625, 0.08659744262695312, 0.1041259765625, 0.12165451049804688, 0.13918304443359375, 0.15671157836914062, 0.1742401123046875, 0.19176864624023438, 0.20929718017578125, 0.22682571411132812, 0.244354248046875, 0.2618827819824219, 0.27941131591796875, 0.2969398498535156, 0.3144683837890625, 0.3319969177246094, 0.34952545166015625, 0.3670539855957031, 0.38458251953125, 0.4021110534667969, 0.41963958740234375, 0.4371681213378906, 0.4546966552734375, 0.4722251892089844, 0.48975372314453125, 0.5072822570800781, 0.524810791015625, 0.5423393249511719, 0.5598678588867188, 0.5773963928222656, 0.5949249267578125, 0.6124534606933594, 0.6299819946289062, 0.6475105285644531, 0.6650390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 0.0, 6.0, 2.0, 9.0, 19.0, 18.0, 19.0, 31.0, 45.0, 57.0, 80.0, 83.0, 95.0, 100.0, 111.0, 89.0, 59.0, 55.0, 29.0, 36.0, 14.0, 11.0, 6.0, 4.0, 4.0, 7.0, 2.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.1975250244140625e-05, -5.074404180049896e-05, -4.95128333568573e-05, -4.828162491321564e-05, -4.7050416469573975e-05, -4.581920802593231e-05, -4.458799958229065e-05, -4.335679113864899e-05, -4.2125582695007324e-05, -4.089437425136566e-05, -3.9663165807724e-05, -3.8431957364082336e-05, -3.7200748920440674e-05, -3.596954047679901e-05, -3.473833203315735e-05, -3.3507123589515686e-05, -3.2275915145874023e-05, -3.104470670223236e-05, -2.9813498258590698e-05, -2.8582289814949036e-05, -2.7351081371307373e-05, -2.611987292766571e-05, -2.4888664484024048e-05, -2.3657456040382385e-05, -2.2426247596740723e-05, -2.119503915309906e-05, -1.9963830709457397e-05, -1.8732622265815735e-05, -1.7501413822174072e-05, -1.627020537853241e-05, -1.5038996934890747e-05, -1.3807788491249084e-05, -1.2576580047607422e-05, -1.134537160396576e-05, -1.0114163160324097e-05, -8.882954716682434e-06, -7.651746273040771e-06, -6.420537829399109e-06, -5.189329385757446e-06, -3.958120942115784e-06, -2.726912498474121e-06, -1.4957040548324585e-06, -2.644956111907959e-07, 9.667128324508667e-07, 2.1979212760925293e-06, 3.429129719734192e-06, 4.6603381633758545e-06, 5.891546607017517e-06, 7.12275505065918e-06, 8.353963494300842e-06, 9.585171937942505e-06, 1.0816380381584167e-05, 1.204758882522583e-05, 1.3278797268867493e-05, 1.4510005712509155e-05, 1.5741214156150818e-05, 1.697242259979248e-05, 1.8203631043434143e-05, 1.9434839487075806e-05, 2.0666047930717468e-05, 2.189725637435913e-05, 2.3128464818000793e-05, 2.4359673261642456e-05, 2.559088170528412e-05, 2.682209014892578e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 11.0, 7.0, 10.0, 7.0, 13.0, 18.0, 29.0, 42.0, 51.0, 78.0, 112.0, 179.0, 273.0, 433.0, 795.0, 1427.0, 2859.0, 6625.0, 18532.0, 72610.0, 429843.0, 413340.0, 70414.0, 18050.0, 6412.0, 2911.0, 1423.0, 796.0, 444.0, 281.0, 153.0, 112.0, 80.0, 61.0, 33.0, 25.0, 16.0, 13.0, 9.0, 6.0, 8.0, 6.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2603721618652344, -0.25072479248046875, -0.24107742309570312, -0.2314300537109375, -0.22178268432617188, -0.21213531494140625, -0.20248794555664062, -0.192840576171875, -0.18319320678710938, -0.17354583740234375, -0.16389846801757812, -0.1542510986328125, -0.14460372924804688, -0.13495635986328125, -0.12530899047851562, -0.11566162109375, -0.10601425170898438, -0.09636688232421875, -0.08671951293945312, -0.0770721435546875, -0.06742477416992188, -0.05777740478515625, -0.048130035400390625, -0.038482666015625, -0.028835296630859375, -0.01918792724609375, -0.009540557861328125, 0.0001068115234375, 0.009754180908203125, 0.01940155029296875, 0.029048919677734375, 0.0386962890625, 0.048343658447265625, 0.05799102783203125, 0.06763839721679688, 0.0772857666015625, 0.08693313598632812, 0.09658050537109375, 0.10622787475585938, 0.115875244140625, 0.12552261352539062, 0.13516998291015625, 0.14481735229492188, 0.1544647216796875, 0.16411209106445312, 0.17375946044921875, 0.18340682983398438, 0.19305419921875, 0.20270156860351562, 0.21234893798828125, 0.22199630737304688, 0.2316436767578125, 0.24129104614257812, 0.25093841552734375, 0.2605857849121094, 0.270233154296875, 0.2798805236816406, 0.28952789306640625, 0.2991752624511719, 0.3088226318359375, 0.3184700012207031, 0.32811737060546875, 0.3377647399902344, 0.347412109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 12.0, 11.0, 13.0, 18.0, 36.0, 27.0, 42.0, 49.0, 66.0, 65.0, 95.0, 83.0, 84.0, 81.0, 60.0, 58.0, 45.0, 32.0, 30.0, 26.0, 16.0, 13.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.311767578125, -0.30086517333984375, -0.2899627685546875, -0.27906036376953125, -0.268157958984375, -0.25725555419921875, -0.2463531494140625, -0.23545074462890625, -0.22454833984375, -0.21364593505859375, -0.2027435302734375, -0.19184112548828125, -0.180938720703125, -0.17003631591796875, -0.1591339111328125, -0.14823150634765625, -0.1373291015625, -0.12642669677734375, -0.1155242919921875, -0.10462188720703125, -0.093719482421875, -0.08281707763671875, -0.0719146728515625, -0.06101226806640625, -0.05010986328125, -0.03920745849609375, -0.0283050537109375, -0.01740264892578125, -0.006500244140625, 0.00440216064453125, 0.0153045654296875, 0.02620697021484375, 0.037109375, 0.04801177978515625, 0.0589141845703125, 0.06981658935546875, 0.080718994140625, 0.09162139892578125, 0.1025238037109375, 0.11342620849609375, 0.12432861328125, 0.13523101806640625, 0.1461334228515625, 0.15703582763671875, 0.167938232421875, 0.17884063720703125, 0.1897430419921875, 0.20064544677734375, 0.2115478515625, 0.22245025634765625, 0.2333526611328125, 0.24425506591796875, 0.255157470703125, 0.26605987548828125, 0.2769622802734375, 0.28786468505859375, 0.29876708984375, 0.30966949462890625, 0.3205718994140625, 0.33147430419921875, 0.342376708984375, 0.35327911376953125, 0.3641815185546875, 0.37508392333984375, 0.385986328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 8.0, 19.0, 58.0, 182.0, 414.0, 200.0, 65.0, 22.0, 11.0, 8.0, 7.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.223868370056152, -6.961328983306885, -6.698789596557617, -6.43625020980835, -6.173710823059082, -5.911170959472656, -5.648631572723389, -5.386092185974121, -5.1235527992248535, -4.861013412475586, -4.598474025726318, -4.335934638977051, -4.073394775390625, -3.8108556270599365, -3.54831600189209, -3.2857766151428223, -3.0232372283935547, -2.760697841644287, -2.4981584548950195, -2.235618829727173, -1.9730794429779053, -1.7105400562286377, -1.4480005502700806, -1.1854610443115234, -0.9229216575622559, -0.6603822112083435, -0.39784276485443115, -0.1353033185005188, 0.12723612785339355, 0.38977551460266113, 0.6523150205612183, 0.9148545265197754, 1.1773948669433594, 1.439934253692627, 1.702473759651184, 1.9650132656097412, 2.227552652359009, 2.4900920391082764, 2.752631664276123, 3.0151710510253906, 3.277710437774658, 3.540249824523926, 3.8027892112731934, 4.065328598022461, 4.327868461608887, 4.590407371520996, 4.852947235107422, 5.1154866218566895, 5.378026008605957, 5.640565395355225, 5.903104782104492, 6.16564416885376, 6.428183555603027, 6.690723419189453, 6.953262805938721, 7.215802192687988, 7.478341579437256, 7.740880966186523, 8.00342082977295, 8.265959739685059, 8.528499603271484, 8.791038513183594, 9.05357837677002, 9.316118240356445, 9.578657150268555]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 10.0, 12.0, 13.0, 54.0, 88.0, 120.0, 139.0, 170.0, 139.0, 85.0, 55.0, 26.0, 19.0, 10.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.11131763458252, -9.751787185668945, -9.392256736755371, -9.032726287841797, -8.673195838928223, -8.313665390014648, -7.954134464263916, -7.594604015350342, -7.235073566436768, -6.875543117523193, -6.516012668609619, -6.156481742858887, -5.7969512939453125, -5.437420845031738, -5.077890396118164, -4.71835994720459, -4.358829498291016, -3.9992990493774414, -3.639768600463867, -3.280237913131714, -2.9207074642181396, -2.5611770153045654, -2.201646327972412, -1.842115879058838, -1.4825854301452637, -1.1230549812316895, -0.7635244131088257, -0.4039938449859619, -0.044463396072387695, 0.3150670528411865, 0.6745977401733398, 1.034128189086914, 1.3936576843261719, 1.753188133239746, 2.1127185821533203, 2.4722492694854736, 2.831779718399048, 3.191310167312622, 3.5508408546447754, 3.9103713035583496, 4.269901752471924, 4.629432201385498, 4.988962650299072, 5.348493576049805, 5.708024024963379, 6.067554473876953, 6.427084922790527, 6.786615371704102, 7.146145820617676, 7.50567626953125, 7.865206718444824, 8.224737167358398, 8.584267616271973, 8.943798065185547, 9.303329467773438, 9.662858963012695, 10.022390365600586, 10.38192081451416, 10.741451263427734, 11.100981712341309, 11.460512161254883, 11.820042610168457, 12.179573059082031, 12.539104461669922, 12.89863395690918]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 3.0, 11.0, 10.0, 16.0, 22.0, 25.0, 41.0, 55.0, 64.0, 77.0, 133.0, 197.0, 301.0, 465.0, 711.0, 1300.0, 2188.0, 4475.0, 10444.0, 36566.0, 3268706.0, 813673.0, 34569.0, 10365.0, 4560.0, 2159.0, 1206.0, 716.0, 424.0, 259.0, 191.0, 103.0, 75.0, 48.0, 41.0, 26.0, 13.0, 14.0, 5.0, 6.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.484375, -1.441925048828125, -1.39947509765625, -1.357025146484375, -1.3145751953125, -1.272125244140625, -1.22967529296875, -1.187225341796875, -1.144775390625, -1.102325439453125, -1.05987548828125, -1.017425537109375, -0.9749755859375, -0.932525634765625, -0.89007568359375, -0.847625732421875, -0.80517578125, -0.762725830078125, -0.72027587890625, -0.677825927734375, -0.6353759765625, -0.592926025390625, -0.55047607421875, -0.508026123046875, -0.465576171875, -0.423126220703125, -0.38067626953125, -0.338226318359375, -0.2957763671875, -0.253326416015625, -0.21087646484375, -0.168426513671875, -0.1259765625, -0.083526611328125, -0.04107666015625, 0.001373291015625, 0.0438232421875, 0.086273193359375, 0.12872314453125, 0.171173095703125, 0.213623046875, 0.256072998046875, 0.29852294921875, 0.340972900390625, 0.3834228515625, 0.425872802734375, 0.46832275390625, 0.510772705078125, 0.55322265625, 0.595672607421875, 0.63812255859375, 0.680572509765625, 0.7230224609375, 0.765472412109375, 0.80792236328125, 0.850372314453125, 0.892822265625, 0.935272216796875, 0.97772216796875, 1.020172119140625, 1.0626220703125, 1.105072021484375, 1.14752197265625, 1.189971923828125, 1.232421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 6.0, 3.0, 5.0, 1.0, 10.0, 7.0, 8.0, 9.0, 12.0, 9.0, 14.0, 21.0, 53.0, 113.0, 238.0, 217.0, 94.0, 47.0, 30.0, 18.0, 13.0, 12.0, 6.0, 8.0, 8.0, 7.0, 7.0, 5.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0], "bins": [-0.2020263671875, -0.19721221923828125, -0.1923980712890625, -0.18758392333984375, -0.182769775390625, -0.17795562744140625, -0.1731414794921875, -0.16832733154296875, -0.16351318359375, -0.15869903564453125, -0.1538848876953125, -0.14907073974609375, -0.144256591796875, -0.13944244384765625, -0.1346282958984375, -0.12981414794921875, -0.125, -0.12018585205078125, -0.1153717041015625, -0.11055755615234375, -0.105743408203125, -0.10092926025390625, -0.0961151123046875, -0.09130096435546875, -0.08648681640625, -0.08167266845703125, -0.0768585205078125, -0.07204437255859375, -0.067230224609375, -0.06241607666015625, -0.0576019287109375, -0.05278778076171875, -0.0479736328125, -0.04315948486328125, -0.0383453369140625, -0.03353118896484375, -0.028717041015625, -0.02390289306640625, -0.0190887451171875, -0.01427459716796875, -0.00946044921875, -0.00464630126953125, 0.0001678466796875, 0.00498199462890625, 0.009796142578125, 0.01461029052734375, 0.0194244384765625, 0.02423858642578125, 0.029052734375, 0.03386688232421875, 0.0386810302734375, 0.04349517822265625, 0.048309326171875, 0.05312347412109375, 0.0579376220703125, 0.06275177001953125, 0.06756591796875, 0.07238006591796875, 0.0771942138671875, 0.08200836181640625, 0.086822509765625, 0.09163665771484375, 0.0964508056640625, 0.10126495361328125, 0.1060791015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 3.0, 14.0, 29.0, 21.0, 28.0, 42.0, 93.0, 122.0, 217.0, 411.0, 908.0, 2100.0, 5423.0, 16109.0, 63627.0, 716175.0, 3241315.0, 110829.0, 23818.0, 7634.0, 2857.0, 1206.0, 567.0, 274.0, 154.0, 80.0, 69.0, 46.0, 29.0, 17.0, 17.0, 4.0, 10.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.0105361938476562, -0.9800567626953125, -0.9495773315429688, -0.919097900390625, -0.8886184692382812, -0.8581390380859375, -0.8276596069335938, -0.79718017578125, -0.7667007446289062, -0.7362213134765625, -0.7057418823242188, -0.675262451171875, -0.6447830200195312, -0.6143035888671875, -0.5838241577148438, -0.5533447265625, -0.5228652954101562, -0.4923858642578125, -0.46190643310546875, -0.431427001953125, -0.40094757080078125, -0.3704681396484375, -0.33998870849609375, -0.30950927734375, -0.27902984619140625, -0.2485504150390625, -0.21807098388671875, -0.187591552734375, -0.15711212158203125, -0.1266326904296875, -0.09615325927734375, -0.065673828125, -0.03519439697265625, -0.0047149658203125, 0.02576446533203125, 0.056243896484375, 0.08672332763671875, 0.1172027587890625, 0.14768218994140625, 0.17816162109375, 0.20864105224609375, 0.2391204833984375, 0.26959991455078125, 0.300079345703125, 0.33055877685546875, 0.3610382080078125, 0.39151763916015625, 0.4219970703125, 0.45247650146484375, 0.4829559326171875, 0.5134353637695312, 0.543914794921875, 0.5743942260742188, 0.6048736572265625, 0.6353530883789062, 0.66583251953125, 0.6963119506835938, 0.7267913818359375, 0.7572708129882812, 0.787750244140625, 0.8182296752929688, 0.8487091064453125, 0.8791885375976562, 0.90966796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 20.0, 6.0, 22.0, 17.0, 33.0, 46.0, 64.0, 102.0, 214.0, 403.0, 1733.0, 648.0, 272.0, 161.0, 96.0, 61.0, 26.0, 20.0, 21.0, 13.0, 14.0, 6.0, 12.0, 8.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.18655014038085938, -0.18132781982421875, -0.17610549926757812, -0.1708831787109375, -0.16566085815429688, -0.16043853759765625, -0.15521621704101562, -0.149993896484375, -0.14477157592773438, -0.13954925537109375, -0.13432693481445312, -0.1291046142578125, -0.12388229370117188, -0.11865997314453125, -0.11343765258789062, -0.10821533203125, -0.10299301147460938, -0.09777069091796875, -0.09254837036132812, -0.0873260498046875, -0.08210372924804688, -0.07688140869140625, -0.07165908813476562, -0.066436767578125, -0.061214447021484375, -0.05599212646484375, -0.050769805908203125, -0.0455474853515625, -0.040325164794921875, -0.03510284423828125, -0.029880523681640625, -0.024658203125, -0.019435882568359375, -0.01421356201171875, -0.008991241455078125, -0.0037689208984375, 0.001453399658203125, 0.00667572021484375, 0.011898040771484375, 0.017120361328125, 0.022342681884765625, 0.02756500244140625, 0.032787322998046875, 0.0380096435546875, 0.043231964111328125, 0.04845428466796875, 0.053676605224609375, 0.05889892578125, 0.06412124633789062, 0.06934356689453125, 0.07456588745117188, 0.0797882080078125, 0.08501052856445312, 0.09023284912109375, 0.09545516967773438, 0.100677490234375, 0.10589981079101562, 0.11112213134765625, 0.11634445190429688, 0.1215667724609375, 0.12678909301757812, 0.13201141357421875, 0.13723373413085938, 0.1424560546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 28.0, 233.0, 603.0, 115.0, 16.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5814886689186096, -0.4715144634246826, -0.3615402579307556, -0.251566082239151, -0.141591876745224, -0.031617701053619385, 0.07835650444030762, 0.18833070993423462, 0.2983049154281616, 0.4082791209220886, 0.5182533264160156, 0.6282274723052979, 0.7382017374038696, 0.8481758832931519, 0.9581500887870789, 1.0681242942810059, 1.178098440170288, 1.2880725860595703, 1.398046851158142, 1.5080209970474243, 1.617995262145996, 1.7279694080352783, 1.8379435539245605, 1.9479178190231323, 2.057892084121704, 2.1678662300109863, 2.2778403759002686, 2.38781476020813, 2.497788906097412, 2.6077630519866943, 2.7177371978759766, 2.827711582183838, 2.93768572807312, 3.0476598739624023, 3.1576340198516846, 3.267608404159546, 3.377582550048828, 3.4875566959381104, 3.5975308418273926, 3.707505226135254, 3.817479372024536, 3.9274535179138184, 4.03742790222168, 4.147401809692383, 4.257376194000244, 4.3673505783081055, 4.477324485778809, 4.58729887008667, 4.697272777557373, 4.807247161865234, 4.9172210693359375, 5.027195453643799, 5.137169361114502, 5.247143745422363, 5.357118129730225, 5.467092037200928, 5.577066421508789, 5.68704080581665, 5.7970147132873535, 5.906989097595215, 6.016963005065918, 6.126937389373779, 6.236911773681641, 6.346885681152344, 6.456860065460205]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 9.0, 15.0, 22.0, 18.0, 26.0, 35.0, 35.0, 41.0, 37.0, 44.0, 41.0, 35.0, 55.0, 59.0, 54.0, 38.0, 50.0, 48.0, 46.0, 38.0, 40.0, 25.0, 23.0, 23.0, 19.0, 16.0, 16.0, 7.0, 14.0, 6.0, 7.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.554146945476532, -0.535702109336853, -0.5172573328018188, -0.4988125264644623, -0.4803677201271057, -0.46192288398742676, -0.4434780776500702, -0.4250332713127136, -0.40658846497535706, -0.3881436586380005, -0.3696988523006439, -0.35125404596328735, -0.3328092098236084, -0.3143644332885742, -0.29591959714889526, -0.2774747908115387, -0.25902998447418213, -0.24058517813682556, -0.222140371799469, -0.20369555056095123, -0.18525074422359467, -0.1668059378862381, -0.14836111664772034, -0.12991631031036377, -0.1114715039730072, -0.09302669763565063, -0.07458188384771347, -0.056137073785066605, -0.03769226372241974, -0.01924745738506317, -0.0008026435971260071, 0.017642170190811157, 0.03608691692352295, 0.054531726986169815, 0.07297653704881668, 0.09142135083675385, 0.10986615717411041, 0.12831096351146698, 0.14675578474998474, 0.1652005910873413, 0.18364539742469788, 0.20209020376205444, 0.220535010099411, 0.23897983133792877, 0.25742465257644653, 0.2758694291114807, 0.29431426525115967, 0.31275907158851624, 0.3312038779258728, 0.34964868426322937, 0.36809349060058594, 0.3865382969379425, 0.4049831032752991, 0.423427939414978, 0.4418727457523346, 0.46031755208969116, 0.47876235842704773, 0.4972071647644043, 0.5156520009040833, 0.5340967774391174, 0.5525416135787964, 0.5709863901138306, 0.5894312262535095, 0.6078760623931885, 0.6263208389282227]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 12.0, 16.0, 21.0, 29.0, 52.0, 71.0, 95.0, 145.0, 209.0, 309.0, 555.0, 921.0, 1653.0, 3139.0, 6320.0, 14083.0, 38994.0, 301546.0, 593820.0, 53513.0, 17197.0, 7513.0, 3627.0, 1901.0, 1079.0, 595.0, 329.0, 264.0, 146.0, 133.0, 69.0, 54.0, 36.0, 28.0, 18.0, 12.0, 9.0, 11.0, 5.0, 2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99853515625, -0.969268798828125, -0.94000244140625, -0.910736083984375, -0.8814697265625, -0.852203369140625, -0.82293701171875, -0.793670654296875, -0.764404296875, -0.735137939453125, -0.70587158203125, -0.676605224609375, -0.6473388671875, -0.618072509765625, -0.58880615234375, -0.559539794921875, -0.5302734375, -0.501007080078125, -0.47174072265625, -0.442474365234375, -0.4132080078125, -0.383941650390625, -0.35467529296875, -0.325408935546875, -0.296142578125, -0.266876220703125, -0.23760986328125, -0.208343505859375, -0.1790771484375, -0.149810791015625, -0.12054443359375, -0.091278076171875, -0.06201171875, -0.032745361328125, -0.00347900390625, 0.025787353515625, 0.0550537109375, 0.084320068359375, 0.11358642578125, 0.142852783203125, 0.172119140625, 0.201385498046875, 0.23065185546875, 0.259918212890625, 0.2891845703125, 0.318450927734375, 0.34771728515625, 0.376983642578125, 0.40625, 0.435516357421875, 0.46478271484375, 0.494049072265625, 0.5233154296875, 0.552581787109375, 0.58184814453125, 0.611114501953125, 0.640380859375, 0.669647216796875, 0.69891357421875, 0.728179931640625, 0.7574462890625, 0.786712646484375, 0.81597900390625, 0.845245361328125, 0.87451171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 10.0, 4.0, 5.0, 10.0, 14.0, 2.0, 9.0, 14.0, 24.0, 53.0, 139.0, 227.0, 199.0, 105.0, 58.0, 31.0, 15.0, 10.0, 16.0, 8.0, 7.0, 8.0, 8.0, 6.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.2130126953125, -0.20794296264648438, -0.20287322998046875, -0.19780349731445312, -0.1927337646484375, -0.18766403198242188, -0.18259429931640625, -0.17752456665039062, -0.172454833984375, -0.16738510131835938, -0.16231536865234375, -0.15724563598632812, -0.1521759033203125, -0.14710617065429688, -0.14203643798828125, -0.13696670532226562, -0.13189697265625, -0.12682723999023438, -0.12175750732421875, -0.11668777465820312, -0.1116180419921875, -0.10654830932617188, -0.10147857666015625, -0.09640884399414062, -0.091339111328125, -0.08626937866210938, -0.08119964599609375, -0.07612991333007812, -0.0710601806640625, -0.06599044799804688, -0.06092071533203125, -0.055850982666015625, -0.05078125, -0.045711517333984375, -0.04064178466796875, -0.035572052001953125, -0.0305023193359375, -0.025432586669921875, -0.02036285400390625, -0.015293121337890625, -0.010223388671875, -0.005153656005859375, -8.392333984375e-05, 0.004985809326171875, 0.0100555419921875, 0.015125274658203125, 0.02019500732421875, 0.025264739990234375, 0.03033447265625, 0.035404205322265625, 0.04047393798828125, 0.045543670654296875, 0.0506134033203125, 0.055683135986328125, 0.06075286865234375, 0.06582260131835938, 0.070892333984375, 0.07596206665039062, 0.08103179931640625, 0.08610153198242188, 0.0911712646484375, 0.09624099731445312, 0.10131072998046875, 0.10638046264648438, 0.1114501953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 9.0, 9.0, 19.0, 23.0, 33.0, 48.0, 61.0, 111.0, 145.0, 252.0, 434.0, 806.0, 1532.0, 3414.0, 9057.0, 28660.0, 122185.0, 522956.0, 278904.0, 54672.0, 14792.0, 5309.0, 2339.0, 1163.0, 620.0, 344.0, 231.0, 134.0, 77.0, 58.0, 42.0, 27.0, 18.0, 18.0, 11.0, 6.0, 5.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5146484375, -0.497344970703125, -0.48004150390625, -0.462738037109375, -0.4454345703125, -0.428131103515625, -0.41082763671875, -0.393524169921875, -0.376220703125, -0.358917236328125, -0.34161376953125, -0.324310302734375, -0.3070068359375, -0.289703369140625, -0.27239990234375, -0.255096435546875, -0.23779296875, -0.220489501953125, -0.20318603515625, -0.185882568359375, -0.1685791015625, -0.151275634765625, -0.13397216796875, -0.116668701171875, -0.099365234375, -0.082061767578125, -0.06475830078125, -0.047454833984375, -0.0301513671875, -0.012847900390625, 0.00445556640625, 0.021759033203125, 0.0390625, 0.056365966796875, 0.07366943359375, 0.090972900390625, 0.1082763671875, 0.125579833984375, 0.14288330078125, 0.160186767578125, 0.177490234375, 0.194793701171875, 0.21209716796875, 0.229400634765625, 0.2467041015625, 0.264007568359375, 0.28131103515625, 0.298614501953125, 0.31591796875, 0.333221435546875, 0.35052490234375, 0.367828369140625, 0.3851318359375, 0.402435302734375, 0.41973876953125, 0.437042236328125, 0.454345703125, 0.471649169921875, 0.48895263671875, 0.506256103515625, 0.5235595703125, 0.540863037109375, 0.55816650390625, 0.575469970703125, 0.5927734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 12.0, 13.0, 21.0, 19.0, 21.0, 23.0, 27.0, 51.0, 50.0, 53.0, 59.0, 44.0, 64.0, 53.0, 55.0, 61.0, 51.0, 55.0, 42.0, 48.0, 35.0, 31.0, 19.0, 11.0, 20.0, 14.0, 11.0, 4.0, 7.0, 4.0, 2.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4451332092285156, -0.42957305908203125, -0.4140129089355469, -0.3984527587890625, -0.3828926086425781, -0.36733245849609375, -0.3517723083496094, -0.336212158203125, -0.3206520080566406, -0.30509185791015625, -0.2895317077636719, -0.2739715576171875, -0.2584114074707031, -0.24285125732421875, -0.22729110717773438, -0.21173095703125, -0.19617080688476562, -0.18061065673828125, -0.16505050659179688, -0.1494903564453125, -0.13393020629882812, -0.11837005615234375, -0.10280990600585938, -0.087249755859375, -0.07168960571289062, -0.05612945556640625, -0.040569305419921875, -0.0250091552734375, -0.009449005126953125, 0.00611114501953125, 0.021671295166015625, 0.0372314453125, 0.052791595458984375, 0.06835174560546875, 0.08391189575195312, 0.0994720458984375, 0.11503219604492188, 0.13059234619140625, 0.14615249633789062, 0.161712646484375, 0.17727279663085938, 0.19283294677734375, 0.20839309692382812, 0.2239532470703125, 0.23951339721679688, 0.25507354736328125, 0.2706336975097656, 0.28619384765625, 0.3017539978027344, 0.31731414794921875, 0.3328742980957031, 0.3484344482421875, 0.3639945983886719, 0.37955474853515625, 0.3951148986816406, 0.410675048828125, 0.4262351989746094, 0.44179534912109375, 0.4573554992675781, 0.4729156494140625, 0.4884757995605469, 0.5040359497070312, 0.5195960998535156, 0.53515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 12.0, 12.0, 28.0, 32.0, 41.0, 83.0, 149.0, 306.0, 680.0, 1994.0, 8325.0, 84035.0, 874951.0, 67499.0, 7308.0, 1777.0, 640.0, 310.0, 162.0, 64.0, 46.0, 32.0, 17.0, 11.0, 8.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.02423095703125, -0.9869384765625, -0.94964599609375, -0.912353515625, -0.87506103515625, -0.8377685546875, -0.80047607421875, -0.76318359375, -0.72589111328125, -0.6885986328125, -0.65130615234375, -0.614013671875, -0.57672119140625, -0.5394287109375, -0.50213623046875, -0.46484375, -0.42755126953125, -0.3902587890625, -0.35296630859375, -0.315673828125, -0.27838134765625, -0.2410888671875, -0.20379638671875, -0.16650390625, -0.12921142578125, -0.0919189453125, -0.05462646484375, -0.017333984375, 0.01995849609375, 0.0572509765625, 0.09454345703125, 0.1318359375, 0.16912841796875, 0.2064208984375, 0.24371337890625, 0.281005859375, 0.31829833984375, 0.3555908203125, 0.39288330078125, 0.43017578125, 0.46746826171875, 0.5047607421875, 0.54205322265625, 0.579345703125, 0.61663818359375, 0.6539306640625, 0.69122314453125, 0.728515625, 0.76580810546875, 0.8031005859375, 0.84039306640625, 0.877685546875, 0.91497802734375, 0.9522705078125, 0.98956298828125, 1.02685546875, 1.06414794921875, 1.1014404296875, 1.13873291015625, 1.176025390625, 1.21331787109375, 1.2506103515625, 1.28790283203125, 1.3251953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 9.0, 7.0, 7.0, 13.0, 12.0, 21.0, 29.0, 30.0, 51.0, 59.0, 68.0, 93.0, 101.0, 98.0, 87.0, 56.0, 56.0, 37.0, 38.0, 26.0, 26.0, 11.0, 10.0, 10.0, 9.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.14984130859375e-05, -4.992075264453888e-05, -4.834309220314026e-05, -4.676543176174164e-05, -4.518777132034302e-05, -4.36101108789444e-05, -4.2032450437545776e-05, -4.0454789996147156e-05, -3.8877129554748535e-05, -3.7299469113349915e-05, -3.5721808671951294e-05, -3.414414823055267e-05, -3.256648778915405e-05, -3.098882734775543e-05, -2.941116690635681e-05, -2.783350646495819e-05, -2.625584602355957e-05, -2.467818558216095e-05, -2.310052514076233e-05, -2.152286469936371e-05, -1.9945204257965088e-05, -1.8367543816566467e-05, -1.6789883375167847e-05, -1.5212222933769226e-05, -1.3634562492370605e-05, -1.2056902050971985e-05, -1.0479241609573364e-05, -8.901581168174744e-06, -7.323920726776123e-06, -5.7462602853775024e-06, -4.168599843978882e-06, -2.5909394025802612e-06, -1.0132789611816406e-06, 5.6438148021698e-07, 2.1420419216156006e-06, 3.719702363014221e-06, 5.297362804412842e-06, 6.875023245811462e-06, 8.452683687210083e-06, 1.0030344128608704e-05, 1.1608004570007324e-05, 1.3185665011405945e-05, 1.4763325452804565e-05, 1.6340985894203186e-05, 1.7918646335601807e-05, 1.9496306777000427e-05, 2.1073967218399048e-05, 2.265162765979767e-05, 2.422928810119629e-05, 2.580694854259491e-05, 2.738460898399353e-05, 2.896226942539215e-05, 3.053992986679077e-05, 3.211759030818939e-05, 3.369525074958801e-05, 3.527291119098663e-05, 3.6850571632385254e-05, 3.8428232073783875e-05, 4.0005892515182495e-05, 4.1583552956581116e-05, 4.3161213397979736e-05, 4.473887383937836e-05, 4.631653428077698e-05, 4.78941947221756e-05, 4.947185516357422e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 18.0, 11.0, 12.0, 21.0, 35.0, 65.0, 90.0, 144.0, 243.0, 481.0, 1101.0, 2826.0, 10350.0, 75963.0, 721957.0, 207634.0, 19929.0, 4572.0, 1516.0, 714.0, 345.0, 177.0, 127.0, 74.0, 34.0, 27.0, 17.0, 19.0, 9.0, 6.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.9921875, -0.9671859741210938, -0.9421844482421875, -0.9171829223632812, -0.892181396484375, -0.8671798706054688, -0.8421783447265625, -0.8171768188476562, -0.79217529296875, -0.7671737670898438, -0.7421722412109375, -0.7171707153320312, -0.692169189453125, -0.6671676635742188, -0.6421661376953125, -0.6171646118164062, -0.5921630859375, -0.5671615600585938, -0.5421600341796875, -0.5171585083007812, -0.492156982421875, -0.46715545654296875, -0.4421539306640625, -0.41715240478515625, -0.39215087890625, -0.36714935302734375, -0.3421478271484375, -0.31714630126953125, -0.292144775390625, -0.26714324951171875, -0.2421417236328125, -0.21714019775390625, -0.192138671875, -0.16713714599609375, -0.1421356201171875, -0.11713409423828125, -0.092132568359375, -0.06713104248046875, -0.0421295166015625, -0.01712799072265625, 0.00787353515625, 0.03287506103515625, 0.0578765869140625, 0.08287811279296875, 0.107879638671875, 0.13288116455078125, 0.1578826904296875, 0.18288421630859375, 0.2078857421875, 0.23288726806640625, 0.2578887939453125, 0.28289031982421875, 0.307891845703125, 0.33289337158203125, 0.3578948974609375, 0.38289642333984375, 0.40789794921875, 0.43289947509765625, 0.4579010009765625, 0.48290252685546875, 0.507904052734375, 0.5329055786132812, 0.5579071044921875, 0.5829086303710938, 0.60791015625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 18.0, 25.0, 35.0, 54.0, 75.0, 111.0, 144.0, 145.0, 140.0, 98.0, 42.0, 36.0, 21.0, 17.0, 8.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.763671875, -0.7455101013183594, -0.7273483276367188, -0.7091865539550781, -0.6910247802734375, -0.6728630065917969, -0.6547012329101562, -0.6365394592285156, -0.618377685546875, -0.6002159118652344, -0.5820541381835938, -0.5638923645019531, -0.5457305908203125, -0.5275688171386719, -0.5094070434570312, -0.4912452697753906, -0.47308349609375, -0.4549217224121094, -0.43675994873046875, -0.4185981750488281, -0.4004364013671875, -0.3822746276855469, -0.36411285400390625, -0.3459510803222656, -0.327789306640625, -0.3096275329589844, -0.29146575927734375, -0.2733039855957031, -0.2551422119140625, -0.23698043823242188, -0.21881866455078125, -0.20065689086914062, -0.1824951171875, -0.16433334350585938, -0.14617156982421875, -0.12800979614257812, -0.1098480224609375, -0.09168624877929688, -0.07352447509765625, -0.055362701416015625, -0.037200927734375, -0.019039154052734375, -0.00087738037109375, 0.017284393310546875, 0.0354461669921875, 0.053607940673828125, 0.07176971435546875, 0.08993148803710938, 0.10809326171875, 0.12625503540039062, 0.14441680908203125, 0.16257858276367188, 0.1807403564453125, 0.19890213012695312, 0.21706390380859375, 0.23522567749023438, 0.253387451171875, 0.2715492248535156, 0.28971099853515625, 0.3078727722167969, 0.3260345458984375, 0.3441963195800781, 0.36235809326171875, 0.3805198669433594, 0.398681640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 15.0, 210.0, 748.0, 31.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.574602127075195, -4.807217597961426, -4.039833068847656, -3.272449016571045, -2.5050644874572754, -1.7376799583435059, -0.9702959060668945, -0.202911376953125, 0.5644731521606445, 1.3318575620651245, 2.0992419719696045, 2.866626262664795, 3.6340107917785645, 4.401395320892334, 5.168779373168945, 5.936163902282715, 6.703548431396484, 7.470932960510254, 8.238317489624023, 9.005701065063477, 9.773086547851562, 10.540470123291016, 11.307854652404785, 12.075239181518555, 12.842623710632324, 13.610008239746094, 14.377392768859863, 15.144777297973633, 15.912160873413086, 16.679546356201172, 17.446929931640625, 18.214313507080078, 18.981700897216797, 19.74908447265625, 20.516469955444336, 21.28385353088379, 22.051239013671875, 22.818622589111328, 23.58600616455078, 24.353391647338867, 25.120777130126953, 25.888160705566406, 26.655546188354492, 27.422929763793945, 28.19031524658203, 28.957698822021484, 29.725082397460938, 30.492467880249023, 31.259851455688477, 32.02723693847656, 32.794620513916016, 33.56200408935547, 34.32938766479492, 35.09677505493164, 35.864158630371094, 36.63154220581055, 37.39892578125, 38.16630935668945, 38.933692932128906, 39.701080322265625, 40.46846389770508, 41.23584747314453, 42.003231048583984, 42.77061462402344, 43.538002014160156]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 10.0, 19.0, 32.0, 26.0, 48.0, 58.0, 57.0, 67.0, 74.0, 68.0, 65.0, 65.0, 73.0, 63.0, 43.0, 35.0, 37.0, 29.0, 24.0, 9.0, 12.0, 8.0, 5.0, 3.0, 6.0, 1.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6703221797943115, -3.5402841567993164, -3.4102461338043213, -3.280208110809326, -3.15017032623291, -3.020132303237915, -2.89009428024292, -2.760056257247925, -2.6300182342529297, -2.4999802112579346, -2.3699421882629395, -2.2399044036865234, -2.1098663806915283, -1.9798283576965332, -1.849790334701538, -1.719752311706543, -1.589714527130127, -1.4596765041351318, -1.3296386003494263, -1.1996005773544312, -1.0695626735687256, -0.9395246505737305, -0.8094866275787354, -0.679448664188385, -0.5494107007980347, -0.4193727374076843, -0.2893347442150116, -0.15929675102233887, -0.029258787631988525, 0.10077917575836182, 0.23081719875335693, 0.3608551621437073, 0.4908933639526367, 0.6209313273429871, 0.7509692907333374, 0.8810073137283325, 1.011045217514038, 1.1410832405090332, 1.2711212635040283, 1.4011592864990234, 1.531197190284729, 1.6612352132797241, 1.7912731170654297, 1.9213111400604248, 2.05134916305542, 2.181386947631836, 2.31142520904541, 2.441462993621826, 2.5715010166168213, 2.7015390396118164, 2.8315770626068115, 2.9616150856018066, 3.0916528701782227, 3.2216908931732178, 3.351728916168213, 3.481766939163208, 3.611804962158203, 3.7418429851531982, 3.8718810081481934, 4.001918792724609, 4.131957054138184, 4.2619948387146, 4.392032623291016, 4.52207088470459, 4.652108669281006]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 7.0, 9.0, 10.0, 9.0, 15.0, 26.0, 28.0, 26.0, 33.0, 32.0, 41.0, 55.0, 66.0, 137.0, 190.0, 226.0, 354.0, 547.0, 882.0, 1463.0, 2459.0, 4959.0, 12510.0, 55475.0, 3820861.0, 249372.0, 26423.0, 8451.0, 3812.0, 2111.0, 1400.0, 858.0, 498.0, 274.0, 208.0, 125.0, 88.0, 60.0, 51.0, 50.0, 27.0, 17.0, 12.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0], "bins": [-1.9970703125, -1.9468536376953125, -1.896636962890625, -1.8464202880859375, -1.79620361328125, -1.7459869384765625, -1.695770263671875, -1.6455535888671875, -1.5953369140625, -1.5451202392578125, -1.494903564453125, -1.4446868896484375, -1.39447021484375, -1.3442535400390625, -1.294036865234375, -1.2438201904296875, -1.193603515625, -1.1433868408203125, -1.093170166015625, -1.0429534912109375, -0.99273681640625, -0.9425201416015625, -0.892303466796875, -0.8420867919921875, -0.7918701171875, -0.7416534423828125, -0.691436767578125, -0.6412200927734375, -0.59100341796875, -0.5407867431640625, -0.490570068359375, -0.4403533935546875, -0.39013671875, -0.3399200439453125, -0.289703369140625, -0.2394866943359375, -0.18927001953125, -0.1390533447265625, -0.088836669921875, -0.0386199951171875, 0.0115966796875, 0.0618133544921875, 0.112030029296875, 0.1622467041015625, 0.21246337890625, 0.2626800537109375, 0.312896728515625, 0.3631134033203125, 0.413330078125, 0.4635467529296875, 0.513763427734375, 0.5639801025390625, 0.61419677734375, 0.6644134521484375, 0.714630126953125, 0.7648468017578125, 0.8150634765625, 0.8652801513671875, 0.915496826171875, 0.9657135009765625, 1.01593017578125, 1.0661468505859375, 1.116363525390625, 1.1665802001953125, 1.216796875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 9.0, 4.0, 11.0, 20.0, 17.0, 29.0, 82.0, 124.0, 183.0, 171.0, 106.0, 65.0, 49.0, 29.0, 20.0, 13.0, 11.0, 7.0, 10.0, 8.0, 9.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.2142333984375, -0.20914936065673828, -0.20406532287597656, -0.19898128509521484, -0.19389724731445312, -0.1888132095336914, -0.1837291717529297, -0.17864513397216797, -0.17356109619140625, -0.16847705841064453, -0.1633930206298828, -0.1583089828491211, -0.15322494506835938, -0.14814090728759766, -0.14305686950683594, -0.13797283172607422, -0.1328887939453125, -0.12780475616455078, -0.12272071838378906, -0.11763668060302734, -0.11255264282226562, -0.1074686050415039, -0.10238456726074219, -0.09730052947998047, -0.09221649169921875, -0.08713245391845703, -0.08204841613769531, -0.0769643783569336, -0.07188034057617188, -0.06679630279541016, -0.06171226501464844, -0.05662822723388672, -0.051544189453125, -0.04646015167236328, -0.04137611389160156, -0.036292076110839844, -0.031208038330078125, -0.026124000549316406, -0.021039962768554688, -0.01595592498779297, -0.01087188720703125, -0.005787849426269531, -0.0007038116455078125, 0.004380226135253906, 0.009464263916015625, 0.014548301696777344, 0.019632339477539062, 0.02471637725830078, 0.0298004150390625, 0.03488445281982422, 0.03996849060058594, 0.045052528381347656, 0.050136566162109375, 0.055220603942871094, 0.06030464172363281, 0.06538867950439453, 0.07047271728515625, 0.07555675506591797, 0.08064079284667969, 0.0857248306274414, 0.09080886840820312, 0.09589290618896484, 0.10097694396972656, 0.10606098175048828, 0.11114501953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 10.0, 4.0, 7.0, 7.0, 6.0, 24.0, 25.0, 45.0, 71.0, 100.0, 163.0, 296.0, 562.0, 1427.0, 3786.0, 12578.0, 59928.0, 3165402.0, 890309.0, 43909.0, 10113.0, 3104.0, 1189.0, 533.0, 277.0, 139.0, 96.0, 60.0, 35.0, 29.0, 15.0, 7.0, 8.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5302734375, -1.48077392578125, -1.4312744140625, -1.38177490234375, -1.332275390625, -1.28277587890625, -1.2332763671875, -1.18377685546875, -1.13427734375, -1.08477783203125, -1.0352783203125, -0.98577880859375, -0.936279296875, -0.88677978515625, -0.8372802734375, -0.78778076171875, -0.73828125, -0.68878173828125, -0.6392822265625, -0.58978271484375, -0.540283203125, -0.49078369140625, -0.4412841796875, -0.39178466796875, -0.34228515625, -0.29278564453125, -0.2432861328125, -0.19378662109375, -0.144287109375, -0.09478759765625, -0.0452880859375, 0.00421142578125, 0.0537109375, 0.10321044921875, 0.1527099609375, 0.20220947265625, 0.251708984375, 0.30120849609375, 0.3507080078125, 0.40020751953125, 0.44970703125, 0.49920654296875, 0.5487060546875, 0.59820556640625, 0.647705078125, 0.69720458984375, 0.7467041015625, 0.79620361328125, 0.845703125, 0.89520263671875, 0.9447021484375, 0.99420166015625, 1.043701171875, 1.09320068359375, 1.1427001953125, 1.19219970703125, 1.24169921875, 1.29119873046875, 1.3406982421875, 1.39019775390625, 1.439697265625, 1.48919677734375, 1.5386962890625, 1.58819580078125, 1.6376953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 5.0, 9.0, 9.0, 13.0, 25.0, 27.0, 30.0, 65.0, 92.0, 204.0, 617.0, 1999.0, 502.0, 206.0, 84.0, 52.0, 35.0, 21.0, 17.0, 12.0, 8.0, 5.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.270751953125, -0.26288604736328125, -0.2550201416015625, -0.24715423583984375, -0.239288330078125, -0.23142242431640625, -0.2235565185546875, -0.21569061279296875, -0.20782470703125, -0.19995880126953125, -0.1920928955078125, -0.18422698974609375, -0.176361083984375, -0.16849517822265625, -0.1606292724609375, -0.15276336669921875, -0.1448974609375, -0.13703155517578125, -0.1291656494140625, -0.12129974365234375, -0.113433837890625, -0.10556793212890625, -0.0977020263671875, -0.08983612060546875, -0.08197021484375, -0.07410430908203125, -0.0662384033203125, -0.05837249755859375, -0.050506591796875, -0.04264068603515625, -0.0347747802734375, -0.02690887451171875, -0.01904296875, -0.01117706298828125, -0.0033111572265625, 0.00455474853515625, 0.012420654296875, 0.02028656005859375, 0.0281524658203125, 0.03601837158203125, 0.04388427734375, 0.05175018310546875, 0.0596160888671875, 0.06748199462890625, 0.075347900390625, 0.08321380615234375, 0.0910797119140625, 0.09894561767578125, 0.1068115234375, 0.11467742919921875, 0.1225433349609375, 0.13040924072265625, 0.138275146484375, 0.14614105224609375, 0.1540069580078125, 0.16187286376953125, 0.16973876953125, 0.17760467529296875, 0.1854705810546875, 0.19333648681640625, 0.201202392578125, 0.20906829833984375, 0.2169342041015625, 0.22480010986328125, 0.232666015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 14.0, 39.0, 79.0, 148.0, 246.0, 236.0, 131.0, 51.0, 22.0, 9.0, 11.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9244107604026794, -0.8663935661315918, -0.8083763718605042, -0.7503591775894165, -0.6923420429229736, -0.634324848651886, -0.5763076543807983, -0.5182905197143555, -0.46027329564094543, -0.4022561013698578, -0.34423893690109253, -0.2862217426300049, -0.22820456326007843, -0.17018738389015198, -0.11217018961906433, -0.05415302515029907, 0.0038641691207885742, 0.061881352216005325, 0.11989853531122208, 0.17791572213172913, 0.23593290150165558, 0.29395008087158203, 0.3519672751426697, 0.40998443961143494, 0.4680016338825226, 0.5260187983512878, 0.5840359926223755, 0.6420531868934631, 0.7000703811645508, 0.7580875158309937, 0.8161047697067261, 0.874121904373169, 0.9321390390396118, 0.9901562333106995, 1.048173427581787, 1.10619056224823, 1.1642078161239624, 1.2222249507904053, 1.2802422046661377, 1.3382593393325806, 1.3962764739990234, 1.4542936086654663, 1.5123108625411987, 1.5703279972076416, 1.628345251083374, 1.686362385749817, 1.7443795204162598, 1.8023967742919922, 1.8604140281677246, 1.9184311628341675, 1.9764484167099, 2.0344655513763428, 2.092482805252075, 2.1504998207092285, 2.208517074584961, 2.2665343284606934, 2.3245513439178467, 2.382568597793579, 2.4405856132507324, 2.498602867126465, 2.5566201210021973, 2.6146373748779297, 2.672654390335083, 2.7306716442108154, 2.788688898086548]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 8.0, 7.0, 10.0, 13.0, 16.0, 22.0, 25.0, 30.0, 30.0, 27.0, 30.0, 32.0, 41.0, 40.0, 40.0, 49.0, 50.0, 44.0, 49.0, 44.0, 45.0, 41.0, 37.0, 35.0, 34.0, 26.0, 24.0, 19.0, 18.0, 12.0, 9.0, 17.0, 17.0, 8.0, 7.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.8186424970626831, -0.7963040471076965, -0.77396559715271, -0.7516271471977234, -0.7292886972427368, -0.7069501876831055, -0.6846117377281189, -0.6622732877731323, -0.6399348378181458, -0.6175963878631592, -0.5952579379081726, -0.572919487953186, -0.5505809783935547, -0.5282425284385681, -0.5059040784835815, -0.48356562852859497, -0.4612271785736084, -0.4388887286186218, -0.41655027866363525, -0.3942117989063263, -0.3718733489513397, -0.34953489899635315, -0.3271964192390442, -0.3048579692840576, -0.28251951932907104, -0.2601810693740845, -0.2378426045179367, -0.21550413966178894, -0.19316568970680237, -0.1708272397518158, -0.14848877489566803, -0.12615031003952026, -0.10381191968917847, -0.0814734622836113, -0.05913500487804413, -0.03679654747247696, -0.01445809006690979, 0.00788036733865738, 0.03021882474422455, 0.052557289600372314, 0.07489573955535889, 0.09723419696092606, 0.11957265436649323, 0.141911119222641, 0.16424956917762756, 0.18658801913261414, 0.2089264839887619, 0.23126494884490967, 0.25360339879989624, 0.2759418487548828, 0.2982802987098694, 0.32061877846717834, 0.3429572284221649, 0.3652956783771515, 0.38763415813446045, 0.409972608089447, 0.4323110580444336, 0.45464950799942017, 0.47698795795440674, 0.4993264377117157, 0.5216648578643799, 0.5440033674240112, 0.5663418173789978, 0.5886802673339844, 0.611018717288971]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 2.0, 5.0, 6.0, 10.0, 27.0, 30.0, 46.0, 69.0, 80.0, 135.0, 200.0, 313.0, 467.0, 831.0, 1390.0, 2656.0, 5957.0, 15658.0, 58828.0, 481615.0, 402615.0, 51594.0, 14465.0, 5559.0, 2563.0, 1333.0, 739.0, 459.0, 268.0, 184.0, 132.0, 74.0, 67.0, 45.0, 33.0, 24.0, 14.0, 12.0, 11.0, 13.0, 7.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1913909912109375, -1.155242919921875, -1.1190948486328125, -1.08294677734375, -1.0467987060546875, -1.010650634765625, -0.9745025634765625, -0.9383544921875, -0.9022064208984375, -0.866058349609375, -0.8299102783203125, -0.79376220703125, -0.7576141357421875, -0.721466064453125, -0.6853179931640625, -0.649169921875, -0.6130218505859375, -0.576873779296875, -0.5407257080078125, -0.50457763671875, -0.4684295654296875, -0.432281494140625, -0.3961334228515625, -0.3599853515625, -0.3238372802734375, -0.287689208984375, -0.2515411376953125, -0.21539306640625, -0.1792449951171875, -0.143096923828125, -0.1069488525390625, -0.07080078125, -0.0346527099609375, 0.001495361328125, 0.0376434326171875, 0.07379150390625, 0.1099395751953125, 0.146087646484375, 0.1822357177734375, 0.2183837890625, 0.2545318603515625, 0.290679931640625, 0.3268280029296875, 0.36297607421875, 0.3991241455078125, 0.435272216796875, 0.4714202880859375, 0.507568359375, 0.5437164306640625, 0.579864501953125, 0.6160125732421875, 0.65216064453125, 0.6883087158203125, 0.724456787109375, 0.7606048583984375, 0.7967529296875, 0.8329010009765625, 0.869049072265625, 0.9051971435546875, 0.94134521484375, 0.9774932861328125, 1.013641357421875, 1.0497894287109375, 1.0859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 4.0, 18.0, 11.0, 16.0, 22.0, 41.0, 77.0, 128.0, 149.0, 164.0, 113.0, 75.0, 40.0, 47.0, 25.0, 15.0, 14.0, 8.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2042236328125, -0.19926929473876953, -0.19431495666503906, -0.1893606185913086, -0.18440628051757812, -0.17945194244384766, -0.1744976043701172, -0.16954326629638672, -0.16458892822265625, -0.15963459014892578, -0.1546802520751953, -0.14972591400146484, -0.14477157592773438, -0.1398172378540039, -0.13486289978027344, -0.12990856170654297, -0.1249542236328125, -0.11999988555908203, -0.11504554748535156, -0.1100912094116211, -0.10513687133789062, -0.10018253326416016, -0.09522819519042969, -0.09027385711669922, -0.08531951904296875, -0.08036518096923828, -0.07541084289550781, -0.07045650482177734, -0.06550216674804688, -0.060547828674316406, -0.05559349060058594, -0.05063915252685547, -0.045684814453125, -0.04073047637939453, -0.03577613830566406, -0.030821800231933594, -0.025867462158203125, -0.020913124084472656, -0.015958786010742188, -0.011004447937011719, -0.00605010986328125, -0.0010957717895507812, 0.0038585662841796875, 0.008812904357910156, 0.013767242431640625, 0.018721580505371094, 0.023675918579101562, 0.02863025665283203, 0.0335845947265625, 0.03853893280029297, 0.04349327087402344, 0.048447608947753906, 0.053401947021484375, 0.058356285095214844, 0.06331062316894531, 0.06826496124267578, 0.07321929931640625, 0.07817363739013672, 0.08312797546386719, 0.08808231353759766, 0.09303665161132812, 0.0979909896850586, 0.10294532775878906, 0.10789966583251953, 0.11285400390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 7.0, 6.0, 16.0, 13.0, 25.0, 55.0, 59.0, 74.0, 130.0, 234.0, 382.0, 731.0, 1547.0, 3998.0, 13614.0, 63587.0, 444459.0, 435429.0, 62844.0, 13794.0, 4192.0, 1590.0, 689.0, 384.0, 222.0, 131.0, 100.0, 59.0, 39.0, 35.0, 21.0, 20.0, 14.0, 5.0, 13.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1123046875, -1.076416015625, -1.04052734375, -1.004638671875, -0.96875, -0.932861328125, -0.89697265625, -0.861083984375, -0.8251953125, -0.789306640625, -0.75341796875, -0.717529296875, -0.681640625, -0.645751953125, -0.60986328125, -0.573974609375, -0.5380859375, -0.502197265625, -0.46630859375, -0.430419921875, -0.39453125, -0.358642578125, -0.32275390625, -0.286865234375, -0.2509765625, -0.215087890625, -0.17919921875, -0.143310546875, -0.107421875, -0.071533203125, -0.03564453125, 0.000244140625, 0.0361328125, 0.072021484375, 0.10791015625, 0.143798828125, 0.1796875, 0.215576171875, 0.25146484375, 0.287353515625, 0.3232421875, 0.359130859375, 0.39501953125, 0.430908203125, 0.466796875, 0.502685546875, 0.53857421875, 0.574462890625, 0.6103515625, 0.646240234375, 0.68212890625, 0.718017578125, 0.75390625, 0.789794921875, 0.82568359375, 0.861572265625, 0.8974609375, 0.933349609375, 0.96923828125, 1.005126953125, 1.041015625, 1.076904296875, 1.11279296875, 1.148681640625, 1.1845703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 5.0, 3.0, 2.0, 7.0, 7.0, 12.0, 18.0, 13.0, 20.0, 25.0, 30.0, 29.0, 34.0, 35.0, 39.0, 43.0, 43.0, 45.0, 55.0, 42.0, 63.0, 49.0, 41.0, 63.0, 38.0, 32.0, 26.0, 23.0, 30.0, 22.0, 14.0, 17.0, 20.0, 6.0, 5.0, 9.0, 10.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.475341796875, -0.4591255187988281, -0.44290924072265625, -0.4266929626464844, -0.4104766845703125, -0.3942604064941406, -0.37804412841796875, -0.3618278503417969, -0.345611572265625, -0.3293952941894531, -0.31317901611328125, -0.2969627380371094, -0.2807464599609375, -0.2645301818847656, -0.24831390380859375, -0.23209762573242188, -0.21588134765625, -0.19966506958007812, -0.18344879150390625, -0.16723251342773438, -0.1510162353515625, -0.13479995727539062, -0.11858367919921875, -0.10236740112304688, -0.086151123046875, -0.06993484497070312, -0.05371856689453125, -0.037502288818359375, -0.0212860107421875, -0.005069732666015625, 0.01114654541015625, 0.027362823486328125, 0.0435791015625, 0.059795379638671875, 0.07601165771484375, 0.09222793579101562, 0.1084442138671875, 0.12466049194335938, 0.14087677001953125, 0.15709304809570312, 0.173309326171875, 0.18952560424804688, 0.20574188232421875, 0.22195816040039062, 0.2381744384765625, 0.2543907165527344, 0.27060699462890625, 0.2868232727050781, 0.30303955078125, 0.3192558288574219, 0.33547210693359375, 0.3516883850097656, 0.3679046630859375, 0.3841209411621094, 0.40033721923828125, 0.4165534973144531, 0.432769775390625, 0.4489860534667969, 0.46520233154296875, 0.4814186096191406, 0.4976348876953125, 0.5138511657714844, 0.5300674438476562, 0.5462837219238281, 0.5625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 3.0, 10.0, 23.0, 16.0, 27.0, 38.0, 60.0, 102.0, 143.0, 263.0, 451.0, 762.0, 1376.0, 2855.0, 7066.0, 22469.0, 111515.0, 661893.0, 191981.0, 30958.0, 9078.0, 3554.0, 1696.0, 888.0, 516.0, 291.0, 184.0, 110.0, 68.0, 44.0, 37.0, 24.0, 24.0, 8.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61376953125, -0.5888442993164062, -0.5639190673828125, -0.5389938354492188, -0.514068603515625, -0.48914337158203125, -0.4642181396484375, -0.43929290771484375, -0.41436767578125, -0.38944244384765625, -0.3645172119140625, -0.33959197998046875, -0.314666748046875, -0.28974151611328125, -0.2648162841796875, -0.23989105224609375, -0.2149658203125, -0.19004058837890625, -0.1651153564453125, -0.14019012451171875, -0.115264892578125, -0.09033966064453125, -0.0654144287109375, -0.04048919677734375, -0.01556396484375, 0.00936126708984375, 0.0342864990234375, 0.05921173095703125, 0.084136962890625, 0.10906219482421875, 0.1339874267578125, 0.15891265869140625, 0.183837890625, 0.20876312255859375, 0.2336883544921875, 0.25861358642578125, 0.283538818359375, 0.30846405029296875, 0.3333892822265625, 0.35831451416015625, 0.38323974609375, 0.40816497802734375, 0.4330902099609375, 0.45801544189453125, 0.482940673828125, 0.5078659057617188, 0.5327911376953125, 0.5577163696289062, 0.5826416015625, 0.6075668334960938, 0.6324920654296875, 0.6574172973632812, 0.682342529296875, 0.7072677612304688, 0.7321929931640625, 0.7571182250976562, 0.78204345703125, 0.8069686889648438, 0.8318939208984375, 0.8568191528320312, 0.881744384765625, 0.9066696166992188, 0.9315948486328125, 0.9565200805664062, 0.9814453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 13.0, 10.0, 19.0, 36.0, 42.0, 62.0, 118.0, 179.0, 178.0, 125.0, 89.0, 35.0, 28.0, 21.0, 14.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001709461212158203, -0.0001652352511882782, -0.00015952438116073608, -0.00015381351113319397, -0.00014810264110565186, -0.00014239177107810974, -0.00013668090105056763, -0.0001309700310230255, -0.0001252591609954834, -0.00011954829096794128, -0.00011383742094039917, -0.00010812655091285706, -0.00010241568088531494, -9.670481085777283e-05, -9.099394083023071e-05, -8.52830708026886e-05, -7.957220077514648e-05, -7.386133074760437e-05, -6.815046072006226e-05, -6.243959069252014e-05, -5.672872066497803e-05, -5.101785063743591e-05, -4.53069806098938e-05, -3.9596110582351685e-05, -3.388524055480957e-05, -2.8174370527267456e-05, -2.2463500499725342e-05, -1.6752630472183228e-05, -1.1041760444641113e-05, -5.330890417098999e-06, 3.7997961044311523e-07, 6.0908496379852295e-06, 1.1801719665527344e-05, 1.7512589693069458e-05, 2.3223459720611572e-05, 2.8934329748153687e-05, 3.46451997756958e-05, 4.0356069803237915e-05, 4.606693983078003e-05, 5.1777809858322144e-05, 5.748867988586426e-05, 6.319954991340637e-05, 6.891041994094849e-05, 7.46212899684906e-05, 8.033215999603271e-05, 8.604303002357483e-05, 9.175390005111694e-05, 9.746477007865906e-05, 0.00010317564010620117, 0.00010888651013374329, 0.0001145973801612854, 0.00012030825018882751, 0.00012601912021636963, 0.00013172999024391174, 0.00013744086027145386, 0.00014315173029899597, 0.00014886260032653809, 0.0001545734703540802, 0.00016028434038162231, 0.00016599521040916443, 0.00017170608043670654, 0.00017741695046424866, 0.00018312782049179077, 0.00018883869051933289, 0.000194549560546875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 1.0, 3.0, 7.0, 8.0, 6.0, 13.0, 17.0, 32.0, 32.0, 57.0, 97.0, 131.0, 224.0, 428.0, 904.0, 2309.0, 6745.0, 29169.0, 329171.0, 616195.0, 48211.0, 9402.0, 2976.0, 1185.0, 547.0, 251.0, 155.0, 88.0, 53.0, 38.0, 26.0, 25.0, 8.0, 12.0, 5.0, 5.0, 5.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0302734375, -0.999176025390625, -0.96807861328125, -0.936981201171875, -0.9058837890625, -0.874786376953125, -0.84368896484375, -0.812591552734375, -0.781494140625, -0.750396728515625, -0.71929931640625, -0.688201904296875, -0.6571044921875, -0.626007080078125, -0.59490966796875, -0.563812255859375, -0.53271484375, -0.501617431640625, -0.47052001953125, -0.439422607421875, -0.4083251953125, -0.377227783203125, -0.34613037109375, -0.315032958984375, -0.283935546875, -0.252838134765625, -0.22174072265625, -0.190643310546875, -0.1595458984375, -0.128448486328125, -0.09735107421875, -0.066253662109375, -0.03515625, -0.004058837890625, 0.02703857421875, 0.058135986328125, 0.0892333984375, 0.120330810546875, 0.15142822265625, 0.182525634765625, 0.213623046875, 0.244720458984375, 0.27581787109375, 0.306915283203125, 0.3380126953125, 0.369110107421875, 0.40020751953125, 0.431304931640625, 0.46240234375, 0.493499755859375, 0.52459716796875, 0.555694580078125, 0.5867919921875, 0.617889404296875, 0.64898681640625, 0.680084228515625, 0.711181640625, 0.742279052734375, 0.77337646484375, 0.804473876953125, 0.8355712890625, 0.866668701171875, 0.89776611328125, 0.928863525390625, 0.9599609375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 3.0, 6.0, 9.0, 6.0, 8.0, 18.0, 20.0, 28.0, 32.0, 33.0, 57.0, 75.0, 80.0, 99.0, 116.0, 94.0, 69.0, 51.0, 38.0, 34.0, 26.0, 12.0, 17.0, 9.0, 5.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.396240234375, -0.38422393798828125, -0.3722076416015625, -0.36019134521484375, -0.348175048828125, -0.33615875244140625, -0.3241424560546875, -0.31212615966796875, -0.30010986328125, -0.28809356689453125, -0.2760772705078125, -0.26406097412109375, -0.252044677734375, -0.24002838134765625, -0.2280120849609375, -0.21599578857421875, -0.2039794921875, -0.19196319580078125, -0.1799468994140625, -0.16793060302734375, -0.155914306640625, -0.14389801025390625, -0.1318817138671875, -0.11986541748046875, -0.10784912109375, -0.09583282470703125, -0.0838165283203125, -0.07180023193359375, -0.059783935546875, -0.04776763916015625, -0.0357513427734375, -0.02373504638671875, -0.01171875, 0.00029754638671875, 0.0123138427734375, 0.02433013916015625, 0.036346435546875, 0.04836273193359375, 0.0603790283203125, 0.07239532470703125, 0.08441162109375, 0.09642791748046875, 0.1084442138671875, 0.12046051025390625, 0.132476806640625, 0.14449310302734375, 0.1565093994140625, 0.16852569580078125, 0.1805419921875, 0.19255828857421875, 0.2045745849609375, 0.21659088134765625, 0.228607177734375, 0.24062347412109375, 0.2526397705078125, 0.26465606689453125, 0.27667236328125, 0.28868865966796875, 0.3007049560546875, 0.31272125244140625, 0.324737548828125, 0.33675384521484375, 0.3487701416015625, 0.36078643798828125, 0.372802734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 32.0, 216.0, 501.0, 194.0, 37.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9745192527771, -6.416813850402832, -5.8591084480285645, -5.301403045654297, -4.743697643280029, -4.185992240905762, -3.628286838531494, -3.0705814361572266, -2.512876033782959, -1.9551706314086914, -1.3974652290344238, -0.8397598266601562, -0.28205442428588867, 0.2756509780883789, 0.8333563804626465, 1.391061782836914, 1.9487671852111816, 2.506472587585449, 3.064177989959717, 3.6218833923339844, 4.179588794708252, 4.7372941970825195, 5.294999599456787, 5.852705001831055, 6.410410404205322, 6.96811580657959, 7.525821208953857, 8.083526611328125, 8.641231536865234, 9.19893741607666, 9.756643295288086, 10.314348220825195, 10.872053146362305, 11.429758071899414, 11.98746395111084, 12.545169830322266, 13.102874755859375, 13.660579681396484, 14.21828556060791, 14.775991439819336, 15.333696365356445, 15.891401290893555, 16.449108123779297, 17.006813049316406, 17.564517974853516, 18.122222900390625, 18.679927825927734, 19.237634658813477, 19.795339584350586, 20.353044509887695, 20.910751342773438, 21.468456268310547, 22.026161193847656, 22.583866119384766, 23.141571044921875, 23.699277877807617, 24.256982803344727, 24.814687728881836, 25.372394561767578, 25.930099487304688, 26.487804412841797, 27.045509338378906, 27.603214263916016, 28.160921096801758, 28.718626022338867]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 4.0, 14.0, 7.0, 20.0, 21.0, 17.0, 18.0, 25.0, 33.0, 38.0, 41.0, 35.0, 50.0, 50.0, 38.0, 48.0, 45.0, 47.0, 43.0, 50.0, 49.0, 50.0, 40.0, 37.0, 37.0, 25.0, 20.0, 15.0, 14.0, 12.0, 6.0, 10.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2408905029296875, -4.113312244415283, -3.985734224319458, -3.858156204223633, -3.7305779457092285, -3.6029999256134033, -3.475421905517578, -3.347843647003174, -3.2202653884887695, -3.0926873683929443, -2.96510910987854, -2.837531089782715, -2.7099528312683105, -2.5823748111724854, -2.45479679107666, -2.327218532562256, -2.1996405124664307, -2.0720624923706055, -1.9444842338562012, -1.816906213760376, -1.6893279552459717, -1.5617499351501465, -1.4341717958450317, -1.306593656539917, -1.1790155172348022, -1.0514373779296875, -0.9238592386245728, -0.7962811589241028, -0.668703019618988, -0.5411248803138733, -0.4135468006134033, -0.2859686613082886, -0.15839052200317383, -0.030812397599220276, 0.09676572680473328, 0.22434383630752563, 0.3519219756126404, 0.4795001149177551, 0.6070781946182251, 0.7346563339233398, 0.8622344732284546, 0.9898126125335693, 1.117390751838684, 1.2449688911437988, 1.372546911239624, 1.5001251697540283, 1.6277031898498535, 1.7552813291549683, 1.882859468460083, 2.010437488555908, 2.1380157470703125, 2.2655937671661377, 2.393172025680542, 2.520750045776367, 2.6483283042907715, 2.7759063243865967, 2.903484344482422, 3.031062364578247, 3.1586406230926514, 3.2862186431884766, 3.413796901702881, 3.541374921798706, 3.6689529418945312, 3.7965312004089355, 3.92410945892334]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 8.0, 15.0, 17.0, 42.0, 33.0, 35.0, 82.0, 136.0, 208.0, 512.0, 1227.0, 3907.0, 22854.0, 4005289.0, 147746.0, 8543.0, 2010.0, 856.0, 343.0, 153.0, 97.0, 61.0, 42.0, 21.0, 10.0, 9.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.68359375, -3.5860595703125, -3.488525390625, -3.3909912109375, -3.29345703125, -3.1959228515625, -3.098388671875, -3.0008544921875, -2.9033203125, -2.8057861328125, -2.708251953125, -2.6107177734375, -2.51318359375, -2.4156494140625, -2.318115234375, -2.2205810546875, -2.123046875, -2.0255126953125, -1.927978515625, -1.8304443359375, -1.73291015625, -1.6353759765625, -1.537841796875, -1.4403076171875, -1.3427734375, -1.2452392578125, -1.147705078125, -1.0501708984375, -0.95263671875, -0.8551025390625, -0.757568359375, -0.6600341796875, -0.5625, -0.4649658203125, -0.367431640625, -0.2698974609375, -0.17236328125, -0.0748291015625, 0.022705078125, 0.1202392578125, 0.2177734375, 0.3153076171875, 0.412841796875, 0.5103759765625, 0.60791015625, 0.7054443359375, 0.802978515625, 0.9005126953125, 0.998046875, 1.0955810546875, 1.193115234375, 1.2906494140625, 1.38818359375, 1.4857177734375, 1.583251953125, 1.6807861328125, 1.7783203125, 1.8758544921875, 1.973388671875, 2.0709228515625, 2.16845703125, 2.2659912109375, 2.363525390625, 2.4610595703125, 2.55859375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 5.0, 13.0, 19.0, 23.0, 28.0, 57.0, 68.0, 71.0, 98.0, 138.0, 129.0, 85.0, 103.0, 47.0, 30.0, 20.0, 15.0, 10.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2117919921875, -0.20616912841796875, -0.2005462646484375, -0.19492340087890625, -0.189300537109375, -0.18367767333984375, -0.1780548095703125, -0.17243194580078125, -0.16680908203125, -0.16118621826171875, -0.1555633544921875, -0.14994049072265625, -0.144317626953125, -0.13869476318359375, -0.1330718994140625, -0.12744903564453125, -0.121826171875, -0.11620330810546875, -0.1105804443359375, -0.10495758056640625, -0.099334716796875, -0.09371185302734375, -0.0880889892578125, -0.08246612548828125, -0.07684326171875, -0.07122039794921875, -0.0655975341796875, -0.05997467041015625, -0.054351806640625, -0.04872894287109375, -0.0431060791015625, -0.03748321533203125, -0.0318603515625, -0.02623748779296875, -0.0206146240234375, -0.01499176025390625, -0.009368896484375, -0.00374603271484375, 0.0018768310546875, 0.00749969482421875, 0.01312255859375, 0.01874542236328125, 0.0243682861328125, 0.02999114990234375, 0.035614013671875, 0.04123687744140625, 0.0468597412109375, 0.05248260498046875, 0.05810546875, 0.06372833251953125, 0.0693511962890625, 0.07497406005859375, 0.080596923828125, 0.08621978759765625, 0.0918426513671875, 0.09746551513671875, 0.10308837890625, 0.10871124267578125, 0.1143341064453125, 0.11995697021484375, 0.125579833984375, 0.13120269775390625, 0.1368255615234375, 0.14244842529296875, 0.1480712890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 16.0, 21.0, 38.0, 37.0, 72.0, 125.0, 190.0, 339.0, 667.0, 1634.0, 5814.0, 59440.0, 4004501.0, 109727.0, 7981.0, 2021.0, 775.0, 376.0, 180.0, 118.0, 54.0, 49.0, 32.0, 15.0, 15.0, 7.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.71600341796875, -2.6351318359375, -2.55426025390625, -2.473388671875, -2.39251708984375, -2.3116455078125, -2.23077392578125, -2.14990234375, -2.06903076171875, -1.9881591796875, -1.90728759765625, -1.826416015625, -1.74554443359375, -1.6646728515625, -1.58380126953125, -1.5029296875, -1.42205810546875, -1.3411865234375, -1.26031494140625, -1.179443359375, -1.09857177734375, -1.0177001953125, -0.93682861328125, -0.85595703125, -0.77508544921875, -0.6942138671875, -0.61334228515625, -0.532470703125, -0.45159912109375, -0.3707275390625, -0.28985595703125, -0.208984375, -0.12811279296875, -0.0472412109375, 0.03363037109375, 0.114501953125, 0.19537353515625, 0.2762451171875, 0.35711669921875, 0.43798828125, 0.51885986328125, 0.5997314453125, 0.68060302734375, 0.761474609375, 0.84234619140625, 0.9232177734375, 1.00408935546875, 1.0849609375, 1.16583251953125, 1.2467041015625, 1.32757568359375, 1.408447265625, 1.48931884765625, 1.5701904296875, 1.65106201171875, 1.73193359375, 1.81280517578125, 1.8936767578125, 1.97454833984375, 2.055419921875, 2.13629150390625, 2.2171630859375, 2.29803466796875, 2.37890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 9.0, 6.0, 23.0, 36.0, 63.0, 205.0, 685.0, 2433.0, 363.0, 112.0, 51.0, 37.0, 17.0, 12.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.6018753051757812, -0.5865631103515625, -0.5712509155273438, -0.555938720703125, -0.5406265258789062, -0.5253143310546875, -0.5100021362304688, -0.49468994140625, -0.47937774658203125, -0.4640655517578125, -0.44875335693359375, -0.433441162109375, -0.41812896728515625, -0.4028167724609375, -0.38750457763671875, -0.3721923828125, -0.35688018798828125, -0.3415679931640625, -0.32625579833984375, -0.310943603515625, -0.29563140869140625, -0.2803192138671875, -0.26500701904296875, -0.24969482421875, -0.23438262939453125, -0.2190704345703125, -0.20375823974609375, -0.188446044921875, -0.17313385009765625, -0.1578216552734375, -0.14250946044921875, -0.127197265625, -0.11188507080078125, -0.0965728759765625, -0.08126068115234375, -0.065948486328125, -0.05063629150390625, -0.0353240966796875, -0.02001190185546875, -0.00469970703125, 0.01061248779296875, 0.0259246826171875, 0.04123687744140625, 0.056549072265625, 0.07186126708984375, 0.0871734619140625, 0.10248565673828125, 0.1177978515625, 0.13311004638671875, 0.1484222412109375, 0.16373443603515625, 0.179046630859375, 0.19435882568359375, 0.2096710205078125, 0.22498321533203125, 0.24029541015625, 0.25560760498046875, 0.2709197998046875, 0.28623199462890625, 0.301544189453125, 0.31685638427734375, 0.3321685791015625, 0.34748077392578125, 0.36279296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 14.0, 30.0, 68.0, 156.0, 261.0, 262.0, 134.0, 45.0, 22.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.760923385620117, -4.67113733291626, -4.5813517570495605, -4.491565704345703, -4.401780128479004, -4.3119940757751465, -4.222208023071289, -4.13242244720459, -4.042636394500732, -3.952850580215454, -3.863064765930176, -3.7732787132263184, -3.68349289894104, -3.5937070846557617, -3.5039210319519043, -3.414135217666626, -3.3243494033813477, -3.2345635890960693, -3.144777774810791, -3.0549917221069336, -2.9652059078216553, -2.875420093536377, -2.7856340408325195, -2.695848226547241, -2.606062412261963, -2.5162765979766846, -2.4264907836914062, -2.336704730987549, -2.2469189167022705, -2.157133102416992, -2.0673470497131348, -1.9775612354278564, -1.8877754211425781, -1.7979896068572998, -1.708203673362732, -1.618417739868164, -1.5286319255828857, -1.4388461112976074, -1.3490601778030396, -1.2592742443084717, -1.1694884300231934, -1.079702615737915, -0.9899166822433472, -0.9001308083534241, -0.810344934463501, -0.7205590605735779, -0.6307731866836548, -0.5409873127937317, -0.45120149850845337, -0.3614156246185303, -0.2716297507286072, -0.18184387683868408, -0.09205800294876099, -0.0022721290588378906, 0.0875137448310852, 0.1772996187210083, 0.2670854926109314, 0.3568713665008545, 0.4466572403907776, 0.5364431142807007, 0.6262289881706238, 0.7160148620605469, 0.80580073595047, 0.8955866098403931, 0.9853724837303162]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 5.0, 19.0, 14.0, 14.0, 14.0, 18.0, 18.0, 12.0, 12.0, 23.0, 24.0, 26.0, 28.0, 39.0, 25.0, 44.0, 43.0, 34.0, 33.0, 42.0, 34.0, 37.0, 48.0, 30.0, 37.0, 33.0, 45.0, 28.0, 23.0, 35.0, 23.0, 16.0, 20.0, 19.0, 12.0, 14.0, 7.0, 7.0, 6.0, 4.0, 5.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.8310531973838806, -0.8046375513076782, -0.7782219052314758, -0.7518062591552734, -0.7253905534744263, -0.6989749073982239, -0.6725592613220215, -0.6461436152458191, -0.6197279691696167, -0.5933123230934143, -0.5668966770172119, -0.5404809713363647, -0.5140653252601624, -0.48764967918395996, -0.46123403310775757, -0.4348183870315552, -0.408402681350708, -0.3819870352745056, -0.35557135939598083, -0.32915571331977844, -0.30274003744125366, -0.27632439136505127, -0.24990874528884888, -0.2234930843114853, -0.1970774233341217, -0.17066176235675812, -0.14424610137939453, -0.11783045530319214, -0.09141479432582855, -0.06499913334846497, -0.03858348727226257, -0.012167826294898987, 0.014247775077819824, 0.04066343232989311, 0.0670790895819664, 0.09349474310874939, 0.11991040408611298, 0.14632606506347656, 0.17274171113967896, 0.19915737211704254, 0.22557303309440613, 0.2519886791706085, 0.2784043550491333, 0.3048200011253357, 0.3312356472015381, 0.35765132308006287, 0.38406696915626526, 0.41048264503479004, 0.43689829111099243, 0.4633139371871948, 0.4897296130657196, 0.5161452293395996, 0.5425609350204468, 0.5689765810966492, 0.5953922271728516, 0.621807873249054, 0.6482235193252563, 0.6746391654014587, 0.7010548114776611, 0.7274705171585083, 0.7538861632347107, 0.7803018093109131, 0.8067174553871155, 0.8331331014633179, 0.859548807144165]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 15.0, 11.0, 22.0, 25.0, 34.0, 53.0, 83.0, 141.0, 215.0, 345.0, 707.0, 1253.0, 2676.0, 6903.0, 22063.0, 111078.0, 584945.0, 257539.0, 41660.0, 10938.0, 3947.0, 1777.0, 909.0, 452.0, 277.0, 156.0, 114.0, 67.0, 52.0, 29.0, 23.0, 6.0, 8.0, 3.0, 6.0, 4.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.2294921875, -1.195068359375, -1.16064453125, -1.126220703125, -1.091796875, -1.057373046875, -1.02294921875, -0.988525390625, -0.9541015625, -0.919677734375, -0.88525390625, -0.850830078125, -0.81640625, -0.781982421875, -0.74755859375, -0.713134765625, -0.6787109375, -0.644287109375, -0.60986328125, -0.575439453125, -0.541015625, -0.506591796875, -0.47216796875, -0.437744140625, -0.4033203125, -0.368896484375, -0.33447265625, -0.300048828125, -0.265625, -0.231201171875, -0.19677734375, -0.162353515625, -0.1279296875, -0.093505859375, -0.05908203125, -0.024658203125, 0.009765625, 0.044189453125, 0.07861328125, 0.113037109375, 0.1474609375, 0.181884765625, 0.21630859375, 0.250732421875, 0.28515625, 0.319580078125, 0.35400390625, 0.388427734375, 0.4228515625, 0.457275390625, 0.49169921875, 0.526123046875, 0.560546875, 0.594970703125, 0.62939453125, 0.663818359375, 0.6982421875, 0.732666015625, 0.76708984375, 0.801513671875, 0.8359375, 0.870361328125, 0.90478515625, 0.939208984375, 0.9736328125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 12.0, 18.0, 28.0, 19.0, 46.0, 73.0, 90.0, 94.0, 122.0, 101.0, 95.0, 93.0, 59.0, 39.0, 30.0, 26.0, 13.0, 10.0, 3.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2322998046875, -0.22647857666015625, -0.2206573486328125, -0.21483612060546875, -0.209014892578125, -0.20319366455078125, -0.1973724365234375, -0.19155120849609375, -0.18572998046875, -0.17990875244140625, -0.1740875244140625, -0.16826629638671875, -0.162445068359375, -0.15662384033203125, -0.1508026123046875, -0.14498138427734375, -0.13916015625, -0.13333892822265625, -0.1275177001953125, -0.12169647216796875, -0.115875244140625, -0.11005401611328125, -0.1042327880859375, -0.09841156005859375, -0.09259033203125, -0.08676910400390625, -0.0809478759765625, -0.07512664794921875, -0.069305419921875, -0.06348419189453125, -0.0576629638671875, -0.05184173583984375, -0.0460205078125, -0.04019927978515625, -0.0343780517578125, -0.02855682373046875, -0.022735595703125, -0.01691436767578125, -0.0110931396484375, -0.00527191162109375, 0.00054931640625, 0.00637054443359375, 0.0121917724609375, 0.01801300048828125, 0.023834228515625, 0.02965545654296875, 0.0354766845703125, 0.04129791259765625, 0.047119140625, 0.05294036865234375, 0.0587615966796875, 0.06458282470703125, 0.070404052734375, 0.07622528076171875, 0.0820465087890625, 0.08786773681640625, 0.09368896484375, 0.09951019287109375, 0.1053314208984375, 0.11115264892578125, 0.116973876953125, 0.12279510498046875, 0.1286163330078125, 0.13443756103515625, 0.1402587890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 2.0, 5.0, 15.0, 18.0, 25.0, 32.0, 47.0, 67.0, 101.0, 180.0, 252.0, 514.0, 1057.0, 2209.0, 5659.0, 18661.0, 81819.0, 434875.0, 400696.0, 75087.0, 17425.0, 5476.0, 2020.0, 974.0, 552.0, 286.0, 169.0, 108.0, 54.0, 59.0, 36.0, 13.0, 17.0, 12.0, 9.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.16796875, -1.1363754272460938, -1.1047821044921875, -1.0731887817382812, -1.041595458984375, -1.0100021362304688, -0.9784088134765625, -0.9468154907226562, -0.91522216796875, -0.8836288452148438, -0.8520355224609375, -0.8204421997070312, -0.788848876953125, -0.7572555541992188, -0.7256622314453125, -0.6940689086914062, -0.6624755859375, -0.6308822631835938, -0.5992889404296875, -0.5676956176757812, -0.536102294921875, -0.5045089721679688, -0.4729156494140625, -0.44132232666015625, -0.40972900390625, -0.37813568115234375, -0.3465423583984375, -0.31494903564453125, -0.283355712890625, -0.25176239013671875, -0.2201690673828125, -0.18857574462890625, -0.156982421875, -0.12538909912109375, -0.0937957763671875, -0.06220245361328125, -0.030609130859375, 0.00098419189453125, 0.0325775146484375, 0.06417083740234375, 0.09576416015625, 0.12735748291015625, 0.1589508056640625, 0.19054412841796875, 0.222137451171875, 0.25373077392578125, 0.2853240966796875, 0.31691741943359375, 0.3485107421875, 0.38010406494140625, 0.4116973876953125, 0.44329071044921875, 0.474884033203125, 0.5064773559570312, 0.5380706787109375, 0.5696640014648438, 0.60125732421875, 0.6328506469726562, 0.6644439697265625, 0.6960372924804688, 0.727630615234375, 0.7592239379882812, 0.7908172607421875, 0.8224105834960938, 0.85400390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 4.0, 13.0, 7.0, 13.0, 5.0, 17.0, 18.0, 35.0, 20.0, 30.0, 31.0, 44.0, 34.0, 48.0, 33.0, 57.0, 45.0, 50.0, 57.0, 43.0, 49.0, 51.0, 34.0, 33.0, 27.0, 21.0, 22.0, 29.0, 28.0, 12.0, 16.0, 12.0, 15.0, 12.0, 4.0, 4.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66259765625, -0.643707275390625, -0.62481689453125, -0.605926513671875, -0.5870361328125, -0.568145751953125, -0.54925537109375, -0.530364990234375, -0.511474609375, -0.492584228515625, -0.47369384765625, -0.454803466796875, -0.4359130859375, -0.417022705078125, -0.39813232421875, -0.379241943359375, -0.3603515625, -0.341461181640625, -0.32257080078125, -0.303680419921875, -0.2847900390625, -0.265899658203125, -0.24700927734375, -0.228118896484375, -0.209228515625, -0.190338134765625, -0.17144775390625, -0.152557373046875, -0.1336669921875, -0.114776611328125, -0.09588623046875, -0.076995849609375, -0.05810546875, -0.039215087890625, -0.02032470703125, -0.001434326171875, 0.0174560546875, 0.036346435546875, 0.05523681640625, 0.074127197265625, 0.093017578125, 0.111907958984375, 0.13079833984375, 0.149688720703125, 0.1685791015625, 0.187469482421875, 0.20635986328125, 0.225250244140625, 0.244140625, 0.263031005859375, 0.28192138671875, 0.300811767578125, 0.3197021484375, 0.338592529296875, 0.35748291015625, 0.376373291015625, 0.395263671875, 0.414154052734375, 0.43304443359375, 0.451934814453125, 0.4708251953125, 0.489715576171875, 0.50860595703125, 0.527496337890625, 0.54638671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 3.0, 9.0, 9.0, 16.0, 14.0, 28.0, 46.0, 63.0, 97.0, 142.0, 214.0, 368.0, 598.0, 1038.0, 1815.0, 3314.0, 6361.0, 12478.0, 26918.0, 66094.0, 200443.0, 432530.0, 183270.0, 61578.0, 25568.0, 11928.0, 6111.0, 3294.0, 1658.0, 986.0, 576.0, 383.0, 179.0, 153.0, 90.0, 53.0, 29.0, 26.0, 24.0, 16.0, 12.0, 5.0, 3.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36328125, -0.35135650634765625, -0.3394317626953125, -0.32750701904296875, -0.315582275390625, -0.30365753173828125, -0.2917327880859375, -0.27980804443359375, -0.26788330078125, -0.25595855712890625, -0.2440338134765625, -0.23210906982421875, -0.220184326171875, -0.20825958251953125, -0.1963348388671875, -0.18441009521484375, -0.1724853515625, -0.16056060791015625, -0.1486358642578125, -0.13671112060546875, -0.124786376953125, -0.11286163330078125, -0.1009368896484375, -0.08901214599609375, -0.07708740234375, -0.06516265869140625, -0.0532379150390625, -0.04131317138671875, -0.029388427734375, -0.01746368408203125, -0.0055389404296875, 0.00638580322265625, 0.018310546875, 0.03023529052734375, 0.0421600341796875, 0.05408477783203125, 0.066009521484375, 0.07793426513671875, 0.0898590087890625, 0.10178375244140625, 0.11370849609375, 0.12563323974609375, 0.1375579833984375, 0.14948272705078125, 0.161407470703125, 0.17333221435546875, 0.1852569580078125, 0.19718170166015625, 0.2091064453125, 0.22103118896484375, 0.2329559326171875, 0.24488067626953125, 0.256805419921875, 0.26873016357421875, 0.2806549072265625, 0.29257965087890625, 0.30450439453125, 0.31642913818359375, 0.3283538818359375, 0.34027862548828125, 0.352203369140625, 0.36412811279296875, 0.3760528564453125, 0.38797760009765625, 0.39990234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 4.0, 6.0, 7.0, 5.0, 8.0, 11.0, 9.0, 23.0, 22.0, 29.0, 54.0, 45.0, 76.0, 123.0, 133.0, 129.0, 79.0, 60.0, 42.0, 42.0, 20.0, 14.0, 11.0, 9.0, 6.0, 5.0, 9.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.268522262573242e-05, -8.920673280954361e-05, -8.57282429933548e-05, -8.224975317716599e-05, -7.877126336097717e-05, -7.529277354478836e-05, -7.181428372859955e-05, -6.833579391241074e-05, -6.485730409622192e-05, -6.137881428003311e-05, -5.79003244638443e-05, -5.442183464765549e-05, -5.0943344831466675e-05, -4.746485501527786e-05, -4.398636519908905e-05, -4.050787538290024e-05, -3.7029385566711426e-05, -3.3550895750522614e-05, -3.00724059343338e-05, -2.659391611814499e-05, -2.3115426301956177e-05, -1.9636936485767365e-05, -1.6158446669578552e-05, -1.267995685338974e-05, -9.201467037200928e-06, -5.7229772210121155e-06, -2.2444874048233032e-06, 1.234002411365509e-06, 4.712492227554321e-06, 8.190982043743134e-06, 1.1669471859931946e-05, 1.5147961676120758e-05, 1.862645149230957e-05, 2.2104941308498383e-05, 2.5583431124687195e-05, 2.9061920940876007e-05, 3.254041075706482e-05, 3.601890057325363e-05, 3.9497390389442444e-05, 4.2975880205631256e-05, 4.645437002182007e-05, 4.993285983800888e-05, 5.341134965419769e-05, 5.6889839470386505e-05, 6.036832928657532e-05, 6.384681910276413e-05, 6.732530891895294e-05, 7.080379873514175e-05, 7.428228855133057e-05, 7.776077836751938e-05, 8.123926818370819e-05, 8.4717757999897e-05, 8.819624781608582e-05, 9.167473763227463e-05, 9.515322744846344e-05, 9.863171726465225e-05, 0.00010211020708084106, 0.00010558869689702988, 0.00010906718671321869, 0.0001125456765294075, 0.00011602416634559631, 0.00011950265616178513, 0.00012298114597797394, 0.00012645963579416275, 0.00012993812561035156]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 5.0, 12.0, 7.0, 16.0, 23.0, 40.0, 43.0, 74.0, 105.0, 169.0, 342.0, 543.0, 1113.0, 2483.0, 6639.0, 20407.0, 83903.0, 525256.0, 328151.0, 55480.0, 14707.0, 4891.0, 2010.0, 889.0, 506.0, 255.0, 151.0, 107.0, 65.0, 53.0, 31.0, 23.0, 11.0, 11.0, 9.0, 6.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57421875, -0.5536117553710938, -0.5330047607421875, -0.5123977661132812, -0.491790771484375, -0.47118377685546875, -0.4505767822265625, -0.42996978759765625, -0.40936279296875, -0.38875579833984375, -0.3681488037109375, -0.34754180908203125, -0.326934814453125, -0.30632781982421875, -0.2857208251953125, -0.26511383056640625, -0.2445068359375, -0.22389984130859375, -0.2032928466796875, -0.18268585205078125, -0.162078857421875, -0.14147186279296875, -0.1208648681640625, -0.10025787353515625, -0.07965087890625, -0.05904388427734375, -0.0384368896484375, -0.01782989501953125, 0.002777099609375, 0.02338409423828125, 0.0439910888671875, 0.06459808349609375, 0.085205078125, 0.10581207275390625, 0.1264190673828125, 0.14702606201171875, 0.167633056640625, 0.18824005126953125, 0.2088470458984375, 0.22945404052734375, 0.25006103515625, 0.27066802978515625, 0.2912750244140625, 0.31188201904296875, 0.332489013671875, 0.35309600830078125, 0.3737030029296875, 0.39430999755859375, 0.4149169921875, 0.43552398681640625, 0.4561309814453125, 0.47673797607421875, 0.497344970703125, 0.5179519653320312, 0.5385589599609375, 0.5591659545898438, 0.57977294921875, 0.6003799438476562, 0.6209869384765625, 0.6415939331054688, 0.662200927734375, 0.6828079223632812, 0.7034149169921875, 0.7240219116210938, 0.74462890625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 9.0, 8.0, 13.0, 27.0, 28.0, 28.0, 29.0, 34.0, 49.0, 78.0, 113.0, 115.0, 104.0, 78.0, 62.0, 47.0, 36.0, 22.0, 21.0, 20.0, 11.0, 15.0, 16.0, 9.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409912109375, -0.39658355712890625, -0.3832550048828125, -0.36992645263671875, -0.356597900390625, -0.34326934814453125, -0.3299407958984375, -0.31661224365234375, -0.30328369140625, -0.28995513916015625, -0.2766265869140625, -0.26329803466796875, -0.249969482421875, -0.23664093017578125, -0.2233123779296875, -0.20998382568359375, -0.1966552734375, -0.18332672119140625, -0.1699981689453125, -0.15666961669921875, -0.143341064453125, -0.13001251220703125, -0.1166839599609375, -0.10335540771484375, -0.09002685546875, -0.07669830322265625, -0.0633697509765625, -0.05004119873046875, -0.036712646484375, -0.02338409423828125, -0.0100555419921875, 0.00327301025390625, 0.0166015625, 0.02993011474609375, 0.0432586669921875, 0.05658721923828125, 0.069915771484375, 0.08324432373046875, 0.0965728759765625, 0.10990142822265625, 0.12322998046875, 0.13655853271484375, 0.1498870849609375, 0.16321563720703125, 0.176544189453125, 0.18987274169921875, 0.2032012939453125, 0.21652984619140625, 0.2298583984375, 0.24318695068359375, 0.2565155029296875, 0.26984405517578125, 0.283172607421875, 0.29650115966796875, 0.3098297119140625, 0.32315826416015625, 0.33648681640625, 0.34981536865234375, 0.3631439208984375, 0.37647247314453125, 0.389801025390625, 0.40312957763671875, 0.4164581298828125, 0.42978668212890625, 0.443115234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 38.0, 149.0, 456.0, 280.0, 56.0, 21.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.624573230743408, -7.0685577392578125, -6.512542724609375, -5.956527233123779, -5.400511741638184, -4.844496726989746, -4.28848123550415, -3.732465982437134, -3.176450729370117, -2.6204354763031006, -2.064420223236084, -1.5084047317504883, -0.9523894786834717, -0.3963742256164551, 0.15964126586914062, 0.7156565189361572, 1.2716717720031738, 1.8276870250701904, 2.383702278137207, 2.9397177696228027, 3.4957330226898193, 4.051748275756836, 4.607763767242432, 5.163779258728027, 5.719794273376465, 6.2758097648620605, 6.831824779510498, 7.387840270996094, 7.943855285644531, 8.499870300292969, 9.055886268615723, 9.61190128326416, 10.167917251586914, 10.723932266235352, 11.279948234558105, 11.835963249206543, 12.39197826385498, 12.947994232177734, 13.504009246826172, 14.06002426147461, 14.616039276123047, 15.172054290771484, 15.728070259094238, 16.28408432006836, 16.84010124206543, 17.396116256713867, 17.952131271362305, 18.508146286010742, 19.064163208007812, 19.62017822265625, 20.176193237304688, 20.732208251953125, 21.288225173950195, 21.844240188598633, 22.40025520324707, 22.956270217895508, 23.512285232543945, 24.068300247192383, 24.62431526184082, 25.18033218383789, 25.736347198486328, 26.292362213134766, 26.848377227783203, 27.40439224243164, 27.960407257080078]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 1.0, 3.0, 5.0, 5.0, 12.0, 16.0, 13.0, 13.0, 18.0, 17.0, 17.0, 19.0, 29.0, 38.0, 29.0, 55.0, 44.0, 43.0, 56.0, 42.0, 40.0, 48.0, 56.0, 40.0, 24.0, 35.0, 19.0, 38.0, 19.0, 34.0, 19.0, 16.0, 24.0, 26.0, 5.0, 15.0, 9.0, 10.0, 8.0, 7.0, 11.0, 5.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.583444833755493, -3.4666872024536133, -3.3499298095703125, -3.2331724166870117, -3.116414785385132, -2.999657154083252, -2.882899761199951, -2.7661423683166504, -2.6493847370147705, -2.5326271057128906, -2.41586971282959, -2.299112319946289, -2.182354688644409, -2.0655970573425293, -1.9488396644592285, -1.8320821523666382, -1.7153246402740479, -1.5985671281814575, -1.4818096160888672, -1.3650521039962769, -1.2482945919036865, -1.1315370798110962, -1.0147795677185059, -0.8980220556259155, -0.7812645435333252, -0.6645070314407349, -0.5477495193481445, -0.4309920072555542, -0.31423449516296387, -0.19747698307037354, -0.0807194709777832, 0.03603804111480713, 0.15279555320739746, 0.2695530652999878, 0.3863105773925781, 0.5030680894851685, 0.6198256015777588, 0.7365831136703491, 0.8533406257629395, 0.9700981378555298, 1.0868556499481201, 1.2036131620407104, 1.3203706741333008, 1.4371281862258911, 1.5538856983184814, 1.6706432104110718, 1.787400722503662, 1.9041582345962524, 2.0209157466888428, 2.1376733779907227, 2.2544307708740234, 2.371188163757324, 2.487945795059204, 2.604703426361084, 2.7214608192443848, 2.8382182121276855, 2.9549758434295654, 3.0717334747314453, 3.188490867614746, 3.305248260498047, 3.4220058917999268, 3.5387635231018066, 3.6555209159851074, 3.772278308868408, 3.889035940170288]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 7.0, 9.0, 13.0, 10.0, 20.0, 29.0, 38.0, 38.0, 57.0, 90.0, 135.0, 210.0, 360.0, 616.0, 1186.0, 2436.0, 5312.0, 15073.0, 67936.0, 3413831.0, 621218.0, 44931.0, 11600.0, 4525.0, 2017.0, 1061.0, 610.0, 315.0, 187.0, 113.0, 72.0, 57.0, 38.0, 36.0, 21.0, 17.0, 14.0, 12.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.26953125, -1.2341537475585938, -1.1987762451171875, -1.1633987426757812, -1.128021240234375, -1.0926437377929688, -1.0572662353515625, -1.0218887329101562, -0.98651123046875, -0.9511337280273438, -0.9157562255859375, -0.8803787231445312, -0.845001220703125, -0.8096237182617188, -0.7742462158203125, -0.7388687133789062, -0.7034912109375, -0.6681137084960938, -0.6327362060546875, -0.5973587036132812, -0.561981201171875, -0.5266036987304688, -0.4912261962890625, -0.45584869384765625, -0.42047119140625, -0.38509368896484375, -0.3497161865234375, -0.31433868408203125, -0.278961181640625, -0.24358367919921875, -0.2082061767578125, -0.17282867431640625, -0.137451171875, -0.10207366943359375, -0.0666961669921875, -0.03131866455078125, 0.004058837890625, 0.03943634033203125, 0.0748138427734375, 0.11019134521484375, 0.14556884765625, 0.18094635009765625, 0.2163238525390625, 0.25170135498046875, 0.287078857421875, 0.32245635986328125, 0.3578338623046875, 0.39321136474609375, 0.4285888671875, 0.46396636962890625, 0.4993438720703125, 0.5347213745117188, 0.570098876953125, 0.6054763793945312, 0.6408538818359375, 0.6762313842773438, 0.71160888671875, 0.7469863891601562, 0.7823638916015625, 0.8177413940429688, 0.853118896484375, 0.8884963989257812, 0.9238739013671875, 0.9592514038085938, 0.99462890625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 9.0, 6.0, 7.0, 10.0, 16.0, 15.0, 41.0, 55.0, 69.0, 81.0, 74.0, 81.0, 87.0, 76.0, 91.0, 62.0, 66.0, 33.0, 27.0, 25.0, 18.0, 24.0, 5.0, 8.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.215087890625, -0.20949363708496094, -0.20389938354492188, -0.1983051300048828, -0.19271087646484375, -0.1871166229248047, -0.18152236938476562, -0.17592811584472656, -0.1703338623046875, -0.16473960876464844, -0.15914535522460938, -0.1535511016845703, -0.14795684814453125, -0.1423625946044922, -0.13676834106445312, -0.13117408752441406, -0.125579833984375, -0.11998558044433594, -0.11439132690429688, -0.10879707336425781, -0.10320281982421875, -0.09760856628417969, -0.09201431274414062, -0.08642005920410156, -0.0808258056640625, -0.07523155212402344, -0.06963729858398438, -0.06404304504394531, -0.05844879150390625, -0.05285453796386719, -0.047260284423828125, -0.04166603088378906, -0.03607177734375, -0.030477523803710938, -0.024883270263671875, -0.019289016723632812, -0.01369476318359375, -0.008100509643554688, -0.002506256103515625, 0.0030879974365234375, 0.0086822509765625, 0.014276504516601562, 0.019870758056640625, 0.025465011596679688, 0.03105926513671875, 0.03665351867675781, 0.042247772216796875, 0.04784202575683594, 0.053436279296875, 0.05903053283691406, 0.06462478637695312, 0.07021903991699219, 0.07581329345703125, 0.08140754699707031, 0.08700180053710938, 0.09259605407714844, 0.0981903076171875, 0.10378456115722656, 0.10937881469726562, 0.11497306823730469, 0.12056732177734375, 0.1261615753173828, 0.13175582885742188, 0.13735008239746094, 0.1429443359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 7.0, 5.0, 7.0, 17.0, 32.0, 39.0, 49.0, 78.0, 157.0, 216.0, 364.0, 689.0, 1367.0, 3520.0, 12802.0, 84750.0, 3712540.0, 341002.0, 26364.0, 5973.0, 2076.0, 930.0, 527.0, 274.0, 187.0, 118.0, 74.0, 40.0, 23.0, 17.0, 14.0, 9.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4580078125, -1.410552978515625, -1.36309814453125, -1.315643310546875, -1.2681884765625, -1.220733642578125, -1.17327880859375, -1.125823974609375, -1.078369140625, -1.030914306640625, -0.98345947265625, -0.936004638671875, -0.8885498046875, -0.841094970703125, -0.79364013671875, -0.746185302734375, -0.69873046875, -0.651275634765625, -0.60382080078125, -0.556365966796875, -0.5089111328125, -0.461456298828125, -0.41400146484375, -0.366546630859375, -0.319091796875, -0.271636962890625, -0.22418212890625, -0.176727294921875, -0.1292724609375, -0.081817626953125, -0.03436279296875, 0.013092041015625, 0.060546875, 0.108001708984375, 0.15545654296875, 0.202911376953125, 0.2503662109375, 0.297821044921875, 0.34527587890625, 0.392730712890625, 0.440185546875, 0.487640380859375, 0.53509521484375, 0.582550048828125, 0.6300048828125, 0.677459716796875, 0.72491455078125, 0.772369384765625, 0.81982421875, 0.867279052734375, 0.91473388671875, 0.962188720703125, 1.0096435546875, 1.057098388671875, 1.10455322265625, 1.152008056640625, 1.199462890625, 1.246917724609375, 1.29437255859375, 1.341827392578125, 1.3892822265625, 1.436737060546875, 1.48419189453125, 1.531646728515625, 1.5791015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 12.0, 7.0, 13.0, 25.0, 25.0, 57.0, 99.0, 222.0, 886.0, 2000.0, 364.0, 151.0, 74.0, 47.0, 28.0, 16.0, 10.0, 6.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.439697265625, -0.42787933349609375, -0.4160614013671875, -0.40424346923828125, -0.392425537109375, -0.38060760498046875, -0.3687896728515625, -0.35697174072265625, -0.34515380859375, -0.33333587646484375, -0.3215179443359375, -0.30970001220703125, -0.297882080078125, -0.28606414794921875, -0.2742462158203125, -0.26242828369140625, -0.2506103515625, -0.23879241943359375, -0.2269744873046875, -0.21515655517578125, -0.203338623046875, -0.19152069091796875, -0.1797027587890625, -0.16788482666015625, -0.15606689453125, -0.14424896240234375, -0.1324310302734375, -0.12061309814453125, -0.108795166015625, -0.09697723388671875, -0.0851593017578125, -0.07334136962890625, -0.0615234375, -0.04970550537109375, -0.0378875732421875, -0.02606964111328125, -0.014251708984375, -0.00243377685546875, 0.0093841552734375, 0.02120208740234375, 0.03302001953125, 0.04483795166015625, 0.0566558837890625, 0.06847381591796875, 0.080291748046875, 0.09210968017578125, 0.1039276123046875, 0.11574554443359375, 0.1275634765625, 0.13938140869140625, 0.1511993408203125, 0.16301727294921875, 0.174835205078125, 0.18665313720703125, 0.1984710693359375, 0.21028900146484375, 0.22210693359375, 0.23392486572265625, 0.2457427978515625, 0.25756072998046875, 0.269378662109375, 0.28119659423828125, 0.2930145263671875, 0.30483245849609375, 0.316650390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 14.0, 51.0, 122.0, 201.0, 289.0, 179.0, 76.0, 40.0, 14.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1438109874725342, -1.0422513484954834, -0.9406917095184326, -0.8391321301460266, -0.7375724911689758, -0.636012852191925, -0.534453272819519, -0.43289363384246826, -0.3313339948654175, -0.2297743707895279, -0.1282147467136383, -0.026655137538909912, 0.07490450143814087, 0.17646414041519165, 0.27802371978759766, 0.37958335876464844, 0.4811429977416992, 0.58270263671875, 0.6842622756958008, 0.7858218550682068, 0.8873814940452576, 0.9889411330223083, 1.0905007123947144, 1.1920603513717651, 1.293619990348816, 1.3951796293258667, 1.4967392683029175, 1.5982987880706787, 1.6998584270477295, 1.8014180660247803, 1.902977705001831, 2.004537343978882, 2.1060967445373535, 2.2076563835144043, 2.309216022491455, 2.410775661468506, 2.5123353004455566, 2.6138949394226074, 2.715454578399658, 2.817014217376709, 2.9185738563537598, 3.0201334953308105, 3.1216931343078613, 3.223252773284912, 3.324812412261963, 3.4263720512390137, 3.5279316902160645, 3.6294913291931152, 3.731050729751587, 3.8326103687286377, 3.9341700077056885, 4.03572940826416, 4.137289047241211, 4.238848686218262, 4.3404083251953125, 4.441967964172363, 4.543527603149414, 4.645087242126465, 4.746646881103516, 4.848206520080566, 4.949766159057617, 5.051325798034668, 5.152885437011719, 5.2544450759887695, 5.35600471496582]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 5.0, 4.0, 11.0, 17.0, 16.0, 17.0, 11.0, 21.0, 32.0, 19.0, 33.0, 36.0, 26.0, 38.0, 34.0, 40.0, 60.0, 49.0, 61.0, 39.0, 41.0, 36.0, 44.0, 39.0, 45.0, 37.0, 38.0, 15.0, 26.0, 13.0, 16.0, 14.0, 13.0, 11.0, 12.0, 4.0, 11.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.207890272140503, -1.174928069114685, -1.1419657468795776, -1.1090035438537598, -1.0760412216186523, -1.0430790185928345, -1.010116696357727, -0.9771544933319092, -0.9441922307014465, -0.9112299680709839, -0.8782677054405212, -0.8453054428100586, -0.8123432397842407, -0.7793809175491333, -0.7464187145233154, -0.7134564518928528, -0.6804941892623901, -0.6475319266319275, -0.6145696640014648, -0.5816074013710022, -0.5486451387405396, -0.5156829357147217, -0.48272067308425903, -0.4497584104537964, -0.41679614782333374, -0.3838338851928711, -0.35087162256240845, -0.3179093897342682, -0.28494712710380554, -0.2519848644733429, -0.21902261674404144, -0.18606036901474, -0.15309804677963257, -0.12013579159975052, -0.08717353641986847, -0.05421128123998642, -0.02124902606010437, 0.011713236570358276, 0.04467548429965973, 0.07763773202896118, 0.11059999465942383, 0.14356225728988647, 0.17652450501918793, 0.20948675274848938, 0.24244901537895203, 0.2754112780094147, 0.30837351083755493, 0.3413357734680176, 0.3742980360984802, 0.40726029872894287, 0.4402225613594055, 0.4731847941875458, 0.506147027015686, 0.5391093492507935, 0.5720715522766113, 0.605033814907074, 0.6379960775375366, 0.6709583401679993, 0.7039206027984619, 0.7368828654289246, 0.7698451280593872, 0.8028073310852051, 0.8357695937156677, 0.8687318563461304, 0.901694118976593]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 8.0, 16.0, 14.0, 20.0, 24.0, 43.0, 50.0, 68.0, 97.0, 163.0, 235.0, 467.0, 821.0, 1355.0, 2641.0, 5365.0, 12731.0, 34358.0, 105190.0, 342801.0, 365230.0, 114426.0, 36741.0, 13587.0, 5868.0, 2690.0, 1388.0, 825.0, 473.0, 295.0, 177.0, 123.0, 70.0, 58.0, 35.0, 31.0, 19.0, 13.0, 11.0, 14.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.637939453125, -0.61669921875, -0.595458984375, -0.57421875, -0.552978515625, -0.53173828125, -0.510498046875, -0.4892578125, -0.468017578125, -0.44677734375, -0.425537109375, -0.404296875, -0.383056640625, -0.36181640625, -0.340576171875, -0.3193359375, -0.298095703125, -0.27685546875, -0.255615234375, -0.234375, -0.213134765625, -0.19189453125, -0.170654296875, -0.1494140625, -0.128173828125, -0.10693359375, -0.085693359375, -0.064453125, -0.043212890625, -0.02197265625, -0.000732421875, 0.0205078125, 0.041748046875, 0.06298828125, 0.084228515625, 0.10546875, 0.126708984375, 0.14794921875, 0.169189453125, 0.1904296875, 0.211669921875, 0.23291015625, 0.254150390625, 0.275390625, 0.296630859375, 0.31787109375, 0.339111328125, 0.3603515625, 0.381591796875, 0.40283203125, 0.424072265625, 0.4453125, 0.466552734375, 0.48779296875, 0.509033203125, 0.5302734375, 0.551513671875, 0.57275390625, 0.593994140625, 0.615234375, 0.636474609375, 0.65771484375, 0.678955078125, 0.7001953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 5.0, 18.0, 17.0, 42.0, 46.0, 51.0, 52.0, 74.0, 63.0, 98.0, 87.0, 69.0, 77.0, 75.0, 44.0, 51.0, 28.0, 26.0, 13.0, 13.0, 13.0, 5.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23095703125, -0.22507095336914062, -0.21918487548828125, -0.21329879760742188, -0.2074127197265625, -0.20152664184570312, -0.19564056396484375, -0.18975448608398438, -0.183868408203125, -0.17798233032226562, -0.17209625244140625, -0.16621017456054688, -0.1603240966796875, -0.15443801879882812, -0.14855194091796875, -0.14266586303710938, -0.13677978515625, -0.13089370727539062, -0.12500762939453125, -0.11912155151367188, -0.1132354736328125, -0.10734939575195312, -0.10146331787109375, -0.09557723999023438, -0.089691162109375, -0.08380508422851562, -0.07791900634765625, -0.07203292846679688, -0.0661468505859375, -0.060260772705078125, -0.05437469482421875, -0.048488616943359375, -0.0426025390625, -0.036716461181640625, -0.03083038330078125, -0.024944305419921875, -0.0190582275390625, -0.013172149658203125, -0.00728607177734375, -0.001399993896484375, 0.004486083984375, 0.010372161865234375, 0.01625823974609375, 0.022144317626953125, 0.0280303955078125, 0.033916473388671875, 0.03980255126953125, 0.045688629150390625, 0.05157470703125, 0.057460784912109375, 0.06334686279296875, 0.06923294067382812, 0.0751190185546875, 0.08100509643554688, 0.08689117431640625, 0.09277725219726562, 0.098663330078125, 0.10454940795898438, 0.11043548583984375, 0.11632156372070312, 0.1222076416015625, 0.12809371948242188, 0.13397979736328125, 0.13986587524414062, 0.145751953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 10.0, 17.0, 25.0, 18.0, 36.0, 39.0, 69.0, 91.0, 106.0, 150.0, 254.0, 379.0, 563.0, 987.0, 1699.0, 3181.0, 6688.0, 15311.0, 42116.0, 139596.0, 404543.0, 294302.0, 87820.0, 28218.0, 11078.0, 4952.0, 2527.0, 1386.0, 816.0, 480.0, 323.0, 215.0, 148.0, 102.0, 77.0, 54.0, 42.0, 31.0, 23.0, 16.0, 16.0, 12.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.689453125, -0.6684417724609375, -0.647430419921875, -0.6264190673828125, -0.60540771484375, -0.5843963623046875, -0.563385009765625, -0.5423736572265625, -0.5213623046875, -0.5003509521484375, -0.479339599609375, -0.4583282470703125, -0.43731689453125, -0.4163055419921875, -0.395294189453125, -0.3742828369140625, -0.353271484375, -0.3322601318359375, -0.311248779296875, -0.2902374267578125, -0.26922607421875, -0.2482147216796875, -0.227203369140625, -0.2061920166015625, -0.1851806640625, -0.1641693115234375, -0.143157958984375, -0.1221466064453125, -0.10113525390625, -0.0801239013671875, -0.059112548828125, -0.0381011962890625, -0.01708984375, 0.0039215087890625, 0.024932861328125, 0.0459442138671875, 0.06695556640625, 0.0879669189453125, 0.108978271484375, 0.1299896240234375, 0.1510009765625, 0.1720123291015625, 0.193023681640625, 0.2140350341796875, 0.23504638671875, 0.2560577392578125, 0.277069091796875, 0.2980804443359375, 0.319091796875, 0.3401031494140625, 0.361114501953125, 0.3821258544921875, 0.40313720703125, 0.4241485595703125, 0.445159912109375, 0.4661712646484375, 0.4871826171875, 0.5081939697265625, 0.529205322265625, 0.5502166748046875, 0.57122802734375, 0.5922393798828125, 0.613250732421875, 0.6342620849609375, 0.6552734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 3.0, 7.0, 7.0, 12.0, 13.0, 21.0, 11.0, 27.0, 24.0, 31.0, 37.0, 34.0, 44.0, 59.0, 39.0, 61.0, 49.0, 59.0, 52.0, 57.0, 55.0, 45.0, 34.0, 41.0, 41.0, 29.0, 21.0, 19.0, 10.0, 12.0, 14.0, 7.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6787109375, -0.6552581787109375, -0.631805419921875, -0.6083526611328125, -0.58489990234375, -0.5614471435546875, -0.537994384765625, -0.5145416259765625, -0.4910888671875, -0.4676361083984375, -0.444183349609375, -0.4207305908203125, -0.39727783203125, -0.3738250732421875, -0.350372314453125, -0.3269195556640625, -0.303466796875, -0.2800140380859375, -0.256561279296875, -0.2331085205078125, -0.20965576171875, -0.1862030029296875, -0.162750244140625, -0.1392974853515625, -0.1158447265625, -0.0923919677734375, -0.068939208984375, -0.0454864501953125, -0.02203369140625, 0.0014190673828125, 0.024871826171875, 0.0483245849609375, 0.07177734375, 0.0952301025390625, 0.118682861328125, 0.1421356201171875, 0.16558837890625, 0.1890411376953125, 0.212493896484375, 0.2359466552734375, 0.2593994140625, 0.2828521728515625, 0.306304931640625, 0.3297576904296875, 0.35321044921875, 0.3766632080078125, 0.400115966796875, 0.4235687255859375, 0.447021484375, 0.4704742431640625, 0.493927001953125, 0.5173797607421875, 0.54083251953125, 0.5642852783203125, 0.587738037109375, 0.6111907958984375, 0.6346435546875, 0.6580963134765625, 0.681549072265625, 0.7050018310546875, 0.72845458984375, 0.7519073486328125, 0.775360107421875, 0.7988128662109375, 0.822265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 5.0, 7.0, 11.0, 22.0, 26.0, 49.0, 71.0, 105.0, 182.0, 272.0, 494.0, 794.0, 1529.0, 2857.0, 5908.0, 13557.0, 36028.0, 117621.0, 461782.0, 291979.0, 71850.0, 24046.0, 9744.0, 4512.0, 2190.0, 1219.0, 651.0, 405.0, 232.0, 138.0, 85.0, 53.0, 40.0, 29.0, 24.0, 11.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.448974609375, -0.4364356994628906, -0.42389678955078125, -0.4113578796386719, -0.3988189697265625, -0.3862800598144531, -0.37374114990234375, -0.3612022399902344, -0.348663330078125, -0.3361244201660156, -0.32358551025390625, -0.3110466003417969, -0.2985076904296875, -0.2859687805175781, -0.27342987060546875, -0.2608909606933594, -0.24835205078125, -0.23581314086914062, -0.22327423095703125, -0.21073532104492188, -0.1981964111328125, -0.18565750122070312, -0.17311859130859375, -0.16057968139648438, -0.148040771484375, -0.13550186157226562, -0.12296295166015625, -0.11042404174804688, -0.0978851318359375, -0.08534622192382812, -0.07280731201171875, -0.060268402099609375, -0.0477294921875, -0.035190582275390625, -0.02265167236328125, -0.010112762451171875, 0.0024261474609375, 0.014965057373046875, 0.02750396728515625, 0.040042877197265625, 0.052581787109375, 0.06512069702148438, 0.07765960693359375, 0.09019851684570312, 0.1027374267578125, 0.11527633666992188, 0.12781524658203125, 0.14035415649414062, 0.15289306640625, 0.16543197631835938, 0.17797088623046875, 0.19050979614257812, 0.2030487060546875, 0.21558761596679688, 0.22812652587890625, 0.24066543579101562, 0.253204345703125, 0.2657432556152344, 0.27828216552734375, 0.2908210754394531, 0.3033599853515625, 0.3158988952636719, 0.32843780517578125, 0.3409767150878906, 0.353515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 10.0, 3.0, 3.0, 9.0, 9.0, 11.0, 12.0, 22.0, 26.0, 39.0, 45.0, 37.0, 64.0, 119.0, 135.0, 112.0, 76.0, 62.0, 42.0, 42.0, 29.0, 18.0, 21.0, 14.0, 12.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010460615158081055, -0.00010137539356946945, -9.814463555812836e-05, -9.491387754678726e-05, -9.168311953544617e-05, -8.845236152410507e-05, -8.522160351276398e-05, -8.199084550142288e-05, -7.876008749008179e-05, -7.552932947874069e-05, -7.22985714673996e-05, -6.90678134560585e-05, -6.583705544471741e-05, -6.260629743337631e-05, -5.937553942203522e-05, -5.614478141069412e-05, -5.291402339935303e-05, -4.968326538801193e-05, -4.645250737667084e-05, -4.322174936532974e-05, -3.999099135398865e-05, -3.676023334264755e-05, -3.352947533130646e-05, -3.0298717319965363e-05, -2.7067959308624268e-05, -2.3837201297283173e-05, -2.0606443285942078e-05, -1.7375685274600983e-05, -1.4144927263259888e-05, -1.0914169251918793e-05, -7.683411240577698e-06, -4.452653229236603e-06, -1.2218952178955078e-06, 2.008862793445587e-06, 5.239620804786682e-06, 8.470378816127777e-06, 1.1701136827468872e-05, 1.4931894838809967e-05, 1.8162652850151062e-05, 2.1393410861492157e-05, 2.4624168872833252e-05, 2.7854926884174347e-05, 3.108568489551544e-05, 3.431644290685654e-05, 3.754720091819763e-05, 4.077795892953873e-05, 4.400871694087982e-05, 4.723947495222092e-05, 5.047023296356201e-05, 5.370099097490311e-05, 5.69317489862442e-05, 6.01625069975853e-05, 6.339326500892639e-05, 6.662402302026749e-05, 6.985478103160858e-05, 7.308553904294968e-05, 7.631629705429077e-05, 7.954705506563187e-05, 8.277781307697296e-05, 8.600857108831406e-05, 8.923932909965515e-05, 9.247008711099625e-05, 9.570084512233734e-05, 9.893160313367844e-05, 0.00010216236114501953]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 10.0, 11.0, 14.0, 32.0, 29.0, 37.0, 44.0, 88.0, 112.0, 205.0, 290.0, 507.0, 823.0, 1537.0, 2831.0, 5810.0, 13788.0, 37416.0, 131352.0, 510647.0, 246104.0, 59736.0, 20336.0, 8300.0, 3777.0, 1959.0, 1109.0, 606.0, 344.0, 235.0, 129.0, 118.0, 57.0, 38.0, 31.0, 28.0, 25.0, 9.0, 7.0, 8.0, 5.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.446044921875, -0.4335517883300781, -0.42105865478515625, -0.4085655212402344, -0.3960723876953125, -0.3835792541503906, -0.37108612060546875, -0.3585929870605469, -0.346099853515625, -0.3336067199707031, -0.32111358642578125, -0.3086204528808594, -0.2961273193359375, -0.2836341857910156, -0.27114105224609375, -0.2586479187011719, -0.24615478515625, -0.23366165161132812, -0.22116851806640625, -0.20867538452148438, -0.1961822509765625, -0.18368911743164062, -0.17119598388671875, -0.15870285034179688, -0.146209716796875, -0.13371658325195312, -0.12122344970703125, -0.10873031616210938, -0.0962371826171875, -0.08374404907226562, -0.07125091552734375, -0.058757781982421875, -0.0462646484375, -0.033771514892578125, -0.02127838134765625, -0.008785247802734375, 0.0037078857421875, 0.016201019287109375, 0.02869415283203125, 0.041187286376953125, 0.053680419921875, 0.06617355346679688, 0.07866668701171875, 0.09115982055664062, 0.1036529541015625, 0.11614608764648438, 0.12863922119140625, 0.14113235473632812, 0.15362548828125, 0.16611862182617188, 0.17861175537109375, 0.19110488891601562, 0.2035980224609375, 0.21609115600585938, 0.22858428955078125, 0.24107742309570312, 0.253570556640625, 0.2660636901855469, 0.27855682373046875, 0.2910499572753906, 0.3035430908203125, 0.3160362243652344, 0.32852935791015625, 0.3410224914550781, 0.353515625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 8.0, 8.0, 8.0, 10.0, 21.0, 19.0, 35.0, 25.0, 26.0, 60.0, 71.0, 64.0, 81.0, 81.0, 98.0, 73.0, 61.0, 44.0, 39.0, 32.0, 28.0, 9.0, 21.0, 10.0, 17.0, 11.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3330078125, -0.3227424621582031, -0.31247711181640625, -0.3022117614746094, -0.2919464111328125, -0.2816810607910156, -0.27141571044921875, -0.2611503601074219, -0.250885009765625, -0.24061965942382812, -0.23035430908203125, -0.22008895874023438, -0.2098236083984375, -0.19955825805664062, -0.18929290771484375, -0.17902755737304688, -0.16876220703125, -0.15849685668945312, -0.14823150634765625, -0.13796615600585938, -0.1277008056640625, -0.11743545532226562, -0.10717010498046875, -0.09690475463867188, -0.086639404296875, -0.07637405395507812, -0.06610870361328125, -0.055843353271484375, -0.0455780029296875, -0.035312652587890625, -0.02504730224609375, -0.014781951904296875, -0.0045166015625, 0.005748748779296875, 0.01601409912109375, 0.026279449462890625, 0.0365447998046875, 0.046810150146484375, 0.05707550048828125, 0.06734085083007812, 0.077606201171875, 0.08787155151367188, 0.09813690185546875, 0.10840225219726562, 0.1186676025390625, 0.12893295288085938, 0.13919830322265625, 0.14946365356445312, 0.15972900390625, 0.16999435424804688, 0.18025970458984375, 0.19052505493164062, 0.2007904052734375, 0.21105575561523438, 0.22132110595703125, 0.23158645629882812, 0.241851806640625, 0.2521171569824219, 0.26238250732421875, 0.2726478576660156, 0.2829132080078125, 0.2931785583496094, 0.30344390869140625, 0.3137092590332031, 0.323974609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 14.0, 38.0, 61.0, 133.0, 227.0, 238.0, 155.0, 67.0, 33.0, 14.0, 9.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.835903644561768, -4.568309307098389, -4.30071496963501, -4.033120632171631, -3.765526294708252, -3.497931957244873, -3.230337381362915, -2.962743043899536, -2.6951487064361572, -2.4275543689727783, -2.1599600315093994, -1.892365574836731, -1.624771237373352, -1.3571768999099731, -1.0895824432373047, -0.8219881057739258, -0.5543937683105469, -0.2867994010448456, -0.019205033779144287, 0.2483893632888794, 0.5159837007522583, 0.7835780382156372, 1.0511724948883057, 1.3187668323516846, 1.5863611698150635, 1.8539555072784424, 2.1215498447418213, 2.3891444206237793, 2.656738758087158, 2.924333095550537, 3.191927433013916, 3.459521770477295, 3.727116584777832, 3.994710922241211, 4.26230525970459, 4.529899597167969, 4.797493934631348, 5.065088272094727, 5.3326826095581055, 5.600276947021484, 5.867871284484863, 6.135465621948242, 6.403059959411621, 6.670654296875, 6.938248634338379, 7.205842971801758, 7.473437309265137, 7.741031646728516, 8.008626937866211, 8.27622127532959, 8.543815612792969, 8.811409950256348, 9.079004287719727, 9.346598625183105, 9.614192962646484, 9.881787300109863, 10.149381637573242, 10.416975975036621, 10.6845703125, 10.952164649963379, 11.219758987426758, 11.487353324890137, 11.754947662353516, 12.022541999816895, 12.290136337280273]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 4.0, 4.0, 3.0, 7.0, 10.0, 17.0, 17.0, 13.0, 17.0, 18.0, 20.0, 25.0, 22.0, 25.0, 31.0, 37.0, 33.0, 34.0, 25.0, 37.0, 46.0, 54.0, 38.0, 36.0, 37.0, 42.0, 25.0, 40.0, 42.0, 27.0, 24.0, 17.0, 33.0, 24.0, 20.0, 22.0, 12.0, 7.0, 11.0, 6.0, 6.0, 4.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.295414924621582, -3.195422410964966, -3.0954298973083496, -2.9954371452331543, -2.895444631576538, -2.795452117919922, -2.6954596042633057, -2.5954670906066895, -2.4954745769500732, -2.395482063293457, -2.295489549636841, -2.1954970359802246, -2.0955042839050293, -1.995511770248413, -1.8955192565917969, -1.7955267429351807, -1.695534110069275, -1.5955415964126587, -1.495548963546753, -1.3955564498901367, -1.2955639362335205, -1.1955714225769043, -1.0955787897109985, -0.9955862760543823, -0.8955937027931213, -0.7956011295318604, -0.6956086158752441, -0.5956160426139832, -0.49562349915504456, -0.39563095569610596, -0.29563838243484497, -0.19564586877822876, -0.09565329551696777, 0.004339255392551422, 0.10433180630207062, 0.2043243646621704, 0.304316908121109, 0.4043094515800476, 0.5043020248413086, 0.6042945384979248, 0.7042871117591858, 0.8042796850204468, 0.904272198677063, 1.0042648315429688, 1.104257345199585, 1.2042498588562012, 1.3042423725128174, 1.4042348861694336, 1.5042275190353394, 1.6042200326919556, 1.7042126655578613, 1.8042051792144775, 1.9041976928710938, 2.00419020652771, 2.104182720184326, 2.2041754722595215, 2.3041679859161377, 2.404160499572754, 2.50415301322937, 2.6041455268859863, 2.7041382789611816, 2.804130792617798, 2.904123306274414, 3.0041158199310303, 3.1041083335876465]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 13.0, 15.0, 15.0, 28.0, 47.0, 76.0, 108.0, 158.0, 254.0, 478.0, 762.0, 1510.0, 3206.0, 7652.0, 22640.0, 105835.0, 3653736.0, 334423.0, 41630.0, 12270.0, 4719.0, 2055.0, 1030.0, 616.0, 332.0, 231.0, 123.0, 77.0, 70.0, 51.0, 32.0, 18.0, 17.0, 12.0, 5.0, 4.0, 1.0, 6.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87158203125, -0.8412399291992188, -0.8108978271484375, -0.7805557250976562, -0.750213623046875, -0.7198715209960938, -0.6895294189453125, -0.6591873168945312, -0.62884521484375, -0.5985031127929688, -0.5681610107421875, -0.5378189086914062, -0.507476806640625, -0.47713470458984375, -0.4467926025390625, -0.41645050048828125, -0.3861083984375, -0.35576629638671875, -0.3254241943359375, -0.29508209228515625, -0.264739990234375, -0.23439788818359375, -0.2040557861328125, -0.17371368408203125, -0.14337158203125, -0.11302947998046875, -0.0826873779296875, -0.05234527587890625, -0.022003173828125, 0.00833892822265625, 0.0386810302734375, 0.06902313232421875, 0.099365234375, 0.12970733642578125, 0.1600494384765625, 0.19039154052734375, 0.220733642578125, 0.25107574462890625, 0.2814178466796875, 0.31175994873046875, 0.34210205078125, 0.37244415283203125, 0.4027862548828125, 0.43312835693359375, 0.463470458984375, 0.49381256103515625, 0.5241546630859375, 0.5544967651367188, 0.5848388671875, 0.6151809692382812, 0.6455230712890625, 0.6758651733398438, 0.706207275390625, 0.7365493774414062, 0.7668914794921875, 0.7972335815429688, 0.82757568359375, 0.8579177856445312, 0.8882598876953125, 0.9186019897460938, 0.948944091796875, 0.9792861938476562, 1.0096282958984375, 1.0399703979492188, 1.0703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 10.0, 6.0, 12.0, 21.0, 22.0, 28.0, 40.0, 52.0, 42.0, 60.0, 72.0, 88.0, 76.0, 76.0, 74.0, 57.0, 58.0, 41.0, 53.0, 27.0, 27.0, 17.0, 14.0, 9.0, 6.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2291259765625, -0.22335243225097656, -0.21757888793945312, -0.2118053436279297, -0.20603179931640625, -0.2002582550048828, -0.19448471069335938, -0.18871116638183594, -0.1829376220703125, -0.17716407775878906, -0.17139053344726562, -0.1656169891357422, -0.15984344482421875, -0.1540699005126953, -0.14829635620117188, -0.14252281188964844, -0.136749267578125, -0.13097572326660156, -0.12520217895507812, -0.11942863464355469, -0.11365509033203125, -0.10788154602050781, -0.10210800170898438, -0.09633445739746094, -0.0905609130859375, -0.08478736877441406, -0.07901382446289062, -0.07324028015136719, -0.06746673583984375, -0.06169319152832031, -0.055919647216796875, -0.05014610290527344, -0.04437255859375, -0.03859901428222656, -0.032825469970703125, -0.027051925659179688, -0.02127838134765625, -0.015504837036132812, -0.009731292724609375, -0.0039577484130859375, 0.0018157958984375, 0.0075893402099609375, 0.013362884521484375, 0.019136428833007812, 0.02490997314453125, 0.030683517456054688, 0.036457061767578125, 0.04223060607910156, 0.048004150390625, 0.05377769470214844, 0.059551239013671875, 0.06532478332519531, 0.07109832763671875, 0.07687187194824219, 0.08264541625976562, 0.08841896057128906, 0.0941925048828125, 0.09996604919433594, 0.10573959350585938, 0.11151313781738281, 0.11728668212890625, 0.12306022644042969, 0.12883377075195312, 0.13460731506347656, 0.140380859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 10.0, 11.0, 12.0, 18.0, 30.0, 33.0, 47.0, 43.0, 72.0, 148.0, 391.0, 2298.0, 65039.0, 4108024.0, 16341.0, 1217.0, 282.0, 90.0, 46.0, 26.0, 28.0, 23.0, 16.0, 18.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.83197021484375, -4.6912841796875, -4.55059814453125, -4.409912109375, -4.26922607421875, -4.1285400390625, -3.98785400390625, -3.84716796875, -3.70648193359375, -3.5657958984375, -3.42510986328125, -3.284423828125, -3.14373779296875, -3.0030517578125, -2.86236572265625, -2.7216796875, -2.58099365234375, -2.4403076171875, -2.29962158203125, -2.158935546875, -2.01824951171875, -1.8775634765625, -1.73687744140625, -1.59619140625, -1.45550537109375, -1.3148193359375, -1.17413330078125, -1.033447265625, -0.89276123046875, -0.7520751953125, -0.61138916015625, -0.470703125, -0.33001708984375, -0.1893310546875, -0.04864501953125, 0.092041015625, 0.23272705078125, 0.3734130859375, 0.51409912109375, 0.65478515625, 0.79547119140625, 0.9361572265625, 1.07684326171875, 1.217529296875, 1.35821533203125, 1.4989013671875, 1.63958740234375, 1.7802734375, 1.92095947265625, 2.0616455078125, 2.20233154296875, 2.343017578125, 2.48370361328125, 2.6243896484375, 2.76507568359375, 2.90576171875, 3.04644775390625, 3.1871337890625, 3.32781982421875, 3.468505859375, 3.60919189453125, 3.7498779296875, 3.89056396484375, 4.03125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 20.0, 41.0, 89.0, 292.0, 2806.0, 588.0, 132.0, 52.0, 21.0, 12.0, 10.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.330078125, -1.3043479919433594, -1.2786178588867188, -1.2528877258300781, -1.2271575927734375, -1.2014274597167969, -1.1756973266601562, -1.1499671936035156, -1.124237060546875, -1.0985069274902344, -1.0727767944335938, -1.0470466613769531, -1.0213165283203125, -0.9955863952636719, -0.9698562622070312, -0.9441261291503906, -0.91839599609375, -0.8926658630371094, -0.8669357299804688, -0.8412055969238281, -0.8154754638671875, -0.7897453308105469, -0.7640151977539062, -0.7382850646972656, -0.712554931640625, -0.6868247985839844, -0.6610946655273438, -0.6353645324707031, -0.6096343994140625, -0.5839042663574219, -0.5581741333007812, -0.5324440002441406, -0.5067138671875, -0.4809837341308594, -0.45525360107421875, -0.4295234680175781, -0.4037933349609375, -0.3780632019042969, -0.35233306884765625, -0.3266029357910156, -0.300872802734375, -0.2751426696777344, -0.24941253662109375, -0.22368240356445312, -0.1979522705078125, -0.17222213745117188, -0.14649200439453125, -0.12076187133789062, -0.09503173828125, -0.06930160522460938, -0.04357147216796875, -0.017841339111328125, 0.0078887939453125, 0.033618927001953125, 0.05934906005859375, 0.08507919311523438, 0.110809326171875, 0.13653945922851562, 0.16226959228515625, 0.18799972534179688, 0.2137298583984375, 0.23945999145507812, 0.26519012451171875, 0.2909202575683594, 0.316650390625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 13.0, 23.0, 34.0, 57.0, 91.0, 147.0, 160.0, 163.0, 133.0, 72.0, 40.0, 20.0, 13.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5754852294921875, -2.4946649074554443, -2.413844585418701, -2.333024263381958, -2.252203941345215, -2.1713833808898926, -2.0905630588531494, -2.0097427368164062, -1.928922414779663, -1.84810209274292, -1.7672817707061768, -1.686461329460144, -1.6056410074234009, -1.5248206853866577, -1.444000244140625, -1.3631799221038818, -1.2823596000671387, -1.2015392780303955, -1.1207189559936523, -1.0398985147476196, -0.9590781927108765, -0.8782578706741333, -0.7974374890327454, -0.7166171073913574, -0.6357967853546143, -0.5549764633178711, -0.47415608167648315, -0.3933357298374176, -0.31251537799835205, -0.2316950261592865, -0.15087467432022095, -0.07005429267883301, 0.010766029357910156, 0.09158638119697571, 0.17240673303604126, 0.2532270848751068, 0.33404743671417236, 0.4148677885532379, 0.49568814039230347, 0.5765085220336914, 0.6573288440704346, 0.7381491661071777, 0.8189695477485657, 0.8997899293899536, 0.9806102514266968, 1.06143057346344, 1.1422510147094727, 1.2230713367462158, 1.303891658782959, 1.3847119808197021, 1.4655323028564453, 1.546352744102478, 1.6271730661392212, 1.7079933881759644, 1.788813829421997, 1.8696341514587402, 1.9504544734954834, 2.0312747955322266, 2.1120951175689697, 2.192915439605713, 2.273736000061035, 2.3545563220977783, 2.4353766441345215, 2.5161969661712646, 2.597017288208008]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 10.0, 9.0, 10.0, 7.0, 14.0, 16.0, 14.0, 13.0, 17.0, 22.0, 28.0, 31.0, 31.0, 39.0, 31.0, 34.0, 43.0, 39.0, 36.0, 39.0, 47.0, 45.0, 43.0, 41.0, 36.0, 32.0, 29.0, 28.0, 20.0, 30.0, 27.0, 17.0, 23.0, 19.0, 18.0, 8.0, 6.0, 4.0, 8.0, 10.0, 2.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.158376932144165, -1.120100736618042, -1.081824541091919, -1.043548345565796, -1.0052721500396729, -0.9669959545135498, -0.9287197589874268, -0.8904435634613037, -0.8521673679351807, -0.8138911724090576, -0.7756149768829346, -0.7373387813568115, -0.6990625858306885, -0.6607863903045654, -0.6225101947784424, -0.5842339992523193, -0.5459578633308411, -0.507681667804718, -0.46940547227859497, -0.4311292767524719, -0.3928530812263489, -0.35457688570022583, -0.31630071997642517, -0.2780245244503021, -0.23974832892417908, -0.20147213339805603, -0.16319593787193298, -0.12491975724697113, -0.08664356172084808, -0.04836736619472504, -0.010091185569763184, 0.028185009956359863, 0.06646120548248291, 0.10473740100860596, 0.143013596534729, 0.18128977715969086, 0.2195659726858139, 0.25784218311309814, 0.2961183488368988, 0.33439454436302185, 0.3726707398891449, 0.41094693541526794, 0.449223130941391, 0.48749929666519165, 0.5257754921913147, 0.5640516877174377, 0.6023278832435608, 0.6406040787696838, 0.6788802742958069, 0.7171564698219299, 0.755432665348053, 0.793708860874176, 0.8319850564002991, 0.8702612519264221, 0.9085373878479004, 0.9468135833740234, 0.9850897789001465, 1.0233659744262695, 1.0616421699523926, 1.0999183654785156, 1.1381945610046387, 1.1764707565307617, 1.2147469520568848, 1.2530231475830078, 1.2912993431091309]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 17.0, 15.0, 30.0, 30.0, 51.0, 67.0, 107.0, 177.0, 289.0, 494.0, 817.0, 1535.0, 2814.0, 5678.0, 11862.0, 28772.0, 75905.0, 219843.0, 399187.0, 188645.0, 65360.0, 25065.0, 10756.0, 5084.0, 2582.0, 1395.0, 778.0, 423.0, 287.0, 165.0, 98.0, 60.0, 49.0, 30.0, 18.0, 19.0, 9.0, 10.0, 4.0, 6.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62890625, -0.6088943481445312, -0.5888824462890625, -0.5688705444335938, -0.548858642578125, -0.5288467407226562, -0.5088348388671875, -0.48882293701171875, -0.46881103515625, -0.44879913330078125, -0.4287872314453125, -0.40877532958984375, -0.388763427734375, -0.36875152587890625, -0.3487396240234375, -0.32872772216796875, -0.3087158203125, -0.28870391845703125, -0.2686920166015625, -0.24868011474609375, -0.228668212890625, -0.20865631103515625, -0.1886444091796875, -0.16863250732421875, -0.14862060546875, -0.12860870361328125, -0.1085968017578125, -0.08858489990234375, -0.068572998046875, -0.04856109619140625, -0.0285491943359375, -0.00853729248046875, 0.011474609375, 0.03148651123046875, 0.0514984130859375, 0.07151031494140625, 0.091522216796875, 0.11153411865234375, 0.1315460205078125, 0.15155792236328125, 0.17156982421875, 0.19158172607421875, 0.2115936279296875, 0.23160552978515625, 0.251617431640625, 0.27162933349609375, 0.2916412353515625, 0.31165313720703125, 0.3316650390625, 0.35167694091796875, 0.3716888427734375, 0.39170074462890625, 0.411712646484375, 0.43172454833984375, 0.4517364501953125, 0.47174835205078125, 0.49176025390625, 0.5117721557617188, 0.5317840576171875, 0.5517959594726562, 0.571807861328125, 0.5918197631835938, 0.6118316650390625, 0.6318435668945312, 0.65185546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 19.0, 13.0, 29.0, 24.0, 37.0, 47.0, 48.0, 43.0, 67.0, 79.0, 82.0, 76.0, 63.0, 56.0, 54.0, 42.0, 45.0, 43.0, 25.0, 28.0, 17.0, 17.0, 14.0, 5.0, 7.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2423095703125, -0.2362804412841797, -0.23025131225585938, -0.22422218322753906, -0.21819305419921875, -0.21216392517089844, -0.20613479614257812, -0.2001056671142578, -0.1940765380859375, -0.1880474090576172, -0.18201828002929688, -0.17598915100097656, -0.16996002197265625, -0.16393089294433594, -0.15790176391601562, -0.1518726348876953, -0.145843505859375, -0.1398143768310547, -0.13378524780273438, -0.12775611877441406, -0.12172698974609375, -0.11569786071777344, -0.10966873168945312, -0.10363960266113281, -0.0976104736328125, -0.09158134460449219, -0.08555221557617188, -0.07952308654785156, -0.07349395751953125, -0.06746482849121094, -0.061435699462890625, -0.05540657043457031, -0.04937744140625, -0.04334831237792969, -0.037319183349609375, -0.03129005432128906, -0.02526092529296875, -0.019231796264648438, -0.013202667236328125, -0.0071735382080078125, -0.0011444091796875, 0.0048847198486328125, 0.010913848876953125, 0.016942977905273438, 0.02297210693359375, 0.029001235961914062, 0.035030364990234375, 0.04105949401855469, 0.047088623046875, 0.05311775207519531, 0.059146881103515625, 0.06517601013183594, 0.07120513916015625, 0.07723426818847656, 0.08326339721679688, 0.08929252624511719, 0.0953216552734375, 0.10135078430175781, 0.10737991333007812, 0.11340904235839844, 0.11943817138671875, 0.12546730041503906, 0.13149642944335938, 0.1375255584716797, 0.1435546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 14.0, 15.0, 18.0, 15.0, 31.0, 46.0, 57.0, 92.0, 140.0, 191.0, 248.0, 433.0, 703.0, 1281.0, 2628.0, 5610.0, 14663.0, 45420.0, 190898.0, 544394.0, 174514.0, 42491.0, 13679.0, 5455.0, 2378.0, 1209.0, 682.0, 416.0, 278.0, 151.0, 94.0, 87.0, 48.0, 47.0, 30.0, 23.0, 19.0, 13.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9213333129882812, -0.8929595947265625, -0.8645858764648438, -0.836212158203125, -0.8078384399414062, -0.7794647216796875, -0.7510910034179688, -0.72271728515625, -0.6943435668945312, -0.6659698486328125, -0.6375961303710938, -0.609222412109375, -0.5808486938476562, -0.5524749755859375, -0.5241012573242188, -0.4957275390625, -0.46735382080078125, -0.4389801025390625, -0.41060638427734375, -0.382232666015625, -0.35385894775390625, -0.3254852294921875, -0.29711151123046875, -0.26873779296875, -0.24036407470703125, -0.2119903564453125, -0.18361663818359375, -0.155242919921875, -0.12686920166015625, -0.0984954833984375, -0.07012176513671875, -0.041748046875, -0.01337432861328125, 0.0149993896484375, 0.04337310791015625, 0.071746826171875, 0.10012054443359375, 0.1284942626953125, 0.15686798095703125, 0.18524169921875, 0.21361541748046875, 0.2419891357421875, 0.27036285400390625, 0.298736572265625, 0.32711029052734375, 0.3554840087890625, 0.38385772705078125, 0.4122314453125, 0.44060516357421875, 0.4689788818359375, 0.49735260009765625, 0.525726318359375, 0.5541000366210938, 0.5824737548828125, 0.6108474731445312, 0.63922119140625, 0.6675949096679688, 0.6959686279296875, 0.7243423461914062, 0.752716064453125, 0.7810897827148438, 0.8094635009765625, 0.8378372192382812, 0.8662109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 8.0, 10.0, 5.0, 4.0, 8.0, 9.0, 14.0, 19.0, 18.0, 16.0, 30.0, 33.0, 26.0, 28.0, 29.0, 44.0, 55.0, 40.0, 41.0, 62.0, 40.0, 42.0, 55.0, 47.0, 45.0, 44.0, 20.0, 31.0, 28.0, 27.0, 21.0, 25.0, 18.0, 8.0, 9.0, 10.0, 10.0, 6.0, 7.0, 3.0, 4.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.630859375, -0.60809326171875, -0.5853271484375, -0.56256103515625, -0.539794921875, -0.51702880859375, -0.4942626953125, -0.47149658203125, -0.44873046875, -0.42596435546875, -0.4031982421875, -0.38043212890625, -0.357666015625, -0.33489990234375, -0.3121337890625, -0.28936767578125, -0.2666015625, -0.24383544921875, -0.2210693359375, -0.19830322265625, -0.175537109375, -0.15277099609375, -0.1300048828125, -0.10723876953125, -0.08447265625, -0.06170654296875, -0.0389404296875, -0.01617431640625, 0.006591796875, 0.02935791015625, 0.0521240234375, 0.07489013671875, 0.09765625, 0.12042236328125, 0.1431884765625, 0.16595458984375, 0.188720703125, 0.21148681640625, 0.2342529296875, 0.25701904296875, 0.27978515625, 0.30255126953125, 0.3253173828125, 0.34808349609375, 0.370849609375, 0.39361572265625, 0.4163818359375, 0.43914794921875, 0.4619140625, 0.48468017578125, 0.5074462890625, 0.53021240234375, 0.552978515625, 0.57574462890625, 0.5985107421875, 0.62127685546875, 0.64404296875, 0.66680908203125, 0.6895751953125, 0.71234130859375, 0.735107421875, 0.75787353515625, 0.7806396484375, 0.80340576171875, 0.826171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 13.0, 7.0, 14.0, 26.0, 35.0, 42.0, 44.0, 83.0, 131.0, 143.0, 257.0, 360.0, 670.0, 1037.0, 1851.0, 3811.0, 9765.0, 41904.0, 458137.0, 468931.0, 42764.0, 9904.0, 3846.0, 1849.0, 1094.0, 617.0, 389.0, 238.0, 176.0, 110.0, 86.0, 59.0, 51.0, 26.0, 20.0, 14.0, 11.0, 11.0, 3.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.833984375, -0.8087158203125, -0.783447265625, -0.7581787109375, -0.73291015625, -0.7076416015625, -0.682373046875, -0.6571044921875, -0.6318359375, -0.6065673828125, -0.581298828125, -0.5560302734375, -0.53076171875, -0.5054931640625, -0.480224609375, -0.4549560546875, -0.4296875, -0.4044189453125, -0.379150390625, -0.3538818359375, -0.32861328125, -0.3033447265625, -0.278076171875, -0.2528076171875, -0.2275390625, -0.2022705078125, -0.177001953125, -0.1517333984375, -0.12646484375, -0.1011962890625, -0.075927734375, -0.0506591796875, -0.025390625, -0.0001220703125, 0.025146484375, 0.0504150390625, 0.07568359375, 0.1009521484375, 0.126220703125, 0.1514892578125, 0.1767578125, 0.2020263671875, 0.227294921875, 0.2525634765625, 0.27783203125, 0.3031005859375, 0.328369140625, 0.3536376953125, 0.37890625, 0.4041748046875, 0.429443359375, 0.4547119140625, 0.47998046875, 0.5052490234375, 0.530517578125, 0.5557861328125, 0.5810546875, 0.6063232421875, 0.631591796875, 0.6568603515625, 0.68212890625, 0.7073974609375, 0.732666015625, 0.7579345703125, 0.783203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 3.0, 2.0, 9.0, 22.0, 27.0, 59.0, 97.0, 173.0, 249.0, 157.0, 65.0, 54.0, 29.0, 12.0, 10.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002579689025878906, -0.00025023892521858215, -0.00024250894784927368, -0.0002347789704799652, -0.00022704899311065674, -0.00021931901574134827, -0.0002115890383720398, -0.00020385906100273132, -0.00019612908363342285, -0.00018839910626411438, -0.0001806691288948059, -0.00017293915152549744, -0.00016520917415618896, -0.0001574791967868805, -0.00014974921941757202, -0.00014201924204826355, -0.00013428926467895508, -0.0001265592873096466, -0.00011882930994033813, -0.00011109933257102966, -0.00010336935520172119, -9.563937783241272e-05, -8.790940046310425e-05, -8.017942309379578e-05, -7.24494457244873e-05, -6.471946835517883e-05, -5.698949098587036e-05, -4.925951361656189e-05, -4.152953624725342e-05, -3.3799558877944946e-05, -2.6069581508636475e-05, -1.8339604139328003e-05, -1.0609626770019531e-05, -2.8796494007110596e-06, 4.850327968597412e-06, 1.2580305337905884e-05, 2.0310282707214355e-05, 2.8040260076522827e-05, 3.57702374458313e-05, 4.350021481513977e-05, 5.123019218444824e-05, 5.8960169553756714e-05, 6.669014692306519e-05, 7.442012429237366e-05, 8.215010166168213e-05, 8.98800790309906e-05, 9.761005640029907e-05, 0.00010534003376960754, 0.00011307001113891602, 0.00012079998850822449, 0.00012852996587753296, 0.00013625994324684143, 0.0001439899206161499, 0.00015171989798545837, 0.00015944987535476685, 0.00016717985272407532, 0.0001749098300933838, 0.00018263980746269226, 0.00019036978483200073, 0.0001980997622013092, 0.00020582973957061768, 0.00021355971693992615, 0.00022128969430923462, 0.0002290196716785431, 0.00023674964904785156]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 5.0, 2.0, 8.0, 5.0, 10.0, 13.0, 16.0, 19.0, 40.0, 61.0, 86.0, 209.0, 378.0, 819.0, 1814.0, 5177.0, 26508.0, 551266.0, 431857.0, 22258.0, 4625.0, 1725.0, 763.0, 400.0, 201.0, 105.0, 74.0, 40.0, 23.0, 20.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95166015625, -0.9188003540039062, -0.8859405517578125, -0.8530807495117188, -0.820220947265625, -0.7873611450195312, -0.7545013427734375, -0.7216415405273438, -0.68878173828125, -0.6559219360351562, -0.6230621337890625, -0.5902023315429688, -0.557342529296875, -0.5244827270507812, -0.4916229248046875, -0.45876312255859375, -0.4259033203125, -0.39304351806640625, -0.3601837158203125, -0.32732391357421875, -0.294464111328125, -0.26160430908203125, -0.2287445068359375, -0.19588470458984375, -0.16302490234375, -0.13016510009765625, -0.0973052978515625, -0.06444549560546875, -0.031585693359375, 0.00127410888671875, 0.0341339111328125, 0.06699371337890625, 0.099853515625, 0.13271331787109375, 0.1655731201171875, 0.19843292236328125, 0.231292724609375, 0.26415252685546875, 0.2970123291015625, 0.32987213134765625, 0.36273193359375, 0.39559173583984375, 0.4284515380859375, 0.46131134033203125, 0.494171142578125, 0.5270309448242188, 0.5598907470703125, 0.5927505493164062, 0.6256103515625, 0.6584701538085938, 0.6913299560546875, 0.7241897583007812, 0.757049560546875, 0.7899093627929688, 0.8227691650390625, 0.8556289672851562, 0.88848876953125, 0.9213485717773438, 0.9542083740234375, 0.9870681762695312, 1.019927978515625, 1.0527877807617188, 1.0856475830078125, 1.1185073852539062, 1.1513671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 15.0, 27.0, 42.0, 62.0, 88.0, 125.0, 177.0, 144.0, 110.0, 71.0, 47.0, 26.0, 16.0, 13.0, 6.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.5940170288085938, -0.5718231201171875, -0.5496292114257812, -0.527435302734375, -0.5052413940429688, -0.4830474853515625, -0.46085357666015625, -0.43865966796875, -0.41646575927734375, -0.3942718505859375, -0.37207794189453125, -0.349884033203125, -0.32769012451171875, -0.3054962158203125, -0.28330230712890625, -0.2611083984375, -0.23891448974609375, -0.2167205810546875, -0.19452667236328125, -0.172332763671875, -0.15013885498046875, -0.1279449462890625, -0.10575103759765625, -0.08355712890625, -0.06136322021484375, -0.0391693115234375, -0.01697540283203125, 0.005218505859375, 0.02741241455078125, 0.0496063232421875, 0.07180023193359375, 0.093994140625, 0.11618804931640625, 0.1383819580078125, 0.16057586669921875, 0.182769775390625, 0.20496368408203125, 0.2271575927734375, 0.24935150146484375, 0.27154541015625, 0.29373931884765625, 0.3159332275390625, 0.33812713623046875, 0.360321044921875, 0.38251495361328125, 0.4047088623046875, 0.42690277099609375, 0.4490966796875, 0.47129058837890625, 0.4934844970703125, 0.5156784057617188, 0.537872314453125, 0.5600662231445312, 0.5822601318359375, 0.6044540405273438, 0.62664794921875, 0.6488418579101562, 0.6710357666015625, 0.6932296752929688, 0.715423583984375, 0.7376174926757812, 0.7598114013671875, 0.7820053100585938, 0.80419921875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 5.0, 19.0, 49.0, 104.0, 142.0, 179.0, 184.0, 141.0, 86.0, 39.0, 26.0, 11.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.862367153167725, -5.583313465118408, -5.304259777069092, -5.025206089019775, -4.746151924133301, -4.467098236083984, -4.188044548034668, -3.9089908599853516, -3.629937171936035, -3.3508834838867188, -3.0718297958374023, -2.792775869369507, -2.5137221813201904, -2.234668493270874, -1.955614686012268, -1.676560878753662, -1.3975071907043457, -1.1184535026550293, -0.8393996953964233, -0.5603459477424622, -0.281292200088501, -0.0022385120391845703, 0.2768152952194214, 0.5558691024780273, 0.8349227905273438, 1.1139764785766602, 1.3930302858352661, 1.672084093093872, 1.9511377811431885, 2.230191469192505, 2.5092453956604004, 2.788299083709717, 3.0673532485961914, 3.346406936645508, 3.625460624694824, 3.9045145511627197, 4.183568000793457, 4.462621688842773, 4.741675853729248, 5.0207295417785645, 5.299783229827881, 5.578836917877197, 5.857890605926514, 6.13694429397583, 6.415998458862305, 6.695052146911621, 6.9741058349609375, 7.253159523010254, 7.53221321105957, 7.811266899108887, 8.090320587158203, 8.36937427520752, 8.648427963256836, 8.927481651306152, 9.206535339355469, 9.485589981079102, 9.764642715454102, 10.043696403503418, 10.322750091552734, 10.60180377960205, 10.880857467651367, 11.159911155700684, 11.43896484375, 11.718019485473633, 11.99707317352295]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 4.0, 10.0, 12.0, 25.0, 11.0, 31.0, 24.0, 27.0, 23.0, 34.0, 59.0, 48.0, 52.0, 56.0, 52.0, 59.0, 68.0, 69.0, 48.0, 42.0, 40.0, 34.0, 33.0, 33.0, 19.0, 12.0, 19.0, 23.0, 13.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76754093170166, -4.615830898284912, -4.464120864868164, -4.312410831451416, -4.160700798034668, -4.00899076461792, -3.8572804927825928, -3.7055704593658447, -3.5538604259490967, -3.4021503925323486, -3.2504403591156006, -3.0987303256988525, -2.9470200538635254, -2.7953100204467773, -2.6435999870300293, -2.4918899536132812, -2.340179920196533, -2.188469886779785, -2.036759853363037, -1.8850497007369995, -1.7333396673202515, -1.5816296339035034, -1.4299194812774658, -1.2782094478607178, -1.1264994144439697, -0.9747893810272217, -0.8230792880058289, -0.671369194984436, -0.519659161567688, -0.36794912815093994, -0.21623903512954712, -0.0645289421081543, 0.08718109130859375, 0.23889115452766418, 0.3906012177467346, 0.5423113107681274, 0.6940213441848755, 0.8457313776016235, 0.9974414706230164, 1.1491515636444092, 1.3008615970611572, 1.4525716304779053, 1.6042816638946533, 1.755991816520691, 1.907701849937439, 2.0594120025634766, 2.2111220359802246, 2.3628320693969727, 2.5145421028137207, 2.6662521362304688, 2.817962169647217, 2.969672203063965, 3.121382236480713, 3.273092269897461, 3.424802541732788, 3.576512575149536, 3.728222608566284, 3.8799326419830322, 4.031642913818359, 4.183352947235107, 4.3350629806518555, 4.4867730140686035, 4.638483047485352, 4.7901930809021, 4.941903114318848]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 5.0, 10.0, 12.0, 14.0, 28.0, 44.0, 63.0, 66.0, 125.0, 201.0, 292.0, 496.0, 768.0, 1314.0, 2275.0, 4478.0, 9658.0, 24736.0, 85555.0, 1156909.0, 2755287.0, 102271.0, 27747.0, 10666.0, 4957.0, 2512.0, 1416.0, 822.0, 518.0, 374.0, 227.0, 136.0, 93.0, 55.0, 51.0, 27.0, 14.0, 20.0, 10.0, 11.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8994140625, -0.8722076416015625, -0.845001220703125, -0.8177947998046875, -0.79058837890625, -0.7633819580078125, -0.736175537109375, -0.7089691162109375, -0.6817626953125, -0.6545562744140625, -0.627349853515625, -0.6001434326171875, -0.57293701171875, -0.5457305908203125, -0.518524169921875, -0.4913177490234375, -0.464111328125, -0.4369049072265625, -0.409698486328125, -0.3824920654296875, -0.35528564453125, -0.3280792236328125, -0.300872802734375, -0.2736663818359375, -0.2464599609375, -0.2192535400390625, -0.192047119140625, -0.1648406982421875, -0.13763427734375, -0.1104278564453125, -0.083221435546875, -0.0560150146484375, -0.02880859375, -0.0016021728515625, 0.025604248046875, 0.0528106689453125, 0.08001708984375, 0.1072235107421875, 0.134429931640625, 0.1616363525390625, 0.1888427734375, 0.2160491943359375, 0.243255615234375, 0.2704620361328125, 0.29766845703125, 0.3248748779296875, 0.352081298828125, 0.3792877197265625, 0.406494140625, 0.4337005615234375, 0.460906982421875, 0.4881134033203125, 0.51531982421875, 0.5425262451171875, 0.569732666015625, 0.5969390869140625, 0.6241455078125, 0.6513519287109375, 0.678558349609375, 0.7057647705078125, 0.73297119140625, 0.7601776123046875, 0.787384033203125, 0.8145904541015625, 0.841796875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 17.0, 22.0, 23.0, 36.0, 42.0, 50.0, 52.0, 55.0, 83.0, 81.0, 70.0, 74.0, 51.0, 54.0, 64.0, 52.0, 44.0, 35.0, 18.0, 16.0, 14.0, 10.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2218017578125, -0.21537399291992188, -0.20894622802734375, -0.20251846313476562, -0.1960906982421875, -0.18966293334960938, -0.18323516845703125, -0.17680740356445312, -0.170379638671875, -0.16395187377929688, -0.15752410888671875, -0.15109634399414062, -0.1446685791015625, -0.13824081420898438, -0.13181304931640625, -0.12538528442382812, -0.11895751953125, -0.11252975463867188, -0.10610198974609375, -0.09967422485351562, -0.0932464599609375, -0.08681869506835938, -0.08039093017578125, -0.07396316528320312, -0.067535400390625, -0.061107635498046875, -0.05467987060546875, -0.048252105712890625, -0.0418243408203125, -0.035396575927734375, -0.02896881103515625, -0.022541046142578125, -0.01611328125, -0.009685516357421875, -0.00325775146484375, 0.003170013427734375, 0.0095977783203125, 0.016025543212890625, 0.02245330810546875, 0.028881072998046875, 0.035308837890625, 0.041736602783203125, 0.04816436767578125, 0.054592132568359375, 0.0610198974609375, 0.06744766235351562, 0.07387542724609375, 0.08030319213867188, 0.08673095703125, 0.09315872192382812, 0.09958648681640625, 0.10601425170898438, 0.1124420166015625, 0.11886978149414062, 0.12529754638671875, 0.13172531127929688, 0.138153076171875, 0.14458084106445312, 0.15100860595703125, 0.15743637084960938, 0.1638641357421875, 0.17029190063476562, 0.17671966552734375, 0.18314743041992188, 0.1895751953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 6.0, 10.0, 23.0, 35.0, 52.0, 80.0, 112.0, 215.0, 405.0, 839.0, 1738.0, 4737.0, 15644.0, 73878.0, 1233714.0, 2738269.0, 94468.0, 19827.0, 5884.0, 2137.0, 966.0, 494.0, 269.0, 179.0, 104.0, 75.0, 35.0, 26.0, 17.0, 12.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4189453125, -1.377288818359375, -1.33563232421875, -1.293975830078125, -1.2523193359375, -1.210662841796875, -1.16900634765625, -1.127349853515625, -1.085693359375, -1.044036865234375, -1.00238037109375, -0.960723876953125, -0.9190673828125, -0.877410888671875, -0.83575439453125, -0.794097900390625, -0.75244140625, -0.710784912109375, -0.66912841796875, -0.627471923828125, -0.5858154296875, -0.544158935546875, -0.50250244140625, -0.460845947265625, -0.419189453125, -0.377532958984375, -0.33587646484375, -0.294219970703125, -0.2525634765625, -0.210906982421875, -0.16925048828125, -0.127593994140625, -0.0859375, -0.044281005859375, -0.00262451171875, 0.039031982421875, 0.0806884765625, 0.122344970703125, 0.16400146484375, 0.205657958984375, 0.247314453125, 0.288970947265625, 0.33062744140625, 0.372283935546875, 0.4139404296875, 0.455596923828125, 0.49725341796875, 0.538909912109375, 0.58056640625, 0.622222900390625, 0.66387939453125, 0.705535888671875, 0.7471923828125, 0.788848876953125, 0.83050537109375, 0.872161865234375, 0.913818359375, 0.955474853515625, 0.99713134765625, 1.038787841796875, 1.0804443359375, 1.122100830078125, 1.16375732421875, 1.205413818359375, 1.2470703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 15.0, 18.0, 13.0, 34.0, 52.0, 78.0, 132.0, 234.0, 526.0, 1658.0, 640.0, 248.0, 136.0, 79.0, 65.0, 28.0, 23.0, 13.0, 13.0, 16.0, 13.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33544921875, -0.31990814208984375, -0.3043670654296875, -0.28882598876953125, -0.273284912109375, -0.25774383544921875, -0.2422027587890625, -0.22666168212890625, -0.21112060546875, -0.19557952880859375, -0.1800384521484375, -0.16449737548828125, -0.148956298828125, -0.13341522216796875, -0.1178741455078125, -0.10233306884765625, -0.0867919921875, -0.07125091552734375, -0.0557098388671875, -0.04016876220703125, -0.024627685546875, -0.00908660888671875, 0.0064544677734375, 0.02199554443359375, 0.03753662109375, 0.05307769775390625, 0.0686187744140625, 0.08415985107421875, 0.099700927734375, 0.11524200439453125, 0.1307830810546875, 0.14632415771484375, 0.161865234375, 0.17740631103515625, 0.1929473876953125, 0.20848846435546875, 0.224029541015625, 0.23957061767578125, 0.2551116943359375, 0.27065277099609375, 0.28619384765625, 0.30173492431640625, 0.3172760009765625, 0.33281707763671875, 0.348358154296875, 0.36389923095703125, 0.3794403076171875, 0.39498138427734375, 0.4105224609375, 0.42606353759765625, 0.4416046142578125, 0.45714569091796875, 0.472686767578125, 0.48822784423828125, 0.5037689208984375, 0.5193099975585938, 0.53485107421875, 0.5503921508789062, 0.5659332275390625, 0.5814743041992188, 0.597015380859375, 0.6125564575195312, 0.6280975341796875, 0.6436386108398438, 0.6591796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 8.0, 29.0, 69.0, 121.0, 165.0, 195.0, 196.0, 98.0, 59.0, 26.0, 17.0, 6.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.035954236984253, -1.893150806427002, -1.750347375869751, -1.6075438261032104, -1.4647403955459595, -1.3219369649887085, -1.179133415222168, -1.036329984664917, -0.893526554107666, -0.750723123550415, -0.6079196333885193, -0.4651161730289459, -0.32231271266937256, -0.17950928211212158, -0.03670579195022583, 0.10609769821166992, 0.2489011287689209, 0.39170458912849426, 0.5345080494880676, 0.6773115396499634, 0.8201149702072144, 0.9629184007644653, 1.1057219505310059, 1.2485253810882568, 1.3913288116455078, 1.5341322422027588, 1.6769356727600098, 1.8197392225265503, 1.9625426530838013, 2.105346202850342, 2.2481496334075928, 2.3909530639648438, 2.533756732940674, 2.676560163497925, 2.819363594055176, 2.9621670246124268, 3.1049704551696777, 3.247774124145508, 3.390577554702759, 3.5333809852600098, 3.6761844158172607, 3.8189878463745117, 3.9617912769317627, 4.104594707489014, 4.247398376464844, 4.390201568603516, 4.533005237579346, 4.675808906555176, 4.818612098693848, 4.961415767669678, 5.10421895980835, 5.24702262878418, 5.389825820922852, 5.532629489898682, 5.6754326820373535, 5.818236351013184, 5.9610395431518555, 6.1038432121276855, 6.246646404266357, 6.3894500732421875, 6.532253265380859, 6.6750569343566895, 6.817860126495361, 6.960663795471191, 7.1034674644470215]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 8.0, 9.0, 10.0, 12.0, 15.0, 23.0, 25.0, 22.0, 27.0, 30.0, 25.0, 34.0, 38.0, 45.0, 44.0, 42.0, 43.0, 43.0, 45.0, 48.0, 38.0, 46.0, 38.0, 35.0, 36.0, 27.0, 26.0, 23.0, 17.0, 17.0, 21.0, 16.0, 12.0, 15.0, 9.0, 5.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5491994619369507, -1.5008944272994995, -1.4525893926620483, -1.4042844772338867, -1.3559794425964355, -1.3076744079589844, -1.2593693733215332, -1.211064338684082, -1.1627593040466309, -1.1144542694091797, -1.0661492347717285, -1.0178442001342773, -0.969539225101471, -0.9212342500686646, -0.8729292154312134, -0.8246241807937622, -0.7763192057609558, -0.7280141711235046, -0.6797091960906982, -0.6314041614532471, -0.5830991268157959, -0.5347940921783447, -0.48648911714553833, -0.43818408250808716, -0.3898790776729584, -0.3415740728378296, -0.2932690382003784, -0.24496403336524963, -0.19665901362895966, -0.14835399389266968, -0.1000489890575409, -0.05174395442008972, -0.0034389495849609375, 0.04486606642603874, 0.09317108243703842, 0.1414760947227478, 0.18978111445903778, 0.23808613419532776, 0.28639113903045654, 0.3346961736679077, 0.3830011785030365, 0.4313061833381653, 0.47961121797561646, 0.5279161930084229, 0.576221227645874, 0.6245262622833252, 0.6728312969207764, 0.7211363315582275, 0.7694413065910339, 0.8177463412284851, 0.8660513162612915, 0.9143563508987427, 0.9626613855361938, 1.010966420173645, 1.0592713356018066, 1.1075763702392578, 1.155881404876709, 1.2041864395141602, 1.2524914741516113, 1.3007965087890625, 1.3491014242172241, 1.3974064588546753, 1.4457114934921265, 1.4940165281295776, 1.5423215627670288]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 9.0, 11.0, 20.0, 26.0, 29.0, 64.0, 76.0, 144.0, 211.0, 377.0, 641.0, 1172.0, 2262.0, 4792.0, 10979.0, 28613.0, 86305.0, 333465.0, 413374.0, 107149.0, 34582.0, 12951.0, 5607.0, 2557.0, 1328.0, 714.0, 410.0, 233.0, 165.0, 93.0, 63.0, 42.0, 31.0, 14.0, 11.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9560546875, -0.9271621704101562, -0.8982696533203125, -0.8693771362304688, -0.840484619140625, -0.8115921020507812, -0.7826995849609375, -0.7538070678710938, -0.72491455078125, -0.6960220336914062, -0.6671295166015625, -0.6382369995117188, -0.609344482421875, -0.5804519653320312, -0.5515594482421875, -0.5226669311523438, -0.4937744140625, -0.46488189697265625, -0.4359893798828125, -0.40709686279296875, -0.378204345703125, -0.34931182861328125, -0.3204193115234375, -0.29152679443359375, -0.26263427734375, -0.23374176025390625, -0.2048492431640625, -0.17595672607421875, -0.147064208984375, -0.11817169189453125, -0.0892791748046875, -0.06038665771484375, -0.031494140625, -0.00260162353515625, 0.0262908935546875, 0.05518341064453125, 0.084075927734375, 0.11296844482421875, 0.1418609619140625, 0.17075347900390625, 0.19964599609375, 0.22853851318359375, 0.2574310302734375, 0.28632354736328125, 0.315216064453125, 0.34410858154296875, 0.3730010986328125, 0.40189361572265625, 0.4307861328125, 0.45967864990234375, 0.4885711669921875, 0.5174636840820312, 0.546356201171875, 0.5752487182617188, 0.6041412353515625, 0.6330337524414062, 0.66192626953125, 0.6908187866210938, 0.7197113037109375, 0.7486038208007812, 0.777496337890625, 0.8063888549804688, 0.8352813720703125, 0.8641738891601562, 0.89306640625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 12.0, 14.0, 17.0, 21.0, 22.0, 42.0, 51.0, 64.0, 65.0, 73.0, 70.0, 67.0, 69.0, 67.0, 54.0, 58.0, 44.0, 49.0, 39.0, 27.0, 20.0, 12.0, 15.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.239990234375, -0.2336254119873047, -0.22726058959960938, -0.22089576721191406, -0.21453094482421875, -0.20816612243652344, -0.20180130004882812, -0.1954364776611328, -0.1890716552734375, -0.1827068328857422, -0.17634201049804688, -0.16997718811035156, -0.16361236572265625, -0.15724754333496094, -0.15088272094726562, -0.1445178985595703, -0.138153076171875, -0.1317882537841797, -0.12542343139648438, -0.11905860900878906, -0.11269378662109375, -0.10632896423339844, -0.09996414184570312, -0.09359931945800781, -0.0872344970703125, -0.08086967468261719, -0.07450485229492188, -0.06814002990722656, -0.06177520751953125, -0.05541038513183594, -0.049045562744140625, -0.04268074035644531, -0.03631591796875, -0.029951095581054688, -0.023586273193359375, -0.017221450805664062, -0.01085662841796875, -0.0044918060302734375, 0.001873016357421875, 0.008237838745117188, 0.0146026611328125, 0.020967483520507812, 0.027332305908203125, 0.03369712829589844, 0.04006195068359375, 0.04642677307128906, 0.052791595458984375, 0.05915641784667969, 0.065521240234375, 0.07188606262207031, 0.07825088500976562, 0.08461570739746094, 0.09098052978515625, 0.09734535217285156, 0.10371017456054688, 0.11007499694824219, 0.1164398193359375, 0.12280464172363281, 0.12916946411132812, 0.13553428649902344, 0.14189910888671875, 0.14826393127441406, 0.15462875366210938, 0.1609935760498047, 0.1673583984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 14.0, 2.0, 18.0, 8.0, 30.0, 39.0, 41.0, 56.0, 91.0, 137.0, 214.0, 318.0, 511.0, 846.0, 1550.0, 2865.0, 5931.0, 14448.0, 39441.0, 125840.0, 448118.0, 284525.0, 77821.0, 25812.0, 10005.0, 4438.0, 2198.0, 1234.0, 732.0, 441.0, 264.0, 168.0, 121.0, 86.0, 49.0, 38.0, 19.0, 19.0, 15.0, 6.0, 12.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.70068359375, -0.6771697998046875, -0.653656005859375, -0.6301422119140625, -0.60662841796875, -0.5831146240234375, -0.559600830078125, -0.5360870361328125, -0.5125732421875, -0.4890594482421875, -0.465545654296875, -0.4420318603515625, -0.41851806640625, -0.3950042724609375, -0.371490478515625, -0.3479766845703125, -0.324462890625, -0.3009490966796875, -0.277435302734375, -0.2539215087890625, -0.23040771484375, -0.2068939208984375, -0.183380126953125, -0.1598663330078125, -0.1363525390625, -0.1128387451171875, -0.089324951171875, -0.0658111572265625, -0.04229736328125, -0.0187835693359375, 0.004730224609375, 0.0282440185546875, 0.0517578125, 0.0752716064453125, 0.098785400390625, 0.1222991943359375, 0.14581298828125, 0.1693267822265625, 0.192840576171875, 0.2163543701171875, 0.2398681640625, 0.2633819580078125, 0.286895751953125, 0.3104095458984375, 0.33392333984375, 0.3574371337890625, 0.380950927734375, 0.4044647216796875, 0.427978515625, 0.4514923095703125, 0.475006103515625, 0.4985198974609375, 0.52203369140625, 0.5455474853515625, 0.569061279296875, 0.5925750732421875, 0.6160888671875, 0.6396026611328125, 0.663116455078125, 0.6866302490234375, 0.71014404296875, 0.7336578369140625, 0.757171630859375, 0.7806854248046875, 0.80419921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 10.0, 20.0, 18.0, 19.0, 22.0, 39.0, 36.0, 50.0, 49.0, 75.0, 48.0, 66.0, 61.0, 64.0, 49.0, 58.0, 53.0, 45.0, 47.0, 44.0, 35.0, 20.0, 19.0, 9.0, 12.0, 2.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.072265625, -1.0431289672851562, -1.0139923095703125, -0.9848556518554688, -0.955718994140625, -0.9265823364257812, -0.8974456787109375, -0.8683090209960938, -0.83917236328125, -0.8100357055664062, -0.7808990478515625, -0.7517623901367188, -0.722625732421875, -0.6934890747070312, -0.6643524169921875, -0.6352157592773438, -0.6060791015625, -0.5769424438476562, -0.5478057861328125, -0.5186691284179688, -0.489532470703125, -0.46039581298828125, -0.4312591552734375, -0.40212249755859375, -0.37298583984375, -0.34384918212890625, -0.3147125244140625, -0.28557586669921875, -0.256439208984375, -0.22730255126953125, -0.1981658935546875, -0.16902923583984375, -0.139892578125, -0.11075592041015625, -0.0816192626953125, -0.05248260498046875, -0.023345947265625, 0.00579071044921875, 0.0349273681640625, 0.06406402587890625, 0.09320068359375, 0.12233734130859375, 0.1514739990234375, 0.18061065673828125, 0.209747314453125, 0.23888397216796875, 0.2680206298828125, 0.29715728759765625, 0.3262939453125, 0.35543060302734375, 0.3845672607421875, 0.41370391845703125, 0.442840576171875, 0.47197723388671875, 0.5011138916015625, 0.5302505493164062, 0.55938720703125, 0.5885238647460938, 0.6176605224609375, 0.6467971801757812, 0.675933837890625, 0.7050704956054688, 0.7342071533203125, 0.7633438110351562, 0.79248046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 9.0, 10.0, 14.0, 19.0, 32.0, 42.0, 77.0, 88.0, 172.0, 266.0, 421.0, 863.0, 1535.0, 3430.0, 8758.0, 39639.0, 780998.0, 184756.0, 17000.0, 5387.0, 2314.0, 1144.0, 621.0, 360.0, 212.0, 132.0, 72.0, 55.0, 33.0, 27.0, 19.0, 12.0, 6.0, 14.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.423828125, -1.3759918212890625, -1.328155517578125, -1.2803192138671875, -1.23248291015625, -1.1846466064453125, -1.136810302734375, -1.0889739990234375, -1.0411376953125, -0.9933013916015625, -0.945465087890625, -0.8976287841796875, -0.84979248046875, -0.8019561767578125, -0.754119873046875, -0.7062835693359375, -0.658447265625, -0.6106109619140625, -0.562774658203125, -0.5149383544921875, -0.46710205078125, -0.4192657470703125, -0.371429443359375, -0.3235931396484375, -0.2757568359375, -0.2279205322265625, -0.180084228515625, -0.1322479248046875, -0.08441162109375, -0.0365753173828125, 0.011260986328125, 0.0590972900390625, 0.10693359375, 0.1547698974609375, 0.202606201171875, 0.2504425048828125, 0.29827880859375, 0.3461151123046875, 0.393951416015625, 0.4417877197265625, 0.4896240234375, 0.5374603271484375, 0.585296630859375, 0.6331329345703125, 0.68096923828125, 0.7288055419921875, 0.776641845703125, 0.8244781494140625, 0.872314453125, 0.9201507568359375, 0.967987060546875, 1.0158233642578125, 1.06365966796875, 1.1114959716796875, 1.159332275390625, 1.2071685791015625, 1.2550048828125, 1.3028411865234375, 1.350677490234375, 1.3985137939453125, 1.44635009765625, 1.4941864013671875, 1.542022705078125, 1.5898590087890625, 1.6376953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 12.0, 8.0, 33.0, 131.0, 437.0, 235.0, 78.0, 34.0, 12.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008025169372558594, -0.0007833391427993774, -0.0007641613483428955, -0.0007449835538864136, -0.0007258057594299316, -0.0007066279649734497, -0.0006874501705169678, -0.0006682723760604858, -0.0006490945816040039, -0.000629916787147522, -0.00061073899269104, -0.0005915611982345581, -0.0005723834037780762, -0.0005532056093215942, -0.0005340278148651123, -0.0005148500204086304, -0.0004956722259521484, -0.0004764944314956665, -0.00045731663703918457, -0.00043813884258270264, -0.0004189610481262207, -0.00039978325366973877, -0.00038060545921325684, -0.0003614276647567749, -0.00034224987030029297, -0.00032307207584381104, -0.0003038942813873291, -0.00028471648693084717, -0.00026553869247436523, -0.0002463608980178833, -0.00022718310356140137, -0.00020800530910491943, -0.0001888275146484375, -0.00016964972019195557, -0.00015047192573547363, -0.0001312941312789917, -0.00011211633682250977, -9.293854236602783e-05, -7.37607479095459e-05, -5.4582953453063965e-05, -3.540515899658203e-05, -1.6227364540100098e-05, 2.950429916381836e-06, 2.212822437286377e-05, 4.13060188293457e-05, 6.048381328582764e-05, 7.966160774230957e-05, 9.88394021987915e-05, 0.00011801719665527344, 0.00013719499111175537, 0.0001563727855682373, 0.00017555058002471924, 0.00019472837448120117, 0.0002139061689376831, 0.00023308396339416504, 0.00025226175785064697, 0.0002714395523071289, 0.00029061734676361084, 0.0003097951412200928, 0.0003289729356765747, 0.00034815073013305664, 0.0003673285245895386, 0.0003865063190460205, 0.00040568411350250244, 0.0004248619079589844]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 13.0, 17.0, 26.0, 30.0, 49.0, 81.0, 112.0, 178.0, 273.0, 460.0, 773.0, 1285.0, 2392.0, 4839.0, 12641.0, 64619.0, 789217.0, 140869.0, 17895.0, 6169.0, 2902.0, 1491.0, 846.0, 457.0, 322.0, 176.0, 114.0, 89.0, 55.0, 38.0, 19.0, 23.0, 11.0, 10.0, 7.0, 6.0, 7.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1259765625, -1.0892333984375, -1.052490234375, -1.0157470703125, -0.97900390625, -0.9422607421875, -0.905517578125, -0.8687744140625, -0.83203125, -0.7952880859375, -0.758544921875, -0.7218017578125, -0.68505859375, -0.6483154296875, -0.611572265625, -0.5748291015625, -0.5380859375, -0.5013427734375, -0.464599609375, -0.4278564453125, -0.39111328125, -0.3543701171875, -0.317626953125, -0.2808837890625, -0.244140625, -0.2073974609375, -0.170654296875, -0.1339111328125, -0.09716796875, -0.0604248046875, -0.023681640625, 0.0130615234375, 0.0498046875, 0.0865478515625, 0.123291015625, 0.1600341796875, 0.19677734375, 0.2335205078125, 0.270263671875, 0.3070068359375, 0.34375, 0.3804931640625, 0.417236328125, 0.4539794921875, 0.49072265625, 0.5274658203125, 0.564208984375, 0.6009521484375, 0.6376953125, 0.6744384765625, 0.711181640625, 0.7479248046875, 0.78466796875, 0.8214111328125, 0.858154296875, 0.8948974609375, 0.931640625, 0.9683837890625, 1.005126953125, 1.0418701171875, 1.07861328125, 1.1153564453125, 1.152099609375, 1.1888427734375, 1.2255859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 17.0, 17.0, 41.0, 72.0, 153.0, 225.0, 180.0, 124.0, 51.0, 26.0, 12.0, 8.0, 9.0, 9.0, 10.0, 4.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.999755859375, -0.96826171875, -0.936767578125, -0.9052734375, -0.873779296875, -0.84228515625, -0.810791015625, -0.779296875, -0.747802734375, -0.71630859375, -0.684814453125, -0.6533203125, -0.621826171875, -0.59033203125, -0.558837890625, -0.52734375, -0.495849609375, -0.46435546875, -0.432861328125, -0.4013671875, -0.369873046875, -0.33837890625, -0.306884765625, -0.275390625, -0.243896484375, -0.21240234375, -0.180908203125, -0.1494140625, -0.117919921875, -0.08642578125, -0.054931640625, -0.0234375, 0.008056640625, 0.03955078125, 0.071044921875, 0.1025390625, 0.134033203125, 0.16552734375, 0.197021484375, 0.228515625, 0.260009765625, 0.29150390625, 0.322998046875, 0.3544921875, 0.385986328125, 0.41748046875, 0.448974609375, 0.48046875, 0.511962890625, 0.54345703125, 0.574951171875, 0.6064453125, 0.637939453125, 0.66943359375, 0.700927734375, 0.732421875, 0.763916015625, 0.79541015625, 0.826904296875, 0.8583984375, 0.889892578125, 0.92138671875, 0.952880859375, 0.984375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 14.0, 23.0, 30.0, 56.0, 102.0, 121.0, 144.0, 141.0, 136.0, 105.0, 61.0, 29.0, 11.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.653658866882324, -11.390778541564941, -11.127899169921875, -10.865018844604492, -10.60213851928711, -10.339259147644043, -10.07637882232666, -9.813499450683594, -9.550619125366211, -9.287738800048828, -9.024859428405762, -8.761979103088379, -8.499099731445312, -8.23621940612793, -7.973339080810547, -7.710459232330322, -7.447579383850098, -7.184699535369873, -6.921819686889648, -6.658939361572266, -6.396059513092041, -6.133179664611816, -5.870299339294434, -5.607419490814209, -5.344539642333984, -5.08165979385376, -4.818779945373535, -4.555899620056152, -4.293019771575928, -4.030139923095703, -3.7672598361968994, -3.5043797492980957, -3.2415008544921875, -2.978621006011963, -2.715740919113159, -2.4528608322143555, -2.189980983734131, -1.9271010160446167, -1.6642210483551025, -1.4013410806655884, -1.1384611129760742, -0.8755811452865601, -0.6127011775970459, -0.34982120990753174, -0.08694124221801758, 0.17593872547149658, 0.43881869316101074, 0.7016986608505249, 0.9645786285400391, 1.2274585962295532, 1.4903385639190674, 1.7532185316085815, 2.0160984992980957, 2.2789783477783203, 2.541858434677124, 2.8047385215759277, 3.0676183700561523, 3.330498218536377, 3.5933783054351807, 3.8562583923339844, 4.119138240814209, 4.382018089294434, 4.644898414611816, 4.907778263092041, 5.170658111572266]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 9.0, 6.0, 6.0, 12.0, 11.0, 19.0, 19.0, 21.0, 18.0, 28.0, 26.0, 34.0, 33.0, 43.0, 30.0, 45.0, 41.0, 50.0, 40.0, 52.0, 48.0, 38.0, 37.0, 46.0, 36.0, 38.0, 24.0, 20.0, 35.0, 24.0, 16.0, 19.0, 18.0, 11.0, 5.0, 11.0, 8.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.762953996658325, -3.6356422901153564, -3.508330821990967, -3.381019115447998, -3.2537076473236084, -3.1263959407806396, -2.99908447265625, -2.8717727661132812, -2.7444610595703125, -2.6171493530273438, -2.489837884902954, -2.3625261783599854, -2.2352147102355957, -2.107903003692627, -1.9805914163589478, -1.8532798290252686, -1.725968360900879, -1.5986567735671997, -1.4713451862335205, -1.3440334796905518, -1.216722011566162, -1.0894103050231934, -0.9620987176895142, -0.834787130355835, -0.7074755430221558, -0.5801639556884766, -0.452852338552475, -0.3255407214164734, -0.1982291340827942, -0.07091754674911499, 0.056394100189208984, 0.18370568752288818, 0.3110175132751465, 0.4383291006088257, 0.5656406879425049, 0.6929523348808289, 0.8202639222145081, 0.9475755095481873, 1.0748871564865112, 1.2021987438201904, 1.3295103311538696, 1.4568219184875488, 1.584133505821228, 1.7114450931549072, 1.838756799697876, 1.9660682678222656, 2.0933799743652344, 2.220691680908203, 2.3480031490325928, 2.4753148555755615, 2.602626323699951, 2.72993803024292, 2.8572494983673096, 2.9845612049102783, 3.111872673034668, 3.2391843795776367, 3.3664960861206055, 3.493807792663574, 3.621119260787964, 3.7484309673309326, 3.8757424354553223, 4.003054141998291, 4.13036584854126, 4.25767707824707, 4.384988784790039]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 10.0, 10.0, 19.0, 19.0, 34.0, 32.0, 46.0, 62.0, 104.0, 164.0, 242.0, 374.0, 570.0, 1094.0, 1921.0, 3793.0, 8188.0, 20406.0, 63026.0, 364160.0, 3484318.0, 176502.0, 41465.0, 14750.0, 6118.0, 2910.0, 1543.0, 901.0, 521.0, 325.0, 209.0, 109.0, 95.0, 69.0, 47.0, 31.0, 30.0, 19.0, 16.0, 9.0, 2.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.806640625, -0.7800521850585938, -0.7534637451171875, -0.7268753051757812, -0.700286865234375, -0.6736984252929688, -0.6471099853515625, -0.6205215454101562, -0.59393310546875, -0.5673446655273438, -0.5407562255859375, -0.5141677856445312, -0.487579345703125, -0.46099090576171875, -0.4344024658203125, -0.40781402587890625, -0.3812255859375, -0.35463714599609375, -0.3280487060546875, -0.30146026611328125, -0.274871826171875, -0.24828338623046875, -0.2216949462890625, -0.19510650634765625, -0.16851806640625, -0.14192962646484375, -0.1153411865234375, -0.08875274658203125, -0.062164306640625, -0.03557586669921875, -0.0089874267578125, 0.01760101318359375, 0.044189453125, 0.07077789306640625, 0.0973663330078125, 0.12395477294921875, 0.150543212890625, 0.17713165283203125, 0.2037200927734375, 0.23030853271484375, 0.25689697265625, 0.28348541259765625, 0.3100738525390625, 0.33666229248046875, 0.363250732421875, 0.38983917236328125, 0.4164276123046875, 0.44301605224609375, 0.4696044921875, 0.49619293212890625, 0.5227813720703125, 0.5493698120117188, 0.575958251953125, 0.6025466918945312, 0.6291351318359375, 0.6557235717773438, 0.68231201171875, 0.7089004516601562, 0.7354888916015625, 0.7620773315429688, 0.788665771484375, 0.8152542114257812, 0.8418426513671875, 0.8684310913085938, 0.89501953125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 10.0, 8.0, 11.0, 18.0, 12.0, 23.0, 32.0, 45.0, 43.0, 56.0, 55.0, 55.0, 65.0, 73.0, 62.0, 58.0, 47.0, 69.0, 49.0, 40.0, 36.0, 27.0, 26.0, 13.0, 20.0, 12.0, 8.0, 2.0, 7.0, 4.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21630859375, -0.2101287841796875, -0.203948974609375, -0.1977691650390625, -0.19158935546875, -0.1854095458984375, -0.179229736328125, -0.1730499267578125, -0.1668701171875, -0.1606903076171875, -0.154510498046875, -0.1483306884765625, -0.14215087890625, -0.1359710693359375, -0.129791259765625, -0.1236114501953125, -0.117431640625, -0.1112518310546875, -0.105072021484375, -0.0988922119140625, -0.09271240234375, -0.0865325927734375, -0.080352783203125, -0.0741729736328125, -0.0679931640625, -0.0618133544921875, -0.055633544921875, -0.0494537353515625, -0.04327392578125, -0.0370941162109375, -0.030914306640625, -0.0247344970703125, -0.0185546875, -0.0123748779296875, -0.006195068359375, -1.52587890625e-05, 0.00616455078125, 0.0123443603515625, 0.018524169921875, 0.0247039794921875, 0.0308837890625, 0.0370635986328125, 0.043243408203125, 0.0494232177734375, 0.05560302734375, 0.0617828369140625, 0.067962646484375, 0.0741424560546875, 0.080322265625, 0.0865020751953125, 0.092681884765625, 0.0988616943359375, 0.10504150390625, 0.1112213134765625, 0.117401123046875, 0.1235809326171875, 0.1297607421875, 0.1359405517578125, 0.142120361328125, 0.1483001708984375, 0.15447998046875, 0.1606597900390625, 0.166839599609375, 0.1730194091796875, 0.17919921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 2.0, 16.0, 15.0, 10.0, 17.0, 21.0, 26.0, 38.0, 45.0, 69.0, 99.0, 143.0, 343.0, 854.0, 3054.0, 15672.0, 224259.0, 3878808.0, 59874.0, 7804.0, 1923.0, 563.0, 237.0, 121.0, 76.0, 46.0, 22.0, 27.0, 14.0, 19.0, 10.0, 10.0, 8.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.613494873046875, -2.51409912109375, -2.414703369140625, -2.3153076171875, -2.215911865234375, -2.11651611328125, -2.017120361328125, -1.917724609375, -1.818328857421875, -1.71893310546875, -1.619537353515625, -1.5201416015625, -1.420745849609375, -1.32135009765625, -1.221954345703125, -1.12255859375, -1.023162841796875, -0.92376708984375, -0.824371337890625, -0.7249755859375, -0.625579833984375, -0.52618408203125, -0.426788330078125, -0.327392578125, -0.227996826171875, -0.12860107421875, -0.029205322265625, 0.0701904296875, 0.169586181640625, 0.26898193359375, 0.368377685546875, 0.4677734375, 0.567169189453125, 0.66656494140625, 0.765960693359375, 0.8653564453125, 0.964752197265625, 1.06414794921875, 1.163543701171875, 1.262939453125, 1.362335205078125, 1.46173095703125, 1.561126708984375, 1.6605224609375, 1.759918212890625, 1.85931396484375, 1.958709716796875, 2.05810546875, 2.157501220703125, 2.25689697265625, 2.356292724609375, 2.4556884765625, 2.555084228515625, 2.65447998046875, 2.753875732421875, 2.853271484375, 2.952667236328125, 3.05206298828125, 3.151458740234375, 3.2508544921875, 3.350250244140625, 3.44964599609375, 3.549041748046875, 3.6484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 14.0, 25.0, 39.0, 79.0, 204.0, 996.0, 2210.0, 268.0, 103.0, 56.0, 34.0, 10.0, 11.0, 4.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.7568359375, -1.7217903137207031, -1.6867446899414062, -1.6516990661621094, -1.6166534423828125, -1.5816078186035156, -1.5465621948242188, -1.5115165710449219, -1.476470947265625, -1.4414253234863281, -1.4063796997070312, -1.3713340759277344, -1.3362884521484375, -1.3012428283691406, -1.2661972045898438, -1.2311515808105469, -1.19610595703125, -1.1610603332519531, -1.1260147094726562, -1.0909690856933594, -1.0559234619140625, -1.0208778381347656, -0.9858322143554688, -0.9507865905761719, -0.915740966796875, -0.8806953430175781, -0.8456497192382812, -0.8106040954589844, -0.7755584716796875, -0.7405128479003906, -0.7054672241210938, -0.6704216003417969, -0.6353759765625, -0.6003303527832031, -0.5652847290039062, -0.5302391052246094, -0.4951934814453125, -0.4601478576660156, -0.42510223388671875, -0.3900566101074219, -0.355010986328125, -0.3199653625488281, -0.28491973876953125, -0.24987411499023438, -0.2148284912109375, -0.17978286743164062, -0.14473724365234375, -0.10969161987304688, -0.07464599609375, -0.039600372314453125, -0.00455474853515625, 0.030490875244140625, 0.0655364990234375, 0.10058212280273438, 0.13562774658203125, 0.17067337036132812, 0.205718994140625, 0.24076461791992188, 0.27581024169921875, 0.3108558654785156, 0.3459014892578125, 0.3809471130371094, 0.41599273681640625, 0.4510383605957031, 0.486083984375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 2.0, 7.0, 5.0, 18.0, 19.0, 28.0, 40.0, 59.0, 77.0, 81.0, 102.0, 114.0, 102.0, 80.0, 65.0, 50.0, 49.0, 25.0, 19.0, 12.0, 9.0, 5.0, 3.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5542678833007812, -2.4611923694610596, -2.368116617202759, -2.275041103363037, -2.1819653511047363, -2.0888898372650146, -1.995814323425293, -1.9027386903762817, -1.8096630573272705, -1.7165874242782593, -1.623511791229248, -1.5304362773895264, -1.4373606443405151, -1.344285011291504, -1.2512094974517822, -1.158133864402771, -1.0650582313537598, -0.9719825983047485, -0.8789070248603821, -0.7858314514160156, -0.6927558183670044, -0.5996801853179932, -0.5066046118736267, -0.41352903842926025, -0.320453405380249, -0.22737780213356018, -0.13430219888687134, -0.041226595640182495, 0.05184900760650635, 0.1449246108531952, 0.23800021409988403, 0.3310757875442505, 0.4241514205932617, 0.517227053642273, 0.6103026270866394, 0.7033782005310059, 0.7964538335800171, 0.8895294666290283, 0.9826050400733948, 1.0756806135177612, 1.1687562465667725, 1.2618318796157837, 1.354907512664795, 1.4479830265045166, 1.5410586595535278, 1.634134292602539, 1.7272098064422607, 1.820285439491272, 1.9133610725402832, 2.006436586380005, 2.0995123386383057, 2.1925878524780273, 2.285663604736328, 2.37873911857605, 2.4718146324157715, 2.5648903846740723, 2.657965898513794, 2.7510414123535156, 2.8441171646118164, 2.937192678451538, 3.0302681922912598, 3.1233439445495605, 3.2164194583892822, 3.309494972229004, 3.4025707244873047]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 6.0, 7.0, 9.0, 8.0, 8.0, 12.0, 16.0, 15.0, 22.0, 27.0, 32.0, 27.0, 33.0, 42.0, 41.0, 43.0, 40.0, 41.0, 37.0, 41.0, 43.0, 27.0, 34.0, 43.0, 38.0, 40.0, 30.0, 30.0, 27.0, 28.0, 27.0, 20.0, 21.0, 15.0, 15.0, 11.0, 5.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.9604204893112183, -1.898557424545288, -1.836694359779358, -1.7748312950134277, -1.712968349456787, -1.651105284690857, -1.5892422199249268, -1.5273791551589966, -1.4655160903930664, -1.4036530256271362, -1.341789960861206, -1.2799270153045654, -1.2180639505386353, -1.156200885772705, -1.094337821006775, -1.0324747562408447, -0.9706118106842041, -0.9087487459182739, -0.8468857407569885, -0.7850226759910583, -0.723159670829773, -0.6612966060638428, -0.5994335412979126, -0.5375704765319824, -0.475707471370697, -0.41384443640708923, -0.35198140144348145, -0.29011833667755127, -0.22825530171394348, -0.1663922667503357, -0.10452920198440552, -0.04266616702079773, 0.01919698715209961, 0.081060029566288, 0.14292307198047638, 0.20478612184524536, 0.26664915680885315, 0.32851219177246094, 0.3903752565383911, 0.4522382915019989, 0.5141013264656067, 0.5759643912315369, 0.6378273963928223, 0.6996904611587524, 0.7615535259246826, 0.823416531085968, 0.8852795958518982, 0.9471426010131836, 1.0090056657791138, 1.070868730545044, 1.1327317953109741, 1.1945948600769043, 1.256457805633545, 1.318320870399475, 1.3801839351654053, 1.4420469999313354, 1.5039100646972656, 1.5657731294631958, 1.627636194229126, 1.6894991397857666, 1.7513622045516968, 1.813225269317627, 1.8750883340835571, 1.9369513988494873, 1.998814344406128]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 13.0, 13.0, 21.0, 24.0, 39.0, 57.0, 70.0, 114.0, 159.0, 190.0, 292.0, 455.0, 659.0, 1014.0, 1530.0, 2412.0, 3952.0, 6436.0, 10849.0, 19083.0, 35095.0, 66047.0, 132460.0, 274475.0, 244819.0, 114991.0, 58531.0, 31695.0, 17204.0, 9925.0, 5884.0, 3476.0, 2255.0, 1398.0, 880.0, 616.0, 429.0, 279.0, 190.0, 150.0, 110.0, 62.0, 57.0, 35.0, 29.0, 15.0, 15.0, 10.0, 12.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0], "bins": [-0.68212890625, -0.6613998413085938, -0.6406707763671875, -0.6199417114257812, -0.599212646484375, -0.5784835815429688, -0.5577545166015625, -0.5370254516601562, -0.51629638671875, -0.49556732177734375, -0.4748382568359375, -0.45410919189453125, -0.433380126953125, -0.41265106201171875, -0.3919219970703125, -0.37119293212890625, -0.3504638671875, -0.32973480224609375, -0.3090057373046875, -0.28827667236328125, -0.267547607421875, -0.24681854248046875, -0.2260894775390625, -0.20536041259765625, -0.18463134765625, -0.16390228271484375, -0.1431732177734375, -0.12244415283203125, -0.101715087890625, -0.08098602294921875, -0.0602569580078125, -0.03952789306640625, -0.018798828125, 0.00193023681640625, 0.0226593017578125, 0.04338836669921875, 0.064117431640625, 0.08484649658203125, 0.1055755615234375, 0.12630462646484375, 0.14703369140625, 0.16776275634765625, 0.1884918212890625, 0.20922088623046875, 0.229949951171875, 0.25067901611328125, 0.2714080810546875, 0.29213714599609375, 0.3128662109375, 0.33359527587890625, 0.3543243408203125, 0.37505340576171875, 0.395782470703125, 0.41651153564453125, 0.4372406005859375, 0.45796966552734375, 0.47869873046875, 0.49942779541015625, 0.5201568603515625, 0.5408859252929688, 0.561614990234375, 0.5823440551757812, 0.6030731201171875, 0.6238021850585938, 0.64453125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 6.0, 10.0, 9.0, 18.0, 19.0, 31.0, 31.0, 27.0, 17.0, 49.0, 44.0, 37.0, 55.0, 57.0, 45.0, 62.0, 48.0, 43.0, 51.0, 50.0, 32.0, 34.0, 40.0, 23.0, 34.0, 18.0, 21.0, 17.0, 20.0, 8.0, 11.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2049560546875, -0.19884681701660156, -0.19273757934570312, -0.1866283416748047, -0.18051910400390625, -0.1744098663330078, -0.16830062866210938, -0.16219139099121094, -0.1560821533203125, -0.14997291564941406, -0.14386367797851562, -0.1377544403076172, -0.13164520263671875, -0.1255359649658203, -0.11942672729492188, -0.11331748962402344, -0.107208251953125, -0.10109901428222656, -0.09498977661132812, -0.08888053894042969, -0.08277130126953125, -0.07666206359863281, -0.07055282592773438, -0.06444358825683594, -0.0583343505859375, -0.05222511291503906, -0.046115875244140625, -0.04000663757324219, -0.03389739990234375, -0.027788162231445312, -0.021678924560546875, -0.015569686889648438, -0.00946044921875, -0.0033512115478515625, 0.002758026123046875, 0.008867263793945312, 0.01497650146484375, 0.021085739135742188, 0.027194976806640625, 0.03330421447753906, 0.0394134521484375, 0.04552268981933594, 0.051631927490234375, 0.05774116516113281, 0.06385040283203125, 0.06995964050292969, 0.07606887817382812, 0.08217811584472656, 0.088287353515625, 0.09439659118652344, 0.10050582885742188, 0.10661506652832031, 0.11272430419921875, 0.11883354187011719, 0.12494277954101562, 0.13105201721191406, 0.1371612548828125, 0.14327049255371094, 0.14937973022460938, 0.1554889678955078, 0.16159820556640625, 0.1677074432373047, 0.17381668090820312, 0.17992591857910156, 0.18603515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 10.0, 8.0, 9.0, 10.0, 18.0, 22.0, 44.0, 38.0, 58.0, 74.0, 91.0, 94.0, 153.0, 228.0, 342.0, 516.0, 895.0, 1605.0, 3245.0, 7018.0, 18041.0, 58285.0, 271584.0, 527299.0, 108700.0, 29592.0, 10671.0, 4560.0, 2227.0, 1091.0, 650.0, 394.0, 256.0, 200.0, 114.0, 87.0, 61.0, 56.0, 43.0, 38.0, 24.0, 22.0, 18.0, 9.0, 11.0, 8.0, 8.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2275390625, -1.1855316162109375, -1.143524169921875, -1.1015167236328125, -1.05950927734375, -1.0175018310546875, -0.975494384765625, -0.9334869384765625, -0.8914794921875, -0.8494720458984375, -0.807464599609375, -0.7654571533203125, -0.72344970703125, -0.6814422607421875, -0.639434814453125, -0.5974273681640625, -0.555419921875, -0.5134124755859375, -0.471405029296875, -0.4293975830078125, -0.38739013671875, -0.3453826904296875, -0.303375244140625, -0.2613677978515625, -0.2193603515625, -0.1773529052734375, -0.135345458984375, -0.0933380126953125, -0.05133056640625, -0.0093231201171875, 0.032684326171875, 0.0746917724609375, 0.11669921875, 0.1587066650390625, 0.200714111328125, 0.2427215576171875, 0.28472900390625, 0.3267364501953125, 0.368743896484375, 0.4107513427734375, 0.4527587890625, 0.4947662353515625, 0.536773681640625, 0.5787811279296875, 0.62078857421875, 0.6627960205078125, 0.704803466796875, 0.7468109130859375, 0.788818359375, 0.8308258056640625, 0.872833251953125, 0.9148406982421875, 0.95684814453125, 0.9988555908203125, 1.040863037109375, 1.0828704833984375, 1.1248779296875, 1.1668853759765625, 1.208892822265625, 1.2509002685546875, 1.29290771484375, 1.3349151611328125, 1.376922607421875, 1.4189300537109375, 1.4609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 10.0, 8.0, 13.0, 13.0, 14.0, 19.0, 22.0, 16.0, 25.0, 39.0, 27.0, 32.0, 53.0, 46.0, 43.0, 66.0, 60.0, 60.0, 46.0, 47.0, 40.0, 53.0, 29.0, 38.0, 25.0, 19.0, 24.0, 22.0, 17.0, 15.0, 8.0, 10.0, 7.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.0595550537109375, -1.025360107421875, -0.9911651611328125, -0.95697021484375, -0.9227752685546875, -0.888580322265625, -0.8543853759765625, -0.8201904296875, -0.7859954833984375, -0.751800537109375, -0.7176055908203125, -0.68341064453125, -0.6492156982421875, -0.615020751953125, -0.5808258056640625, -0.546630859375, -0.5124359130859375, -0.478240966796875, -0.4440460205078125, -0.40985107421875, -0.3756561279296875, -0.341461181640625, -0.3072662353515625, -0.2730712890625, -0.2388763427734375, -0.204681396484375, -0.1704864501953125, -0.13629150390625, -0.1020965576171875, -0.067901611328125, -0.0337066650390625, 0.00048828125, 0.0346832275390625, 0.068878173828125, 0.1030731201171875, 0.13726806640625, 0.1714630126953125, 0.205657958984375, 0.2398529052734375, 0.2740478515625, 0.3082427978515625, 0.342437744140625, 0.3766326904296875, 0.41082763671875, 0.4450225830078125, 0.479217529296875, 0.5134124755859375, 0.547607421875, 0.5818023681640625, 0.615997314453125, 0.6501922607421875, 0.68438720703125, 0.7185821533203125, 0.752777099609375, 0.7869720458984375, 0.8211669921875, 0.8553619384765625, 0.889556884765625, 0.9237518310546875, 0.95794677734375, 0.9921417236328125, 1.026336669921875, 1.0605316162109375, 1.0947265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 6.0, 17.0, 13.0, 23.0, 52.0, 67.0, 159.0, 330.0, 863.0, 3888.0, 94861.0, 934626.0, 11120.0, 1560.0, 481.0, 213.0, 100.0, 50.0, 41.0, 27.0, 15.0, 11.0, 10.0, 3.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.4100341796875, -4.273193359375, -4.1363525390625, -3.99951171875, -3.8626708984375, -3.725830078125, -3.5889892578125, -3.4521484375, -3.3153076171875, -3.178466796875, -3.0416259765625, -2.90478515625, -2.7679443359375, -2.631103515625, -2.4942626953125, -2.357421875, -2.2205810546875, -2.083740234375, -1.9468994140625, -1.81005859375, -1.6732177734375, -1.536376953125, -1.3995361328125, -1.2626953125, -1.1258544921875, -0.989013671875, -0.8521728515625, -0.71533203125, -0.5784912109375, -0.441650390625, -0.3048095703125, -0.16796875, -0.0311279296875, 0.105712890625, 0.2425537109375, 0.37939453125, 0.5162353515625, 0.653076171875, 0.7899169921875, 0.9267578125, 1.0635986328125, 1.200439453125, 1.3372802734375, 1.47412109375, 1.6109619140625, 1.747802734375, 1.8846435546875, 2.021484375, 2.1583251953125, 2.295166015625, 2.4320068359375, 2.56884765625, 2.7056884765625, 2.842529296875, 2.9793701171875, 3.1162109375, 3.2530517578125, 3.389892578125, 3.5267333984375, 3.66357421875, 3.8004150390625, 3.937255859375, 4.0740966796875, 4.2109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 6.0, 3.0, 5.0, 11.0, 11.0, 31.0, 30.0, 64.0, 73.0, 182.0, 283.0, 101.0, 67.0, 40.0, 37.0, 20.0, 13.0, 7.0, 3.0, 7.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003609657287597656, -0.00034904852509498596, -0.0003371313214302063, -0.00032521411776542664, -0.00031329691410064697, -0.0003013797104358673, -0.00028946250677108765, -0.000277545303106308, -0.0002656280994415283, -0.00025371089577674866, -0.000241793692111969, -0.00022987648844718933, -0.00021795928478240967, -0.00020604208111763, -0.00019412487745285034, -0.00018220767378807068, -0.00017029047012329102, -0.00015837326645851135, -0.0001464560627937317, -0.00013453885912895203, -0.00012262165546417236, -0.0001107044517993927, -9.878724813461304e-05, -8.687004446983337e-05, -7.495284080505371e-05, -6.303563714027405e-05, -5.1118433475494385e-05, -3.920122981071472e-05, -2.728402614593506e-05, -1.5366822481155396e-05, -3.4496188163757324e-06, 8.46758484840393e-06, 2.0384788513183594e-05, 3.230199217796326e-05, 4.421919584274292e-05, 5.613639950752258e-05, 6.805360317230225e-05, 7.997080683708191e-05, 9.188801050186157e-05, 0.00010380521416664124, 0.0001157224178314209, 0.00012763962149620056, 0.00013955682516098022, 0.0001514740288257599, 0.00016339123249053955, 0.00017530843615531921, 0.00018722563982009888, 0.00019914284348487854, 0.0002110600471496582, 0.00022297725081443787, 0.00023489445447921753, 0.0002468116581439972, 0.00025872886180877686, 0.0002706460654735565, 0.0002825632691383362, 0.00029448047280311584, 0.0003063976764678955, 0.00031831488013267517, 0.00033023208379745483, 0.0003421492874622345, 0.00035406649112701416, 0.0003659836947917938, 0.0003779008984565735, 0.00038981810212135315, 0.0004017353057861328]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 7.0, 10.0, 13.0, 19.0, 29.0, 37.0, 64.0, 107.0, 176.0, 295.0, 532.0, 974.0, 2104.0, 6206.0, 69105.0, 938016.0, 23133.0, 4209.0, 1625.0, 746.0, 422.0, 250.0, 142.0, 90.0, 61.0, 41.0, 30.0, 25.0, 14.0, 9.0, 11.0, 9.0, 4.0, 3.0, 7.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.828125, -2.73175048828125, -2.6353759765625, -2.53900146484375, -2.442626953125, -2.34625244140625, -2.2498779296875, -2.15350341796875, -2.05712890625, -1.96075439453125, -1.8643798828125, -1.76800537109375, -1.671630859375, -1.57525634765625, -1.4788818359375, -1.38250732421875, -1.2861328125, -1.18975830078125, -1.0933837890625, -0.99700927734375, -0.900634765625, -0.80426025390625, -0.7078857421875, -0.61151123046875, -0.51513671875, -0.41876220703125, -0.3223876953125, -0.22601318359375, -0.129638671875, -0.03326416015625, 0.0631103515625, 0.15948486328125, 0.255859375, 0.35223388671875, 0.4486083984375, 0.54498291015625, 0.641357421875, 0.73773193359375, 0.8341064453125, 0.93048095703125, 1.02685546875, 1.12322998046875, 1.2196044921875, 1.31597900390625, 1.412353515625, 1.50872802734375, 1.6051025390625, 1.70147705078125, 1.7978515625, 1.89422607421875, 1.9906005859375, 2.08697509765625, 2.183349609375, 2.27972412109375, 2.3760986328125, 2.47247314453125, 2.56884765625, 2.66522216796875, 2.7615966796875, 2.85797119140625, 2.954345703125, 3.05072021484375, 3.1470947265625, 3.24346923828125, 3.33984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 26.0, 36.0, 108.0, 247.0, 303.0, 142.0, 63.0, 25.0, 8.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.806640625, -2.7400360107421875, -2.673431396484375, -2.6068267822265625, -2.54022216796875, -2.4736175537109375, -2.407012939453125, -2.3404083251953125, -2.2738037109375, -2.2071990966796875, -2.140594482421875, -2.0739898681640625, -2.00738525390625, -1.9407806396484375, -1.874176025390625, -1.8075714111328125, -1.740966796875, -1.6743621826171875, -1.607757568359375, -1.5411529541015625, -1.47454833984375, -1.4079437255859375, -1.341339111328125, -1.2747344970703125, -1.2081298828125, -1.1415252685546875, -1.074920654296875, -1.0083160400390625, -0.94171142578125, -0.8751068115234375, -0.808502197265625, -0.7418975830078125, -0.67529296875, -0.6086883544921875, -0.542083740234375, -0.4754791259765625, -0.40887451171875, -0.3422698974609375, -0.275665283203125, -0.2090606689453125, -0.1424560546875, -0.0758514404296875, -0.009246826171875, 0.0573577880859375, 0.12396240234375, 0.1905670166015625, 0.257171630859375, 0.3237762451171875, 0.390380859375, 0.4569854736328125, 0.523590087890625, 0.5901947021484375, 0.65679931640625, 0.7234039306640625, 0.790008544921875, 0.8566131591796875, 0.9232177734375, 0.9898223876953125, 1.056427001953125, 1.1230316162109375, 1.18963623046875, 1.2562408447265625, 1.322845458984375, 1.3894500732421875, 1.4560546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 18.0, 48.0, 131.0, 254.0, 269.0, 172.0, 73.0, 19.0, 11.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.50525665283203, -27.73777198791504, -26.970287322998047, -26.202802658081055, -25.435317993164062, -24.667831420898438, -23.900348663330078, -23.132862091064453, -22.36537742614746, -21.59789276123047, -20.830408096313477, -20.062923431396484, -19.295438766479492, -18.5279541015625, -17.760467529296875, -16.992982864379883, -16.22549819946289, -15.458013534545898, -14.690528869628906, -13.923044204711914, -13.155558586120605, -12.388073921203613, -11.620589256286621, -10.853103637695312, -10.085620880126953, -9.318136215209961, -8.550651550292969, -7.783166408538818, -7.015681266784668, -6.248196601867676, -5.480711936950684, -4.713226795196533, -3.945741653442383, -3.1782567501068115, -2.4107718467712402, -1.643287181854248, -0.8758022785186768, -0.10831737518310547, 0.6591672897338867, 1.426652431488037, 2.1941370964050293, 2.9616219997406006, 3.729106903076172, 4.496591567993164, 5.264076232910156, 6.031561374664307, 6.799046039581299, 7.566531181335449, 8.334015846252441, 9.101500511169434, 9.868985176086426, 10.636470794677734, 11.403955459594727, 12.171440124511719, 12.938924789428711, 13.706409454345703, 14.473894119262695, 15.241378784179688, 16.00886344909668, 16.776348114013672, 17.543832778930664, 18.311317443847656, 19.07880401611328, 19.846288681030273, 20.613773345947266]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 6.0, 1.0, 7.0, 6.0, 8.0, 12.0, 6.0, 11.0, 14.0, 17.0, 22.0, 13.0, 21.0, 24.0, 30.0, 22.0, 37.0, 26.0, 42.0, 36.0, 49.0, 50.0, 45.0, 52.0, 37.0, 30.0, 44.0, 29.0, 41.0, 33.0, 34.0, 18.0, 24.0, 28.0, 23.0, 11.0, 20.0, 17.0, 15.0, 15.0, 5.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1119232177734375, -4.931403160095215, -4.75088357925415, -4.570363521575928, -4.389843940734863, -4.209323883056641, -4.028803825378418, -3.8482840061187744, -3.667764186859131, -3.4872443675994873, -3.3067245483398438, -3.126204490661621, -2.9456846714019775, -2.765164852142334, -2.5846447944641113, -2.4041249752044678, -2.223605155944824, -2.0430853366851807, -1.8625653982162476, -1.6820454597473145, -1.501525640487671, -1.3210058212280273, -1.1404858827590942, -0.9599659442901611, -0.7794461250305176, -0.5989262461662292, -0.4184063673019409, -0.2378864884376526, -0.05736660957336426, 0.12315326929092407, 0.3036731481552124, 0.4841930866241455, 0.6647124290466309, 0.8452323079109192, 1.0257521867752075, 1.2062721252441406, 1.3867919445037842, 1.5673117637634277, 1.7478317022323608, 1.928351640701294, 2.1088714599609375, 2.289391279220581, 2.4699110984802246, 2.6504311561584473, 2.830950975418091, 3.0114707946777344, 3.191990852355957, 3.3725106716156006, 3.553030490875244, 3.7335503101348877, 3.9140701293945312, 4.094590187072754, 4.275110244750977, 4.455629825592041, 4.636149883270264, 4.816669464111328, 4.997189521789551, 5.177709579467773, 5.358229160308838, 5.5387492179870605, 5.719268798828125, 5.899788856506348, 6.08030891418457, 6.260828971862793, 6.441348552703857]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 10.0, 22.0, 39.0, 57.0, 106.0, 161.0, 282.0, 526.0, 1011.0, 2324.0, 5712.0, 17077.0, 71619.0, 1597546.0, 2396214.0, 74207.0, 16839.0, 5780.0, 2359.0, 1084.0, 575.0, 290.0, 178.0, 99.0, 56.0, 37.0, 27.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.2323760986328125, -1.188385009765625, -1.1443939208984375, -1.10040283203125, -1.0564117431640625, -1.012420654296875, -0.9684295654296875, -0.9244384765625, -0.8804473876953125, -0.836456298828125, -0.7924652099609375, -0.74847412109375, -0.7044830322265625, -0.660491943359375, -0.6165008544921875, -0.572509765625, -0.5285186767578125, -0.484527587890625, -0.4405364990234375, -0.39654541015625, -0.3525543212890625, -0.308563232421875, -0.2645721435546875, -0.2205810546875, -0.1765899658203125, -0.132598876953125, -0.0886077880859375, -0.04461669921875, -0.0006256103515625, 0.043365478515625, 0.0873565673828125, 0.13134765625, 0.1753387451171875, 0.219329833984375, 0.2633209228515625, 0.30731201171875, 0.3513031005859375, 0.395294189453125, 0.4392852783203125, 0.4832763671875, 0.5272674560546875, 0.571258544921875, 0.6152496337890625, 0.65924072265625, 0.7032318115234375, 0.747222900390625, 0.7912139892578125, 0.835205078125, 0.8791961669921875, 0.923187255859375, 0.9671783447265625, 1.01116943359375, 1.0551605224609375, 1.099151611328125, 1.1431427001953125, 1.1871337890625, 1.2311248779296875, 1.275115966796875, 1.3191070556640625, 1.36309814453125, 1.4070892333984375, 1.451080322265625, 1.4950714111328125, 1.5390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 1.0, 9.0, 8.0, 12.0, 11.0, 23.0, 17.0, 31.0, 28.0, 31.0, 43.0, 37.0, 58.0, 61.0, 52.0, 57.0, 50.0, 51.0, 59.0, 43.0, 40.0, 51.0, 48.0, 32.0, 30.0, 22.0, 24.0, 23.0, 15.0, 9.0, 5.0, 4.0, 3.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.254638671875, -0.24745750427246094, -0.24027633666992188, -0.2330951690673828, -0.22591400146484375, -0.2187328338623047, -0.21155166625976562, -0.20437049865722656, -0.1971893310546875, -0.19000816345214844, -0.18282699584960938, -0.1756458282470703, -0.16846466064453125, -0.1612834930419922, -0.15410232543945312, -0.14692115783691406, -0.139739990234375, -0.13255882263183594, -0.12537765502929688, -0.11819648742675781, -0.11101531982421875, -0.10383415222167969, -0.09665298461914062, -0.08947181701660156, -0.0822906494140625, -0.07510948181152344, -0.06792831420898438, -0.06074714660644531, -0.05356597900390625, -0.04638481140136719, -0.039203643798828125, -0.03202247619628906, -0.02484130859375, -0.017660140991210938, -0.010478973388671875, -0.0032978057861328125, 0.00388336181640625, 0.011064529418945312, 0.018245697021484375, 0.025426864624023438, 0.0326080322265625, 0.03978919982910156, 0.046970367431640625, 0.05415153503417969, 0.06133270263671875, 0.06851387023925781, 0.07569503784179688, 0.08287620544433594, 0.090057373046875, 0.09723854064941406, 0.10441970825195312, 0.11160087585449219, 0.11878204345703125, 0.1259632110595703, 0.13314437866210938, 0.14032554626464844, 0.1475067138671875, 0.15468788146972656, 0.16186904907226562, 0.1690502166748047, 0.17623138427734375, 0.1834125518798828, 0.19059371948242188, 0.19777488708496094, 0.2049560546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 9.0, 7.0, 8.0, 11.0, 22.0, 43.0, 82.0, 105.0, 163.0, 282.0, 480.0, 839.0, 1710.0, 3716.0, 10035.0, 36995.0, 261033.0, 3637752.0, 194431.0, 30824.0, 8715.0, 3406.0, 1572.0, 852.0, 475.0, 281.0, 159.0, 108.0, 63.0, 42.0, 26.0, 14.0, 11.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7373046875, -1.6762237548828125, -1.615142822265625, -1.5540618896484375, -1.49298095703125, -1.4319000244140625, -1.370819091796875, -1.3097381591796875, -1.2486572265625, -1.1875762939453125, -1.126495361328125, -1.0654144287109375, -1.00433349609375, -0.9432525634765625, -0.882171630859375, -0.8210906982421875, -0.760009765625, -0.6989288330078125, -0.637847900390625, -0.5767669677734375, -0.51568603515625, -0.4546051025390625, -0.393524169921875, -0.3324432373046875, -0.2713623046875, -0.2102813720703125, -0.149200439453125, -0.0881195068359375, -0.02703857421875, 0.0340423583984375, 0.095123291015625, 0.1562042236328125, 0.21728515625, 0.2783660888671875, 0.339447021484375, 0.4005279541015625, 0.46160888671875, 0.5226898193359375, 0.583770751953125, 0.6448516845703125, 0.7059326171875, 0.7670135498046875, 0.828094482421875, 0.8891754150390625, 0.95025634765625, 1.0113372802734375, 1.072418212890625, 1.1334991455078125, 1.194580078125, 1.2556610107421875, 1.316741943359375, 1.3778228759765625, 1.43890380859375, 1.4999847412109375, 1.561065673828125, 1.6221466064453125, 1.6832275390625, 1.7443084716796875, 1.805389404296875, 1.8664703369140625, 1.92755126953125, 1.9886322021484375, 2.049713134765625, 2.1107940673828125, 2.171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 0.0, 11.0, 8.0, 12.0, 9.0, 19.0, 19.0, 38.0, 56.0, 81.0, 146.0, 268.0, 785.0, 1653.0, 419.0, 214.0, 113.0, 56.0, 44.0, 25.0, 28.0, 17.0, 14.0, 5.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.83251953125, -0.8088912963867188, -0.7852630615234375, -0.7616348266601562, -0.738006591796875, -0.7143783569335938, -0.6907501220703125, -0.6671218872070312, -0.64349365234375, -0.6198654174804688, -0.5962371826171875, -0.5726089477539062, -0.548980712890625, -0.5253524780273438, -0.5017242431640625, -0.47809600830078125, -0.4544677734375, -0.43083953857421875, -0.4072113037109375, -0.38358306884765625, -0.359954833984375, -0.33632659912109375, -0.3126983642578125, -0.28907012939453125, -0.26544189453125, -0.24181365966796875, -0.2181854248046875, -0.19455718994140625, -0.170928955078125, -0.14730072021484375, -0.1236724853515625, -0.10004425048828125, -0.076416015625, -0.05278778076171875, -0.0291595458984375, -0.00553131103515625, 0.018096923828125, 0.04172515869140625, 0.0653533935546875, 0.08898162841796875, 0.11260986328125, 0.13623809814453125, 0.1598663330078125, 0.18349456787109375, 0.207122802734375, 0.23075103759765625, 0.2543792724609375, 0.27800750732421875, 0.3016357421875, 0.32526397705078125, 0.3488922119140625, 0.37252044677734375, 0.396148681640625, 0.41977691650390625, 0.4434051513671875, 0.46703338623046875, 0.49066162109375, 0.5142898559570312, 0.5379180908203125, 0.5615463256835938, 0.585174560546875, 0.6088027954101562, 0.6324310302734375, 0.6560592651367188, 0.6796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 25.0, 45.0, 95.0, 151.0, 192.0, 168.0, 127.0, 82.0, 59.0, 18.0, 15.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.399649620056152, -5.206660747528076, -5.013671398162842, -4.820682525634766, -4.627693176269531, -4.434704303741455, -4.241715431213379, -4.0487260818481445, -3.8557372093200684, -3.662748098373413, -3.469758987426758, -3.2767701148986816, -3.0837810039520264, -2.890791893005371, -2.697803020477295, -2.5048139095306396, -2.3118247985839844, -2.118835687637329, -1.9258466958999634, -1.7328577041625977, -1.5398685932159424, -1.346879482269287, -1.1538904905319214, -0.9609014987945557, -0.7679123878479004, -0.5749233365058899, -0.3819342851638794, -0.1889452338218689, 0.0040438175201416016, 0.1970328688621521, 0.3900219202041626, 0.5830109119415283, 0.7760000228881836, 0.9689890742301941, 1.1619781255722046, 1.3549671173095703, 1.5479562282562256, 1.7409453392028809, 1.9339343309402466, 2.1269233226776123, 2.3199124336242676, 2.512901544570923, 2.705890655517578, 2.8988795280456543, 3.0918686389923096, 3.284857749938965, 3.477846622467041, 3.6708357334136963, 3.8638248443603516, 4.056813716888428, 4.249803066253662, 4.442791938781738, 4.635781288146973, 4.828770160675049, 5.021759033203125, 5.214748382568359, 5.4077372550964355, 5.600726127624512, 5.793715476989746, 5.986704349517822, 6.179693222045898, 6.372682571411133, 6.565671443939209, 6.758660316467285, 6.9516496658325195]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 5.0, 12.0, 6.0, 9.0, 14.0, 13.0, 17.0, 18.0, 22.0, 27.0, 28.0, 26.0, 43.0, 37.0, 43.0, 34.0, 38.0, 38.0, 54.0, 55.0, 53.0, 43.0, 44.0, 39.0, 40.0, 31.0, 38.0, 28.0, 18.0, 19.0, 15.0, 18.0, 16.0, 13.0, 6.0, 6.0, 8.0, 9.0, 7.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.3538808822631836, -2.284026861190796, -2.2141730785369873, -2.1443190574645996, -2.074465274810791, -2.0046112537384033, -1.9347573518753052, -1.864903450012207, -1.7950494289398193, -1.7251955270767212, -1.655341625213623, -1.5854876041412354, -1.5156337022781372, -1.445779800415039, -1.375925898551941, -1.3060719966888428, -1.2362180948257446, -1.1663641929626465, -1.0965102910995483, -1.0266563892364502, -0.9568023681640625, -0.8869484663009644, -0.8170945644378662, -0.7472406625747681, -0.6773867011070251, -0.607532799243927, -0.5376788377761841, -0.46782493591308594, -0.3979710042476654, -0.3281170725822449, -0.25826317071914673, -0.1884092390537262, -0.11855530738830566, -0.04870138317346573, 0.021152541041374207, 0.09100645780563354, 0.16086038947105408, 0.2307143211364746, 0.30056822299957275, 0.3704221546649933, 0.4402760863304138, 0.510129988193512, 0.5799839496612549, 0.649837851524353, 0.7196917533874512, 0.7895457148551941, 0.8593996167182922, 0.9292535781860352, 0.9991074800491333, 1.0689613819122314, 1.1388152837753296, 1.2086691856384277, 1.2785232067108154, 1.3483771085739136, 1.4182310104370117, 1.4880849123001099, 1.557938814163208, 1.6277927160263062, 1.6976466178894043, 1.767500638961792, 1.8373545408248901, 1.9072084426879883, 1.9770623445510864, 2.0469162464141846, 2.1167702674865723]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 0.0, 6.0, 7.0, 12.0, 19.0, 14.0, 38.0, 36.0, 77.0, 84.0, 133.0, 188.0, 287.0, 428.0, 751.0, 1208.0, 2179.0, 4054.0, 7917.0, 16325.0, 33880.0, 76174.0, 282508.0, 434611.0, 103358.0, 42777.0, 20169.0, 9765.0, 4999.0, 2685.0, 1461.0, 883.0, 537.0, 323.0, 182.0, 153.0, 96.0, 63.0, 44.0, 36.0, 27.0, 18.0, 11.0, 15.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-1.001953125, -0.97344970703125, -0.9449462890625, -0.91644287109375, -0.887939453125, -0.85943603515625, -0.8309326171875, -0.80242919921875, -0.77392578125, -0.74542236328125, -0.7169189453125, -0.68841552734375, -0.659912109375, -0.63140869140625, -0.6029052734375, -0.57440185546875, -0.5458984375, -0.51739501953125, -0.4888916015625, -0.46038818359375, -0.431884765625, -0.40338134765625, -0.3748779296875, -0.34637451171875, -0.31787109375, -0.28936767578125, -0.2608642578125, -0.23236083984375, -0.203857421875, -0.17535400390625, -0.1468505859375, -0.11834716796875, -0.08984375, -0.06134033203125, -0.0328369140625, -0.00433349609375, 0.024169921875, 0.05267333984375, 0.0811767578125, 0.10968017578125, 0.13818359375, 0.16668701171875, 0.1951904296875, 0.22369384765625, 0.252197265625, 0.28070068359375, 0.3092041015625, 0.33770751953125, 0.3662109375, 0.39471435546875, 0.4232177734375, 0.45172119140625, 0.480224609375, 0.50872802734375, 0.5372314453125, 0.56573486328125, 0.59423828125, 0.62274169921875, 0.6512451171875, 0.67974853515625, 0.708251953125, 0.73675537109375, 0.7652587890625, 0.79376220703125, 0.822265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 9.0, 6.0, 9.0, 18.0, 23.0, 29.0, 17.0, 36.0, 39.0, 41.0, 34.0, 52.0, 39.0, 44.0, 49.0, 53.0, 49.0, 63.0, 50.0, 62.0, 42.0, 53.0, 31.0, 33.0, 25.0, 23.0, 13.0, 13.0, 16.0, 10.0, 6.0, 2.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.289306640625, -0.28157997131347656, -0.2738533020019531, -0.2661266326904297, -0.25839996337890625, -0.2506732940673828, -0.24294662475585938, -0.23521995544433594, -0.2274932861328125, -0.21976661682128906, -0.21203994750976562, -0.2043132781982422, -0.19658660888671875, -0.1888599395751953, -0.18113327026367188, -0.17340660095214844, -0.165679931640625, -0.15795326232910156, -0.15022659301757812, -0.1424999237060547, -0.13477325439453125, -0.1270465850830078, -0.11931991577148438, -0.11159324645996094, -0.1038665771484375, -0.09613990783691406, -0.08841323852539062, -0.08068656921386719, -0.07295989990234375, -0.06523323059082031, -0.057506561279296875, -0.04977989196777344, -0.04205322265625, -0.03432655334472656, -0.026599884033203125, -0.018873214721679688, -0.01114654541015625, -0.0034198760986328125, 0.004306793212890625, 0.012033462524414062, 0.0197601318359375, 0.027486801147460938, 0.035213470458984375, 0.04294013977050781, 0.05066680908203125, 0.05839347839355469, 0.06612014770507812, 0.07384681701660156, 0.081573486328125, 0.08930015563964844, 0.09702682495117188, 0.10475349426269531, 0.11248016357421875, 0.12020683288574219, 0.12793350219726562, 0.13566017150878906, 0.1433868408203125, 0.15111351013183594, 0.15884017944335938, 0.1665668487548828, 0.17429351806640625, 0.1820201873779297, 0.18974685668945312, 0.19747352600097656, 0.2052001953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 6.0, 7.0, 10.0, 14.0, 26.0, 32.0, 35.0, 51.0, 91.0, 137.0, 217.0, 336.0, 549.0, 953.0, 2164.0, 6211.0, 24777.0, 132702.0, 745423.0, 105034.0, 20327.0, 5218.0, 1885.0, 867.0, 507.0, 333.0, 223.0, 121.0, 78.0, 55.0, 45.0, 36.0, 23.0, 16.0, 11.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7744140625, -1.7179718017578125, -1.661529541015625, -1.6050872802734375, -1.54864501953125, -1.4922027587890625, -1.435760498046875, -1.3793182373046875, -1.3228759765625, -1.2664337158203125, -1.209991455078125, -1.1535491943359375, -1.09710693359375, -1.0406646728515625, -0.984222412109375, -0.9277801513671875, -0.871337890625, -0.8148956298828125, -0.758453369140625, -0.7020111083984375, -0.64556884765625, -0.5891265869140625, -0.532684326171875, -0.4762420654296875, -0.4197998046875, -0.3633575439453125, -0.306915283203125, -0.2504730224609375, -0.19403076171875, -0.1375885009765625, -0.081146240234375, -0.0247039794921875, 0.03173828125, 0.0881805419921875, 0.144622802734375, 0.2010650634765625, 0.25750732421875, 0.3139495849609375, 0.370391845703125, 0.4268341064453125, 0.4832763671875, 0.5397186279296875, 0.596160888671875, 0.6526031494140625, 0.70904541015625, 0.7654876708984375, 0.821929931640625, 0.8783721923828125, 0.934814453125, 0.9912567138671875, 1.047698974609375, 1.1041412353515625, 1.16058349609375, 1.2170257568359375, 1.273468017578125, 1.3299102783203125, 1.3863525390625, 1.4427947998046875, 1.499237060546875, 1.5556793212890625, 1.61212158203125, 1.6685638427734375, 1.725006103515625, 1.7814483642578125, 1.837890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 1.0, 6.0, 9.0, 13.0, 13.0, 21.0, 11.0, 27.0, 31.0, 29.0, 43.0, 33.0, 46.0, 41.0, 42.0, 58.0, 48.0, 58.0, 43.0, 39.0, 41.0, 45.0, 56.0, 42.0, 24.0, 32.0, 17.0, 25.0, 23.0, 16.0, 13.0, 10.0, 9.0, 10.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1328125, -1.0998992919921875, -1.066986083984375, -1.0340728759765625, -1.00115966796875, -0.9682464599609375, -0.935333251953125, -0.9024200439453125, -0.8695068359375, -0.8365936279296875, -0.803680419921875, -0.7707672119140625, -0.73785400390625, -0.7049407958984375, -0.672027587890625, -0.6391143798828125, -0.606201171875, -0.5732879638671875, -0.540374755859375, -0.5074615478515625, -0.47454833984375, -0.4416351318359375, -0.408721923828125, -0.3758087158203125, -0.3428955078125, -0.3099822998046875, -0.277069091796875, -0.2441558837890625, -0.21124267578125, -0.1783294677734375, -0.145416259765625, -0.1125030517578125, -0.07958984375, -0.0466766357421875, -0.013763427734375, 0.0191497802734375, 0.05206298828125, 0.0849761962890625, 0.117889404296875, 0.1508026123046875, 0.1837158203125, 0.2166290283203125, 0.249542236328125, 0.2824554443359375, 0.31536865234375, 0.3482818603515625, 0.381195068359375, 0.4141082763671875, 0.447021484375, 0.4799346923828125, 0.512847900390625, 0.5457611083984375, 0.57867431640625, 0.6115875244140625, 0.644500732421875, 0.6774139404296875, 0.7103271484375, 0.7432403564453125, 0.776153564453125, 0.8090667724609375, 0.84197998046875, 0.8748931884765625, 0.907806396484375, 0.9407196044921875, 0.9736328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 14.0, 22.0, 45.0, 73.0, 121.0, 243.0, 423.0, 882.0, 2808.0, 11932.0, 84468.0, 854791.0, 76827.0, 11341.0, 2788.0, 921.0, 350.0, 169.0, 115.0, 70.0, 45.0, 24.0, 13.0, 11.0, 9.0, 7.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.489227294921875, -1.44036865234375, -1.391510009765625, -1.3426513671875, -1.293792724609375, -1.24493408203125, -1.196075439453125, -1.147216796875, -1.098358154296875, -1.04949951171875, -1.000640869140625, -0.9517822265625, -0.902923583984375, -0.85406494140625, -0.805206298828125, -0.75634765625, -0.707489013671875, -0.65863037109375, -0.609771728515625, -0.5609130859375, -0.512054443359375, -0.46319580078125, -0.414337158203125, -0.365478515625, -0.316619873046875, -0.26776123046875, -0.218902587890625, -0.1700439453125, -0.121185302734375, -0.07232666015625, -0.023468017578125, 0.025390625, 0.074249267578125, 0.12310791015625, 0.171966552734375, 0.2208251953125, 0.269683837890625, 0.31854248046875, 0.367401123046875, 0.416259765625, 0.465118408203125, 0.51397705078125, 0.562835693359375, 0.6116943359375, 0.660552978515625, 0.70941162109375, 0.758270263671875, 0.80712890625, 0.855987548828125, 0.90484619140625, 0.953704833984375, 1.0025634765625, 1.051422119140625, 1.10028076171875, 1.149139404296875, 1.197998046875, 1.246856689453125, 1.29571533203125, 1.344573974609375, 1.3934326171875, 1.442291259765625, 1.49114990234375, 1.540008544921875, 1.5888671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 7.0, 7.0, 7.0, 8.0, 15.0, 17.0, 18.0, 27.0, 40.0, 73.0, 212.0, 240.0, 109.0, 55.0, 20.0, 21.0, 23.0, 25.0, 11.0, 6.0, 14.0, 10.0, 11.0, 5.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021028518676757812, -0.0002035200595855713, -0.00019675493240356445, -0.00018998980522155762, -0.00018322467803955078, -0.00017645955085754395, -0.0001696944236755371, -0.00016292929649353027, -0.00015616416931152344, -0.0001493990421295166, -0.00014263391494750977, -0.00013586878776550293, -0.0001291036605834961, -0.00012233853340148926, -0.00011557340621948242, -0.00010880827903747559, -0.00010204315185546875, -9.527802467346191e-05, -8.851289749145508e-05, -8.174777030944824e-05, -7.49826431274414e-05, -6.821751594543457e-05, -6.145238876342773e-05, -5.46872615814209e-05, -4.792213439941406e-05, -4.1157007217407227e-05, -3.439188003540039e-05, -2.7626752853393555e-05, -2.086162567138672e-05, -1.4096498489379883e-05, -7.331371307373047e-06, -5.662441253662109e-07, 6.198883056640625e-06, 1.2964010238647461e-05, 1.9729137420654297e-05, 2.6494264602661133e-05, 3.325939178466797e-05, 4.0024518966674805e-05, 4.678964614868164e-05, 5.3554773330688477e-05, 6.031990051269531e-05, 6.708502769470215e-05, 7.385015487670898e-05, 8.061528205871582e-05, 8.738040924072266e-05, 9.414553642272949e-05, 0.00010091066360473633, 0.00010767579078674316, 0.00011444091796875, 0.00012120604515075684, 0.00012797117233276367, 0.0001347362995147705, 0.00014150142669677734, 0.00014826655387878418, 0.00015503168106079102, 0.00016179680824279785, 0.0001685619354248047, 0.00017532706260681152, 0.00018209218978881836, 0.0001888573169708252, 0.00019562244415283203, 0.00020238757133483887, 0.0002091526985168457, 0.00021591782569885254, 0.00022268295288085938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 9.0, 24.0, 35.0, 53.0, 67.0, 140.0, 232.0, 478.0, 1170.0, 3819.0, 19812.0, 322040.0, 665451.0, 27776.0, 4854.0, 1424.0, 495.0, 256.0, 154.0, 88.0, 63.0, 34.0, 20.0, 18.0, 7.0, 7.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7861328125, -1.7379608154296875, -1.689788818359375, -1.6416168212890625, -1.59344482421875, -1.5452728271484375, -1.497100830078125, -1.4489288330078125, -1.4007568359375, -1.3525848388671875, -1.304412841796875, -1.2562408447265625, -1.20806884765625, -1.1598968505859375, -1.111724853515625, -1.0635528564453125, -1.015380859375, -0.9672088623046875, -0.919036865234375, -0.8708648681640625, -0.82269287109375, -0.7745208740234375, -0.726348876953125, -0.6781768798828125, -0.6300048828125, -0.5818328857421875, -0.533660888671875, -0.4854888916015625, -0.43731689453125, -0.3891448974609375, -0.340972900390625, -0.2928009033203125, -0.24462890625, -0.1964569091796875, -0.148284912109375, -0.1001129150390625, -0.05194091796875, -0.0037689208984375, 0.044403076171875, 0.0925750732421875, 0.1407470703125, 0.1889190673828125, 0.237091064453125, 0.2852630615234375, 0.33343505859375, 0.3816070556640625, 0.429779052734375, 0.4779510498046875, 0.526123046875, 0.5742950439453125, 0.622467041015625, 0.6706390380859375, 0.71881103515625, 0.7669830322265625, 0.815155029296875, 0.8633270263671875, 0.9114990234375, 0.9596710205078125, 1.007843017578125, 1.0560150146484375, 1.10418701171875, 1.1523590087890625, 1.200531005859375, 1.2487030029296875, 1.296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 11.0, 7.0, 15.0, 31.0, 37.0, 63.0, 118.0, 156.0, 184.0, 125.0, 62.0, 38.0, 21.0, 15.0, 18.0, 15.0, 11.0, 8.0, 5.0, 5.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6511917114257812, -0.6295318603515625, -0.6078720092773438, -0.586212158203125, -0.5645523071289062, -0.5428924560546875, -0.5212326049804688, -0.49957275390625, -0.47791290283203125, -0.4562530517578125, -0.43459320068359375, -0.412933349609375, -0.39127349853515625, -0.3696136474609375, -0.34795379638671875, -0.3262939453125, -0.30463409423828125, -0.2829742431640625, -0.26131439208984375, -0.239654541015625, -0.21799468994140625, -0.1963348388671875, -0.17467498779296875, -0.15301513671875, -0.13135528564453125, -0.1096954345703125, -0.08803558349609375, -0.066375732421875, -0.04471588134765625, -0.0230560302734375, -0.00139617919921875, 0.020263671875, 0.04192352294921875, 0.0635833740234375, 0.08524322509765625, 0.106903076171875, 0.12856292724609375, 0.1502227783203125, 0.17188262939453125, 0.19354248046875, 0.21520233154296875, 0.2368621826171875, 0.25852203369140625, 0.280181884765625, 0.30184173583984375, 0.3235015869140625, 0.34516143798828125, 0.3668212890625, 0.38848114013671875, 0.4101409912109375, 0.43180084228515625, 0.453460693359375, 0.47512054443359375, 0.4967803955078125, 0.5184402465820312, 0.54010009765625, 0.5617599487304688, 0.5834197998046875, 0.6050796508789062, 0.626739501953125, 0.6483993530273438, 0.6700592041015625, 0.6917190551757812, 0.71337890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 22.0, 57.0, 123.0, 201.0, 220.0, 185.0, 89.0, 45.0, 29.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.820932388305664, -22.3185977935791, -21.81626319885254, -21.313928604125977, -20.811594009399414, -20.30925941467285, -19.80692481994629, -19.304590225219727, -18.802255630493164, -18.2999210357666, -17.79758644104004, -17.295251846313477, -16.792917251586914, -16.29058265686035, -15.788248062133789, -15.285913467407227, -14.783577919006348, -14.281243324279785, -13.778908729553223, -13.27657413482666, -12.774239540100098, -12.271904945373535, -11.769569396972656, -11.267234802246094, -10.764900207519531, -10.262565612792969, -9.760231018066406, -9.257896423339844, -8.755561828613281, -8.253227233886719, -7.750892162322998, -7.2485575675964355, -6.746223449707031, -6.243888854980469, -5.741554260253906, -5.239219665527344, -4.736885070800781, -4.234550476074219, -3.732215404510498, -3.2298808097839355, -2.727546215057373, -2.2252116203308105, -1.7228769063949585, -1.2205421924591064, -0.718207597732544, -0.21587300300598145, 0.28646183013916016, 0.7887964248657227, 1.2911310195922852, 1.7934656143188477, 2.29580020904541, 2.7981350421905518, 3.3004696369171143, 3.8028042316436768, 4.305139064788818, 4.807473659515381, 5.309808254241943, 5.812142848968506, 6.314477443695068, 6.816812515258789, 7.319147109985352, 7.821481704711914, 8.323816299438477, 8.826150894165039, 9.328485488891602]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 5.0, 15.0, 11.0, 18.0, 15.0, 21.0, 29.0, 35.0, 34.0, 40.0, 41.0, 45.0, 35.0, 49.0, 36.0, 48.0, 51.0, 37.0, 45.0, 41.0, 43.0, 32.0, 35.0, 26.0, 28.0, 29.0, 22.0, 16.0, 21.0, 13.0, 17.0, 13.0, 6.0, 4.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.080190658569336, -3.9303290843963623, -3.7804675102233887, -3.630606174468994, -3.4807446002960205, -3.330883026123047, -3.1810216903686523, -3.0311601161956787, -2.881298542022705, -2.7314369678497314, -2.581575393676758, -2.4317140579223633, -2.2818524837493896, -2.131990909576416, -1.982129454612732, -1.8322679996490479, -1.6824064254760742, -1.5325448513031006, -1.3826833963394165, -1.2328219413757324, -1.0829603672027588, -0.9330988526344299, -0.7832373380661011, -0.633375883102417, -0.48351430892944336, -0.3336527943611145, -0.18379127979278564, -0.03392976522445679, 0.11593174934387207, 0.2657932639122009, 0.4156547784805298, 0.5655162334442139, 0.7153773307800293, 0.8652388453483582, 1.015100359916687, 1.164961814880371, 1.3148233890533447, 1.4646849632263184, 1.6145464181900024, 1.7644078731536865, 1.9142694473266602, 2.064131021499634, 2.2139925956726074, 2.363853931427002, 2.5137155055999756, 2.663577079772949, 2.8134384155273438, 2.9632999897003174, 3.113161563873291, 3.2630231380462646, 3.4128847122192383, 3.562746047973633, 3.7126076221466064, 3.86246919631958, 4.012330532073975, 4.162192344665527, 4.312053680419922, 4.461915016174316, 4.611776828765869, 4.761638164520264, 4.911499977111816, 5.061361312866211, 5.2112226486206055, 5.361083984375, 5.510945796966553]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 19.0, 20.0, 27.0, 32.0, 65.0, 118.0, 156.0, 285.0, 462.0, 788.0, 1398.0, 2963.0, 6837.0, 18583.0, 70316.0, 2156016.0, 1835374.0, 68793.0, 18981.0, 6824.0, 2890.0, 1430.0, 743.0, 424.0, 267.0, 154.0, 100.0, 68.0, 52.0, 22.0, 20.0, 16.0, 13.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1962890625, -1.1519775390625, -1.107666015625, -1.0633544921875, -1.01904296875, -0.9747314453125, -0.930419921875, -0.8861083984375, -0.841796875, -0.7974853515625, -0.753173828125, -0.7088623046875, -0.66455078125, -0.6202392578125, -0.575927734375, -0.5316162109375, -0.4873046875, -0.4429931640625, -0.398681640625, -0.3543701171875, -0.31005859375, -0.2657470703125, -0.221435546875, -0.1771240234375, -0.1328125, -0.0885009765625, -0.044189453125, 0.0001220703125, 0.04443359375, 0.0887451171875, 0.133056640625, 0.1773681640625, 0.2216796875, 0.2659912109375, 0.310302734375, 0.3546142578125, 0.39892578125, 0.4432373046875, 0.487548828125, 0.5318603515625, 0.576171875, 0.6204833984375, 0.664794921875, 0.7091064453125, 0.75341796875, 0.7977294921875, 0.842041015625, 0.8863525390625, 0.9306640625, 0.9749755859375, 1.019287109375, 1.0635986328125, 1.10791015625, 1.1522216796875, 1.196533203125, 1.2408447265625, 1.28515625, 1.3294677734375, 1.373779296875, 1.4180908203125, 1.46240234375, 1.5067138671875, 1.551025390625, 1.5953369140625, 1.6396484375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 7.0, 8.0, 11.0, 13.0, 15.0, 23.0, 35.0, 30.0, 24.0, 32.0, 47.0, 39.0, 37.0, 49.0, 48.0, 45.0, 37.0, 47.0, 59.0, 53.0, 47.0, 48.0, 36.0, 33.0, 28.0, 21.0, 18.0, 24.0, 21.0, 14.0, 13.0, 12.0, 6.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2200927734375, -0.2128582000732422, -0.20562362670898438, -0.19838905334472656, -0.19115447998046875, -0.18391990661621094, -0.17668533325195312, -0.1694507598876953, -0.1622161865234375, -0.1549816131591797, -0.14774703979492188, -0.14051246643066406, -0.13327789306640625, -0.12604331970214844, -0.11880874633789062, -0.11157417297363281, -0.104339599609375, -0.09710502624511719, -0.08987045288085938, -0.08263587951660156, -0.07540130615234375, -0.06816673278808594, -0.060932159423828125, -0.05369758605957031, -0.0464630126953125, -0.03922843933105469, -0.031993865966796875, -0.024759292602539062, -0.01752471923828125, -0.010290145874023438, -0.003055572509765625, 0.0041790008544921875, 0.01141357421875, 0.018648147583007812, 0.025882720947265625, 0.03311729431152344, 0.04035186767578125, 0.04758644104003906, 0.054821014404296875, 0.06205558776855469, 0.0692901611328125, 0.07652473449707031, 0.08375930786132812, 0.09099388122558594, 0.09822845458984375, 0.10546302795410156, 0.11269760131835938, 0.11993217468261719, 0.127166748046875, 0.1344013214111328, 0.14163589477539062, 0.14887046813964844, 0.15610504150390625, 0.16333961486816406, 0.17057418823242188, 0.1778087615966797, 0.1850433349609375, 0.1922779083251953, 0.19951248168945312, 0.20674705505371094, 0.21398162841796875, 0.22121620178222656, 0.22845077514648438, 0.2356853485107422, 0.242919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 14.0, 14.0, 23.0, 42.0, 77.0, 99.0, 144.0, 268.0, 442.0, 882.0, 1836.0, 4402.0, 15289.0, 100376.0, 3840236.0, 198042.0, 21975.0, 5714.0, 2171.0, 999.0, 540.0, 274.0, 145.0, 92.0, 59.0, 34.0, 30.0, 19.0, 6.0, 5.0, 10.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.19366455078125, -2.1080322265625, -2.02239990234375, -1.936767578125, -1.85113525390625, -1.7655029296875, -1.67987060546875, -1.59423828125, -1.50860595703125, -1.4229736328125, -1.33734130859375, -1.251708984375, -1.16607666015625, -1.0804443359375, -0.99481201171875, -0.9091796875, -0.82354736328125, -0.7379150390625, -0.65228271484375, -0.566650390625, -0.48101806640625, -0.3953857421875, -0.30975341796875, -0.22412109375, -0.13848876953125, -0.0528564453125, 0.03277587890625, 0.118408203125, 0.20404052734375, 0.2896728515625, 0.37530517578125, 0.4609375, 0.54656982421875, 0.6322021484375, 0.71783447265625, 0.803466796875, 0.88909912109375, 0.9747314453125, 1.06036376953125, 1.14599609375, 1.23162841796875, 1.3172607421875, 1.40289306640625, 1.488525390625, 1.57415771484375, 1.6597900390625, 1.74542236328125, 1.8310546875, 1.91668701171875, 2.0023193359375, 2.08795166015625, 2.173583984375, 2.25921630859375, 2.3448486328125, 2.43048095703125, 2.51611328125, 2.60174560546875, 2.6873779296875, 2.77301025390625, 2.858642578125, 2.94427490234375, 3.0299072265625, 3.11553955078125, 3.201171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 9.0, 7.0, 11.0, 29.0, 37.0, 61.0, 121.0, 301.0, 2029.0, 955.0, 234.0, 117.0, 47.0, 27.0, 24.0, 18.0, 13.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2265625, -1.1957931518554688, -1.1650238037109375, -1.1342544555664062, -1.103485107421875, -1.0727157592773438, -1.0419464111328125, -1.0111770629882812, -0.98040771484375, -0.9496383666992188, -0.9188690185546875, -0.8880996704101562, -0.857330322265625, -0.8265609741210938, -0.7957916259765625, -0.7650222778320312, -0.7342529296875, -0.7034835815429688, -0.6727142333984375, -0.6419448852539062, -0.611175537109375, -0.5804061889648438, -0.5496368408203125, -0.5188674926757812, -0.48809814453125, -0.45732879638671875, -0.4265594482421875, -0.39579010009765625, -0.365020751953125, -0.33425140380859375, -0.3034820556640625, -0.27271270751953125, -0.241943359375, -0.21117401123046875, -0.1804046630859375, -0.14963531494140625, -0.118865966796875, -0.08809661865234375, -0.0573272705078125, -0.02655792236328125, 0.00421142578125, 0.03498077392578125, 0.0657501220703125, 0.09651947021484375, 0.127288818359375, 0.15805816650390625, 0.1888275146484375, 0.21959686279296875, 0.2503662109375, 0.28113555908203125, 0.3119049072265625, 0.34267425537109375, 0.373443603515625, 0.40421295166015625, 0.4349822998046875, 0.46575164794921875, 0.49652099609375, 0.5272903442382812, 0.5580596923828125, 0.5888290405273438, 0.619598388671875, 0.6503677368164062, 0.6811370849609375, 0.7119064331054688, 0.74267578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 9.0, 6.0, 12.0, 22.0, 45.0, 97.0, 188.0, 208.0, 208.0, 105.0, 44.0, 29.0, 22.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.235668182373047, -8.016654014587402, -7.797639846801758, -7.578625679016113, -7.359611511230469, -7.140597343444824, -6.92158317565918, -6.702568531036377, -6.483554363250732, -6.264540195465088, -6.045526027679443, -5.826511859893799, -5.607497692108154, -5.388483047485352, -5.169468879699707, -4.9504547119140625, -4.731440544128418, -4.512426376342773, -4.293412208557129, -4.074398040771484, -3.8553836345672607, -3.636369466781616, -3.4173552989959717, -3.198340892791748, -2.9793272018432617, -2.760313034057617, -2.5412988662719727, -2.322284698486328, -2.1032702922821045, -1.88425612449646, -1.6652419567108154, -1.4462276697158813, -1.2272133827209473, -1.0081992149353027, -0.7891849279403687, -0.5701707601547241, -0.3511565327644348, -0.1321423053741455, 0.08687186241149902, 0.3058861494064331, 0.5249003171920776, 0.7439145445823669, 0.9629287719726562, 1.1819429397583008, 1.4009571075439453, 1.6199713945388794, 1.838985562324524, 2.057999849319458, 2.2770140171051025, 2.496028184890747, 2.7150423526763916, 2.9340567588806152, 3.1530709266662598, 3.3720850944519043, 3.591099262237549, 3.8101134300231934, 4.029127597808838, 4.248141765594482, 4.467155933380127, 4.6861701011657715, 4.905184268951416, 5.124198913574219, 5.343213081359863, 5.562227249145508, 5.781241416931152]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 11.0, 17.0, 17.0, 22.0, 28.0, 26.0, 25.0, 32.0, 37.0, 38.0, 30.0, 49.0, 57.0, 53.0, 45.0, 68.0, 42.0, 52.0, 39.0, 43.0, 42.0, 39.0, 28.0, 32.0, 24.0, 21.0, 8.0, 14.0, 8.0, 12.0, 3.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3003811836242676, -2.217085123062134, -2.133789300918579, -2.0504932403564453, -1.9671971797943115, -1.8839012384414673, -1.800605297088623, -1.7173092365264893, -1.6340131759643555, -1.5507172346115112, -1.4674211740493774, -1.3841252326965332, -1.3008291721343994, -1.2175332307815552, -1.134237289428711, -1.0509412288665771, -0.9676452875137329, -0.8843492865562439, -0.8010532855987549, -0.7177573442459106, -0.6344612836837769, -0.5511653423309326, -0.4678693413734436, -0.3845733404159546, -0.3012773394584656, -0.21798133850097656, -0.13468535244464874, -0.05138936638832092, 0.03190663456916809, 0.1152026355266571, 0.19849860668182373, 0.28179460763931274, 0.36509060859680176, 0.44838660955429077, 0.5316826105117798, 0.614978551864624, 0.6982746124267578, 0.781570553779602, 0.8648665547370911, 0.9481625556945801, 1.0314586162567139, 1.114754557609558, 1.198050618171692, 1.2813465595245361, 1.36464262008667, 1.4479385614395142, 1.5312345027923584, 1.6145305633544922, 1.6978265047073364, 1.7811224460601807, 1.8644185066223145, 1.9477144479751587, 2.031010389328003, 2.1143064498901367, 2.1976025104522705, 2.2808985710144043, 2.364194393157959, 2.4474904537200928, 2.5307862758636475, 2.6140823364257812, 2.697378396987915, 2.780674457550049, 2.8639702796936035, 2.9472663402557373, 3.030562400817871]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 12.0, 17.0, 31.0, 49.0, 54.0, 140.0, 217.0, 426.0, 919.0, 2096.0, 5166.0, 14019.0, 42265.0, 223219.0, 634888.0, 85785.0, 24539.0, 8668.0, 3236.0, 1417.0, 628.0, 331.0, 151.0, 77.0, 69.0, 42.0, 24.0, 11.0, 20.0, 12.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.3026580810546875, -1.259613037109375, -1.2165679931640625, -1.17352294921875, -1.1304779052734375, -1.087432861328125, -1.0443878173828125, -1.0013427734375, -0.9582977294921875, -0.915252685546875, -0.8722076416015625, -0.82916259765625, -0.7861175537109375, -0.743072509765625, -0.7000274658203125, -0.656982421875, -0.6139373779296875, -0.570892333984375, -0.5278472900390625, -0.48480224609375, -0.4417572021484375, -0.398712158203125, -0.3556671142578125, -0.3126220703125, -0.2695770263671875, -0.226531982421875, -0.1834869384765625, -0.14044189453125, -0.0973968505859375, -0.054351806640625, -0.0113067626953125, 0.03173828125, 0.0747833251953125, 0.117828369140625, 0.1608734130859375, 0.20391845703125, 0.2469635009765625, 0.290008544921875, 0.3330535888671875, 0.3760986328125, 0.4191436767578125, 0.462188720703125, 0.5052337646484375, 0.54827880859375, 0.5913238525390625, 0.634368896484375, 0.6774139404296875, 0.720458984375, 0.7635040283203125, 0.806549072265625, 0.8495941162109375, 0.89263916015625, 0.9356842041015625, 0.978729248046875, 1.0217742919921875, 1.0648193359375, 1.1078643798828125, 1.150909423828125, 1.1939544677734375, 1.23699951171875, 1.2800445556640625, 1.323089599609375, 1.3661346435546875, 1.4091796875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 12.0, 18.0, 15.0, 31.0, 32.0, 31.0, 42.0, 48.0, 48.0, 55.0, 47.0, 65.0, 62.0, 48.0, 66.0, 51.0, 53.0, 64.0, 41.0, 34.0, 28.0, 21.0, 20.0, 22.0, 14.0, 6.0, 5.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3230094909667969, -0.31252288818359375, -0.3020362854003906, -0.2915496826171875, -0.2810630798339844, -0.27057647705078125, -0.2600898742675781, -0.249603271484375, -0.23911666870117188, -0.22863006591796875, -0.21814346313476562, -0.2076568603515625, -0.19717025756835938, -0.18668365478515625, -0.17619705200195312, -0.16571044921875, -0.15522384643554688, -0.14473724365234375, -0.13425064086914062, -0.1237640380859375, -0.11327743530273438, -0.10279083251953125, -0.09230422973632812, -0.081817626953125, -0.07133102416992188, -0.06084442138671875, -0.050357818603515625, -0.0398712158203125, -0.029384613037109375, -0.01889801025390625, -0.008411407470703125, 0.0020751953125, 0.012561798095703125, 0.02304840087890625, 0.033535003662109375, 0.0440216064453125, 0.054508209228515625, 0.06499481201171875, 0.07548141479492188, 0.085968017578125, 0.09645462036132812, 0.10694122314453125, 0.11742782592773438, 0.1279144287109375, 0.13840103149414062, 0.14888763427734375, 0.15937423706054688, 0.16986083984375, 0.18034744262695312, 0.19083404541015625, 0.20132064819335938, 0.2118072509765625, 0.22229385375976562, 0.23278045654296875, 0.24326705932617188, 0.253753662109375, 0.2642402648925781, 0.27472686767578125, 0.2852134704589844, 0.2957000732421875, 0.3061866760253906, 0.31667327880859375, 0.3271598815917969, 0.337646484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 4.0, 1.0, 9.0, 8.0, 14.0, 6.0, 15.0, 30.0, 35.0, 51.0, 62.0, 90.0, 167.0, 303.0, 555.0, 1077.0, 2242.0, 5401.0, 14915.0, 46299.0, 445632.0, 459293.0, 47191.0, 14805.0, 5683.0, 2255.0, 1091.0, 546.0, 288.0, 161.0, 103.0, 71.0, 42.0, 35.0, 19.0, 11.0, 10.0, 7.0, 8.0, 10.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.378509521484375, -1.32928466796875, -1.280059814453125, -1.2308349609375, -1.181610107421875, -1.13238525390625, -1.083160400390625, -1.033935546875, -0.984710693359375, -0.93548583984375, -0.886260986328125, -0.8370361328125, -0.787811279296875, -0.73858642578125, -0.689361572265625, -0.64013671875, -0.590911865234375, -0.54168701171875, -0.492462158203125, -0.4432373046875, -0.394012451171875, -0.34478759765625, -0.295562744140625, -0.246337890625, -0.197113037109375, -0.14788818359375, -0.098663330078125, -0.0494384765625, -0.000213623046875, 0.04901123046875, 0.098236083984375, 0.1474609375, 0.196685791015625, 0.24591064453125, 0.295135498046875, 0.3443603515625, 0.393585205078125, 0.44281005859375, 0.492034912109375, 0.541259765625, 0.590484619140625, 0.63970947265625, 0.688934326171875, 0.7381591796875, 0.787384033203125, 0.83660888671875, 0.885833740234375, 0.93505859375, 0.984283447265625, 1.03350830078125, 1.082733154296875, 1.1319580078125, 1.181182861328125, 1.23040771484375, 1.279632568359375, 1.328857421875, 1.378082275390625, 1.42730712890625, 1.476531982421875, 1.5257568359375, 1.574981689453125, 1.62420654296875, 1.673431396484375, 1.72265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 2.0, 8.0, 10.0, 8.0, 8.0, 19.0, 12.0, 17.0, 25.0, 27.0, 29.0, 48.0, 42.0, 40.0, 49.0, 49.0, 58.0, 56.0, 62.0, 50.0, 48.0, 63.0, 33.0, 38.0, 37.0, 22.0, 26.0, 22.0, 15.0, 15.0, 15.0, 11.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3427734375, -1.3011932373046875, -1.259613037109375, -1.2180328369140625, -1.17645263671875, -1.1348724365234375, -1.093292236328125, -1.0517120361328125, -1.0101318359375, -0.9685516357421875, -0.926971435546875, -0.8853912353515625, -0.84381103515625, -0.8022308349609375, -0.760650634765625, -0.7190704345703125, -0.677490234375, -0.6359100341796875, -0.594329833984375, -0.5527496337890625, -0.51116943359375, -0.4695892333984375, -0.428009033203125, -0.3864288330078125, -0.3448486328125, -0.3032684326171875, -0.261688232421875, -0.2201080322265625, -0.17852783203125, -0.1369476318359375, -0.095367431640625, -0.0537872314453125, -0.01220703125, 0.0293731689453125, 0.070953369140625, 0.1125335693359375, 0.15411376953125, 0.1956939697265625, 0.237274169921875, 0.2788543701171875, 0.3204345703125, 0.3620147705078125, 0.403594970703125, 0.4451751708984375, 0.48675537109375, 0.5283355712890625, 0.569915771484375, 0.6114959716796875, 0.653076171875, 0.6946563720703125, 0.736236572265625, 0.7778167724609375, 0.81939697265625, 0.8609771728515625, 0.902557373046875, 0.9441375732421875, 0.9857177734375, 1.0272979736328125, 1.068878173828125, 1.1104583740234375, 1.15203857421875, 1.1936187744140625, 1.235198974609375, 1.2767791748046875, 1.318359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 10.0, 12.0, 20.0, 28.0, 51.0, 83.0, 140.0, 222.0, 338.0, 700.0, 1294.0, 2452.0, 4959.0, 10906.0, 26804.0, 82921.0, 708794.0, 146462.0, 35859.0, 13861.0, 6176.0, 2942.0, 1531.0, 855.0, 429.0, 268.0, 157.0, 92.0, 55.0, 40.0, 25.0, 10.0, 12.0, 11.0, 7.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.83203125, -0.808013916015625, -0.78399658203125, -0.759979248046875, -0.7359619140625, -0.711944580078125, -0.68792724609375, -0.663909912109375, -0.639892578125, -0.615875244140625, -0.59185791015625, -0.567840576171875, -0.5438232421875, -0.519805908203125, -0.49578857421875, -0.471771240234375, -0.44775390625, -0.423736572265625, -0.39971923828125, -0.375701904296875, -0.3516845703125, -0.327667236328125, -0.30364990234375, -0.279632568359375, -0.255615234375, -0.231597900390625, -0.20758056640625, -0.183563232421875, -0.1595458984375, -0.135528564453125, -0.11151123046875, -0.087493896484375, -0.0634765625, -0.039459228515625, -0.01544189453125, 0.008575439453125, 0.0325927734375, 0.056610107421875, 0.08062744140625, 0.104644775390625, 0.128662109375, 0.152679443359375, 0.17669677734375, 0.200714111328125, 0.2247314453125, 0.248748779296875, 0.27276611328125, 0.296783447265625, 0.32080078125, 0.344818115234375, 0.36883544921875, 0.392852783203125, 0.4168701171875, 0.440887451171875, 0.46490478515625, 0.488922119140625, 0.512939453125, 0.536956787109375, 0.56097412109375, 0.584991455078125, 0.6090087890625, 0.633026123046875, 0.65704345703125, 0.681060791015625, 0.705078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 8.0, 9.0, 0.0, 9.0, 18.0, 17.0, 17.0, 35.0, 69.0, 208.0, 319.0, 141.0, 42.0, 17.0, 13.0, 9.0, 11.0, 11.0, 11.0, 5.0, 2.0, 2.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001919269561767578, -0.0001843571662902832, -0.0001767873764038086, -0.00016921758651733398, -0.00016164779663085938, -0.00015407800674438477, -0.00014650821685791016, -0.00013893842697143555, -0.00013136863708496094, -0.00012379884719848633, -0.00011622905731201172, -0.00010865926742553711, -0.0001010894775390625, -9.351968765258789e-05, -8.594989776611328e-05, -7.838010787963867e-05, -7.081031799316406e-05, -6.324052810668945e-05, -5.5670738220214844e-05, -4.8100948333740234e-05, -4.0531158447265625e-05, -3.2961368560791016e-05, -2.5391578674316406e-05, -1.7821788787841797e-05, -1.0251998901367188e-05, -2.682209014892578e-06, 4.887580871582031e-06, 1.245737075805664e-05, 2.002716064453125e-05, 2.759695053100586e-05, 3.516674041748047e-05, 4.273653030395508e-05, 5.030632019042969e-05, 5.78761100769043e-05, 6.54458999633789e-05, 7.301568984985352e-05, 8.058547973632812e-05, 8.815526962280273e-05, 9.572505950927734e-05, 0.00010329484939575195, 0.00011086463928222656, 0.00011843442916870117, 0.00012600421905517578, 0.0001335740089416504, 0.000141143798828125, 0.0001487135887145996, 0.00015628337860107422, 0.00016385316848754883, 0.00017142295837402344, 0.00017899274826049805, 0.00018656253814697266, 0.00019413232803344727, 0.00020170211791992188, 0.00020927190780639648, 0.0002168416976928711, 0.0002244114875793457, 0.0002319812774658203, 0.00023955106735229492, 0.00024712085723876953, 0.00025469064712524414, 0.00026226043701171875, 0.00026983022689819336, 0.00027740001678466797, 0.0002849698066711426, 0.0002925395965576172]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 9.0, 11.0, 11.0, 24.0, 42.0, 61.0, 84.0, 172.0, 324.0, 749.0, 1817.0, 5271.0, 20036.0, 138239.0, 816054.0, 49595.0, 10616.0, 3123.0, 1209.0, 518.0, 247.0, 122.0, 79.0, 57.0, 25.0, 14.0, 15.0, 7.0, 7.0, 5.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4111328125, -1.369964599609375, -1.32879638671875, -1.287628173828125, -1.2464599609375, -1.205291748046875, -1.16412353515625, -1.122955322265625, -1.081787109375, -1.040618896484375, -0.99945068359375, -0.958282470703125, -0.9171142578125, -0.875946044921875, -0.83477783203125, -0.793609619140625, -0.75244140625, -0.711273193359375, -0.67010498046875, -0.628936767578125, -0.5877685546875, -0.546600341796875, -0.50543212890625, -0.464263916015625, -0.423095703125, -0.381927490234375, -0.34075927734375, -0.299591064453125, -0.2584228515625, -0.217254638671875, -0.17608642578125, -0.134918212890625, -0.09375, -0.052581787109375, -0.01141357421875, 0.029754638671875, 0.0709228515625, 0.112091064453125, 0.15325927734375, 0.194427490234375, 0.235595703125, 0.276763916015625, 0.31793212890625, 0.359100341796875, 0.4002685546875, 0.441436767578125, 0.48260498046875, 0.523773193359375, 0.56494140625, 0.606109619140625, 0.64727783203125, 0.688446044921875, 0.7296142578125, 0.770782470703125, 0.81195068359375, 0.853118896484375, 0.894287109375, 0.935455322265625, 0.97662353515625, 1.017791748046875, 1.0589599609375, 1.100128173828125, 1.14129638671875, 1.182464599609375, 1.2236328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 6.0, 7.0, 6.0, 6.0, 7.0, 7.0, 11.0, 23.0, 41.0, 72.0, 113.0, 203.0, 182.0, 108.0, 56.0, 26.0, 11.0, 13.0, 14.0, 11.0, 8.0, 16.0, 8.0, 9.0, 3.0, 2.0, 8.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.650390625, -0.626251220703125, -0.60211181640625, -0.577972412109375, -0.5538330078125, -0.529693603515625, -0.50555419921875, -0.481414794921875, -0.457275390625, -0.433135986328125, -0.40899658203125, -0.384857177734375, -0.3607177734375, -0.336578369140625, -0.31243896484375, -0.288299560546875, -0.26416015625, -0.240020751953125, -0.21588134765625, -0.191741943359375, -0.1676025390625, -0.143463134765625, -0.11932373046875, -0.095184326171875, -0.071044921875, -0.046905517578125, -0.02276611328125, 0.001373291015625, 0.0255126953125, 0.049652099609375, 0.07379150390625, 0.097930908203125, 0.1220703125, 0.146209716796875, 0.17034912109375, 0.194488525390625, 0.2186279296875, 0.242767333984375, 0.26690673828125, 0.291046142578125, 0.315185546875, 0.339324951171875, 0.36346435546875, 0.387603759765625, 0.4117431640625, 0.435882568359375, 0.46002197265625, 0.484161376953125, 0.50830078125, 0.532440185546875, 0.55657958984375, 0.580718994140625, 0.6048583984375, 0.628997802734375, 0.65313720703125, 0.677276611328125, 0.701416015625, 0.725555419921875, 0.74969482421875, 0.773834228515625, 0.7979736328125, 0.822113037109375, 0.84625244140625, 0.870391845703125, 0.89453125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 9.0, 17.0, 20.0, 42.0, 68.0, 101.0, 129.0, 162.0, 136.0, 134.0, 76.0, 55.0, 25.0, 11.0, 10.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.525595664978027, -7.181560516357422, -6.837524890899658, -6.493489742279053, -6.149454116821289, -5.805418968200684, -5.461383819580078, -5.117348670959473, -4.773313045501709, -4.4292778968811035, -4.08524227142334, -3.7412071228027344, -3.39717173576355, -3.0531363487243652, -2.7091012001037598, -2.365065813064575, -2.0210304260253906, -1.676995038986206, -1.332959771156311, -0.988924503326416, -0.6448891162872314, -0.3008537292480469, 0.043181419372558594, 0.38721680641174316, 0.7312521934509277, 1.0752875804901123, 1.4193228483200073, 1.7633581161499023, 2.107393503189087, 2.4514288902282715, 2.795464038848877, 3.1394994258880615, 3.4835357666015625, 3.827571153640747, 4.171606540679932, 4.515641689300537, 4.859677314758301, 5.203712463378906, 5.547747611999512, 5.891782760620117, 6.235818386077881, 6.579853534698486, 6.92388916015625, 7.2679243087768555, 7.611959457397461, 7.955995082855225, 8.300029754638672, 8.644065856933594, 8.9881010055542, 9.332136154174805, 9.67617130279541, 10.020206451416016, 10.364242553710938, 10.708277702331543, 11.052312850952148, 11.396347999572754, 11.74038314819336, 12.084418296813965, 12.42845344543457, 12.772489547729492, 13.116524696350098, 13.460559844970703, 13.804594993591309, 14.148630142211914, 14.492666244506836]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 7.0, 7.0, 5.0, 11.0, 6.0, 12.0, 7.0, 22.0, 12.0, 16.0, 21.0, 18.0, 31.0, 34.0, 25.0, 35.0, 30.0, 33.0, 34.0, 43.0, 43.0, 37.0, 35.0, 32.0, 38.0, 37.0, 37.0, 38.0, 34.0, 32.0, 38.0, 26.0, 18.0, 32.0, 31.0, 16.0, 19.0, 12.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01706600189209, -4.860353469848633, -4.703640937805176, -4.546928405761719, -4.390215873718262, -4.233503341674805, -4.076790809631348, -3.9200778007507324, -3.7633652687072754, -3.6066527366638184, -3.4499402046203613, -3.2932276725769043, -3.136514902114868, -2.979802370071411, -2.823089838027954, -2.666377067565918, -2.50966477394104, -2.352952241897583, -2.196239709854126, -2.03952693939209, -1.8828144073486328, -1.7261018753051758, -1.5693893432617188, -1.4126766920089722, -1.2559641599655151, -1.099251627922058, -0.9425389766693115, -0.7858264446258545, -0.6291138529777527, -0.4724012613296509, -0.31568872928619385, -0.15897607803344727, -0.0022635459899902344, 0.15444903075695038, 0.311161607503891, 0.4678741693496704, 0.6245867609977722, 0.781299352645874, 0.938011884689331, 1.0947245359420776, 1.2514370679855347, 1.4081496000289917, 1.5648622512817383, 1.7215747833251953, 1.8782873153686523, 2.0349998474121094, 2.1917123794555664, 2.3484251499176025, 2.5051376819610596, 2.6618502140045166, 2.8185627460479736, 2.9752755165100098, 3.131988048553467, 3.288700580596924, 3.445413112640381, 3.602125644683838, 3.758838176727295, 3.915550708770752, 4.072263240814209, 4.228975772857666, 4.385688304901123, 4.542401313781738, 4.699113845825195, 4.855826377868652, 5.012538909912109]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 7.0, 12.0, 12.0, 16.0, 23.0, 27.0, 42.0, 58.0, 89.0, 122.0, 176.0, 246.0, 388.0, 553.0, 816.0, 1260.0, 1980.0, 3291.0, 5744.0, 11010.0, 23570.0, 65709.0, 441698.0, 3442752.0, 125938.0, 35721.0, 15039.0, 7347.0, 4004.0, 2266.0, 1446.0, 959.0, 610.0, 430.0, 262.0, 184.0, 116.0, 104.0, 74.0, 50.0, 29.0, 27.0, 23.0, 15.0, 12.0, 4.0, 7.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0], "bins": [-1.3505859375, -1.3099365234375, -1.269287109375, -1.2286376953125, -1.18798828125, -1.1473388671875, -1.106689453125, -1.0660400390625, -1.025390625, -0.9847412109375, -0.944091796875, -0.9034423828125, -0.86279296875, -0.8221435546875, -0.781494140625, -0.7408447265625, -0.7001953125, -0.6595458984375, -0.618896484375, -0.5782470703125, -0.53759765625, -0.4969482421875, -0.456298828125, -0.4156494140625, -0.375, -0.3343505859375, -0.293701171875, -0.2530517578125, -0.21240234375, -0.1717529296875, -0.131103515625, -0.0904541015625, -0.0498046875, -0.0091552734375, 0.031494140625, 0.0721435546875, 0.11279296875, 0.1534423828125, 0.194091796875, 0.2347412109375, 0.275390625, 0.3160400390625, 0.356689453125, 0.3973388671875, 0.43798828125, 0.4786376953125, 0.519287109375, 0.5599365234375, 0.6005859375, 0.6412353515625, 0.681884765625, 0.7225341796875, 0.76318359375, 0.8038330078125, 0.844482421875, 0.8851318359375, 0.92578125, 0.9664306640625, 1.007080078125, 1.0477294921875, 1.08837890625, 1.1290283203125, 1.169677734375, 1.2103271484375, 1.2509765625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 11.0, 14.0, 12.0, 15.0, 22.0, 27.0, 27.0, 35.0, 36.0, 36.0, 44.0, 38.0, 37.0, 51.0, 69.0, 52.0, 45.0, 57.0, 44.0, 38.0, 43.0, 38.0, 30.0, 29.0, 25.0, 28.0, 24.0, 21.0, 11.0, 9.0, 7.0, 6.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.2606964111328125, -0.251861572265625, -0.2430267333984375, -0.23419189453125, -0.2253570556640625, -0.216522216796875, -0.2076873779296875, -0.1988525390625, -0.1900177001953125, -0.181182861328125, -0.1723480224609375, -0.16351318359375, -0.1546783447265625, -0.145843505859375, -0.1370086669921875, -0.128173828125, -0.1193389892578125, -0.110504150390625, -0.1016693115234375, -0.09283447265625, -0.0839996337890625, -0.075164794921875, -0.0663299560546875, -0.0574951171875, -0.0486602783203125, -0.039825439453125, -0.0309906005859375, -0.02215576171875, -0.0133209228515625, -0.004486083984375, 0.0043487548828125, 0.01318359375, 0.0220184326171875, 0.030853271484375, 0.0396881103515625, 0.04852294921875, 0.0573577880859375, 0.066192626953125, 0.0750274658203125, 0.0838623046875, 0.0926971435546875, 0.101531982421875, 0.1103668212890625, 0.11920166015625, 0.1280364990234375, 0.136871337890625, 0.1457061767578125, 0.154541015625, 0.1633758544921875, 0.172210693359375, 0.1810455322265625, 0.18988037109375, 0.1987152099609375, 0.207550048828125, 0.2163848876953125, 0.2252197265625, 0.2340545654296875, 0.242889404296875, 0.2517242431640625, 0.26055908203125, 0.2693939208984375, 0.278228759765625, 0.2870635986328125, 0.2958984375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 8.0, 7.0, 7.0, 6.0, 14.0, 33.0, 18.0, 38.0, 67.0, 76.0, 94.0, 153.0, 191.0, 262.0, 368.0, 600.0, 989.0, 1903.0, 4155.0, 10845.0, 38849.0, 317810.0, 3683535.0, 99975.0, 20649.0, 6875.0, 2863.0, 1398.0, 843.0, 491.0, 309.0, 221.0, 169.0, 127.0, 95.0, 48.0, 51.0, 42.0, 28.0, 21.0, 18.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.912109375, -2.8245849609375, -2.737060546875, -2.6495361328125, -2.56201171875, -2.4744873046875, -2.386962890625, -2.2994384765625, -2.2119140625, -2.1243896484375, -2.036865234375, -1.9493408203125, -1.86181640625, -1.7742919921875, -1.686767578125, -1.5992431640625, -1.51171875, -1.4241943359375, -1.336669921875, -1.2491455078125, -1.16162109375, -1.0740966796875, -0.986572265625, -0.8990478515625, -0.8115234375, -0.7239990234375, -0.636474609375, -0.5489501953125, -0.46142578125, -0.3739013671875, -0.286376953125, -0.1988525390625, -0.111328125, -0.0238037109375, 0.063720703125, 0.1512451171875, 0.23876953125, 0.3262939453125, 0.413818359375, 0.5013427734375, 0.5888671875, 0.6763916015625, 0.763916015625, 0.8514404296875, 0.93896484375, 1.0264892578125, 1.114013671875, 1.2015380859375, 1.2890625, 1.3765869140625, 1.464111328125, 1.5516357421875, 1.63916015625, 1.7266845703125, 1.814208984375, 1.9017333984375, 1.9892578125, 2.0767822265625, 2.164306640625, 2.2518310546875, 2.33935546875, 2.4268798828125, 2.514404296875, 2.6019287109375, 2.689453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 10.0, 12.0, 21.0, 31.0, 55.0, 102.0, 266.0, 2301.0, 830.0, 188.0, 97.0, 48.0, 35.0, 25.0, 10.0, 7.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.162109375, -1.1231536865234375, -1.084197998046875, -1.0452423095703125, -1.00628662109375, -0.9673309326171875, -0.928375244140625, -0.8894195556640625, -0.8504638671875, -0.8115081787109375, -0.772552490234375, -0.7335968017578125, -0.69464111328125, -0.6556854248046875, -0.616729736328125, -0.5777740478515625, -0.538818359375, -0.4998626708984375, -0.460906982421875, -0.4219512939453125, -0.38299560546875, -0.3440399169921875, -0.305084228515625, -0.2661285400390625, -0.2271728515625, -0.1882171630859375, -0.149261474609375, -0.1103057861328125, -0.07135009765625, -0.0323944091796875, 0.006561279296875, 0.0455169677734375, 0.08447265625, 0.1234283447265625, 0.162384033203125, 0.2013397216796875, 0.24029541015625, 0.2792510986328125, 0.318206787109375, 0.3571624755859375, 0.3961181640625, 0.4350738525390625, 0.474029541015625, 0.5129852294921875, 0.55194091796875, 0.5908966064453125, 0.629852294921875, 0.6688079833984375, 0.707763671875, 0.7467193603515625, 0.785675048828125, 0.8246307373046875, 0.86358642578125, 0.9025421142578125, 0.941497802734375, 0.9804534912109375, 1.0194091796875, 1.0583648681640625, 1.097320556640625, 1.1362762451171875, 1.17523193359375, 1.2141876220703125, 1.253143310546875, 1.2920989990234375, 1.3310546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 9.0, 10.0, 28.0, 38.0, 82.0, 135.0, 179.0, 169.0, 127.0, 97.0, 51.0, 29.0, 19.0, 11.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.762930870056152, -8.532520294189453, -8.302109718322754, -8.071699142456055, -7.841289043426514, -7.610878944396973, -7.380468368530273, -7.150057792663574, -6.919647693634033, -6.689237117767334, -6.458827018737793, -6.228416442871094, -5.9980058670043945, -5.7675957679748535, -5.537185192108154, -5.306775093078613, -5.076364517211914, -4.845953941345215, -4.615543842315674, -4.385133266448975, -4.154722690582275, -3.9243125915527344, -3.693902015686035, -3.463491678237915, -3.2330808639526367, -3.0026705265045166, -2.7722599506378174, -2.5418496131896973, -2.311439275741577, -2.081028938293457, -1.8506183624267578, -1.6202080249786377, -1.3897976875305176, -1.159387230873108, -0.9289768934249878, -0.6985664367675781, -0.46815603971481323, -0.23774564266204834, -0.007335186004638672, 0.22307515144348145, 0.4534856081008911, 0.683896005153656, 0.9143064022064209, 1.1447168588638306, 1.3751273155212402, 1.6055376529693604, 1.83594810962677, 2.0663585662841797, 2.2967689037323, 2.52717924118042, 2.757589817047119, 2.9880001544952393, 3.2184104919433594, 3.4488210678100586, 3.6792314052581787, 3.909641742706299, 4.140052318572998, 4.370462894439697, 4.600872993469238, 4.8312835693359375, 5.061694145202637, 5.292104244232178, 5.522514820098877, 5.752924919128418, 5.983335494995117]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 14.0, 3.0, 12.0, 17.0, 18.0, 11.0, 20.0, 14.0, 19.0, 24.0, 33.0, 22.0, 37.0, 37.0, 38.0, 29.0, 34.0, 40.0, 32.0, 38.0, 42.0, 43.0, 40.0, 33.0, 27.0, 32.0, 26.0, 32.0, 29.0, 25.0, 23.0, 20.0, 23.0, 13.0, 19.0, 15.0, 9.0, 7.0, 13.0, 5.0, 6.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.5090084075927734, -2.4304816722869873, -2.3519551753997803, -2.273428440093994, -2.194901704788208, -2.116374969482422, -2.037848472595215, -1.9593217372894287, -1.8807951211929321, -1.8022685050964355, -1.7237417697906494, -1.6452151536941528, -1.5666885375976562, -1.4881618022918701, -1.4096351861953735, -1.331108570098877, -1.2525818347930908, -1.1740552186965942, -1.095528483390808, -1.0170018672943115, -0.9384751915931702, -0.8599485158920288, -0.7814218997955322, -0.7028952240943909, -0.6243685483932495, -0.5458418726921082, -0.4673152267932892, -0.3887885808944702, -0.31026190519332886, -0.2317352294921875, -0.15320858359336853, -0.07468193769454956, 0.003844738006591797, 0.08237139880657196, 0.16089805960655212, 0.2394247204065323, 0.31795138120651245, 0.3964780569076538, 0.4750047028064728, 0.5535313487052917, 0.6320580244064331, 0.7105847001075745, 0.7891113758087158, 0.8676379919052124, 0.9461646676063538, 1.0246913433074951, 1.1032179594039917, 1.1817445755004883, 1.2602713108062744, 1.338797926902771, 1.4173246622085571, 1.4958512783050537, 1.5743780136108398, 1.6529046297073364, 1.731431245803833, 1.8099579811096191, 1.8884845972061157, 1.9670112133026123, 2.0455379486083984, 2.1240646839141846, 2.2025911808013916, 2.2811179161071777, 2.359644651412964, 2.438171148300171, 2.516697883605957]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 10.0, 11.0, 26.0, 27.0, 45.0, 63.0, 89.0, 105.0, 185.0, 285.0, 453.0, 720.0, 1231.0, 2301.0, 4363.0, 8670.0, 19474.0, 45951.0, 122383.0, 377252.0, 298052.0, 97470.0, 37286.0, 16071.0, 7405.0, 3661.0, 2029.0, 1049.0, 645.0, 426.0, 262.0, 183.0, 110.0, 80.0, 35.0, 34.0, 29.0, 21.0, 11.0, 11.0, 7.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.369140625, -1.3248138427734375, -1.280487060546875, -1.2361602783203125, -1.19183349609375, -1.1475067138671875, -1.103179931640625, -1.0588531494140625, -1.0145263671875, -0.9701995849609375, -0.925872802734375, -0.8815460205078125, -0.83721923828125, -0.7928924560546875, -0.748565673828125, -0.7042388916015625, -0.659912109375, -0.6155853271484375, -0.571258544921875, -0.5269317626953125, -0.48260498046875, -0.4382781982421875, -0.393951416015625, -0.3496246337890625, -0.3052978515625, -0.2609710693359375, -0.216644287109375, -0.1723175048828125, -0.12799072265625, -0.0836639404296875, -0.039337158203125, 0.0049896240234375, 0.04931640625, 0.0936431884765625, 0.137969970703125, 0.1822967529296875, 0.22662353515625, 0.2709503173828125, 0.315277099609375, 0.3596038818359375, 0.4039306640625, 0.4482574462890625, 0.492584228515625, 0.5369110107421875, 0.58123779296875, 0.6255645751953125, 0.669891357421875, 0.7142181396484375, 0.758544921875, 0.8028717041015625, 0.847198486328125, 0.8915252685546875, 0.93585205078125, 0.9801788330078125, 1.024505615234375, 1.0688323974609375, 1.1131591796875, 1.1574859619140625, 1.201812744140625, 1.2461395263671875, 1.29046630859375, 1.3347930908203125, 1.379119873046875, 1.4234466552734375, 1.4677734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 6.0, 15.0, 14.0, 14.0, 19.0, 28.0, 23.0, 31.0, 37.0, 36.0, 36.0, 44.0, 39.0, 41.0, 52.0, 53.0, 51.0, 54.0, 48.0, 35.0, 44.0, 47.0, 33.0, 36.0, 27.0, 25.0, 17.0, 20.0, 18.0, 11.0, 10.0, 4.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313232421875, -0.3026924133300781, -0.29215240478515625, -0.2816123962402344, -0.2710723876953125, -0.2605323791503906, -0.24999237060546875, -0.23945236206054688, -0.228912353515625, -0.21837234497070312, -0.20783233642578125, -0.19729232788085938, -0.1867523193359375, -0.17621231079101562, -0.16567230224609375, -0.15513229370117188, -0.14459228515625, -0.13405227661132812, -0.12351226806640625, -0.11297225952148438, -0.1024322509765625, -0.09189224243164062, -0.08135223388671875, -0.07081222534179688, -0.060272216796875, -0.049732208251953125, -0.03919219970703125, -0.028652191162109375, -0.0181121826171875, -0.007572174072265625, 0.00296783447265625, 0.013507843017578125, 0.0240478515625, 0.034587860107421875, 0.04512786865234375, 0.055667877197265625, 0.0662078857421875, 0.07674789428710938, 0.08728790283203125, 0.09782791137695312, 0.108367919921875, 0.11890792846679688, 0.12944793701171875, 0.13998794555664062, 0.1505279541015625, 0.16106796264648438, 0.17160797119140625, 0.18214797973632812, 0.19268798828125, 0.20322799682617188, 0.21376800537109375, 0.22430801391601562, 0.2348480224609375, 0.24538803100585938, 0.25592803955078125, 0.2664680480957031, 0.277008056640625, 0.2875480651855469, 0.29808807373046875, 0.3086280822753906, 0.3191680908203125, 0.3297080993652344, 0.34024810791015625, 0.3507881164550781, 0.361328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 13.0, 9.0, 10.0, 23.0, 24.0, 32.0, 30.0, 69.0, 100.0, 203.0, 342.0, 549.0, 1077.0, 2277.0, 5443.0, 16494.0, 61345.0, 336335.0, 510186.0, 81444.0, 20322.0, 6798.0, 2680.0, 1230.0, 660.0, 315.0, 202.0, 141.0, 74.0, 39.0, 31.0, 21.0, 18.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.104766845703125, -2.02984619140625, -1.954925537109375, -1.8800048828125, -1.805084228515625, -1.73016357421875, -1.655242919921875, -1.580322265625, -1.505401611328125, -1.43048095703125, -1.355560302734375, -1.2806396484375, -1.205718994140625, -1.13079833984375, -1.055877685546875, -0.98095703125, -0.906036376953125, -0.83111572265625, -0.756195068359375, -0.6812744140625, -0.606353759765625, -0.53143310546875, -0.456512451171875, -0.381591796875, -0.306671142578125, -0.23175048828125, -0.156829833984375, -0.0819091796875, -0.006988525390625, 0.06793212890625, 0.142852783203125, 0.2177734375, 0.292694091796875, 0.36761474609375, 0.442535400390625, 0.5174560546875, 0.592376708984375, 0.66729736328125, 0.742218017578125, 0.817138671875, 0.892059326171875, 0.96697998046875, 1.041900634765625, 1.1168212890625, 1.191741943359375, 1.26666259765625, 1.341583251953125, 1.41650390625, 1.491424560546875, 1.56634521484375, 1.641265869140625, 1.7161865234375, 1.791107177734375, 1.86602783203125, 1.940948486328125, 2.015869140625, 2.090789794921875, 2.16571044921875, 2.240631103515625, 2.3155517578125, 2.390472412109375, 2.46539306640625, 2.540313720703125, 2.615234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 13.0, 13.0, 13.0, 21.0, 25.0, 37.0, 27.0, 36.0, 41.0, 50.0, 38.0, 64.0, 72.0, 64.0, 62.0, 43.0, 50.0, 53.0, 41.0, 33.0, 32.0, 29.0, 21.0, 18.0, 19.0, 19.0, 11.0, 12.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -1.989349365234375, -1.92596435546875, -1.862579345703125, -1.7991943359375, -1.735809326171875, -1.67242431640625, -1.609039306640625, -1.545654296875, -1.482269287109375, -1.41888427734375, -1.355499267578125, -1.2921142578125, -1.228729248046875, -1.16534423828125, -1.101959228515625, -1.03857421875, -0.975189208984375, -0.91180419921875, -0.848419189453125, -0.7850341796875, -0.721649169921875, -0.65826416015625, -0.594879150390625, -0.531494140625, -0.468109130859375, -0.40472412109375, -0.341339111328125, -0.2779541015625, -0.214569091796875, -0.15118408203125, -0.087799072265625, -0.0244140625, 0.038970947265625, 0.10235595703125, 0.165740966796875, 0.2291259765625, 0.292510986328125, 0.35589599609375, 0.419281005859375, 0.482666015625, 0.546051025390625, 0.60943603515625, 0.672821044921875, 0.7362060546875, 0.799591064453125, 0.86297607421875, 0.926361083984375, 0.98974609375, 1.053131103515625, 1.11651611328125, 1.179901123046875, 1.2432861328125, 1.306671142578125, 1.37005615234375, 1.433441162109375, 1.496826171875, 1.560211181640625, 1.62359619140625, 1.686981201171875, 1.7503662109375, 1.813751220703125, 1.87713623046875, 1.940521240234375, 2.00390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 21.0, 16.0, 26.0, 34.0, 69.0, 86.0, 115.0, 233.0, 387.0, 795.0, 1861.0, 4733.0, 21773.0, 873172.0, 130502.0, 9239.0, 2917.0, 1215.0, 535.0, 280.0, 166.0, 117.0, 76.0, 57.0, 40.0, 20.0, 11.0, 7.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.388671875, -3.27850341796875, -3.1683349609375, -3.05816650390625, -2.947998046875, -2.83782958984375, -2.7276611328125, -2.61749267578125, -2.50732421875, -2.39715576171875, -2.2869873046875, -2.17681884765625, -2.066650390625, -1.95648193359375, -1.8463134765625, -1.73614501953125, -1.6259765625, -1.51580810546875, -1.4056396484375, -1.29547119140625, -1.185302734375, -1.07513427734375, -0.9649658203125, -0.85479736328125, -0.74462890625, -0.63446044921875, -0.5242919921875, -0.41412353515625, -0.303955078125, -0.19378662109375, -0.0836181640625, 0.02655029296875, 0.13671875, 0.24688720703125, 0.3570556640625, 0.46722412109375, 0.577392578125, 0.68756103515625, 0.7977294921875, 0.90789794921875, 1.01806640625, 1.12823486328125, 1.2384033203125, 1.34857177734375, 1.458740234375, 1.56890869140625, 1.6790771484375, 1.78924560546875, 1.8994140625, 2.00958251953125, 2.1197509765625, 2.22991943359375, 2.340087890625, 2.45025634765625, 2.5604248046875, 2.67059326171875, 2.78076171875, 2.89093017578125, 3.0010986328125, 3.11126708984375, 3.221435546875, 3.33160400390625, 3.4417724609375, 3.55194091796875, 3.662109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 15.0, 21.0, 26.0, 32.0, 60.0, 71.0, 122.0, 286.0, 104.0, 76.0, 56.0, 35.0, 26.0, 15.0, 16.0, 7.0, 3.0, 1.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00037670135498046875, -0.0003630220890045166, -0.00034934282302856445, -0.0003356635570526123, -0.00032198429107666016, -0.000308305025100708, -0.00029462575912475586, -0.0002809464931488037, -0.00026726722717285156, -0.0002535879611968994, -0.00023990869522094727, -0.00022622942924499512, -0.00021255016326904297, -0.00019887089729309082, -0.00018519163131713867, -0.00017151236534118652, -0.00015783309936523438, -0.00014415383338928223, -0.00013047456741333008, -0.00011679530143737793, -0.00010311603546142578, -8.943676948547363e-05, -7.575750350952148e-05, -6.207823753356934e-05, -4.839897155761719e-05, -3.471970558166504e-05, -2.104043960571289e-05, -7.361173629760742e-06, 6.318092346191406e-06, 1.9997358322143555e-05, 3.36766242980957e-05, 4.735589027404785e-05, 6.103515625e-05, 7.471442222595215e-05, 8.83936882019043e-05, 0.00010207295417785645, 0.0001157522201538086, 0.00012943148612976074, 0.0001431107521057129, 0.00015679001808166504, 0.0001704692840576172, 0.00018414855003356934, 0.00019782781600952148, 0.00021150708198547363, 0.00022518634796142578, 0.00023886561393737793, 0.0002525448799133301, 0.0002662241458892822, 0.0002799034118652344, 0.0002935826778411865, 0.00030726194381713867, 0.0003209412097930908, 0.00033462047576904297, 0.0003482997417449951, 0.00036197900772094727, 0.0003756582736968994, 0.00038933753967285156, 0.0004030168056488037, 0.00041669607162475586, 0.000430375337600708, 0.00044405460357666016, 0.0004577338695526123, 0.00047141313552856445, 0.0004850924015045166, 0.0004987716674804688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 8.0, 12.0, 21.0, 22.0, 33.0, 52.0, 53.0, 90.0, 144.0, 239.0, 401.0, 743.0, 1362.0, 2929.0, 7146.0, 27719.0, 625230.0, 350028.0, 20691.0, 6024.0, 2603.0, 1312.0, 645.0, 378.0, 225.0, 145.0, 91.0, 59.0, 34.0, 24.0, 22.0, 12.0, 13.0, 7.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1171875, -2.041351318359375, -1.96551513671875, -1.889678955078125, -1.8138427734375, -1.738006591796875, -1.66217041015625, -1.586334228515625, -1.510498046875, -1.434661865234375, -1.35882568359375, -1.282989501953125, -1.2071533203125, -1.131317138671875, -1.05548095703125, -0.979644775390625, -0.90380859375, -0.827972412109375, -0.75213623046875, -0.676300048828125, -0.6004638671875, -0.524627685546875, -0.44879150390625, -0.372955322265625, -0.297119140625, -0.221282958984375, -0.14544677734375, -0.069610595703125, 0.0062255859375, 0.082061767578125, 0.15789794921875, 0.233734130859375, 0.3095703125, 0.385406494140625, 0.46124267578125, 0.537078857421875, 0.6129150390625, 0.688751220703125, 0.76458740234375, 0.840423583984375, 0.916259765625, 0.992095947265625, 1.06793212890625, 1.143768310546875, 1.2196044921875, 1.295440673828125, 1.37127685546875, 1.447113037109375, 1.52294921875, 1.598785400390625, 1.67462158203125, 1.750457763671875, 1.8262939453125, 1.902130126953125, 1.97796630859375, 2.053802490234375, 2.129638671875, 2.205474853515625, 2.28131103515625, 2.357147216796875, 2.4329833984375, 2.508819580078125, 2.58465576171875, 2.660491943359375, 2.736328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 3.0, 11.0, 12.0, 10.0, 18.0, 40.0, 48.0, 88.0, 139.0, 193.0, 165.0, 97.0, 47.0, 29.0, 21.0, 17.0, 8.0, 10.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0859375, -2.028778076171875, -1.97161865234375, -1.914459228515625, -1.8572998046875, -1.800140380859375, -1.74298095703125, -1.685821533203125, -1.628662109375, -1.571502685546875, -1.51434326171875, -1.457183837890625, -1.4000244140625, -1.342864990234375, -1.28570556640625, -1.228546142578125, -1.17138671875, -1.114227294921875, -1.05706787109375, -0.999908447265625, -0.9427490234375, -0.885589599609375, -0.82843017578125, -0.771270751953125, -0.714111328125, -0.656951904296875, -0.59979248046875, -0.542633056640625, -0.4854736328125, -0.428314208984375, -0.37115478515625, -0.313995361328125, -0.2568359375, -0.199676513671875, -0.14251708984375, -0.085357666015625, -0.0281982421875, 0.028961181640625, 0.08612060546875, 0.143280029296875, 0.200439453125, 0.257598876953125, 0.31475830078125, 0.371917724609375, 0.4290771484375, 0.486236572265625, 0.54339599609375, 0.600555419921875, 0.65771484375, 0.714874267578125, 0.77203369140625, 0.829193115234375, 0.8863525390625, 0.943511962890625, 1.00067138671875, 1.057830810546875, 1.114990234375, 1.172149658203125, 1.22930908203125, 1.286468505859375, 1.3436279296875, 1.400787353515625, 1.45794677734375, 1.515106201171875, 1.572265625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 14.0, 7.0, 9.0, 9.0, 15.0, 16.0, 44.0, 52.0, 70.0, 97.0, 99.0, 113.0, 89.0, 96.0, 82.0, 47.0, 50.0, 35.0, 20.0, 16.0, 6.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.415666580200195, -16.93995475769043, -16.46424102783203, -15.988529205322266, -15.512816429138184, -15.037103652954102, -14.561391830444336, -14.085679054260254, -13.609966278076172, -13.13425350189209, -12.658541679382324, -12.182828903198242, -11.70711612701416, -11.231403350830078, -10.755691528320312, -10.27997875213623, -9.804266929626465, -9.328554153442383, -8.852842330932617, -8.377129554748535, -7.901416778564453, -7.425704479217529, -6.9499921798706055, -6.474279403686523, -5.9985671043396, -5.522854804992676, -5.047142028808594, -4.57142972946167, -4.095717430114746, -3.620004653930664, -3.1442923545837402, -2.6685798168182373, -2.192868232727051, -1.7171556949615479, -1.2414432764053345, -0.7657308578491211, -0.29001832008361816, 0.18569421768188477, 0.6614065170288086, 1.1371190547943115, 1.6128315925598145, 2.0885441303253174, 2.5642566680908203, 3.039968967437744, 3.515681505203247, 3.99139404296875, 4.467106342315674, 4.942818641662598, 5.41853141784668, 5.8942437171936035, 6.3699564933776855, 6.845668792724609, 7.321381568908691, 7.797093868255615, 8.272806167602539, 8.748518943786621, 9.224231719970703, 9.699944496154785, 10.17565631866455, 10.651369094848633, 11.127081871032715, 11.602794647216797, 12.078506469726562, 12.554219245910645, 13.02993106842041]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 9.0, 6.0, 17.0, 16.0, 13.0, 19.0, 19.0, 24.0, 21.0, 25.0, 40.0, 35.0, 24.0, 26.0, 47.0, 43.0, 47.0, 41.0, 41.0, 50.0, 46.0, 43.0, 53.0, 33.0, 37.0, 22.0, 27.0, 27.0, 23.0, 20.0, 16.0, 8.0, 11.0, 16.0, 14.0, 8.0, 6.0, 6.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.201085090637207, -9.910774230957031, -9.620463371276855, -9.33015251159668, -9.03984260559082, -8.749531745910645, -8.459220886230469, -8.168910026550293, -7.878599166870117, -7.588288307189941, -7.297977447509766, -7.007667064666748, -6.717356204986572, -6.4270453453063965, -6.136734962463379, -5.846424102783203, -5.556113243103027, -5.265802383422852, -4.975491523742676, -4.685181140899658, -4.394870281219482, -4.104559421539307, -3.81424880027771, -3.5239381790161133, -3.2336273193359375, -2.9433164596557617, -2.653005838394165, -2.3626952171325684, -2.0723843574523926, -1.7820736169815063, -1.4917628765106201, -1.2014522552490234, -0.9111413955688477, -0.6208306550979614, -0.3305199146270752, -0.040209174156188965, 0.25010156631469727, 0.5404123067855835, 0.8307230472564697, 1.1210336685180664, 1.4113445281982422, 1.7016552686691284, 1.9919660091400146, 2.2822766304016113, 2.572587490081787, 2.862898349761963, 3.1532089710235596, 3.4435195922851562, 3.733830451965332, 4.024141311645508, 4.314452171325684, 4.604762554168701, 4.895073413848877, 5.185384273529053, 5.47569465637207, 5.766005516052246, 6.056316375732422, 6.346627235412598, 6.636938095092773, 6.927248477935791, 7.217559337615967, 7.507870197296143, 7.79818058013916, 8.088491439819336, 8.378802299499512]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 13.0, 19.0, 28.0, 40.0, 67.0, 107.0, 188.0, 359.0, 609.0, 1233.0, 2619.0, 5808.0, 15283.0, 52595.0, 464060.0, 3522025.0, 91854.0, 22672.0, 7952.0, 3305.0, 1641.0, 766.0, 406.0, 251.0, 146.0, 76.0, 56.0, 27.0, 22.0, 16.0, 11.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.494140625, -2.418975830078125, -2.34381103515625, -2.268646240234375, -2.1934814453125, -2.118316650390625, -2.04315185546875, -1.967987060546875, -1.892822265625, -1.817657470703125, -1.74249267578125, -1.667327880859375, -1.5921630859375, -1.516998291015625, -1.44183349609375, -1.366668701171875, -1.29150390625, -1.216339111328125, -1.14117431640625, -1.066009521484375, -0.9908447265625, -0.915679931640625, -0.84051513671875, -0.765350341796875, -0.690185546875, -0.615020751953125, -0.53985595703125, -0.464691162109375, -0.3895263671875, -0.314361572265625, -0.23919677734375, -0.164031982421875, -0.0888671875, -0.013702392578125, 0.06146240234375, 0.136627197265625, 0.2117919921875, 0.286956787109375, 0.36212158203125, 0.437286376953125, 0.512451171875, 0.587615966796875, 0.66278076171875, 0.737945556640625, 0.8131103515625, 0.888275146484375, 0.96343994140625, 1.038604736328125, 1.11376953125, 1.188934326171875, 1.26409912109375, 1.339263916015625, 1.4144287109375, 1.489593505859375, 1.56475830078125, 1.639923095703125, 1.715087890625, 1.790252685546875, 1.86541748046875, 1.940582275390625, 2.0157470703125, 2.090911865234375, 2.16607666015625, 2.241241455078125, 2.31640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 9.0, 14.0, 21.0, 4.0, 19.0, 24.0, 24.0, 43.0, 25.0, 37.0, 49.0, 46.0, 41.0, 51.0, 56.0, 52.0, 54.0, 56.0, 44.0, 40.0, 43.0, 41.0, 30.0, 35.0, 23.0, 29.0, 18.0, 10.0, 20.0, 10.0, 8.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.39501953125, -0.38291168212890625, -0.3708038330078125, -0.35869598388671875, -0.346588134765625, -0.33448028564453125, -0.3223724365234375, -0.31026458740234375, -0.29815673828125, -0.28604888916015625, -0.2739410400390625, -0.26183319091796875, -0.249725341796875, -0.23761749267578125, -0.2255096435546875, -0.21340179443359375, -0.2012939453125, -0.18918609619140625, -0.1770782470703125, -0.16497039794921875, -0.152862548828125, -0.14075469970703125, -0.1286468505859375, -0.11653900146484375, -0.10443115234375, -0.09232330322265625, -0.0802154541015625, -0.06810760498046875, -0.055999755859375, -0.04389190673828125, -0.0317840576171875, -0.01967620849609375, -0.007568359375, 0.00453948974609375, 0.0166473388671875, 0.02875518798828125, 0.040863037109375, 0.05297088623046875, 0.0650787353515625, 0.07718658447265625, 0.08929443359375, 0.10140228271484375, 0.1135101318359375, 0.12561798095703125, 0.137725830078125, 0.14983367919921875, 0.1619415283203125, 0.17404937744140625, 0.1861572265625, 0.19826507568359375, 0.2103729248046875, 0.22248077392578125, 0.234588623046875, 0.24669647216796875, 0.2588043212890625, 0.27091217041015625, 0.28302001953125, 0.29512786865234375, 0.3072357177734375, 0.31934356689453125, 0.331451416015625, 0.34355926513671875, 0.3556671142578125, 0.36777496337890625, 0.3798828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 9.0, 17.0, 18.0, 17.0, 22.0, 36.0, 58.0, 78.0, 92.0, 126.0, 202.0, 333.0, 452.0, 747.0, 1353.0, 2677.0, 5761.0, 14618.0, 53981.0, 638051.0, 3351713.0, 89338.0, 20021.0, 7159.0, 3224.0, 1658.0, 833.0, 530.0, 358.0, 234.0, 161.0, 113.0, 79.0, 44.0, 37.0, 35.0, 25.0, 24.0, 11.0, 9.0, 6.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.3203125, -3.217010498046875, -3.11370849609375, -3.010406494140625, -2.9071044921875, -2.803802490234375, -2.70050048828125, -2.597198486328125, -2.493896484375, -2.390594482421875, -2.28729248046875, -2.183990478515625, -2.0806884765625, -1.977386474609375, -1.87408447265625, -1.770782470703125, -1.66748046875, -1.564178466796875, -1.46087646484375, -1.357574462890625, -1.2542724609375, -1.150970458984375, -1.04766845703125, -0.944366455078125, -0.841064453125, -0.737762451171875, -0.63446044921875, -0.531158447265625, -0.4278564453125, -0.324554443359375, -0.22125244140625, -0.117950439453125, -0.0146484375, 0.088653564453125, 0.19195556640625, 0.295257568359375, 0.3985595703125, 0.501861572265625, 0.60516357421875, 0.708465576171875, 0.811767578125, 0.915069580078125, 1.01837158203125, 1.121673583984375, 1.2249755859375, 1.328277587890625, 1.43157958984375, 1.534881591796875, 1.63818359375, 1.741485595703125, 1.84478759765625, 1.948089599609375, 2.0513916015625, 2.154693603515625, 2.25799560546875, 2.361297607421875, 2.464599609375, 2.567901611328125, 2.67120361328125, 2.774505615234375, 2.8778076171875, 2.981109619140625, 3.08441162109375, 3.187713623046875, 3.291015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 12.0, 21.0, 24.0, 41.0, 74.0, 172.0, 410.0, 2476.0, 466.0, 178.0, 60.0, 45.0, 18.0, 15.0, 9.0, 9.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.99609375, -1.9365234375, -1.876953125, -1.8173828125, -1.7578125, -1.6982421875, -1.638671875, -1.5791015625, -1.51953125, -1.4599609375, -1.400390625, -1.3408203125, -1.28125, -1.2216796875, -1.162109375, -1.1025390625, -1.04296875, -0.9833984375, -0.923828125, -0.8642578125, -0.8046875, -0.7451171875, -0.685546875, -0.6259765625, -0.56640625, -0.5068359375, -0.447265625, -0.3876953125, -0.328125, -0.2685546875, -0.208984375, -0.1494140625, -0.08984375, -0.0302734375, 0.029296875, 0.0888671875, 0.1484375, 0.2080078125, 0.267578125, 0.3271484375, 0.38671875, 0.4462890625, 0.505859375, 0.5654296875, 0.625, 0.6845703125, 0.744140625, 0.8037109375, 0.86328125, 0.9228515625, 0.982421875, 1.0419921875, 1.1015625, 1.1611328125, 1.220703125, 1.2802734375, 1.33984375, 1.3994140625, 1.458984375, 1.5185546875, 1.578125, 1.6376953125, 1.697265625, 1.7568359375, 1.81640625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 24.0, 78.0, 190.0, 366.0, 214.0, 87.0, 24.0, 11.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.99333572387695, -32.28654479980469, -31.579753875732422, -30.872962951660156, -30.166173934936523, -29.459383010864258, -28.752592086791992, -28.045801162719727, -27.33901023864746, -26.632219314575195, -25.92542839050293, -25.218639373779297, -24.51184844970703, -23.805057525634766, -23.0982666015625, -22.391475677490234, -21.68468475341797, -20.977893829345703, -20.271102905273438, -19.564311981201172, -18.85752296447754, -18.150732040405273, -17.443941116333008, -16.737150192260742, -16.03036117553711, -15.323570251464844, -14.616780281066895, -13.909989356994629, -13.203198432922363, -12.496408462524414, -11.789617538452148, -11.082826614379883, -10.376035690307617, -9.669244766235352, -8.962454795837402, -8.255663871765137, -7.548872947692871, -6.842082500457764, -6.135292053222656, -5.428501129150391, -4.721710681915283, -4.014920234680176, -3.30812931060791, -2.6013388633728027, -1.8945481777191162, -1.1877574920654297, -0.48096704483032227, 0.22582387924194336, 0.9326143264770508, 1.6394050121307373, 2.346195697784424, 3.0529861450195312, 3.7597768306732178, 4.466567516326904, 5.173357963562012, 5.880148887634277, 6.586939334869385, 7.293729782104492, 8.000520706176758, 8.707311630249023, 9.414101600646973, 10.120892524719238, 10.827682495117188, 11.534473419189453, 12.241264343261719]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0, 8.0, 11.0, 14.0, 10.0, 19.0, 26.0, 28.0, 32.0, 38.0, 36.0, 50.0, 43.0, 54.0, 53.0, 49.0, 50.0, 41.0, 43.0, 40.0, 44.0, 63.0, 34.0, 42.0, 41.0, 28.0, 22.0, 15.0, 13.0, 15.0, 12.0, 8.0, 7.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.954738616943359, -5.787208557128906, -5.619678497314453, -5.4521484375, -5.284618377685547, -5.117088317871094, -4.949558258056641, -4.7820281982421875, -4.614498138427734, -4.446968078613281, -4.279438018798828, -4.111907958984375, -3.944377899169922, -3.7768478393554688, -3.6093175411224365, -3.4417874813079834, -3.274257183074951, -3.106727123260498, -2.939197063446045, -2.771667003631592, -2.6041369438171387, -2.4366068840026855, -2.2690765857696533, -2.1015465259552, -1.934016466140747, -1.766486406326294, -1.5989563465118408, -1.4314261674880981, -1.263896107673645, -1.096366047859192, -0.9288358688354492, -0.7613058090209961, -0.5937752723693848, -0.42624518275260925, -0.25871509313583374, -0.09118497371673584, 0.07634508609771729, 0.2438751459121704, 0.4114053249359131, 0.5789353847503662, 0.7464654445648193, 0.9139955043792725, 1.0815255641937256, 1.2490557432174683, 1.4165858030319214, 1.5841158628463745, 1.7516460418701172, 1.9191761016845703, 2.0867061614990234, 2.2542362213134766, 2.4217662811279297, 2.589296340942383, 2.756826400756836, 2.924356460571289, 3.0918867588043213, 3.2594168186187744, 3.4269468784332275, 3.5944769382476807, 3.762006998062134, 3.929537296295166, 4.097067356109619, 4.264597415924072, 4.432127475738525, 4.5996575355529785, 4.767187595367432]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 16.0, 18.0, 43.0, 50.0, 110.0, 205.0, 348.0, 626.0, 1284.0, 2657.0, 6061.0, 15869.0, 48578.0, 178953.0, 496532.0, 210873.0, 55886.0, 17810.0, 6758.0, 2894.0, 1378.0, 726.0, 394.0, 175.0, 107.0, 64.0, 33.0, 22.0, 19.0, 17.0, 10.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9238433837890625, -1.856475830078125, -1.7891082763671875, -1.72174072265625, -1.6543731689453125, -1.587005615234375, -1.5196380615234375, -1.4522705078125, -1.3849029541015625, -1.317535400390625, -1.2501678466796875, -1.18280029296875, -1.1154327392578125, -1.048065185546875, -0.9806976318359375, -0.913330078125, -0.8459625244140625, -0.778594970703125, -0.7112274169921875, -0.64385986328125, -0.5764923095703125, -0.509124755859375, -0.4417572021484375, -0.3743896484375, -0.3070220947265625, -0.239654541015625, -0.1722869873046875, -0.10491943359375, -0.0375518798828125, 0.029815673828125, 0.0971832275390625, 0.16455078125, 0.2319183349609375, 0.299285888671875, 0.3666534423828125, 0.43402099609375, 0.5013885498046875, 0.568756103515625, 0.6361236572265625, 0.7034912109375, 0.7708587646484375, 0.838226318359375, 0.9055938720703125, 0.97296142578125, 1.0403289794921875, 1.107696533203125, 1.1750640869140625, 1.242431640625, 1.3097991943359375, 1.377166748046875, 1.4445343017578125, 1.51190185546875, 1.5792694091796875, 1.646636962890625, 1.7140045166015625, 1.7813720703125, 1.8487396240234375, 1.916107177734375, 1.9834747314453125, 2.05084228515625, 2.1182098388671875, 2.185577392578125, 2.2529449462890625, 2.3203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 12.0, 8.0, 10.0, 7.0, 12.0, 16.0, 18.0, 17.0, 30.0, 34.0, 28.0, 40.0, 33.0, 46.0, 39.0, 51.0, 54.0, 37.0, 53.0, 58.0, 61.0, 52.0, 42.0, 40.0, 32.0, 34.0, 27.0, 24.0, 13.0, 15.0, 15.0, 9.0, 13.0, 8.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.456298828125, -0.4423484802246094, -0.42839813232421875, -0.4144477844238281, -0.4004974365234375, -0.3865470886230469, -0.37259674072265625, -0.3586463928222656, -0.344696044921875, -0.3307456970214844, -0.31679534912109375, -0.3028450012207031, -0.2888946533203125, -0.2749443054199219, -0.26099395751953125, -0.24704360961914062, -0.23309326171875, -0.21914291381835938, -0.20519256591796875, -0.19124221801757812, -0.1772918701171875, -0.16334152221679688, -0.14939117431640625, -0.13544082641601562, -0.121490478515625, -0.10754013061523438, -0.09358978271484375, -0.07963943481445312, -0.0656890869140625, -0.051738739013671875, -0.03778839111328125, -0.023838043212890625, -0.0098876953125, 0.004062652587890625, 0.01801300048828125, 0.031963348388671875, 0.0459136962890625, 0.059864044189453125, 0.07381439208984375, 0.08776473999023438, 0.101715087890625, 0.11566543579101562, 0.12961578369140625, 0.14356613159179688, 0.1575164794921875, 0.17146682739257812, 0.18541717529296875, 0.19936752319335938, 0.21331787109375, 0.22726821899414062, 0.24121856689453125, 0.2551689147949219, 0.2691192626953125, 0.2830696105957031, 0.29701995849609375, 0.3109703063964844, 0.324920654296875, 0.3388710021972656, 0.35282135009765625, 0.3667716979980469, 0.3807220458984375, 0.3946723937988281, 0.40862274169921875, 0.4225730895996094, 0.4365234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 5.0, 9.0, 4.0, 9.0, 9.0, 15.0, 32.0, 37.0, 60.0, 88.0, 110.0, 187.0, 274.0, 482.0, 822.0, 1630.0, 3683.0, 9896.0, 35774.0, 197752.0, 623607.0, 133025.0, 26543.0, 7946.0, 3090.0, 1448.0, 748.0, 430.0, 288.0, 168.0, 100.0, 76.0, 57.0, 41.0, 30.0, 22.0, 20.0, 7.0, 11.0, 4.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.779296875, -2.68475341796875, -2.5902099609375, -2.49566650390625, -2.401123046875, -2.30657958984375, -2.2120361328125, -2.11749267578125, -2.02294921875, -1.92840576171875, -1.8338623046875, -1.73931884765625, -1.644775390625, -1.55023193359375, -1.4556884765625, -1.36114501953125, -1.2666015625, -1.17205810546875, -1.0775146484375, -0.98297119140625, -0.888427734375, -0.79388427734375, -0.6993408203125, -0.60479736328125, -0.51025390625, -0.41571044921875, -0.3211669921875, -0.22662353515625, -0.132080078125, -0.03753662109375, 0.0570068359375, 0.15155029296875, 0.24609375, 0.34063720703125, 0.4351806640625, 0.52972412109375, 0.624267578125, 0.71881103515625, 0.8133544921875, 0.90789794921875, 1.00244140625, 1.09698486328125, 1.1915283203125, 1.28607177734375, 1.380615234375, 1.47515869140625, 1.5697021484375, 1.66424560546875, 1.7587890625, 1.85333251953125, 1.9478759765625, 2.04241943359375, 2.136962890625, 2.23150634765625, 2.3260498046875, 2.42059326171875, 2.51513671875, 2.60968017578125, 2.7042236328125, 2.79876708984375, 2.893310546875, 2.98785400390625, 3.0823974609375, 3.17694091796875, 3.271484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 5.0, 9.0, 5.0, 8.0, 15.0, 18.0, 15.0, 13.0, 26.0, 22.0, 24.0, 28.0, 42.0, 39.0, 37.0, 49.0, 43.0, 45.0, 45.0, 48.0, 51.0, 44.0, 42.0, 44.0, 34.0, 39.0, 34.0, 29.0, 19.0, 25.0, 25.0, 17.0, 15.0, 6.0, 5.0, 4.0, 6.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.74609375, -2.66510009765625, -2.5841064453125, -2.50311279296875, -2.422119140625, -2.34112548828125, -2.2601318359375, -2.17913818359375, -2.09814453125, -2.01715087890625, -1.9361572265625, -1.85516357421875, -1.774169921875, -1.69317626953125, -1.6121826171875, -1.53118896484375, -1.4501953125, -1.36920166015625, -1.2882080078125, -1.20721435546875, -1.126220703125, -1.04522705078125, -0.9642333984375, -0.88323974609375, -0.80224609375, -0.72125244140625, -0.6402587890625, -0.55926513671875, -0.478271484375, -0.39727783203125, -0.3162841796875, -0.23529052734375, -0.154296875, -0.07330322265625, 0.0076904296875, 0.08868408203125, 0.169677734375, 0.25067138671875, 0.3316650390625, 0.41265869140625, 0.49365234375, 0.57464599609375, 0.6556396484375, 0.73663330078125, 0.817626953125, 0.89862060546875, 0.9796142578125, 1.06060791015625, 1.1416015625, 1.22259521484375, 1.3035888671875, 1.38458251953125, 1.465576171875, 1.54656982421875, 1.6275634765625, 1.70855712890625, 1.78955078125, 1.87054443359375, 1.9515380859375, 2.03253173828125, 2.113525390625, 2.19451904296875, 2.2755126953125, 2.35650634765625, 2.4375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 7.0, 9.0, 10.0, 14.0, 10.0, 28.0, 34.0, 41.0, 78.0, 120.0, 229.0, 382.0, 989.0, 2978.0, 18254.0, 751411.0, 260520.0, 9836.0, 2046.0, 683.0, 349.0, 185.0, 96.0, 79.0, 57.0, 34.0, 13.0, 14.0, 10.0, 6.0, 6.0, 8.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.693359375, -3.565399169921875, -3.43743896484375, -3.309478759765625, -3.1815185546875, -3.053558349609375, -2.92559814453125, -2.797637939453125, -2.669677734375, -2.541717529296875, -2.41375732421875, -2.285797119140625, -2.1578369140625, -2.029876708984375, -1.90191650390625, -1.773956298828125, -1.64599609375, -1.518035888671875, -1.39007568359375, -1.262115478515625, -1.1341552734375, -1.006195068359375, -0.87823486328125, -0.750274658203125, -0.622314453125, -0.494354248046875, -0.36639404296875, -0.238433837890625, -0.1104736328125, 0.017486572265625, 0.14544677734375, 0.273406982421875, 0.4013671875, 0.529327392578125, 0.65728759765625, 0.785247802734375, 0.9132080078125, 1.041168212890625, 1.16912841796875, 1.297088623046875, 1.425048828125, 1.553009033203125, 1.68096923828125, 1.808929443359375, 1.9368896484375, 2.064849853515625, 2.19281005859375, 2.320770263671875, 2.44873046875, 2.576690673828125, 2.70465087890625, 2.832611083984375, 2.9605712890625, 3.088531494140625, 3.21649169921875, 3.344451904296875, 3.472412109375, 3.600372314453125, 3.72833251953125, 3.856292724609375, 3.9842529296875, 4.112213134765625, 4.24017333984375, 4.368133544921875, 4.49609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 4.0, 12.0, 18.0, 20.0, 30.0, 33.0, 52.0, 71.0, 102.0, 118.0, 123.0, 85.0, 75.0, 82.0, 53.0, 30.0, 27.0, 15.0, 10.0, 2.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003268718719482422, -0.00031601637601852417, -0.00030516088008880615, -0.00029430538415908813, -0.0002834498882293701, -0.0002725943922996521, -0.0002617388963699341, -0.00025088340044021606, -0.00024002790451049805, -0.00022917240858078003, -0.000218316912651062, -0.000207461416721344, -0.00019660592079162598, -0.00018575042486190796, -0.00017489492893218994, -0.00016403943300247192, -0.0001531839370727539, -0.0001423284411430359, -0.00013147294521331787, -0.00012061744928359985, -0.00010976195335388184, -9.890645742416382e-05, -8.80509614944458e-05, -7.719546556472778e-05, -6.633996963500977e-05, -5.548447370529175e-05, -4.462897777557373e-05, -3.377348184585571e-05, -2.2917985916137695e-05, -1.2062489986419678e-05, -1.2069940567016602e-06, 9.648501873016357e-06, 2.0503997802734375e-05, 3.135949373245239e-05, 4.221498966217041e-05, 5.307048559188843e-05, 6.392598152160645e-05, 7.478147745132446e-05, 8.563697338104248e-05, 9.64924693107605e-05, 0.00010734796524047852, 0.00011820346117019653, 0.00012905895709991455, 0.00013991445302963257, 0.00015076994895935059, 0.0001616254448890686, 0.00017248094081878662, 0.00018333643674850464, 0.00019419193267822266, 0.00020504742860794067, 0.0002159029245376587, 0.0002267584204673767, 0.00023761391639709473, 0.00024846941232681274, 0.00025932490825653076, 0.0002701804041862488, 0.0002810359001159668, 0.0002918913960456848, 0.00030274689197540283, 0.00031360238790512085, 0.00032445788383483887, 0.0003353133797645569, 0.0003461688756942749, 0.0003570243716239929, 0.00036787986755371094]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 18.0, 25.0, 34.0, 50.0, 60.0, 100.0, 156.0, 268.0, 443.0, 766.0, 1596.0, 3288.0, 8443.0, 28137.0, 178263.0, 679161.0, 113405.0, 21442.0, 6871.0, 2807.0, 1409.0, 691.0, 412.0, 213.0, 144.0, 98.0, 67.0, 50.0, 30.0, 20.0, 11.0, 9.0, 8.0, 9.0, 6.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.57421875, -1.51458740234375, -1.4549560546875, -1.39532470703125, -1.335693359375, -1.27606201171875, -1.2164306640625, -1.15679931640625, -1.09716796875, -1.03753662109375, -0.9779052734375, -0.91827392578125, -0.858642578125, -0.79901123046875, -0.7393798828125, -0.67974853515625, -0.6201171875, -0.56048583984375, -0.5008544921875, -0.44122314453125, -0.381591796875, -0.32196044921875, -0.2623291015625, -0.20269775390625, -0.14306640625, -0.08343505859375, -0.0238037109375, 0.03582763671875, 0.095458984375, 0.15509033203125, 0.2147216796875, 0.27435302734375, 0.333984375, 0.39361572265625, 0.4532470703125, 0.51287841796875, 0.572509765625, 0.63214111328125, 0.6917724609375, 0.75140380859375, 0.81103515625, 0.87066650390625, 0.9302978515625, 0.98992919921875, 1.049560546875, 1.10919189453125, 1.1688232421875, 1.22845458984375, 1.2880859375, 1.34771728515625, 1.4073486328125, 1.46697998046875, 1.526611328125, 1.58624267578125, 1.6458740234375, 1.70550537109375, 1.76513671875, 1.82476806640625, 1.8843994140625, 1.94403076171875, 2.003662109375, 2.06329345703125, 2.1229248046875, 2.18255615234375, 2.2421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 3.0, 4.0, 9.0, 8.0, 14.0, 17.0, 29.0, 41.0, 51.0, 66.0, 99.0, 106.0, 115.0, 102.0, 88.0, 61.0, 56.0, 32.0, 19.0, 20.0, 8.0, 14.0, 8.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.517608642578125, -1.46881103515625, -1.420013427734375, -1.3712158203125, -1.322418212890625, -1.27362060546875, -1.224822998046875, -1.176025390625, -1.127227783203125, -1.07843017578125, -1.029632568359375, -0.9808349609375, -0.932037353515625, -0.88323974609375, -0.834442138671875, -0.78564453125, -0.736846923828125, -0.68804931640625, -0.639251708984375, -0.5904541015625, -0.541656494140625, -0.49285888671875, -0.444061279296875, -0.395263671875, -0.346466064453125, -0.29766845703125, -0.248870849609375, -0.2000732421875, -0.151275634765625, -0.10247802734375, -0.053680419921875, -0.0048828125, 0.043914794921875, 0.09271240234375, 0.141510009765625, 0.1903076171875, 0.239105224609375, 0.28790283203125, 0.336700439453125, 0.385498046875, 0.434295654296875, 0.48309326171875, 0.531890869140625, 0.5806884765625, 0.629486083984375, 0.67828369140625, 0.727081298828125, 0.77587890625, 0.824676513671875, 0.87347412109375, 0.922271728515625, 0.9710693359375, 1.019866943359375, 1.06866455078125, 1.117462158203125, 1.166259765625, 1.215057373046875, 1.26385498046875, 1.312652587890625, 1.3614501953125, 1.410247802734375, 1.45904541015625, 1.507843017578125, 1.556640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 26.0, 42.0, 82.0, 132.0, 146.0, 159.0, 134.0, 101.0, 70.0, 41.0, 22.0, 13.0, 7.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.737228393554688, -23.920413970947266, -23.103599548339844, -22.286785125732422, -21.469970703125, -20.653156280517578, -19.83634376525879, -19.019529342651367, -18.202714920043945, -17.385900497436523, -16.5690860748291, -15.752272605895996, -14.935458183288574, -14.118643760681152, -13.301830291748047, -12.485015869140625, -11.668201446533203, -10.851387023925781, -10.03457260131836, -9.217759132385254, -8.400944709777832, -7.58413028717041, -6.7673163414001465, -5.950502395629883, -5.133687973022461, -4.316873550415039, -3.5000596046447754, -2.6832454204559326, -1.8664312362670898, -1.049616813659668, -0.2328028678894043, 0.5840110778808594, 1.4008235931396484, 2.217637777328491, 3.034451961517334, 3.8512661457061768, 4.6680803298950195, 5.484894752502441, 6.301708698272705, 7.118522644042969, 7.935337066650391, 8.752151489257812, 9.568965911865234, 10.38577938079834, 11.202593803405762, 12.019408226013184, 12.836221694946289, 13.653036117553711, 14.469850540161133, 15.286664962768555, 16.103479385375977, 16.9202938079834, 17.737106323242188, 18.55392074584961, 19.37073516845703, 20.187549591064453, 21.004364013671875, 21.821178436279297, 22.63799285888672, 23.45480728149414, 24.271621704101562, 25.088436126708984, 25.905248641967773, 26.722063064575195, 27.538877487182617]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 9.0, 7.0, 12.0, 12.0, 13.0, 17.0, 17.0, 20.0, 13.0, 23.0, 30.0, 30.0, 32.0, 34.0, 49.0, 52.0, 35.0, 45.0, 61.0, 46.0, 46.0, 34.0, 37.0, 26.0, 36.0, 31.0, 27.0, 18.0, 27.0, 25.0, 25.0, 13.0, 10.0, 10.0, 15.0, 11.0, 7.0, 11.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.96211051940918, -11.571186065673828, -11.180262565612793, -10.789338111877441, -10.398414611816406, -10.007490158081055, -9.616565704345703, -9.225641250610352, -8.834717750549316, -8.443793296813965, -8.05286979675293, -7.661945343017578, -7.271021366119385, -6.880097389221191, -6.48917293548584, -6.0982489585876465, -5.707324981689453, -5.31640100479126, -4.925477027893066, -4.534552574157715, -4.1436285972595215, -3.752704620361328, -3.3617804050445557, -2.970856189727783, -2.57993221282959, -2.1890082359313965, -1.798084020614624, -1.4071599245071411, -1.0162358283996582, -0.6253117322921753, -0.23438763618469238, 0.15653657913208008, 0.5474615097045898, 0.9383856058120728, 1.3293097019195557, 1.7202337980270386, 2.1111578941345215, 2.502081871032715, 2.8930060863494873, 3.2839303016662598, 3.674854278564453, 4.0657782554626465, 4.45670223236084, 4.847626686096191, 5.238550662994385, 5.629474639892578, 6.02039909362793, 6.411323070526123, 6.802247047424316, 7.19317102432251, 7.584095001220703, 7.975019454956055, 8.365943908691406, 8.756867408752441, 9.147791862487793, 9.538715362548828, 9.92963981628418, 10.320564270019531, 10.711487770080566, 11.102412223815918, 11.493335723876953, 11.884260177612305, 12.275184631347656, 12.666109085083008, 13.057032585144043]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 14.0, 11.0, 17.0, 22.0, 45.0, 61.0, 99.0, 155.0, 265.0, 464.0, 915.0, 2081.0, 6340.0, 50171.0, 4107762.0, 18705.0, 3999.0, 1465.0, 700.0, 385.0, 211.0, 124.0, 102.0, 52.0, 31.0, 21.0, 17.0, 9.0, 8.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.744140625, -5.5546875, -5.365234375, -5.17578125, -4.986328125, -4.796875, -4.607421875, -4.41796875, -4.228515625, -4.0390625, -3.849609375, -3.66015625, -3.470703125, -3.28125, -3.091796875, -2.90234375, -2.712890625, -2.5234375, -2.333984375, -2.14453125, -1.955078125, -1.765625, -1.576171875, -1.38671875, -1.197265625, -1.0078125, -0.818359375, -0.62890625, -0.439453125, -0.25, -0.060546875, 0.12890625, 0.318359375, 0.5078125, 0.697265625, 0.88671875, 1.076171875, 1.265625, 1.455078125, 1.64453125, 1.833984375, 2.0234375, 2.212890625, 2.40234375, 2.591796875, 2.78125, 2.970703125, 3.16015625, 3.349609375, 3.5390625, 3.728515625, 3.91796875, 4.107421875, 4.296875, 4.486328125, 4.67578125, 4.865234375, 5.0546875, 5.244140625, 5.43359375, 5.623046875, 5.8125, 6.001953125, 6.19140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 5.0, 8.0, 12.0, 13.0, 8.0, 11.0, 11.0, 22.0, 12.0, 28.0, 24.0, 24.0, 39.0, 31.0, 40.0, 43.0, 38.0, 59.0, 45.0, 37.0, 57.0, 45.0, 52.0, 37.0, 43.0, 34.0, 28.0, 22.0, 27.0, 26.0, 17.0, 12.0, 9.0, 13.0, 6.0, 7.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.41162109375, -0.397979736328125, -0.38433837890625, -0.370697021484375, -0.3570556640625, -0.343414306640625, -0.32977294921875, -0.316131591796875, -0.302490234375, -0.288848876953125, -0.27520751953125, -0.261566162109375, -0.2479248046875, -0.234283447265625, -0.22064208984375, -0.207000732421875, -0.193359375, -0.179718017578125, -0.16607666015625, -0.152435302734375, -0.1387939453125, -0.125152587890625, -0.11151123046875, -0.097869873046875, -0.084228515625, -0.070587158203125, -0.05694580078125, -0.043304443359375, -0.0296630859375, -0.016021728515625, -0.00238037109375, 0.011260986328125, 0.02490234375, 0.038543701171875, 0.05218505859375, 0.065826416015625, 0.0794677734375, 0.093109130859375, 0.10675048828125, 0.120391845703125, 0.134033203125, 0.147674560546875, 0.16131591796875, 0.174957275390625, 0.1885986328125, 0.202239990234375, 0.21588134765625, 0.229522705078125, 0.2431640625, 0.256805419921875, 0.27044677734375, 0.284088134765625, 0.2977294921875, 0.311370849609375, 0.32501220703125, 0.338653564453125, 0.352294921875, 0.365936279296875, 0.37957763671875, 0.393218994140625, 0.4068603515625, 0.420501708984375, 0.43414306640625, 0.447784423828125, 0.46142578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 14.0, 23.0, 37.0, 67.0, 135.0, 284.0, 627.0, 1673.0, 6704.0, 1735980.0, 2438948.0, 6935.0, 1714.0, 591.0, 278.0, 128.0, 70.0, 32.0, 19.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.296875, -13.939453125, -13.58203125, -13.224609375, -12.8671875, -12.509765625, -12.15234375, -11.794921875, -11.4375, -11.080078125, -10.72265625, -10.365234375, -10.0078125, -9.650390625, -9.29296875, -8.935546875, -8.578125, -8.220703125, -7.86328125, -7.505859375, -7.1484375, -6.791015625, -6.43359375, -6.076171875, -5.71875, -5.361328125, -5.00390625, -4.646484375, -4.2890625, -3.931640625, -3.57421875, -3.216796875, -2.859375, -2.501953125, -2.14453125, -1.787109375, -1.4296875, -1.072265625, -0.71484375, -0.357421875, 0.0, 0.357421875, 0.71484375, 1.072265625, 1.4296875, 1.787109375, 2.14453125, 2.501953125, 2.859375, 3.216796875, 3.57421875, 3.931640625, 4.2890625, 4.646484375, 5.00390625, 5.361328125, 5.71875, 6.076171875, 6.43359375, 6.791015625, 7.1484375, 7.505859375, 7.86328125, 8.220703125, 8.578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 17.0, 46.0, 172.0, 3552.0, 142.0, 53.0, 18.0, 15.0, 16.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.326171875, -1.2925338745117188, -1.2588958740234375, -1.2252578735351562, -1.191619873046875, -1.1579818725585938, -1.1243438720703125, -1.0907058715820312, -1.05706787109375, -1.0234298706054688, -0.9897918701171875, -0.9561538696289062, -0.922515869140625, -0.8888778686523438, -0.8552398681640625, -0.8216018676757812, -0.7879638671875, -0.7543258666992188, -0.7206878662109375, -0.6870498657226562, -0.653411865234375, -0.6197738647460938, -0.5861358642578125, -0.5524978637695312, -0.51885986328125, -0.48522186279296875, -0.4515838623046875, -0.41794586181640625, -0.384307861328125, -0.35066986083984375, -0.3170318603515625, -0.28339385986328125, -0.249755859375, -0.21611785888671875, -0.1824798583984375, -0.14884185791015625, -0.115203857421875, -0.08156585693359375, -0.0479278564453125, -0.01428985595703125, 0.01934814453125, 0.05298614501953125, 0.0866241455078125, 0.12026214599609375, 0.153900146484375, 0.18753814697265625, 0.2211761474609375, 0.25481414794921875, 0.2884521484375, 0.32209014892578125, 0.3557281494140625, 0.38936614990234375, 0.423004150390625, 0.45664215087890625, 0.4902801513671875, 0.5239181518554688, 0.55755615234375, 0.5911941528320312, 0.6248321533203125, 0.6584701538085938, 0.692108154296875, 0.7257461547851562, 0.7593841552734375, 0.7930221557617188, 0.82666015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 12.0, 20.0, 37.0, 60.0, 95.0, 123.0, 141.0, 135.0, 122.0, 76.0, 62.0, 43.0, 18.0, 12.0, 14.0, 7.0, 4.0, 1.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8458211421966553, -2.724628448486328, -2.603435754776001, -2.482243061065674, -2.3610503673553467, -2.2398576736450195, -2.1186647415161133, -1.9974721670150757, -1.8762794733047485, -1.7550867795944214, -1.6338940858840942, -1.5127012729644775, -1.3915085792541504, -1.2703158855438232, -1.149123191833496, -1.027930498123169, -0.9067378044128418, -0.7855451107025146, -0.6643524169921875, -0.5431596636772156, -0.4219669699668884, -0.3007742762565613, -0.17958152294158936, -0.05838882923126221, 0.06280386447906494, 0.18399657309055328, 0.3051892817020416, 0.42638200521469116, 0.5475746989250183, 0.6687673926353455, 0.7899601459503174, 0.9111528396606445, 1.0323452949523926, 1.1535379886627197, 1.2747306823730469, 1.395923376083374, 1.5171160697937012, 1.6383087635040283, 1.759501576423645, 1.8806942701339722, 2.0018868446350098, 2.123079538345337, 2.244272232055664, 2.365464925765991, 2.4866576194763184, 2.6078503131866455, 2.7290430068969727, 2.850235939025879, 2.971428632736206, 3.092621326446533, 3.2138140201568604, 3.3350067138671875, 3.4561994075775146, 3.577392101287842, 3.698585033416748, 3.819777488708496, 3.9409704208374023, 4.062163352966309, 4.183355808258057, 4.304548740386963, 4.425741195678711, 4.546934127807617, 4.668126583099365, 4.7893195152282715, 4.9105119705200195]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 9.0, 4.0, 11.0, 18.0, 13.0, 17.0, 26.0, 15.0, 27.0, 15.0, 36.0, 37.0, 35.0, 37.0, 36.0, 47.0, 35.0, 39.0, 37.0, 40.0, 45.0, 41.0, 33.0, 32.0, 35.0, 30.0, 28.0, 25.0, 28.0, 25.0, 22.0, 9.0, 18.0, 18.0, 11.0, 15.0, 9.0, 7.0, 7.0, 5.0, 7.0, 3.0, 0.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.8350119590759277, -1.7821900844573975, -1.7293682098388672, -1.676546335220337, -1.6237245798110962, -1.570902705192566, -1.5180808305740356, -1.4652589559555054, -1.4124372005462646, -1.3596153259277344, -1.306793451309204, -1.2539715766906738, -1.201149821281433, -1.1483279466629028, -1.0955060720443726, -1.0426841974258423, -0.989862322807312, -0.9370404481887817, -0.8842186331748962, -0.831396758556366, -0.7785749435424805, -0.7257530689239502, -0.6729311943054199, -0.6201093196868896, -0.5672875046730042, -0.5144656300544739, -0.4616438150405884, -0.4088219404220581, -0.3560000956058502, -0.30317825078964233, -0.25035637617111206, -0.19753453135490417, -0.1447126865386963, -0.0918908342719078, -0.039068982005119324, 0.013752877712249756, 0.06657472252845764, 0.11939656734466553, 0.1722184419631958, 0.2250402867794037, 0.2778621315956116, 0.33068397641181946, 0.38350582122802734, 0.4363276958465576, 0.4891495406627655, 0.5419713854789734, 0.5947932600975037, 0.6476150751113892, 0.7004369497299194, 0.7532588243484497, 0.8060806393623352, 0.8589025139808655, 0.911724328994751, 0.9645462036132812, 1.0173680782318115, 1.0701899528503418, 1.123011827468872, 1.1758337020874023, 1.2286555767059326, 1.281477451324463, 1.3342992067337036, 1.3871210813522339, 1.4399429559707642, 1.4927648305892944, 1.5455865859985352]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 3.0, 7.0, 16.0, 22.0, 21.0, 37.0, 67.0, 70.0, 85.0, 146.0, 230.0, 344.0, 451.0, 679.0, 1119.0, 1745.0, 2960.0, 5012.0, 8902.0, 16628.0, 32621.0, 69545.0, 159147.0, 306174.0, 236358.0, 105911.0, 47746.0, 23302.0, 12268.0, 6765.0, 3818.0, 2277.0, 1384.0, 872.0, 573.0, 406.0, 282.0, 166.0, 109.0, 54.0, 66.0, 44.0, 34.0, 22.0, 17.0, 15.0, 11.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 4.0], "bins": [-1.6298828125, -1.5801239013671875, -1.530364990234375, -1.4806060791015625, -1.43084716796875, -1.3810882568359375, -1.331329345703125, -1.2815704345703125, -1.2318115234375, -1.1820526123046875, -1.132293701171875, -1.0825347900390625, -1.03277587890625, -0.9830169677734375, -0.933258056640625, -0.8834991455078125, -0.833740234375, -0.7839813232421875, -0.734222412109375, -0.6844635009765625, -0.63470458984375, -0.5849456787109375, -0.535186767578125, -0.4854278564453125, -0.4356689453125, -0.3859100341796875, -0.336151123046875, -0.2863922119140625, -0.23663330078125, -0.1868743896484375, -0.137115478515625, -0.0873565673828125, -0.03759765625, 0.0121612548828125, 0.061920166015625, 0.1116790771484375, 0.16143798828125, 0.2111968994140625, 0.260955810546875, 0.3107147216796875, 0.3604736328125, 0.4102325439453125, 0.459991455078125, 0.5097503662109375, 0.55950927734375, 0.6092681884765625, 0.659027099609375, 0.7087860107421875, 0.758544921875, 0.8083038330078125, 0.858062744140625, 0.9078216552734375, 0.95758056640625, 1.0073394775390625, 1.057098388671875, 1.1068572998046875, 1.1566162109375, 1.2063751220703125, 1.256134033203125, 1.3058929443359375, 1.35565185546875, 1.4054107666015625, 1.455169677734375, 1.5049285888671875, 1.5546875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 16.0, 12.0, 11.0, 14.0, 17.0, 25.0, 30.0, 37.0, 29.0, 36.0, 46.0, 38.0, 50.0, 48.0, 65.0, 56.0, 45.0, 43.0, 45.0, 44.0, 40.0, 39.0, 33.0, 35.0, 19.0, 22.0, 20.0, 10.0, 14.0, 9.0, 7.0, 8.0, 8.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6181640625, -0.6001358032226562, -0.5821075439453125, -0.5640792846679688, -0.546051025390625, -0.5280227661132812, -0.5099945068359375, -0.49196624755859375, -0.47393798828125, -0.45590972900390625, -0.4378814697265625, -0.41985321044921875, -0.401824951171875, -0.38379669189453125, -0.3657684326171875, -0.34774017333984375, -0.3297119140625, -0.31168365478515625, -0.2936553955078125, -0.27562713623046875, -0.257598876953125, -0.23957061767578125, -0.2215423583984375, -0.20351409912109375, -0.18548583984375, -0.16745758056640625, -0.1494293212890625, -0.13140106201171875, -0.113372802734375, -0.09534454345703125, -0.0773162841796875, -0.05928802490234375, -0.041259765625, -0.02323150634765625, -0.0052032470703125, 0.01282501220703125, 0.030853271484375, 0.04888153076171875, 0.0669097900390625, 0.08493804931640625, 0.10296630859375, 0.12099456787109375, 0.1390228271484375, 0.15705108642578125, 0.175079345703125, 0.19310760498046875, 0.2111358642578125, 0.22916412353515625, 0.2471923828125, 0.26522064208984375, 0.2832489013671875, 0.30127716064453125, 0.319305419921875, 0.33733367919921875, 0.3553619384765625, 0.37339019775390625, 0.39141845703125, 0.40944671630859375, 0.4274749755859375, 0.44550323486328125, 0.463531494140625, 0.48155975341796875, 0.4995880126953125, 0.5176162719726562, 0.53564453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 14.0, 16.0, 15.0, 23.0, 43.0, 54.0, 63.0, 102.0, 138.0, 155.0, 269.0, 399.0, 696.0, 1131.0, 2128.0, 4503.0, 10649.0, 28852.0, 100509.0, 426286.0, 347159.0, 82318.0, 24710.0, 9431.0, 4104.0, 1897.0, 1036.0, 553.0, 369.0, 273.0, 172.0, 110.0, 81.0, 59.0, 57.0, 30.0, 41.0, 19.0, 21.0, 15.0, 5.0, 3.0, 7.0, 6.0, 9.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.658203125, -2.58209228515625, -2.5059814453125, -2.42987060546875, -2.353759765625, -2.27764892578125, -2.2015380859375, -2.12542724609375, -2.04931640625, -1.97320556640625, -1.8970947265625, -1.82098388671875, -1.744873046875, -1.66876220703125, -1.5926513671875, -1.51654052734375, -1.4404296875, -1.36431884765625, -1.2882080078125, -1.21209716796875, -1.135986328125, -1.05987548828125, -0.9837646484375, -0.90765380859375, -0.83154296875, -0.75543212890625, -0.6793212890625, -0.60321044921875, -0.527099609375, -0.45098876953125, -0.3748779296875, -0.29876708984375, -0.22265625, -0.14654541015625, -0.0704345703125, 0.00567626953125, 0.081787109375, 0.15789794921875, 0.2340087890625, 0.31011962890625, 0.38623046875, 0.46234130859375, 0.5384521484375, 0.61456298828125, 0.690673828125, 0.76678466796875, 0.8428955078125, 0.91900634765625, 0.9951171875, 1.07122802734375, 1.1473388671875, 1.22344970703125, 1.299560546875, 1.37567138671875, 1.4517822265625, 1.52789306640625, 1.60400390625, 1.68011474609375, 1.7562255859375, 1.83233642578125, 1.908447265625, 1.98455810546875, 2.0606689453125, 2.13677978515625, 2.212890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 8.0, 5.0, 6.0, 9.0, 9.0, 13.0, 17.0, 19.0, 11.0, 19.0, 20.0, 29.0, 25.0, 38.0, 39.0, 37.0, 35.0, 40.0, 37.0, 40.0, 42.0, 47.0, 35.0, 35.0, 44.0, 48.0, 36.0, 41.0, 27.0, 35.0, 23.0, 16.0, 23.0, 16.0, 12.0, 7.0, 13.0, 6.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.70703125, -2.62091064453125, -2.5347900390625, -2.44866943359375, -2.362548828125, -2.27642822265625, -2.1903076171875, -2.10418701171875, -2.01806640625, -1.93194580078125, -1.8458251953125, -1.75970458984375, -1.673583984375, -1.58746337890625, -1.5013427734375, -1.41522216796875, -1.3291015625, -1.24298095703125, -1.1568603515625, -1.07073974609375, -0.984619140625, -0.89849853515625, -0.8123779296875, -0.72625732421875, -0.64013671875, -0.55401611328125, -0.4678955078125, -0.38177490234375, -0.295654296875, -0.20953369140625, -0.1234130859375, -0.03729248046875, 0.048828125, 0.13494873046875, 0.2210693359375, 0.30718994140625, 0.393310546875, 0.47943115234375, 0.5655517578125, 0.65167236328125, 0.73779296875, 0.82391357421875, 0.9100341796875, 0.99615478515625, 1.082275390625, 1.16839599609375, 1.2545166015625, 1.34063720703125, 1.4267578125, 1.51287841796875, 1.5989990234375, 1.68511962890625, 1.771240234375, 1.85736083984375, 1.9434814453125, 2.02960205078125, 2.11572265625, 2.20184326171875, 2.2879638671875, 2.37408447265625, 2.460205078125, 2.54632568359375, 2.6324462890625, 2.71856689453125, 2.8046875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 8.0, 12.0, 23.0, 14.0, 35.0, 49.0, 84.0, 110.0, 222.0, 431.0, 939.0, 2456.0, 7670.0, 45753.0, 785925.0, 183191.0, 14942.0, 3875.0, 1472.0, 608.0, 273.0, 147.0, 102.0, 47.0, 41.0, 27.0, 19.0, 10.0, 18.0, 15.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.61328125, -2.522308349609375, -2.43133544921875, -2.340362548828125, -2.2493896484375, -2.158416748046875, -2.06744384765625, -1.976470947265625, -1.885498046875, -1.794525146484375, -1.70355224609375, -1.612579345703125, -1.5216064453125, -1.430633544921875, -1.33966064453125, -1.248687744140625, -1.15771484375, -1.066741943359375, -0.97576904296875, -0.884796142578125, -0.7938232421875, -0.702850341796875, -0.61187744140625, -0.520904541015625, -0.429931640625, -0.338958740234375, -0.24798583984375, -0.157012939453125, -0.0660400390625, 0.024932861328125, 0.11590576171875, 0.206878662109375, 0.2978515625, 0.388824462890625, 0.47979736328125, 0.570770263671875, 0.6617431640625, 0.752716064453125, 0.84368896484375, 0.934661865234375, 1.025634765625, 1.116607666015625, 1.20758056640625, 1.298553466796875, 1.3895263671875, 1.480499267578125, 1.57147216796875, 1.662445068359375, 1.75341796875, 1.844390869140625, 1.93536376953125, 2.026336669921875, 2.1173095703125, 2.208282470703125, 2.29925537109375, 2.390228271484375, 2.481201171875, 2.572174072265625, 2.66314697265625, 2.754119873046875, 2.8450927734375, 2.936065673828125, 3.02703857421875, 3.118011474609375, 3.208984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 9.0, 12.0, 14.0, 21.0, 29.0, 57.0, 82.0, 123.0, 139.0, 155.0, 115.0, 87.0, 59.0, 32.0, 27.0, 11.0, 12.0, 10.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004200935363769531, -0.0004064999520778656, -0.0003929063677787781, -0.00037931278347969055, -0.00036571919918060303, -0.0003521256148815155, -0.000338532030582428, -0.00032493844628334045, -0.00031134486198425293, -0.0002977512776851654, -0.0002841576933860779, -0.00027056410908699036, -0.00025697052478790283, -0.0002433769404888153, -0.00022978335618972778, -0.00021618977189064026, -0.00020259618759155273, -0.0001890026032924652, -0.00017540901899337769, -0.00016181543469429016, -0.00014822185039520264, -0.0001346282660961151, -0.00012103468179702759, -0.00010744109749794006, -9.384751319885254e-05, -8.025392889976501e-05, -6.666034460067749e-05, -5.3066760301589966e-05, -3.947317600250244e-05, -2.5879591703414917e-05, -1.2286007404327393e-05, 1.3075768947601318e-06, 1.4901161193847656e-05, 2.849474549293518e-05, 4.2088329792022705e-05, 5.568191409111023e-05, 6.927549839019775e-05, 8.286908268928528e-05, 9.64626669883728e-05, 0.00011005625128746033, 0.00012364983558654785, 0.00013724341988563538, 0.0001508370041847229, 0.00016443058848381042, 0.00017802417278289795, 0.00019161775708198547, 0.000205211341381073, 0.00021880492568016052, 0.00023239850997924805, 0.00024599209427833557, 0.0002595856785774231, 0.0002731792628765106, 0.00028677284717559814, 0.00030036643147468567, 0.0003139600157737732, 0.0003275536000728607, 0.00034114718437194824, 0.00035474076867103577, 0.0003683343529701233, 0.0003819279372692108, 0.00039552152156829834, 0.00040911510586738586, 0.0004227086901664734, 0.0004363022744655609, 0.00044989585876464844]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 4.0, 3.0, 9.0, 13.0, 19.0, 33.0, 44.0, 66.0, 111.0, 200.0, 397.0, 850.0, 2179.0, 7222.0, 69884.0, 899660.0, 57501.0, 6665.0, 2008.0, 808.0, 399.0, 194.0, 96.0, 57.0, 32.0, 30.0, 22.0, 9.0, 8.0, 13.0, 4.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.20745849609375, -3.0906982421875, -2.97393798828125, -2.857177734375, -2.74041748046875, -2.6236572265625, -2.50689697265625, -2.39013671875, -2.27337646484375, -2.1566162109375, -2.03985595703125, -1.923095703125, -1.80633544921875, -1.6895751953125, -1.57281494140625, -1.4560546875, -1.33929443359375, -1.2225341796875, -1.10577392578125, -0.989013671875, -0.87225341796875, -0.7554931640625, -0.63873291015625, -0.52197265625, -0.40521240234375, -0.2884521484375, -0.17169189453125, -0.054931640625, 0.06182861328125, 0.1785888671875, 0.29534912109375, 0.412109375, 0.52886962890625, 0.6456298828125, 0.76239013671875, 0.879150390625, 0.99591064453125, 1.1126708984375, 1.22943115234375, 1.34619140625, 1.46295166015625, 1.5797119140625, 1.69647216796875, 1.813232421875, 1.92999267578125, 2.0467529296875, 2.16351318359375, 2.2802734375, 2.39703369140625, 2.5137939453125, 2.63055419921875, 2.747314453125, 2.86407470703125, 2.9808349609375, 3.09759521484375, 3.21435546875, 3.33111572265625, 3.4478759765625, 3.56463623046875, 3.681396484375, 3.79815673828125, 3.9149169921875, 4.03167724609375, 4.1484375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 8.0, 5.0, 7.0, 20.0, 20.0, 55.0, 70.0, 131.0, 182.0, 184.0, 116.0, 81.0, 42.0, 33.0, 12.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.28515625, -3.196319580078125, -3.10748291015625, -3.018646240234375, -2.9298095703125, -2.840972900390625, -2.75213623046875, -2.663299560546875, -2.574462890625, -2.485626220703125, -2.39678955078125, -2.307952880859375, -2.2191162109375, -2.130279541015625, -2.04144287109375, -1.952606201171875, -1.86376953125, -1.774932861328125, -1.68609619140625, -1.597259521484375, -1.5084228515625, -1.419586181640625, -1.33074951171875, -1.241912841796875, -1.153076171875, -1.064239501953125, -0.97540283203125, -0.886566162109375, -0.7977294921875, -0.708892822265625, -0.62005615234375, -0.531219482421875, -0.4423828125, -0.353546142578125, -0.26470947265625, -0.175872802734375, -0.0870361328125, 0.001800537109375, 0.09063720703125, 0.179473876953125, 0.268310546875, 0.357147216796875, 0.44598388671875, 0.534820556640625, 0.6236572265625, 0.712493896484375, 0.80133056640625, 0.890167236328125, 0.97900390625, 1.067840576171875, 1.15667724609375, 1.245513916015625, 1.3343505859375, 1.423187255859375, 1.51202392578125, 1.600860595703125, 1.689697265625, 1.778533935546875, 1.86737060546875, 1.956207275390625, 2.0450439453125, 2.133880615234375, 2.22271728515625, 2.311553955078125, 2.400390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 13.0, 20.0, 60.0, 99.0, 171.0, 194.0, 180.0, 120.0, 72.0, 34.0, 16.0, 11.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.37241744995117, -34.2209358215332, -33.0694580078125, -31.91797637939453, -30.766494750976562, -29.615013122558594, -28.463533401489258, -27.312053680419922, -26.160572052001953, -25.009090423583984, -23.85761070251465, -22.706130981445312, -21.554649353027344, -20.403167724609375, -19.25168800354004, -18.100208282470703, -16.948726654052734, -15.797245979309082, -14.64576530456543, -13.494284629821777, -12.342803955078125, -11.191323280334473, -10.03984260559082, -8.888361930847168, -7.736881256103516, -6.585400581359863, -5.433919906616211, -4.282439231872559, -3.1309585571289062, -1.979477882385254, -0.8279972076416016, 0.3234834671020508, 1.4749679565429688, 2.626448631286621, 3.7779293060302734, 4.929409980773926, 6.080890655517578, 7.2323713302612305, 8.383852005004883, 9.535332679748535, 10.686813354492188, 11.83829402923584, 12.989774703979492, 14.141255378723145, 15.292736053466797, 16.444217681884766, 17.5956974029541, 18.747177124023438, 19.898658752441406, 21.050140380859375, 22.20162010192871, 23.353099822998047, 24.504581451416016, 25.656063079833984, 26.80754280090332, 27.959022521972656, 29.110504150390625, 30.261985778808594, 31.41346549987793, 32.564945220947266, 33.716426849365234, 34.8679084777832, 36.019386291503906, 37.170867919921875, 38.322349548339844]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 7.0, 8.0, 8.0, 11.0, 8.0, 8.0, 14.0, 16.0, 20.0, 13.0, 20.0, 29.0, 35.0, 32.0, 30.0, 50.0, 53.0, 40.0, 39.0, 57.0, 56.0, 52.0, 50.0, 36.0, 48.0, 37.0, 32.0, 33.0, 27.0, 24.0, 22.0, 14.0, 16.0, 20.0, 6.0, 13.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.56295394897461, -17.0260009765625, -16.48904800415039, -15.952094078063965, -15.415141105651855, -14.878188133239746, -14.34123420715332, -13.804281234741211, -13.267328262329102, -12.730375289916992, -12.193422317504883, -11.656468391418457, -11.119515419006348, -10.582562446594238, -10.045608520507812, -9.508655548095703, -8.971702575683594, -8.434749603271484, -7.897796154022217, -7.360842704772949, -6.82388973236084, -6.2869367599487305, -5.749983310699463, -5.213029861450195, -4.676076889038086, -4.139123916625977, -3.602170467376709, -3.0652172565460205, -2.528264045715332, -1.9913108348846436, -1.454357624053955, -0.9174044132232666, -0.3804512023925781, 0.15650200843811035, 0.6934552192687988, 1.2304084300994873, 1.7673616409301758, 2.3043148517608643, 2.8412680625915527, 3.378221273422241, 3.9151744842529297, 4.452127456665039, 4.989080905914307, 5.526034355163574, 6.062987327575684, 6.599940299987793, 7.1368937492370605, 7.673847198486328, 8.210800170898438, 8.747753143310547, 9.284706115722656, 9.821660041809082, 10.358613014221191, 10.8955659866333, 11.432519912719727, 11.969472885131836, 12.506425857543945, 13.043378829956055, 13.580331802368164, 14.11728572845459, 14.6542387008667, 15.191191673278809, 15.728145599365234, 16.265098571777344, 16.802051544189453]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 17.0, 19.0, 25.0, 35.0, 51.0, 67.0, 92.0, 175.0, 224.0, 389.0, 577.0, 877.0, 1613.0, 2903.0, 6558.0, 18244.0, 125570.0, 3981877.0, 35572.0, 10014.0, 4047.0, 2108.0, 1115.0, 697.0, 450.0, 325.0, 202.0, 116.0, 100.0, 60.0, 44.0, 28.0, 25.0, 14.0, 11.0, 13.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.741363525390625, -2.65069580078125, -2.560028076171875, -2.4693603515625, -2.378692626953125, -2.28802490234375, -2.197357177734375, -2.106689453125, -2.016021728515625, -1.92535400390625, -1.834686279296875, -1.7440185546875, -1.653350830078125, -1.56268310546875, -1.472015380859375, -1.38134765625, -1.290679931640625, -1.20001220703125, -1.109344482421875, -1.0186767578125, -0.928009033203125, -0.83734130859375, -0.746673583984375, -0.656005859375, -0.565338134765625, -0.47467041015625, -0.384002685546875, -0.2933349609375, -0.202667236328125, -0.11199951171875, -0.021331787109375, 0.0693359375, 0.160003662109375, 0.25067138671875, 0.341339111328125, 0.4320068359375, 0.522674560546875, 0.61334228515625, 0.704010009765625, 0.794677734375, 0.885345458984375, 0.97601318359375, 1.066680908203125, 1.1573486328125, 1.248016357421875, 1.33868408203125, 1.429351806640625, 1.52001953125, 1.610687255859375, 1.70135498046875, 1.792022705078125, 1.8826904296875, 1.973358154296875, 2.06402587890625, 2.154693603515625, 2.245361328125, 2.336029052734375, 2.42669677734375, 2.517364501953125, 2.6080322265625, 2.698699951171875, 2.78936767578125, 2.880035400390625, 2.970703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 13.0, 13.0, 19.0, 13.0, 18.0, 18.0, 21.0, 28.0, 32.0, 45.0, 40.0, 60.0, 57.0, 45.0, 58.0, 58.0, 64.0, 58.0, 56.0, 32.0, 38.0, 35.0, 34.0, 21.0, 25.0, 24.0, 16.0, 11.0, 10.0, 9.0, 9.0, 5.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.502166748046875, -0.48138427734375, -0.460601806640625, -0.4398193359375, -0.419036865234375, -0.39825439453125, -0.377471923828125, -0.356689453125, -0.335906982421875, -0.31512451171875, -0.294342041015625, -0.2735595703125, -0.252777099609375, -0.23199462890625, -0.211212158203125, -0.1904296875, -0.169647216796875, -0.14886474609375, -0.128082275390625, -0.1072998046875, -0.086517333984375, -0.06573486328125, -0.044952392578125, -0.024169921875, -0.003387451171875, 0.01739501953125, 0.038177490234375, 0.0589599609375, 0.079742431640625, 0.10052490234375, 0.121307373046875, 0.14208984375, 0.162872314453125, 0.18365478515625, 0.204437255859375, 0.2252197265625, 0.246002197265625, 0.26678466796875, 0.287567138671875, 0.308349609375, 0.329132080078125, 0.34991455078125, 0.370697021484375, 0.3914794921875, 0.412261962890625, 0.43304443359375, 0.453826904296875, 0.474609375, 0.495391845703125, 0.51617431640625, 0.536956787109375, 0.5577392578125, 0.578521728515625, 0.59930419921875, 0.620086669921875, 0.640869140625, 0.661651611328125, 0.68243408203125, 0.703216552734375, 0.7239990234375, 0.744781494140625, 0.76556396484375, 0.786346435546875, 0.80712890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 15.0, 9.0, 22.0, 26.0, 28.0, 41.0, 58.0, 80.0, 88.0, 105.0, 154.0, 207.0, 299.0, 380.0, 631.0, 1023.0, 1736.0, 3402.0, 7628.0, 22610.0, 207995.0, 3885264.0, 41246.0, 10715.0, 4447.0, 2312.0, 1231.0, 751.0, 465.0, 345.0, 239.0, 181.0, 135.0, 95.0, 77.0, 56.0, 39.0, 47.0, 23.0, 23.0, 13.0, 15.0, 1.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25, -3.142333984375, -3.03466796875, -2.927001953125, -2.8193359375, -2.711669921875, -2.60400390625, -2.496337890625, -2.388671875, -2.281005859375, -2.17333984375, -2.065673828125, -1.9580078125, -1.850341796875, -1.74267578125, -1.635009765625, -1.52734375, -1.419677734375, -1.31201171875, -1.204345703125, -1.0966796875, -0.989013671875, -0.88134765625, -0.773681640625, -0.666015625, -0.558349609375, -0.45068359375, -0.343017578125, -0.2353515625, -0.127685546875, -0.02001953125, 0.087646484375, 0.1953125, 0.302978515625, 0.41064453125, 0.518310546875, 0.6259765625, 0.733642578125, 0.84130859375, 0.948974609375, 1.056640625, 1.164306640625, 1.27197265625, 1.379638671875, 1.4873046875, 1.594970703125, 1.70263671875, 1.810302734375, 1.91796875, 2.025634765625, 2.13330078125, 2.240966796875, 2.3486328125, 2.456298828125, 2.56396484375, 2.671630859375, 2.779296875, 2.886962890625, 2.99462890625, 3.102294921875, 3.2099609375, 3.317626953125, 3.42529296875, 3.532958984375, 3.640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 4.0, 5.0, 6.0, 13.0, 42.0, 59.0, 171.0, 3411.0, 208.0, 61.0, 32.0, 15.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0478515625, -1.015655517578125, -0.98345947265625, -0.951263427734375, -0.9190673828125, -0.886871337890625, -0.85467529296875, -0.822479248046875, -0.790283203125, -0.758087158203125, -0.72589111328125, -0.693695068359375, -0.6614990234375, -0.629302978515625, -0.59710693359375, -0.564910888671875, -0.53271484375, -0.500518798828125, -0.46832275390625, -0.436126708984375, -0.4039306640625, -0.371734619140625, -0.33953857421875, -0.307342529296875, -0.275146484375, -0.242950439453125, -0.21075439453125, -0.178558349609375, -0.1463623046875, -0.114166259765625, -0.08197021484375, -0.049774169921875, -0.017578125, 0.014617919921875, 0.04681396484375, 0.079010009765625, 0.1112060546875, 0.143402099609375, 0.17559814453125, 0.207794189453125, 0.239990234375, 0.272186279296875, 0.30438232421875, 0.336578369140625, 0.3687744140625, 0.400970458984375, 0.43316650390625, 0.465362548828125, 0.49755859375, 0.529754638671875, 0.56195068359375, 0.594146728515625, 0.6263427734375, 0.658538818359375, 0.69073486328125, 0.722930908203125, 0.755126953125, 0.787322998046875, 0.81951904296875, 0.851715087890625, 0.8839111328125, 0.916107177734375, 0.94830322265625, 0.980499267578125, 1.0126953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 14.0, 19.0, 20.0, 21.0, 48.0, 42.0, 68.0, 79.0, 98.0, 111.0, 98.0, 93.0, 61.0, 63.0, 50.0, 34.0, 19.0, 13.0, 9.0, 10.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2817435264587402, -3.187826156616211, -3.0939085483551025, -2.9999911785125732, -2.906073570251465, -2.8121562004089355, -2.7182388305664062, -2.624321222305298, -2.5304036140441895, -2.43648624420166, -2.3425686359405518, -2.2486512660980225, -2.154733657836914, -2.0608162879943848, -1.966898798942566, -1.872981309890747, -1.7790639400482178, -1.685146450996399, -1.59122896194458, -1.4973115921020508, -1.4033939838409424, -1.309476613998413, -1.2155591249465942, -1.1216416358947754, -1.0277241468429565, -0.9338066577911377, -0.8398891687393188, -0.7459717392921448, -0.6520542502403259, -0.5581367611885071, -0.464219331741333, -0.37030184268951416, -0.2763843536376953, -0.18246687948703766, -0.08854940533638, 0.005368053913116455, 0.0992855429649353, 0.19320303201675415, 0.2871204614639282, 0.38103795051574707, 0.4749554395675659, 0.5688729286193848, 0.6627904176712036, 0.7567078471183777, 0.8506253361701965, 0.9445428252220154, 1.0384602546691895, 1.1323777437210083, 1.2262952327728271, 1.320212721824646, 1.4141302108764648, 1.5080475807189941, 1.6019651889801025, 1.6958825588226318, 1.7898000478744507, 1.8837175369262695, 1.9776350259780884, 2.0715525150299072, 2.1654698848724365, 2.259387493133545, 2.353304862976074, 2.4472224712371826, 2.541139841079712, 2.6350574493408203, 2.7289748191833496]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 6.0, 6.0, 11.0, 8.0, 4.0, 12.0, 11.0, 13.0, 18.0, 26.0, 22.0, 22.0, 20.0, 27.0, 25.0, 33.0, 35.0, 37.0, 28.0, 33.0, 32.0, 48.0, 30.0, 38.0, 52.0, 35.0, 38.0, 34.0, 44.0, 20.0, 26.0, 21.0, 23.0, 19.0, 18.0, 12.0, 10.0, 14.0, 12.0, 18.0, 13.0, 7.0, 8.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0], "bins": [-1.6309796571731567, -1.5815048217773438, -1.5320299863815308, -1.4825551509857178, -1.4330801963806152, -1.3836053609848022, -1.3341305255889893, -1.2846556901931763, -1.2351808547973633, -1.1857060194015503, -1.1362311840057373, -1.0867562294006348, -1.0372813940048218, -0.9878065586090088, -0.9383317232131958, -0.8888568878173828, -0.8393819332122803, -0.7899070978164673, -0.7404322028160095, -0.6909573674201965, -0.6414824724197388, -0.5920076370239258, -0.5425328016281128, -0.4930579364299774, -0.44358307123184204, -0.39410820603370667, -0.3446333408355713, -0.2951585054397583, -0.24568364024162292, -0.19620877504348755, -0.14673393964767456, -0.09725907444953918, -0.04778420925140381, 0.0016906484961509705, 0.05116550624370575, 0.10064035654067993, 0.1501152217388153, 0.19959008693695068, 0.24906492233276367, 0.29853978753089905, 0.3480146527290344, 0.3974895179271698, 0.4469643831253052, 0.49643921852111816, 0.5459140539169312, 0.5953889489173889, 0.6448637843132019, 0.6943386793136597, 0.7438135147094727, 0.7932883501052856, 0.8427632451057434, 0.8922380805015564, 0.9417129755020142, 0.9911878108978271, 1.0406626462936401, 1.0901374816894531, 1.1396124362945557, 1.1890872716903687, 1.2385621070861816, 1.2880370616912842, 1.3375118970870972, 1.3869867324829102, 1.4364615678787231, 1.4859364032745361, 1.5354112386703491]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 7.0, 18.0, 26.0, 36.0, 64.0, 106.0, 159.0, 239.0, 404.0, 632.0, 1082.0, 1958.0, 3747.0, 7034.0, 14263.0, 31075.0, 72924.0, 176460.0, 332472.0, 230683.0, 96706.0, 40942.0, 18449.0, 8781.0, 4404.0, 2513.0, 1362.0, 737.0, 471.0, 302.0, 170.0, 106.0, 66.0, 59.0, 27.0, 16.0, 16.0, 9.0, 7.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4326171875, -1.385894775390625, -1.33917236328125, -1.292449951171875, -1.2457275390625, -1.199005126953125, -1.15228271484375, -1.105560302734375, -1.058837890625, -1.012115478515625, -0.96539306640625, -0.918670654296875, -0.8719482421875, -0.825225830078125, -0.77850341796875, -0.731781005859375, -0.68505859375, -0.638336181640625, -0.59161376953125, -0.544891357421875, -0.4981689453125, -0.451446533203125, -0.40472412109375, -0.358001708984375, -0.311279296875, -0.264556884765625, -0.21783447265625, -0.171112060546875, -0.1243896484375, -0.077667236328125, -0.03094482421875, 0.015777587890625, 0.0625, 0.109222412109375, 0.15594482421875, 0.202667236328125, 0.2493896484375, 0.296112060546875, 0.34283447265625, 0.389556884765625, 0.436279296875, 0.483001708984375, 0.52972412109375, 0.576446533203125, 0.6231689453125, 0.669891357421875, 0.71661376953125, 0.763336181640625, 0.81005859375, 0.856781005859375, 0.90350341796875, 0.950225830078125, 0.9969482421875, 1.043670654296875, 1.09039306640625, 1.137115478515625, 1.183837890625, 1.230560302734375, 1.27728271484375, 1.324005126953125, 1.3707275390625, 1.417449951171875, 1.46417236328125, 1.510894775390625, 1.5576171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 6.0, 17.0, 11.0, 15.0, 20.0, 26.0, 35.0, 31.0, 45.0, 40.0, 58.0, 38.0, 45.0, 51.0, 49.0, 63.0, 60.0, 51.0, 48.0, 49.0, 38.0, 28.0, 26.0, 20.0, 29.0, 20.0, 13.0, 15.0, 6.0, 12.0, 8.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.71826171875, -0.6962051391601562, -0.6741485595703125, -0.6520919799804688, -0.630035400390625, -0.6079788208007812, -0.5859222412109375, -0.5638656616210938, -0.54180908203125, -0.5197525024414062, -0.4976959228515625, -0.47563934326171875, -0.453582763671875, -0.43152618408203125, -0.4094696044921875, -0.38741302490234375, -0.3653564453125, -0.34329986572265625, -0.3212432861328125, -0.29918670654296875, -0.277130126953125, -0.25507354736328125, -0.2330169677734375, -0.21096038818359375, -0.18890380859375, -0.16684722900390625, -0.1447906494140625, -0.12273406982421875, -0.100677490234375, -0.07862091064453125, -0.0565643310546875, -0.03450775146484375, -0.012451171875, 0.00960540771484375, 0.0316619873046875, 0.05371856689453125, 0.075775146484375, 0.09783172607421875, 0.1198883056640625, 0.14194488525390625, 0.16400146484375, 0.18605804443359375, 0.2081146240234375, 0.23017120361328125, 0.252227783203125, 0.27428436279296875, 0.2963409423828125, 0.31839752197265625, 0.3404541015625, 0.36251068115234375, 0.3845672607421875, 0.40662384033203125, 0.428680419921875, 0.45073699951171875, 0.4727935791015625, 0.49485015869140625, 0.51690673828125, 0.5389633178710938, 0.5610198974609375, 0.5830764770507812, 0.605133056640625, 0.6271896362304688, 0.6492462158203125, 0.6713027954101562, 0.693359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 7.0, 7.0, 8.0, 12.0, 18.0, 29.0, 44.0, 44.0, 86.0, 122.0, 176.0, 306.0, 465.0, 827.0, 1769.0, 4449.0, 15372.0, 83846.0, 593826.0, 292402.0, 39535.0, 9020.0, 3079.0, 1299.0, 676.0, 365.0, 237.0, 193.0, 104.0, 64.0, 41.0, 40.0, 28.0, 16.0, 8.0, 12.0, 6.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.921875, -2.826995849609375, -2.73211669921875, -2.637237548828125, -2.5423583984375, -2.447479248046875, -2.35260009765625, -2.257720947265625, -2.162841796875, -2.067962646484375, -1.97308349609375, -1.878204345703125, -1.7833251953125, -1.688446044921875, -1.59356689453125, -1.498687744140625, -1.40380859375, -1.308929443359375, -1.21405029296875, -1.119171142578125, -1.0242919921875, -0.929412841796875, -0.83453369140625, -0.739654541015625, -0.644775390625, -0.549896240234375, -0.45501708984375, -0.360137939453125, -0.2652587890625, -0.170379638671875, -0.07550048828125, 0.019378662109375, 0.1142578125, 0.209136962890625, 0.30401611328125, 0.398895263671875, 0.4937744140625, 0.588653564453125, 0.68353271484375, 0.778411865234375, 0.873291015625, 0.968170166015625, 1.06304931640625, 1.157928466796875, 1.2528076171875, 1.347686767578125, 1.44256591796875, 1.537445068359375, 1.63232421875, 1.727203369140625, 1.82208251953125, 1.916961669921875, 2.0118408203125, 2.106719970703125, 2.20159912109375, 2.296478271484375, 2.391357421875, 2.486236572265625, 2.58111572265625, 2.675994873046875, 2.7708740234375, 2.865753173828125, 2.96063232421875, 3.055511474609375, 3.150390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 10.0, 9.0, 11.0, 16.0, 15.0, 19.0, 18.0, 23.0, 28.0, 32.0, 31.0, 33.0, 37.0, 43.0, 40.0, 41.0, 39.0, 38.0, 41.0, 31.0, 35.0, 35.0, 46.0, 41.0, 25.0, 31.0, 27.0, 32.0, 27.0, 19.0, 21.0, 22.0, 12.0, 11.0, 8.0, 12.0, 7.0, 6.0, 3.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.888671875, -2.798431396484375, -2.70819091796875, -2.617950439453125, -2.5277099609375, -2.437469482421875, -2.34722900390625, -2.256988525390625, -2.166748046875, -2.076507568359375, -1.98626708984375, -1.896026611328125, -1.8057861328125, -1.715545654296875, -1.62530517578125, -1.535064697265625, -1.44482421875, -1.354583740234375, -1.26434326171875, -1.174102783203125, -1.0838623046875, -0.993621826171875, -0.90338134765625, -0.813140869140625, -0.722900390625, -0.632659912109375, -0.54241943359375, -0.452178955078125, -0.3619384765625, -0.271697998046875, -0.18145751953125, -0.091217041015625, -0.0009765625, 0.089263916015625, 0.17950439453125, 0.269744873046875, 0.3599853515625, 0.450225830078125, 0.54046630859375, 0.630706787109375, 0.720947265625, 0.811187744140625, 0.90142822265625, 0.991668701171875, 1.0819091796875, 1.172149658203125, 1.26239013671875, 1.352630615234375, 1.44287109375, 1.533111572265625, 1.62335205078125, 1.713592529296875, 1.8038330078125, 1.894073486328125, 1.98431396484375, 2.074554443359375, 2.164794921875, 2.255035400390625, 2.34527587890625, 2.435516357421875, 2.5257568359375, 2.615997314453125, 2.70623779296875, 2.796478271484375, 2.88671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 10.0, 15.0, 16.0, 34.0, 74.0, 104.0, 246.0, 493.0, 1500.0, 6297.0, 60388.0, 814120.0, 150702.0, 11065.0, 2113.0, 766.0, 283.0, 128.0, 68.0, 37.0, 11.0, 20.0, 22.0, 8.0, 4.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.4982757568359375, -2.428192138671875, -2.3581085205078125, -2.28802490234375, -2.2179412841796875, -2.147857666015625, -2.0777740478515625, -2.0076904296875, -1.9376068115234375, -1.867523193359375, -1.7974395751953125, -1.72735595703125, -1.6572723388671875, -1.587188720703125, -1.5171051025390625, -1.447021484375, -1.3769378662109375, -1.306854248046875, -1.2367706298828125, -1.16668701171875, -1.0966033935546875, -1.026519775390625, -0.9564361572265625, -0.8863525390625, -0.8162689208984375, -0.746185302734375, -0.6761016845703125, -0.60601806640625, -0.5359344482421875, -0.465850830078125, -0.3957672119140625, -0.32568359375, -0.2555999755859375, -0.185516357421875, -0.1154327392578125, -0.04534912109375, 0.0247344970703125, 0.094818115234375, 0.1649017333984375, 0.2349853515625, 0.3050689697265625, 0.375152587890625, 0.4452362060546875, 0.51531982421875, 0.5854034423828125, 0.655487060546875, 0.7255706787109375, 0.795654296875, 0.8657379150390625, 0.935821533203125, 1.0059051513671875, 1.07598876953125, 1.1460723876953125, 1.216156005859375, 1.2862396240234375, 1.3563232421875, 1.4264068603515625, 1.496490478515625, 1.5665740966796875, 1.63665771484375, 1.7067413330078125, 1.776824951171875, 1.8469085693359375, 1.9169921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 2.0, 8.0, 8.0, 7.0, 8.0, 13.0, 22.0, 21.0, 35.0, 45.0, 54.0, 66.0, 84.0, 89.0, 105.0, 97.0, 68.0, 66.0, 38.0, 36.0, 17.0, 30.0, 23.0, 11.0, 6.0, 13.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001964569091796875, -0.0001887008547782898, -0.0001809448003768921, -0.00017318874597549438, -0.00016543269157409668, -0.00015767663717269897, -0.00014992058277130127, -0.00014216452836990356, -0.00013440847396850586, -0.00012665241956710815, -0.00011889636516571045, -0.00011114031076431274, -0.00010338425636291504, -9.562820196151733e-05, -8.787214756011963e-05, -8.011609315872192e-05, -7.236003875732422e-05, -6.460398435592651e-05, -5.684792995452881e-05, -4.9091875553131104e-05, -4.13358211517334e-05, -3.357976675033569e-05, -2.5823712348937988e-05, -1.8067657947540283e-05, -1.0311603546142578e-05, -2.555549144744873e-06, 5.200505256652832e-06, 1.2956559658050537e-05, 2.0712614059448242e-05, 2.8468668460845947e-05, 3.622472286224365e-05, 4.398077726364136e-05, 5.173683166503906e-05, 5.949288606643677e-05, 6.724894046783447e-05, 7.500499486923218e-05, 8.276104927062988e-05, 9.051710367202759e-05, 9.827315807342529e-05, 0.000106029212474823, 0.0001137852668762207, 0.00012154132127761841, 0.0001292973756790161, 0.00013705343008041382, 0.00014480948448181152, 0.00015256553888320923, 0.00016032159328460693, 0.00016807764768600464, 0.00017583370208740234, 0.00018358975648880005, 0.00019134581089019775, 0.00019910186529159546, 0.00020685791969299316, 0.00021461397409439087, 0.00022237002849578857, 0.00023012608289718628, 0.00023788213729858398, 0.0002456381916999817, 0.0002533942461013794, 0.0002611503005027771, 0.0002689063549041748, 0.0002766624093055725, 0.0002844184637069702, 0.0002921745181083679, 0.0002999305725097656]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 7.0, 12.0, 5.0, 5.0, 17.0, 15.0, 33.0, 54.0, 94.0, 120.0, 223.0, 343.0, 681.0, 1378.0, 3247.0, 9862.0, 46583.0, 376765.0, 522921.0, 66409.0, 12513.0, 3812.0, 1635.0, 766.0, 409.0, 260.0, 127.0, 85.0, 47.0, 38.0, 18.0, 18.0, 19.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.455078125, -1.4082794189453125, -1.361480712890625, -1.3146820068359375, -1.26788330078125, -1.2210845947265625, -1.174285888671875, -1.1274871826171875, -1.0806884765625, -1.0338897705078125, -0.987091064453125, -0.9402923583984375, -0.89349365234375, -0.8466949462890625, -0.799896240234375, -0.7530975341796875, -0.706298828125, -0.6595001220703125, -0.612701416015625, -0.5659027099609375, -0.51910400390625, -0.4723052978515625, -0.425506591796875, -0.3787078857421875, -0.3319091796875, -0.2851104736328125, -0.238311767578125, -0.1915130615234375, -0.14471435546875, -0.0979156494140625, -0.051116943359375, -0.0043182373046875, 0.04248046875, 0.0892791748046875, 0.136077880859375, 0.1828765869140625, 0.22967529296875, 0.2764739990234375, 0.323272705078125, 0.3700714111328125, 0.4168701171875, 0.4636688232421875, 0.510467529296875, 0.5572662353515625, 0.60406494140625, 0.6508636474609375, 0.697662353515625, 0.7444610595703125, 0.791259765625, 0.8380584716796875, 0.884857177734375, 0.9316558837890625, 0.97845458984375, 1.0252532958984375, 1.072052001953125, 1.1188507080078125, 1.1656494140625, 1.2124481201171875, 1.259246826171875, 1.3060455322265625, 1.35284423828125, 1.3996429443359375, 1.446441650390625, 1.4932403564453125, 1.5400390625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 10.0, 18.0, 28.0, 35.0, 53.0, 51.0, 63.0, 75.0, 73.0, 100.0, 81.0, 59.0, 67.0, 42.0, 46.0, 45.0, 25.0, 18.0, 16.0, 12.0, 13.0, 6.0, 4.0, 2.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2441864013671875, -1.208099365234375, -1.1720123291015625, -1.13592529296875, -1.0998382568359375, -1.063751220703125, -1.0276641845703125, -0.9915771484375, -0.9554901123046875, -0.919403076171875, -0.8833160400390625, -0.84722900390625, -0.8111419677734375, -0.775054931640625, -0.7389678955078125, -0.702880859375, -0.6667938232421875, -0.630706787109375, -0.5946197509765625, -0.55853271484375, -0.5224456787109375, -0.486358642578125, -0.4502716064453125, -0.4141845703125, -0.3780975341796875, -0.342010498046875, -0.3059234619140625, -0.26983642578125, -0.2337493896484375, -0.197662353515625, -0.1615753173828125, -0.12548828125, -0.0894012451171875, -0.053314208984375, -0.0172271728515625, 0.01885986328125, 0.0549468994140625, 0.091033935546875, 0.1271209716796875, 0.1632080078125, 0.1992950439453125, 0.235382080078125, 0.2714691162109375, 0.30755615234375, 0.3436431884765625, 0.379730224609375, 0.4158172607421875, 0.451904296875, 0.4879913330078125, 0.524078369140625, 0.5601654052734375, 0.59625244140625, 0.6323394775390625, 0.668426513671875, 0.7045135498046875, 0.7406005859375, 0.7766876220703125, 0.812774658203125, 0.8488616943359375, 0.88494873046875, 0.9210357666015625, 0.957122802734375, 0.9932098388671875, 1.029296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 17.0, 42.0, 107.0, 155.0, 228.0, 214.0, 135.0, 56.0, 24.0, 13.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.38730239868164, -38.2537841796875, -37.120269775390625, -35.986751556396484, -34.853233337402344, -33.71971893310547, -32.58620071411133, -31.45268440246582, -30.319168090820312, -29.185651779174805, -28.052135467529297, -26.918617248535156, -25.78510093688965, -24.65158462524414, -23.51806640625, -22.384550094604492, -21.251033782958984, -20.117517471313477, -18.98400115966797, -17.850482940673828, -16.71696662902832, -15.583450317382812, -14.449933052062988, -13.316415786743164, -12.182899475097656, -11.049383163452148, -9.915865898132324, -8.7823486328125, -7.648832321166992, -6.515315532684326, -5.38179874420166, -4.248281955718994, -3.1147689819335938, -1.9812521934509277, -0.8477354049682617, 0.2857813835144043, 1.4192981719970703, 2.5528149604797363, 3.6863317489624023, 4.819848537445068, 5.953365325927734, 7.0868821144104, 8.220398902893066, 9.35391616821289, 10.487432479858398, 11.620948791503906, 12.75446605682373, 13.887983322143555, 15.021499633789062, 16.15501594543457, 17.288532257080078, 18.42205047607422, 19.555566787719727, 20.689083099365234, 21.822601318359375, 22.956117630004883, 24.08963394165039, 25.2231502532959, 26.356666564941406, 27.490184783935547, 28.623701095581055, 29.757217407226562, 30.890735626220703, 32.02425003051758, 33.15776824951172]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 6.0, 8.0, 11.0, 15.0, 19.0, 25.0, 26.0, 36.0, 36.0, 28.0, 38.0, 46.0, 46.0, 63.0, 53.0, 59.0, 58.0, 47.0, 53.0, 41.0, 45.0, 47.0, 38.0, 24.0, 23.0, 15.0, 19.0, 17.0, 12.0, 11.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.001277923583984, -17.47834587097168, -16.955413818359375, -16.432483673095703, -15.909551620483398, -15.386619567871094, -14.863687515258789, -14.340755462646484, -13.817824363708496, -13.294892311096191, -12.771961212158203, -12.249029159545898, -11.726097106933594, -11.203166007995605, -10.6802339553833, -10.157302856445312, -9.634370803833008, -9.111438751220703, -8.588507652282715, -8.06557559967041, -7.542644023895264, -7.019712448120117, -6.4967803955078125, -5.973848819732666, -5.4509172439575195, -4.927985668182373, -4.405054092407227, -3.882122039794922, -3.3591904640197754, -2.836258888244629, -2.3133270740509033, -1.7903952598571777, -1.267465591430664, -0.744533896446228, -0.221602201461792, 0.30132949352264404, 0.8242611885070801, 1.3471927642822266, 1.8701245784759521, 2.3930563926696777, 2.915987968444824, 3.4389195442199707, 3.9618513584136963, 4.484783172607422, 5.007714748382568, 5.530646324157715, 6.0535783767700195, 6.576509952545166, 7.0994415283203125, 7.622373104095459, 8.145304679870605, 8.66823673248291, 9.191167831420898, 9.714099884033203, 10.237031936645508, 10.759963989257812, 11.2828950881958, 11.805827140808105, 12.328758239746094, 12.851690292358398, 13.374622344970703, 13.897553443908691, 14.420485496520996, 14.943416595458984, 15.466348648071289]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 7.0, 9.0, 21.0, 21.0, 27.0, 33.0, 47.0, 80.0, 109.0, 122.0, 186.0, 264.0, 376.0, 655.0, 1018.0, 1774.0, 3389.0, 9228.0, 55607.0, 4082874.0, 25455.0, 6304.0, 2704.0, 1443.0, 865.0, 522.0, 316.0, 198.0, 166.0, 119.0, 66.0, 64.0, 40.0, 42.0, 28.0, 18.0, 9.0, 10.0, 14.0, 10.0, 5.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.439453125, -3.33306884765625, -3.2266845703125, -3.12030029296875, -3.013916015625, -2.90753173828125, -2.8011474609375, -2.69476318359375, -2.58837890625, -2.48199462890625, -2.3756103515625, -2.26922607421875, -2.162841796875, -2.05645751953125, -1.9500732421875, -1.84368896484375, -1.7373046875, -1.63092041015625, -1.5245361328125, -1.41815185546875, -1.311767578125, -1.20538330078125, -1.0989990234375, -0.99261474609375, -0.88623046875, -0.77984619140625, -0.6734619140625, -0.56707763671875, -0.460693359375, -0.35430908203125, -0.2479248046875, -0.14154052734375, -0.03515625, 0.07122802734375, 0.1776123046875, 0.28399658203125, 0.390380859375, 0.49676513671875, 0.6031494140625, 0.70953369140625, 0.81591796875, 0.92230224609375, 1.0286865234375, 1.13507080078125, 1.241455078125, 1.34783935546875, 1.4542236328125, 1.56060791015625, 1.6669921875, 1.77337646484375, 1.8797607421875, 1.98614501953125, 2.092529296875, 2.19891357421875, 2.3052978515625, 2.41168212890625, 2.51806640625, 2.62445068359375, 2.7308349609375, 2.83721923828125, 2.943603515625, 3.04998779296875, 3.1563720703125, 3.26275634765625, 3.369140625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 11.0, 8.0, 7.0, 10.0, 12.0, 20.0, 18.0, 16.0, 24.0, 43.0, 37.0, 41.0, 52.0, 42.0, 51.0, 49.0, 54.0, 51.0, 66.0, 53.0, 44.0, 42.0, 48.0, 32.0, 25.0, 24.0, 23.0, 10.0, 15.0, 17.0, 9.0, 9.0, 9.0, 1.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.662109375, -0.640533447265625, -0.61895751953125, -0.597381591796875, -0.5758056640625, -0.554229736328125, -0.53265380859375, -0.511077880859375, -0.489501953125, -0.467926025390625, -0.44635009765625, -0.424774169921875, -0.4031982421875, -0.381622314453125, -0.36004638671875, -0.338470458984375, -0.31689453125, -0.295318603515625, -0.27374267578125, -0.252166748046875, -0.2305908203125, -0.209014892578125, -0.18743896484375, -0.165863037109375, -0.144287109375, -0.122711181640625, -0.10113525390625, -0.079559326171875, -0.0579833984375, -0.036407470703125, -0.01483154296875, 0.006744384765625, 0.0283203125, 0.049896240234375, 0.07147216796875, 0.093048095703125, 0.1146240234375, 0.136199951171875, 0.15777587890625, 0.179351806640625, 0.200927734375, 0.222503662109375, 0.24407958984375, 0.265655517578125, 0.2872314453125, 0.308807373046875, 0.33038330078125, 0.351959228515625, 0.37353515625, 0.395111083984375, 0.41668701171875, 0.438262939453125, 0.4598388671875, 0.481414794921875, 0.50299072265625, 0.524566650390625, 0.546142578125, 0.567718505859375, 0.58929443359375, 0.610870361328125, 0.6324462890625, 0.654022216796875, 0.67559814453125, 0.697174072265625, 0.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 10.0, 15.0, 16.0, 23.0, 26.0, 51.0, 71.0, 111.0, 197.0, 267.0, 482.0, 874.0, 1528.0, 2817.0, 6067.0, 16426.0, 110097.0, 4005691.0, 31776.0, 9247.0, 3895.0, 1941.0, 1054.0, 589.0, 374.0, 213.0, 143.0, 84.0, 56.0, 42.0, 26.0, 30.0, 15.0, 11.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.365234375, -3.26397705078125, -3.1627197265625, -3.06146240234375, -2.960205078125, -2.85894775390625, -2.7576904296875, -2.65643310546875, -2.55517578125, -2.45391845703125, -2.3526611328125, -2.25140380859375, -2.150146484375, -2.04888916015625, -1.9476318359375, -1.84637451171875, -1.7451171875, -1.64385986328125, -1.5426025390625, -1.44134521484375, -1.340087890625, -1.23883056640625, -1.1375732421875, -1.03631591796875, -0.93505859375, -0.83380126953125, -0.7325439453125, -0.63128662109375, -0.530029296875, -0.42877197265625, -0.3275146484375, -0.22625732421875, -0.125, -0.02374267578125, 0.0775146484375, 0.17877197265625, 0.280029296875, 0.38128662109375, 0.4825439453125, 0.58380126953125, 0.68505859375, 0.78631591796875, 0.8875732421875, 0.98883056640625, 1.090087890625, 1.19134521484375, 1.2926025390625, 1.39385986328125, 1.4951171875, 1.59637451171875, 1.6976318359375, 1.79888916015625, 1.900146484375, 2.00140380859375, 2.1026611328125, 2.20391845703125, 2.30517578125, 2.40643310546875, 2.5076904296875, 2.60894775390625, 2.710205078125, 2.81146240234375, 2.9127197265625, 3.01397705078125, 3.115234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 6.0, 8.0, 14.0, 20.0, 18.0, 47.0, 175.0, 3543.0, 116.0, 43.0, 24.0, 14.0, 4.0, 7.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84375, -0.8205413818359375, -0.797332763671875, -0.7741241455078125, -0.75091552734375, -0.7277069091796875, -0.704498291015625, -0.6812896728515625, -0.6580810546875, -0.6348724365234375, -0.611663818359375, -0.5884552001953125, -0.56524658203125, -0.5420379638671875, -0.518829345703125, -0.4956207275390625, -0.472412109375, -0.4492034912109375, -0.425994873046875, -0.4027862548828125, -0.37957763671875, -0.3563690185546875, -0.333160400390625, -0.3099517822265625, -0.2867431640625, -0.2635345458984375, -0.240325927734375, -0.2171173095703125, -0.19390869140625, -0.1707000732421875, -0.147491455078125, -0.1242828369140625, -0.10107421875, -0.0778656005859375, -0.054656982421875, -0.0314483642578125, -0.00823974609375, 0.0149688720703125, 0.038177490234375, 0.0613861083984375, 0.0845947265625, 0.1078033447265625, 0.131011962890625, 0.1542205810546875, 0.17742919921875, 0.2006378173828125, 0.223846435546875, 0.2470550537109375, 0.270263671875, 0.2934722900390625, 0.316680908203125, 0.3398895263671875, 0.36309814453125, 0.3863067626953125, 0.409515380859375, 0.4327239990234375, 0.4559326171875, 0.4791412353515625, 0.502349853515625, 0.5255584716796875, 0.54876708984375, 0.5719757080078125, 0.595184326171875, 0.6183929443359375, 0.6416015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 6.0, 7.0, 11.0, 28.0, 53.0, 64.0, 104.0, 136.0, 152.0, 165.0, 127.0, 58.0, 39.0, 22.0, 15.0, 10.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.265946388244629, -4.1496381759643555, -4.03333044052124, -3.917022228240967, -3.8007142543792725, -3.684406042098999, -3.5680980682373047, -3.4517898559570312, -3.335481882095337, -3.2191739082336426, -3.102865695953369, -2.986557722091675, -2.8702497482299805, -2.753941535949707, -2.6376335620880127, -2.5213255882263184, -2.405017375946045, -2.2887094020843506, -2.172401189804077, -2.056093215942383, -1.939785122871399, -1.823477029800415, -1.7071690559387207, -1.5908609628677368, -1.474553108215332, -1.3582450151443481, -1.2419370412826538, -1.12562894821167, -1.009320855140686, -0.8930128216743469, -0.7767047882080078, -0.6603966951370239, -0.54408860206604, -0.42778053879737854, -0.31147247552871704, -0.19516444206237793, -0.07885637879371643, 0.03745168447494507, 0.15375971794128418, 0.27006781101226807, 0.3863758444786072, 0.5026838779449463, 0.6189919710159302, 0.7353000044822693, 0.8516080379486084, 0.9679161310195923, 1.0842242240905762, 1.2005321979522705, 1.3168402910232544, 1.4331483840942383, 1.5494563579559326, 1.6657644510269165, 1.7820725440979004, 1.8983805179595947, 2.014688491821289, 2.1309967041015625, 2.247304677963257, 2.363612651824951, 2.4799208641052246, 2.596228837966919, 2.7125368118286133, 2.8288450241088867, 2.945152997970581, 3.0614609718322754, 3.177769184112549]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 2.0, 6.0, 5.0, 6.0, 8.0, 10.0, 9.0, 9.0, 21.0, 15.0, 30.0, 23.0, 38.0, 31.0, 26.0, 31.0, 33.0, 39.0, 36.0, 54.0, 51.0, 46.0, 39.0, 33.0, 42.0, 48.0, 42.0, 29.0, 31.0, 31.0, 24.0, 26.0, 22.0, 12.0, 14.0, 13.0, 7.0, 14.0, 7.0, 7.0, 9.0, 2.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.281733512878418, -1.2431830167770386, -1.2046325206756592, -1.1660820245742798, -1.1275315284729004, -1.0889809131622314, -1.050430417060852, -1.0118799209594727, -0.9733294248580933, -0.9347789287567139, -0.8962284326553345, -0.8576778769493103, -0.8191273808479309, -0.7805768847465515, -0.7420263290405273, -0.703475832939148, -0.6649253368377686, -0.6263748407363892, -0.5878243446350098, -0.5492737889289856, -0.5107232928276062, -0.4721727967262268, -0.433622270822525, -0.39507174491882324, -0.35652124881744385, -0.31797075271606445, -0.27942022681236267, -0.24086971580982208, -0.2023192048072815, -0.1637686938047409, -0.12521818280220032, -0.08666765689849854, -0.04811704158782959, -0.009566530585289001, 0.028983980417251587, 0.06753449141979218, 0.10608500242233276, 0.14463551342487335, 0.18318602442741394, 0.22173655033111572, 0.2602870464324951, 0.2988375425338745, 0.3373880684375763, 0.3759385943412781, 0.41448909044265747, 0.45303958654403687, 0.49159011244773865, 0.5301406383514404, 0.5686911344528198, 0.6072416305541992, 0.6457921266555786, 0.6843426823616028, 0.7228931784629822, 0.7614436745643616, 0.7999942302703857, 0.8385447263717651, 0.8770952224731445, 0.9156457185745239, 0.9541962146759033, 0.9927467703819275, 1.031297206878662, 1.069847822189331, 1.1083983182907104, 1.1469488143920898, 1.1854993104934692]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 12.0, 17.0, 30.0, 33.0, 74.0, 109.0, 146.0, 285.0, 450.0, 873.0, 1640.0, 3264.0, 6747.0, 14554.0, 34617.0, 86327.0, 232098.0, 377419.0, 174185.0, 65777.0, 26938.0, 11760.0, 5416.0, 2627.0, 1370.0, 741.0, 420.0, 231.0, 114.0, 95.0, 51.0, 28.0, 21.0, 21.0, 8.0, 9.0, 4.0, 9.0, 4.0, 3.0, 0.0, 3.0, 2.0], "bins": [-1.9091796875, -1.859405517578125, -1.80963134765625, -1.759857177734375, -1.7100830078125, -1.660308837890625, -1.61053466796875, -1.560760498046875, -1.510986328125, -1.461212158203125, -1.41143798828125, -1.361663818359375, -1.3118896484375, -1.262115478515625, -1.21234130859375, -1.162567138671875, -1.11279296875, -1.063018798828125, -1.01324462890625, -0.963470458984375, -0.9136962890625, -0.863922119140625, -0.81414794921875, -0.764373779296875, -0.714599609375, -0.664825439453125, -0.61505126953125, -0.565277099609375, -0.5155029296875, -0.465728759765625, -0.41595458984375, -0.366180419921875, -0.31640625, -0.266632080078125, -0.21685791015625, -0.167083740234375, -0.1173095703125, -0.067535400390625, -0.01776123046875, 0.032012939453125, 0.081787109375, 0.131561279296875, 0.18133544921875, 0.231109619140625, 0.2808837890625, 0.330657958984375, 0.38043212890625, 0.430206298828125, 0.47998046875, 0.529754638671875, 0.57952880859375, 0.629302978515625, 0.6790771484375, 0.728851318359375, 0.77862548828125, 0.828399658203125, 0.878173828125, 0.927947998046875, 0.97772216796875, 1.027496337890625, 1.0772705078125, 1.127044677734375, 1.17681884765625, 1.226593017578125, 1.2763671875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 14.0, 8.0, 8.0, 13.0, 7.0, 14.0, 11.0, 21.0, 22.0, 32.0, 33.0, 33.0, 40.0, 37.0, 45.0, 45.0, 53.0, 49.0, 45.0, 36.0, 64.0, 47.0, 44.0, 37.0, 34.0, 32.0, 30.0, 17.0, 19.0, 14.0, 14.0, 14.0, 11.0, 6.0, 8.0, 5.0, 5.0, 8.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6471481323242188, -0.6263275146484375, -0.6055068969726562, -0.584686279296875, -0.5638656616210938, -0.5430450439453125, -0.5222244262695312, -0.50140380859375, -0.48058319091796875, -0.4597625732421875, -0.43894195556640625, -0.418121337890625, -0.39730072021484375, -0.3764801025390625, -0.35565948486328125, -0.3348388671875, -0.31401824951171875, -0.2931976318359375, -0.27237701416015625, -0.251556396484375, -0.23073577880859375, -0.2099151611328125, -0.18909454345703125, -0.16827392578125, -0.14745330810546875, -0.1266326904296875, -0.10581207275390625, -0.084991455078125, -0.06417083740234375, -0.0433502197265625, -0.02252960205078125, -0.001708984375, 0.01911163330078125, 0.0399322509765625, 0.06075286865234375, 0.081573486328125, 0.10239410400390625, 0.1232147216796875, 0.14403533935546875, 0.16485595703125, 0.18567657470703125, 0.2064971923828125, 0.22731781005859375, 0.248138427734375, 0.26895904541015625, 0.2897796630859375, 0.31060028076171875, 0.3314208984375, 0.35224151611328125, 0.3730621337890625, 0.39388275146484375, 0.414703369140625, 0.43552398681640625, 0.4563446044921875, 0.47716522216796875, 0.49798583984375, 0.5188064575195312, 0.5396270751953125, 0.5604476928710938, 0.581268310546875, 0.6020889282226562, 0.6229095458984375, 0.6437301635742188, 0.66455078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 8.0, 9.0, 23.0, 23.0, 28.0, 45.0, 82.0, 103.0, 148.0, 232.0, 352.0, 550.0, 963.0, 1975.0, 5425.0, 21351.0, 153115.0, 734202.0, 104606.0, 16585.0, 4482.0, 1799.0, 922.0, 528.0, 327.0, 223.0, 148.0, 76.0, 56.0, 49.0, 41.0, 28.0, 12.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0859375, -2.99627685546875, -2.9066162109375, -2.81695556640625, -2.727294921875, -2.63763427734375, -2.5479736328125, -2.45831298828125, -2.36865234375, -2.27899169921875, -2.1893310546875, -2.09967041015625, -2.010009765625, -1.92034912109375, -1.8306884765625, -1.74102783203125, -1.6513671875, -1.56170654296875, -1.4720458984375, -1.38238525390625, -1.292724609375, -1.20306396484375, -1.1134033203125, -1.02374267578125, -0.93408203125, -0.84442138671875, -0.7547607421875, -0.66510009765625, -0.575439453125, -0.48577880859375, -0.3961181640625, -0.30645751953125, -0.216796875, -0.12713623046875, -0.0374755859375, 0.05218505859375, 0.141845703125, 0.23150634765625, 0.3211669921875, 0.41082763671875, 0.50048828125, 0.59014892578125, 0.6798095703125, 0.76947021484375, 0.859130859375, 0.94879150390625, 1.0384521484375, 1.12811279296875, 1.2177734375, 1.30743408203125, 1.3970947265625, 1.48675537109375, 1.576416015625, 1.66607666015625, 1.7557373046875, 1.84539794921875, 1.93505859375, 2.02471923828125, 2.1143798828125, 2.20404052734375, 2.293701171875, 2.38336181640625, 2.4730224609375, 2.56268310546875, 2.65234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 9.0, 10.0, 11.0, 14.0, 12.0, 23.0, 22.0, 19.0, 28.0, 19.0, 24.0, 31.0, 37.0, 39.0, 29.0, 40.0, 43.0, 39.0, 49.0, 35.0, 48.0, 44.0, 34.0, 44.0, 35.0, 31.0, 22.0, 32.0, 20.0, 31.0, 21.0, 11.0, 14.0, 15.0, 12.0, 6.0, 11.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.185760498046875, -2.10003662109375, -2.014312744140625, -1.9285888671875, -1.842864990234375, -1.75714111328125, -1.671417236328125, -1.585693359375, -1.499969482421875, -1.41424560546875, -1.328521728515625, -1.2427978515625, -1.157073974609375, -1.07135009765625, -0.985626220703125, -0.89990234375, -0.814178466796875, -0.72845458984375, -0.642730712890625, -0.5570068359375, -0.471282958984375, -0.38555908203125, -0.299835205078125, -0.214111328125, -0.128387451171875, -0.04266357421875, 0.043060302734375, 0.1287841796875, 0.214508056640625, 0.30023193359375, 0.385955810546875, 0.4716796875, 0.557403564453125, 0.64312744140625, 0.728851318359375, 0.8145751953125, 0.900299072265625, 0.98602294921875, 1.071746826171875, 1.157470703125, 1.243194580078125, 1.32891845703125, 1.414642333984375, 1.5003662109375, 1.586090087890625, 1.67181396484375, 1.757537841796875, 1.84326171875, 1.928985595703125, 2.01470947265625, 2.100433349609375, 2.1861572265625, 2.271881103515625, 2.35760498046875, 2.443328857421875, 2.529052734375, 2.614776611328125, 2.70050048828125, 2.786224365234375, 2.8719482421875, 2.957672119140625, 3.04339599609375, 3.129119873046875, 3.21484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 11.0, 12.0, 44.0, 38.0, 76.0, 153.0, 292.0, 760.0, 3038.0, 24781.0, 847482.0, 161674.0, 7718.0, 1494.0, 491.0, 225.0, 96.0, 64.0, 36.0, 13.0, 7.0, 8.0, 10.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.252288818359375, -3.15301513671875, -3.053741455078125, -2.9544677734375, -2.855194091796875, -2.75592041015625, -2.656646728515625, -2.557373046875, -2.458099365234375, -2.35882568359375, -2.259552001953125, -2.1602783203125, -2.061004638671875, -1.96173095703125, -1.862457275390625, -1.76318359375, -1.663909912109375, -1.56463623046875, -1.465362548828125, -1.3660888671875, -1.266815185546875, -1.16754150390625, -1.068267822265625, -0.968994140625, -0.869720458984375, -0.77044677734375, -0.671173095703125, -0.5718994140625, -0.472625732421875, -0.37335205078125, -0.274078369140625, -0.1748046875, -0.075531005859375, 0.02374267578125, 0.123016357421875, 0.2222900390625, 0.321563720703125, 0.42083740234375, 0.520111083984375, 0.619384765625, 0.718658447265625, 0.81793212890625, 0.917205810546875, 1.0164794921875, 1.115753173828125, 1.21502685546875, 1.314300537109375, 1.41357421875, 1.512847900390625, 1.61212158203125, 1.711395263671875, 1.8106689453125, 1.909942626953125, 2.00921630859375, 2.108489990234375, 2.207763671875, 2.307037353515625, 2.40631103515625, 2.505584716796875, 2.6048583984375, 2.704132080078125, 2.80340576171875, 2.902679443359375, 3.001953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 14.0, 17.0, 23.0, 29.0, 46.0, 79.0, 113.0, 141.0, 122.0, 127.0, 83.0, 47.0, 33.0, 22.0, 22.0, 12.0, 16.0, 9.0, 10.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0004382133483886719, -0.0004282817244529724, -0.00041835010051727295, -0.0004084184765815735, -0.000398486852645874, -0.00038855522871017456, -0.0003786236047744751, -0.00036869198083877563, -0.00035876035690307617, -0.0003488287329673767, -0.00033889710903167725, -0.0003289654850959778, -0.0003190338611602783, -0.00030910223722457886, -0.0002991706132888794, -0.00028923898935317993, -0.00027930736541748047, -0.000269375741481781, -0.00025944411754608154, -0.0002495124936103821, -0.00023958086967468262, -0.00022964924573898315, -0.0002197176218032837, -0.00020978599786758423, -0.00019985437393188477, -0.0001899227499961853, -0.00017999112606048584, -0.00017005950212478638, -0.00016012787818908691, -0.00015019625425338745, -0.000140264630317688, -0.00013033300638198853, -0.00012040138244628906, -0.0001104697585105896, -0.00010053813457489014, -9.060651063919067e-05, -8.067488670349121e-05, -7.074326276779175e-05, -6.0811638832092285e-05, -5.088001489639282e-05, -4.094839096069336e-05, -3.1016767024993896e-05, -2.1085143089294434e-05, -1.115351915359497e-05, -1.2218952178955078e-06, 8.709728717803955e-06, 1.8641352653503418e-05, 2.857297658920288e-05, 3.8504600524902344e-05, 4.843622446060181e-05, 5.836784839630127e-05, 6.829947233200073e-05, 7.82310962677002e-05, 8.816272020339966e-05, 9.809434413909912e-05, 0.00010802596807479858, 0.00011795759201049805, 0.0001278892159461975, 0.00013782083988189697, 0.00014775246381759644, 0.0001576840877532959, 0.00016761571168899536, 0.00017754733562469482, 0.0001874789595603943, 0.00019741058349609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 8.0, 10.0, 7.0, 13.0, 22.0, 33.0, 45.0, 78.0, 170.0, 340.0, 684.0, 1931.0, 6949.0, 55858.0, 825453.0, 141116.0, 11363.0, 2660.0, 939.0, 396.0, 198.0, 108.0, 56.0, 35.0, 25.0, 13.0, 18.0, 9.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.432891845703125, -2.35601806640625, -2.279144287109375, -2.2022705078125, -2.125396728515625, -2.04852294921875, -1.971649169921875, -1.894775390625, -1.817901611328125, -1.74102783203125, -1.664154052734375, -1.5872802734375, -1.510406494140625, -1.43353271484375, -1.356658935546875, -1.27978515625, -1.202911376953125, -1.12603759765625, -1.049163818359375, -0.9722900390625, -0.895416259765625, -0.81854248046875, -0.741668701171875, -0.664794921875, -0.587921142578125, -0.51104736328125, -0.434173583984375, -0.3572998046875, -0.280426025390625, -0.20355224609375, -0.126678466796875, -0.0498046875, 0.027069091796875, 0.10394287109375, 0.180816650390625, 0.2576904296875, 0.334564208984375, 0.41143798828125, 0.488311767578125, 0.565185546875, 0.642059326171875, 0.71893310546875, 0.795806884765625, 0.8726806640625, 0.949554443359375, 1.02642822265625, 1.103302001953125, 1.18017578125, 1.257049560546875, 1.33392333984375, 1.410797119140625, 1.4876708984375, 1.564544677734375, 1.64141845703125, 1.718292236328125, 1.795166015625, 1.872039794921875, 1.94891357421875, 2.025787353515625, 2.1026611328125, 2.179534912109375, 2.25640869140625, 2.333282470703125, 2.41015625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 13.0, 23.0, 28.0, 38.0, 63.0, 94.0, 138.0, 138.0, 124.0, 117.0, 80.0, 57.0, 29.0, 15.0, 16.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583984375, -1.514312744140625, -1.44464111328125, -1.374969482421875, -1.3052978515625, -1.235626220703125, -1.16595458984375, -1.096282958984375, -1.026611328125, -0.956939697265625, -0.88726806640625, -0.817596435546875, -0.7479248046875, -0.678253173828125, -0.60858154296875, -0.538909912109375, -0.46923828125, -0.399566650390625, -0.32989501953125, -0.260223388671875, -0.1905517578125, -0.120880126953125, -0.05120849609375, 0.018463134765625, 0.088134765625, 0.157806396484375, 0.22747802734375, 0.297149658203125, 0.3668212890625, 0.436492919921875, 0.50616455078125, 0.575836181640625, 0.6455078125, 0.715179443359375, 0.78485107421875, 0.854522705078125, 0.9241943359375, 0.993865966796875, 1.06353759765625, 1.133209228515625, 1.202880859375, 1.272552490234375, 1.34222412109375, 1.411895751953125, 1.4815673828125, 1.551239013671875, 1.62091064453125, 1.690582275390625, 1.76025390625, 1.829925537109375, 1.89959716796875, 1.969268798828125, 2.0389404296875, 2.108612060546875, 2.17828369140625, 2.247955322265625, 2.317626953125, 2.387298583984375, 2.45697021484375, 2.526641845703125, 2.5963134765625, 2.665985107421875, 2.73565673828125, 2.805328369140625, 2.875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 12.0, 18.0, 26.0, 54.0, 67.0, 82.0, 106.0, 119.0, 149.0, 86.0, 88.0, 55.0, 48.0, 25.0, 13.0, 11.0, 7.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-17.27664566040039, -16.702539443969727, -16.128433227539062, -15.554327964782715, -14.98022174835205, -14.406115531921387, -13.832010269165039, -13.257904052734375, -12.683797836303711, -12.109691619873047, -11.535585403442383, -10.961480140686035, -10.387373924255371, -9.813267707824707, -9.23916244506836, -8.665056228637695, -8.090950012207031, -7.516843795776367, -6.942738056182861, -6.3686323165893555, -5.794526100158691, -5.220419883728027, -4.6463141441345215, -4.072208404541016, -3.4981021881103516, -2.9239962100982666, -2.3498902320861816, -1.7757842540740967, -1.2016782760620117, -0.6275722980499268, -0.0534663200378418, 0.5206394195556641, 1.0947437286376953, 1.6688497066497803, 2.2429556846618652, 2.81706166267395, 3.391167640686035, 3.96527361869812, 4.539379596710205, 5.113485336303711, 5.687591552734375, 6.261697769165039, 6.835803508758545, 7.409909248352051, 7.984015464782715, 8.558121681213379, 9.132226943969727, 9.70633316040039, 10.280439376831055, 10.854545593261719, 11.428651809692383, 12.00275707244873, 12.576863288879395, 13.150969505310059, 13.725074768066406, 14.29918098449707, 14.873287200927734, 15.447393417358398, 16.021499633789062, 16.595605850219727, 17.16971206665039, 17.743816375732422, 18.317922592163086, 18.89202880859375, 19.466135025024414]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 2.0, 5.0, 4.0, 5.0, 6.0, 4.0, 12.0, 11.0, 7.0, 24.0, 10.0, 24.0, 31.0, 23.0, 27.0, 33.0, 30.0, 34.0, 37.0, 51.0, 54.0, 48.0, 49.0, 49.0, 35.0, 42.0, 35.0, 40.0, 39.0, 28.0, 22.0, 33.0, 26.0, 14.0, 23.0, 16.0, 13.0, 10.0, 19.0, 10.0, 3.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.908052444458008, -12.49710464477539, -12.08615779876709, -11.675209999084473, -11.264263153076172, -10.853315353393555, -10.442367553710938, -10.03141975402832, -9.62047290802002, -9.209525108337402, -8.798578262329102, -8.387630462646484, -7.976683139801025, -7.565735816955566, -7.154788017272949, -6.74384069442749, -6.332893371582031, -5.921946048736572, -5.510998725891113, -5.100050926208496, -4.689103603363037, -4.278156280517578, -3.86720871925354, -3.456261157989502, -3.045313835144043, -2.634366512298584, -2.223418951034546, -1.8124715089797974, -1.4015240669250488, -0.9905767440795898, -0.5796291828155518, -0.16868162155151367, 0.2422647476196289, 0.6532121896743774, 1.064159631729126, 1.4751070737838745, 1.886054515838623, 2.297001838684082, 2.70794939994812, 3.118896961212158, 3.529844284057617, 3.940791606903076, 4.351738929748535, 4.762686729431152, 5.173634052276611, 5.58458137512207, 5.9955291748046875, 6.4064764976501465, 6.8174238204956055, 7.2283711433410645, 7.639318466186523, 8.05026626586914, 8.461214065551758, 8.872160911560059, 9.283108711242676, 9.694055557250977, 10.105003356933594, 10.515951156616211, 10.926898002624512, 11.337845802307129, 11.74879264831543, 12.159740447998047, 12.570688247680664, 12.981636047363281, 13.392582893371582]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 6.0, 8.0, 13.0, 20.0, 24.0, 30.0, 44.0, 47.0, 80.0, 99.0, 135.0, 186.0, 284.0, 422.0, 629.0, 1021.0, 1725.0, 3250.0, 7555.0, 23855.0, 275341.0, 3826585.0, 34693.0, 9189.0, 3840.0, 1969.0, 1094.0, 715.0, 417.0, 302.0, 193.0, 161.0, 102.0, 61.0, 59.0, 32.0, 33.0, 18.0, 21.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.259765625, -3.17193603515625, -3.0841064453125, -2.99627685546875, -2.908447265625, -2.82061767578125, -2.7327880859375, -2.64495849609375, -2.55712890625, -2.46929931640625, -2.3814697265625, -2.29364013671875, -2.205810546875, -2.11798095703125, -2.0301513671875, -1.94232177734375, -1.8544921875, -1.76666259765625, -1.6788330078125, -1.59100341796875, -1.503173828125, -1.41534423828125, -1.3275146484375, -1.23968505859375, -1.15185546875, -1.06402587890625, -0.9761962890625, -0.88836669921875, -0.800537109375, -0.71270751953125, -0.6248779296875, -0.53704833984375, -0.44921875, -0.36138916015625, -0.2735595703125, -0.18572998046875, -0.097900390625, -0.01007080078125, 0.0777587890625, 0.16558837890625, 0.25341796875, 0.34124755859375, 0.4290771484375, 0.51690673828125, 0.604736328125, 0.69256591796875, 0.7803955078125, 0.86822509765625, 0.9560546875, 1.04388427734375, 1.1317138671875, 1.21954345703125, 1.307373046875, 1.39520263671875, 1.4830322265625, 1.57086181640625, 1.65869140625, 1.74652099609375, 1.8343505859375, 1.92218017578125, 2.010009765625, 2.09783935546875, 2.1856689453125, 2.27349853515625, 2.361328125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 9.0, 10.0, 13.0, 11.0, 12.0, 17.0, 27.0, 29.0, 24.0, 27.0, 34.0, 44.0, 49.0, 48.0, 68.0, 59.0, 66.0, 58.0, 57.0, 47.0, 32.0, 51.0, 34.0, 38.0, 30.0, 24.0, 18.0, 14.0, 8.0, 11.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7369918823242188, -0.7132415771484375, -0.6894912719726562, -0.665740966796875, -0.6419906616210938, -0.6182403564453125, -0.5944900512695312, -0.57073974609375, -0.5469894409179688, -0.5232391357421875, -0.49948883056640625, -0.475738525390625, -0.45198822021484375, -0.4282379150390625, -0.40448760986328125, -0.3807373046875, -0.35698699951171875, -0.3332366943359375, -0.30948638916015625, -0.285736083984375, -0.26198577880859375, -0.2382354736328125, -0.21448516845703125, -0.19073486328125, -0.16698455810546875, -0.1432342529296875, -0.11948394775390625, -0.095733642578125, -0.07198333740234375, -0.0482330322265625, -0.02448272705078125, -0.000732421875, 0.02301788330078125, 0.0467681884765625, 0.07051849365234375, 0.094268798828125, 0.11801910400390625, 0.1417694091796875, 0.16551971435546875, 0.18927001953125, 0.21302032470703125, 0.2367706298828125, 0.26052093505859375, 0.284271240234375, 0.30802154541015625, 0.3317718505859375, 0.35552215576171875, 0.3792724609375, 0.40302276611328125, 0.4267730712890625, 0.45052337646484375, 0.474273681640625, 0.49802398681640625, 0.5217742919921875, 0.5455245971679688, 0.56927490234375, 0.5930252075195312, 0.6167755126953125, 0.6405258178710938, 0.664276123046875, 0.6880264282226562, 0.7117767333984375, 0.7355270385742188, 0.75927734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 9.0, 9.0, 23.0, 27.0, 51.0, 82.0, 90.0, 171.0, 268.0, 406.0, 791.0, 1424.0, 2764.0, 5898.0, 17095.0, 97387.0, 3951984.0, 87277.0, 16430.0, 5991.0, 2757.0, 1420.0, 775.0, 436.0, 252.0, 170.0, 100.0, 70.0, 41.0, 25.0, 21.0, 15.0, 7.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.85552978515625, -2.7618408203125, -2.66815185546875, -2.574462890625, -2.48077392578125, -2.3870849609375, -2.29339599609375, -2.19970703125, -2.10601806640625, -2.0123291015625, -1.91864013671875, -1.824951171875, -1.73126220703125, -1.6375732421875, -1.54388427734375, -1.4501953125, -1.35650634765625, -1.2628173828125, -1.16912841796875, -1.075439453125, -0.98175048828125, -0.8880615234375, -0.79437255859375, -0.70068359375, -0.60699462890625, -0.5133056640625, -0.41961669921875, -0.325927734375, -0.23223876953125, -0.1385498046875, -0.04486083984375, 0.048828125, 0.14251708984375, 0.2362060546875, 0.32989501953125, 0.423583984375, 0.51727294921875, 0.6109619140625, 0.70465087890625, 0.79833984375, 0.89202880859375, 0.9857177734375, 1.07940673828125, 1.173095703125, 1.26678466796875, 1.3604736328125, 1.45416259765625, 1.5478515625, 1.64154052734375, 1.7352294921875, 1.82891845703125, 1.922607421875, 2.01629638671875, 2.1099853515625, 2.20367431640625, 2.29736328125, 2.39105224609375, 2.4847412109375, 2.57843017578125, 2.672119140625, 2.76580810546875, 2.8594970703125, 2.95318603515625, 3.046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 4.0, 10.0, 16.0, 34.0, 62.0, 184.0, 2691.0, 727.0, 127.0, 61.0, 44.0, 24.0, 16.0, 10.0, 11.0, 5.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1396484375, -1.101531982421875, -1.06341552734375, -1.025299072265625, -0.9871826171875, -0.949066162109375, -0.91094970703125, -0.872833251953125, -0.834716796875, -0.796600341796875, -0.75848388671875, -0.720367431640625, -0.6822509765625, -0.644134521484375, -0.60601806640625, -0.567901611328125, -0.52978515625, -0.491668701171875, -0.45355224609375, -0.415435791015625, -0.3773193359375, -0.339202880859375, -0.30108642578125, -0.262969970703125, -0.224853515625, -0.186737060546875, -0.14862060546875, -0.110504150390625, -0.0723876953125, -0.034271240234375, 0.00384521484375, 0.041961669921875, 0.080078125, 0.118194580078125, 0.15631103515625, 0.194427490234375, 0.2325439453125, 0.270660400390625, 0.30877685546875, 0.346893310546875, 0.385009765625, 0.423126220703125, 0.46124267578125, 0.499359130859375, 0.5374755859375, 0.575592041015625, 0.61370849609375, 0.651824951171875, 0.68994140625, 0.728057861328125, 0.76617431640625, 0.804290771484375, 0.8424072265625, 0.880523681640625, 0.91864013671875, 0.956756591796875, 0.994873046875, 1.032989501953125, 1.07110595703125, 1.109222412109375, 1.1473388671875, 1.185455322265625, 1.22357177734375, 1.261688232421875, 1.2998046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 9.0, 28.0, 62.0, 95.0, 118.0, 147.0, 145.0, 110.0, 89.0, 70.0, 35.0, 23.0, 12.0, 2.0, 15.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.244816303253174, -3.0666351318359375, -2.8884541988372803, -2.710273027420044, -2.5320920944213867, -2.3539109230041504, -2.175729751586914, -1.9975486993789673, -1.8193676471710205, -1.6411865949630737, -1.463005542755127, -1.2848243713378906, -1.1066433191299438, -0.9284622669219971, -0.7502810955047607, -0.572100043296814, -0.3939189910888672, -0.21573790907859802, -0.03755682706832886, 0.1406242847442627, 0.3188053369522095, 0.49698638916015625, 0.6751675605773926, 0.8533486127853394, 1.0315296649932861, 1.209710717201233, 1.3878917694091797, 1.566072940826416, 1.7442539930343628, 1.9224350452423096, 2.100616216659546, 2.278797149658203, 2.4569787979125977, 2.635159969329834, 2.813340902328491, 2.9915220737457275, 3.1697030067443848, 3.347884178161621, 3.5260653495788574, 3.7042465209960938, 3.882427453994751, 4.060608386993408, 4.2387895584106445, 4.416970729827881, 4.595151901245117, 4.773332595825195, 4.95151424407959, 5.129694938659668, 5.307876110076904, 5.486057281494141, 5.664238452911377, 5.842419624328613, 6.020600318908691, 6.198781490325928, 6.376962661743164, 6.5551438331604, 6.733325004577637, 6.911506175994873, 7.089687347412109, 7.2678680419921875, 7.446049213409424, 7.62423038482666, 7.8024115562438965, 7.980592727661133, 8.158773422241211]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 16.0, 11.0, 9.0, 15.0, 19.0, 22.0, 20.0, 24.0, 22.0, 26.0, 35.0, 30.0, 45.0, 38.0, 35.0, 35.0, 42.0, 31.0, 35.0, 36.0, 36.0, 38.0, 36.0, 39.0, 31.0, 34.0, 37.0, 37.0, 19.0, 23.0, 17.0, 17.0, 13.0, 9.0, 13.0, 8.0, 8.0, 7.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.1991825103759766, -3.1076595783233643, -3.016136407852173, -2.9246134757995605, -2.833090305328369, -2.741567373275757, -2.6500444412231445, -2.558521270751953, -2.466998338699341, -2.3754754066467285, -2.283952236175537, -2.192429304122925, -2.1009063720703125, -2.009383201599121, -1.9178602695465088, -1.826337218284607, -1.734814167022705, -1.6432911157608032, -1.5517680644989014, -1.460245132446289, -1.3687220811843872, -1.2771990299224854, -1.185676097869873, -1.0941530466079712, -1.0026299953460693, -0.9111069440841675, -0.8195839524269104, -0.7280609607696533, -0.6365379095077515, -0.5450148582458496, -0.45349186658859253, -0.36196887493133545, -0.2704458236694336, -0.17892280220985413, -0.08739978075027466, 0.00412324070930481, 0.09564626216888428, 0.18716928362846375, 0.2786923050880432, 0.3702152967453003, 0.46173834800720215, 0.553261399269104, 0.6447843909263611, 0.7363073825836182, 0.82783043384552, 0.9193534851074219, 1.0108764171600342, 1.102399468421936, 1.193922519683838, 1.2854455709457397, 1.3769686222076416, 1.468491554260254, 1.5600146055221558, 1.6515376567840576, 1.74306058883667, 1.8345836400985718, 1.9261066913604736, 2.017629623413086, 2.1091527938842773, 2.2006757259368896, 2.292198657989502, 2.3837218284606934, 2.4752447605133057, 2.566767692565918, 2.6582908630371094]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 10.0, 11.0, 15.0, 26.0, 26.0, 35.0, 68.0, 101.0, 127.0, 206.0, 321.0, 528.0, 890.0, 1432.0, 2731.0, 5117.0, 10145.0, 22142.0, 51924.0, 130003.0, 340541.0, 291007.0, 108820.0, 43965.0, 18950.0, 9056.0, 4522.0, 2385.0, 1343.0, 790.0, 490.0, 294.0, 168.0, 135.0, 66.0, 55.0, 40.0, 25.0, 14.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.060546875, -2.0031585693359375, -1.945770263671875, -1.8883819580078125, -1.83099365234375, -1.7736053466796875, -1.716217041015625, -1.6588287353515625, -1.6014404296875, -1.5440521240234375, -1.486663818359375, -1.4292755126953125, -1.37188720703125, -1.3144989013671875, -1.257110595703125, -1.1997222900390625, -1.142333984375, -1.0849456787109375, -1.027557373046875, -0.9701690673828125, -0.91278076171875, -0.8553924560546875, -0.798004150390625, -0.7406158447265625, -0.6832275390625, -0.6258392333984375, -0.568450927734375, -0.5110626220703125, -0.45367431640625, -0.3962860107421875, -0.338897705078125, -0.2815093994140625, -0.22412109375, -0.1667327880859375, -0.109344482421875, -0.0519561767578125, 0.00543212890625, 0.0628204345703125, 0.120208740234375, 0.1775970458984375, 0.2349853515625, 0.2923736572265625, 0.349761962890625, 0.4071502685546875, 0.46453857421875, 0.5219268798828125, 0.579315185546875, 0.6367034912109375, 0.694091796875, 0.7514801025390625, 0.808868408203125, 0.8662567138671875, 0.92364501953125, 0.9810333251953125, 1.038421630859375, 1.0958099365234375, 1.1531982421875, 1.2105865478515625, 1.267974853515625, 1.3253631591796875, 1.38275146484375, 1.4401397705078125, 1.497528076171875, 1.5549163818359375, 1.6123046875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 3.0, 4.0, 14.0, 13.0, 11.0, 15.0, 15.0, 30.0, 21.0, 27.0, 32.0, 43.0, 38.0, 48.0, 54.0, 51.0, 57.0, 56.0, 59.0, 52.0, 54.0, 44.0, 44.0, 38.0, 29.0, 24.0, 34.0, 15.0, 18.0, 10.0, 12.0, 2.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.79638671875, -0.7715530395507812, -0.7467193603515625, -0.7218856811523438, -0.697052001953125, -0.6722183227539062, -0.6473846435546875, -0.6225509643554688, -0.59771728515625, -0.5728836059570312, -0.5480499267578125, -0.5232162475585938, -0.498382568359375, -0.47354888916015625, -0.4487152099609375, -0.42388153076171875, -0.3990478515625, -0.37421417236328125, -0.3493804931640625, -0.32454681396484375, -0.299713134765625, -0.27487945556640625, -0.2500457763671875, -0.22521209716796875, -0.20037841796875, -0.17554473876953125, -0.1507110595703125, -0.12587738037109375, -0.101043701171875, -0.07621002197265625, -0.0513763427734375, -0.02654266357421875, -0.001708984375, 0.02312469482421875, 0.0479583740234375, 0.07279205322265625, 0.097625732421875, 0.12245941162109375, 0.1472930908203125, 0.17212677001953125, 0.19696044921875, 0.22179412841796875, 0.2466278076171875, 0.27146148681640625, 0.296295166015625, 0.32112884521484375, 0.3459625244140625, 0.37079620361328125, 0.3956298828125, 0.42046356201171875, 0.4452972412109375, 0.47013092041015625, 0.494964599609375, 0.5197982788085938, 0.5446319580078125, 0.5694656372070312, 0.59429931640625, 0.6191329956054688, 0.6439666748046875, 0.6688003540039062, 0.693634033203125, 0.7184677124023438, 0.7433013916015625, 0.7681350708007812, 0.79296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 6.0, 7.0, 13.0, 15.0, 23.0, 30.0, 51.0, 69.0, 115.0, 167.0, 235.0, 355.0, 532.0, 1011.0, 1880.0, 4373.0, 15370.0, 90376.0, 647952.0, 240717.0, 31706.0, 7464.0, 2751.0, 1338.0, 749.0, 418.0, 252.0, 187.0, 116.0, 81.0, 53.0, 32.0, 32.0, 30.0, 17.0, 6.0, 10.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.408203125, -3.31005859375, -3.2119140625, -3.11376953125, -3.015625, -2.91748046875, -2.8193359375, -2.72119140625, -2.623046875, -2.52490234375, -2.4267578125, -2.32861328125, -2.23046875, -2.13232421875, -2.0341796875, -1.93603515625, -1.837890625, -1.73974609375, -1.6416015625, -1.54345703125, -1.4453125, -1.34716796875, -1.2490234375, -1.15087890625, -1.052734375, -0.95458984375, -0.8564453125, -0.75830078125, -0.66015625, -0.56201171875, -0.4638671875, -0.36572265625, -0.267578125, -0.16943359375, -0.0712890625, 0.02685546875, 0.125, 0.22314453125, 0.3212890625, 0.41943359375, 0.517578125, 0.61572265625, 0.7138671875, 0.81201171875, 0.91015625, 1.00830078125, 1.1064453125, 1.20458984375, 1.302734375, 1.40087890625, 1.4990234375, 1.59716796875, 1.6953125, 1.79345703125, 1.8916015625, 1.98974609375, 2.087890625, 2.18603515625, 2.2841796875, 2.38232421875, 2.48046875, 2.57861328125, 2.6767578125, 2.77490234375, 2.873046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 5.0, 8.0, 19.0, 13.0, 15.0, 22.0, 18.0, 29.0, 26.0, 33.0, 32.0, 42.0, 42.0, 31.0, 55.0, 51.0, 50.0, 56.0, 51.0, 36.0, 42.0, 44.0, 45.0, 34.0, 36.0, 18.0, 29.0, 18.0, 19.0, 13.0, 12.0, 13.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.9453125, -2.839385986328125, -2.73345947265625, -2.627532958984375, -2.5216064453125, -2.415679931640625, -2.30975341796875, -2.203826904296875, -2.097900390625, -1.991973876953125, -1.88604736328125, -1.780120849609375, -1.6741943359375, -1.568267822265625, -1.46234130859375, -1.356414794921875, -1.25048828125, -1.144561767578125, -1.03863525390625, -0.932708740234375, -0.8267822265625, -0.720855712890625, -0.61492919921875, -0.509002685546875, -0.403076171875, -0.297149658203125, -0.19122314453125, -0.085296630859375, 0.0206298828125, 0.126556396484375, 0.23248291015625, 0.338409423828125, 0.4443359375, 0.550262451171875, 0.65618896484375, 0.762115478515625, 0.8680419921875, 0.973968505859375, 1.07989501953125, 1.185821533203125, 1.291748046875, 1.397674560546875, 1.50360107421875, 1.609527587890625, 1.7154541015625, 1.821380615234375, 1.92730712890625, 2.033233642578125, 2.13916015625, 2.245086669921875, 2.35101318359375, 2.456939697265625, 2.5628662109375, 2.668792724609375, 2.77471923828125, 2.880645751953125, 2.986572265625, 3.092498779296875, 3.19842529296875, 3.304351806640625, 3.4102783203125, 3.516204833984375, 3.62213134765625, 3.728057861328125, 3.833984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 14.0, 20.0, 41.0, 73.0, 173.0, 639.0, 4883.0, 224844.0, 805325.0, 11032.0, 1092.0, 230.0, 82.0, 43.0, 18.0, 18.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.30169677734375, -4.1971435546875, -4.09259033203125, -3.988037109375, -3.88348388671875, -3.7789306640625, -3.67437744140625, -3.56982421875, -3.46527099609375, -3.3607177734375, -3.25616455078125, -3.151611328125, -3.04705810546875, -2.9425048828125, -2.83795166015625, -2.7333984375, -2.62884521484375, -2.5242919921875, -2.41973876953125, -2.315185546875, -2.21063232421875, -2.1060791015625, -2.00152587890625, -1.89697265625, -1.79241943359375, -1.6878662109375, -1.58331298828125, -1.478759765625, -1.37420654296875, -1.2696533203125, -1.16510009765625, -1.060546875, -0.95599365234375, -0.8514404296875, -0.74688720703125, -0.642333984375, -0.53778076171875, -0.4332275390625, -0.32867431640625, -0.22412109375, -0.11956787109375, -0.0150146484375, 0.08953857421875, 0.194091796875, 0.29864501953125, 0.4031982421875, 0.50775146484375, 0.6123046875, 0.71685791015625, 0.8214111328125, 0.92596435546875, 1.030517578125, 1.13507080078125, 1.2396240234375, 1.34417724609375, 1.44873046875, 1.55328369140625, 1.6578369140625, 1.76239013671875, 1.866943359375, 1.97149658203125, 2.0760498046875, 2.18060302734375, 2.28515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 8.0, 15.0, 14.0, 24.0, 25.0, 38.0, 39.0, 64.0, 96.0, 132.0, 149.0, 102.0, 94.0, 48.0, 36.0, 22.0, 22.0, 11.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002865791320800781, -0.0002761036157608032, -0.0002656280994415283, -0.0002551525831222534, -0.0002446770668029785, -0.0002342015504837036, -0.0002237260341644287, -0.0002132505178451538, -0.0002027750015258789, -0.000192299485206604, -0.0001818239688873291, -0.0001713484525680542, -0.0001608729362487793, -0.0001503974199295044, -0.0001399219036102295, -0.0001294463872909546, -0.00011897087097167969, -0.00010849535465240479, -9.801983833312988e-05, -8.754432201385498e-05, -7.706880569458008e-05, -6.659328937530518e-05, -5.6117773056030273e-05, -4.564225673675537e-05, -3.516674041748047e-05, -2.4691224098205566e-05, -1.4215707778930664e-05, -3.7401914596557617e-06, 6.735324859619141e-06, 1.7210841178894043e-05, 2.7686357498168945e-05, 3.816187381744385e-05, 4.863739013671875e-05, 5.911290645599365e-05, 6.958842277526855e-05, 8.006393909454346e-05, 9.053945541381836e-05, 0.00010101497173309326, 0.00011149048805236816, 0.00012196600437164307, 0.00013244152069091797, 0.00014291703701019287, 0.00015339255332946777, 0.00016386806964874268, 0.00017434358596801758, 0.00018481910228729248, 0.00019529461860656738, 0.00020577013492584229, 0.0002162456512451172, 0.0002267211675643921, 0.000237196683883667, 0.0002476722002029419, 0.0002581477165222168, 0.0002686232328414917, 0.0002790987491607666, 0.0002895742654800415, 0.0003000497817993164, 0.0003105252981185913, 0.0003210008144378662, 0.0003314763307571411, 0.000341951847076416, 0.0003524273633956909, 0.0003629028797149658, 0.0003733783960342407, 0.0003838539123535156]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 3.0, 3.0, 4.0, 8.0, 16.0, 18.0, 29.0, 59.0, 104.0, 199.0, 401.0, 878.0, 2547.0, 9582.0, 89649.0, 819718.0, 110003.0, 10619.0, 2816.0, 997.0, 426.0, 194.0, 109.0, 53.0, 36.0, 27.0, 16.0, 9.0, 9.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9345703125, -1.880126953125, -1.82568359375, -1.771240234375, -1.716796875, -1.662353515625, -1.60791015625, -1.553466796875, -1.4990234375, -1.444580078125, -1.39013671875, -1.335693359375, -1.28125, -1.226806640625, -1.17236328125, -1.117919921875, -1.0634765625, -1.009033203125, -0.95458984375, -0.900146484375, -0.845703125, -0.791259765625, -0.73681640625, -0.682373046875, -0.6279296875, -0.573486328125, -0.51904296875, -0.464599609375, -0.41015625, -0.355712890625, -0.30126953125, -0.246826171875, -0.1923828125, -0.137939453125, -0.08349609375, -0.029052734375, 0.025390625, 0.079833984375, 0.13427734375, 0.188720703125, 0.2431640625, 0.297607421875, 0.35205078125, 0.406494140625, 0.4609375, 0.515380859375, 0.56982421875, 0.624267578125, 0.6787109375, 0.733154296875, 0.78759765625, 0.842041015625, 0.896484375, 0.950927734375, 1.00537109375, 1.059814453125, 1.1142578125, 1.168701171875, 1.22314453125, 1.277587890625, 1.33203125, 1.386474609375, 1.44091796875, 1.495361328125, 1.5498046875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 5.0, 5.0, 12.0, 31.0, 32.0, 49.0, 62.0, 90.0, 108.0, 132.0, 137.0, 102.0, 78.0, 44.0, 41.0, 25.0, 13.0, 11.0, 11.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2678070068359375, -1.216278076171875, -1.1647491455078125, -1.11322021484375, -1.0616912841796875, -1.010162353515625, -0.9586334228515625, -0.9071044921875, -0.8555755615234375, -0.804046630859375, -0.7525177001953125, -0.70098876953125, -0.6494598388671875, -0.597930908203125, -0.5464019775390625, -0.494873046875, -0.4433441162109375, -0.391815185546875, -0.3402862548828125, -0.28875732421875, -0.2372283935546875, -0.185699462890625, -0.1341705322265625, -0.0826416015625, -0.0311126708984375, 0.020416259765625, 0.0719451904296875, 0.12347412109375, 0.1750030517578125, 0.226531982421875, 0.2780609130859375, 0.32958984375, 0.3811187744140625, 0.432647705078125, 0.4841766357421875, 0.53570556640625, 0.5872344970703125, 0.638763427734375, 0.6902923583984375, 0.7418212890625, 0.7933502197265625, 0.844879150390625, 0.8964080810546875, 0.94793701171875, 0.9994659423828125, 1.050994873046875, 1.1025238037109375, 1.154052734375, 1.2055816650390625, 1.257110595703125, 1.3086395263671875, 1.36016845703125, 1.4116973876953125, 1.463226318359375, 1.5147552490234375, 1.5662841796875, 1.6178131103515625, 1.669342041015625, 1.7208709716796875, 1.77239990234375, 1.8239288330078125, 1.875457763671875, 1.9269866943359375, 1.978515625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 6.0, 21.0, 52.0, 102.0, 159.0, 237.0, 180.0, 114.0, 60.0, 20.0, 27.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.781608581542969, -14.770590782165527, -13.759572982788086, -12.748554229736328, -11.737537384033203, -10.726518630981445, -9.715500831604004, -8.704483032226562, -7.693465232849121, -6.68244743347168, -5.671429634094238, -4.660411357879639, -3.6493935585021973, -2.638375759124756, -1.6273574829101562, -0.6163396835327148, 0.39467811584472656, 1.4056960344314575, 2.4167139530181885, 3.427731990814209, 4.43874979019165, 5.449767589569092, 6.460785865783691, 7.471803665161133, 8.482821464538574, 9.493839263916016, 10.504857063293457, 11.515874862670898, 12.526893615722656, 13.537910461425781, 14.548929214477539, 15.55994701385498, 16.570964813232422, 17.58198356628418, 18.593000411987305, 19.604019165039062, 20.615036010742188, 21.626054763793945, 22.637073516845703, 23.648090362548828, 24.659107208251953, 25.67012596130371, 26.681142807006836, 27.692161560058594, 28.70317840576172, 29.714197158813477, 30.725215911865234, 31.73623275756836, 32.74725341796875, 33.758270263671875, 34.769290924072266, 35.78030776977539, 36.791324615478516, 37.80234146118164, 38.81336212158203, 39.824378967285156, 40.83539581298828, 41.846412658691406, 42.8574333190918, 43.86845016479492, 44.87946701049805, 45.89048385620117, 46.90150451660156, 47.91252136230469, 48.92353820800781]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 8.0, 6.0, 10.0, 13.0, 14.0, 15.0, 21.0, 28.0, 22.0, 24.0, 39.0, 41.0, 38.0, 40.0, 37.0, 47.0, 63.0, 66.0, 68.0, 44.0, 46.0, 42.0, 39.0, 32.0, 27.0, 43.0, 29.0, 20.0, 12.0, 9.0, 11.0, 12.0, 6.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.186368942260742, -15.684624671936035, -15.182881355285645, -14.681137084960938, -14.179393768310547, -13.67764949798584, -13.175905227661133, -12.674161911010742, -12.172417640686035, -11.670673370361328, -11.168930053710938, -10.66718578338623, -10.165441513061523, -9.663698196411133, -9.161953926086426, -8.660209655761719, -8.158466339111328, -7.656722545623779, -7.1549787521362305, -6.653234481811523, -6.151490688323975, -5.649746894836426, -5.148002624511719, -4.64625883102417, -4.144515037536621, -3.6427712440490723, -3.1410272121429443, -2.6392831802368164, -2.1375393867492676, -1.6357955932617188, -1.1340515613555908, -0.6323075294494629, -0.13056373596191406, 0.3711801767349243, 0.8729240894317627, 1.374668002128601, 1.8764119148254395, 2.3781557083129883, 2.879899740219116, 3.381643772125244, 3.883387565612793, 4.385131359100342, 4.886875152587891, 5.388619422912598, 5.8903632164001465, 6.392107009887695, 6.893851280212402, 7.395595073699951, 7.8973388671875, 8.399083137512207, 8.900826454162598, 9.402570724487305, 9.904314041137695, 10.406058311462402, 10.90780258178711, 11.4095458984375, 11.911290168762207, 12.413034439086914, 12.914777755737305, 13.416522026062012, 13.918266296386719, 14.42000961303711, 14.921753883361816, 15.423498153686523, 15.925241470336914]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 10.0, 14.0, 15.0, 23.0, 33.0, 45.0, 57.0, 86.0, 148.0, 212.0, 342.0, 531.0, 837.0, 1480.0, 2705.0, 5185.0, 11022.0, 26076.0, 82349.0, 587903.0, 3101358.0, 277715.0, 57542.0, 20162.0, 8782.0, 4288.0, 2213.0, 1224.0, 729.0, 421.0, 231.0, 195.0, 111.0, 79.0, 39.0, 45.0, 23.0, 12.0, 16.0, 4.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-1.9560546875, -1.9036865234375, -1.851318359375, -1.7989501953125, -1.74658203125, -1.6942138671875, -1.641845703125, -1.5894775390625, -1.537109375, -1.4847412109375, -1.432373046875, -1.3800048828125, -1.32763671875, -1.2752685546875, -1.222900390625, -1.1705322265625, -1.1181640625, -1.0657958984375, -1.013427734375, -0.9610595703125, -0.90869140625, -0.8563232421875, -0.803955078125, -0.7515869140625, -0.69921875, -0.6468505859375, -0.594482421875, -0.5421142578125, -0.48974609375, -0.4373779296875, -0.385009765625, -0.3326416015625, -0.2802734375, -0.2279052734375, -0.175537109375, -0.1231689453125, -0.07080078125, -0.0184326171875, 0.033935546875, 0.0863037109375, 0.138671875, 0.1910400390625, 0.243408203125, 0.2957763671875, 0.34814453125, 0.4005126953125, 0.452880859375, 0.5052490234375, 0.5576171875, 0.6099853515625, 0.662353515625, 0.7147216796875, 0.76708984375, 0.8194580078125, 0.871826171875, 0.9241943359375, 0.9765625, 1.0289306640625, 1.081298828125, 1.1336669921875, 1.18603515625, 1.2384033203125, 1.290771484375, 1.3431396484375, 1.3955078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 4.0, 11.0, 22.0, 23.0, 23.0, 33.0, 36.0, 35.0, 36.0, 50.0, 34.0, 43.0, 54.0, 62.0, 56.0, 68.0, 60.0, 48.0, 40.0, 39.0, 32.0, 31.0, 25.0, 30.0, 18.0, 15.0, 16.0, 9.0, 3.0, 3.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8125, -0.789215087890625, -0.76593017578125, -0.742645263671875, -0.7193603515625, -0.696075439453125, -0.67279052734375, -0.649505615234375, -0.626220703125, -0.602935791015625, -0.57965087890625, -0.556365966796875, -0.5330810546875, -0.509796142578125, -0.48651123046875, -0.463226318359375, -0.43994140625, -0.416656494140625, -0.39337158203125, -0.370086669921875, -0.3468017578125, -0.323516845703125, -0.30023193359375, -0.276947021484375, -0.253662109375, -0.230377197265625, -0.20709228515625, -0.183807373046875, -0.1605224609375, -0.137237548828125, -0.11395263671875, -0.090667724609375, -0.0673828125, -0.044097900390625, -0.02081298828125, 0.002471923828125, 0.0257568359375, 0.049041748046875, 0.07232666015625, 0.095611572265625, 0.118896484375, 0.142181396484375, 0.16546630859375, 0.188751220703125, 0.2120361328125, 0.235321044921875, 0.25860595703125, 0.281890869140625, 0.30517578125, 0.328460693359375, 0.35174560546875, 0.375030517578125, 0.3983154296875, 0.421600341796875, 0.44488525390625, 0.468170166015625, 0.491455078125, 0.514739990234375, 0.53802490234375, 0.561309814453125, 0.5845947265625, 0.607879638671875, 0.63116455078125, 0.654449462890625, 0.677734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 9.0, 13.0, 23.0, 28.0, 62.0, 118.0, 166.0, 292.0, 536.0, 1164.0, 3165.0, 11138.0, 57744.0, 1214379.0, 2805553.0, 79600.0, 13730.0, 3870.0, 1383.0, 597.0, 261.0, 170.0, 91.0, 57.0, 34.0, 37.0, 13.0, 10.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59765625, -2.498046875, -2.3984375, -2.298828125, -2.19921875, -2.099609375, -2.0, -1.900390625, -1.80078125, -1.701171875, -1.6015625, -1.501953125, -1.40234375, -1.302734375, -1.203125, -1.103515625, -1.00390625, -0.904296875, -0.8046875, -0.705078125, -0.60546875, -0.505859375, -0.40625, -0.306640625, -0.20703125, -0.107421875, -0.0078125, 0.091796875, 0.19140625, 0.291015625, 0.390625, 0.490234375, 0.58984375, 0.689453125, 0.7890625, 0.888671875, 0.98828125, 1.087890625, 1.1875, 1.287109375, 1.38671875, 1.486328125, 1.5859375, 1.685546875, 1.78515625, 1.884765625, 1.984375, 2.083984375, 2.18359375, 2.283203125, 2.3828125, 2.482421875, 2.58203125, 2.681640625, 2.78125, 2.880859375, 2.98046875, 3.080078125, 3.1796875, 3.279296875, 3.37890625, 3.478515625, 3.578125, 3.677734375, 3.77734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 11.0, 12.0, 15.0, 21.0, 24.0, 39.0, 67.0, 83.0, 146.0, 303.0, 775.0, 1287.0, 605.0, 247.0, 151.0, 74.0, 60.0, 39.0, 31.0, 21.0, 12.0, 6.0, 5.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.366943359375, -3.27685546875, -3.186767578125, -3.0966796875, -3.006591796875, -2.91650390625, -2.826416015625, -2.736328125, -2.646240234375, -2.55615234375, -2.466064453125, -2.3759765625, -2.285888671875, -2.19580078125, -2.105712890625, -2.015625, -1.925537109375, -1.83544921875, -1.745361328125, -1.6552734375, -1.565185546875, -1.47509765625, -1.385009765625, -1.294921875, -1.204833984375, -1.11474609375, -1.024658203125, -0.9345703125, -0.844482421875, -0.75439453125, -0.664306640625, -0.57421875, -0.484130859375, -0.39404296875, -0.303955078125, -0.2138671875, -0.123779296875, -0.03369140625, 0.056396484375, 0.146484375, 0.236572265625, 0.32666015625, 0.416748046875, 0.5068359375, 0.596923828125, 0.68701171875, 0.777099609375, 0.8671875, 0.957275390625, 1.04736328125, 1.137451171875, 1.2275390625, 1.317626953125, 1.40771484375, 1.497802734375, 1.587890625, 1.677978515625, 1.76806640625, 1.858154296875, 1.9482421875, 2.038330078125, 2.12841796875, 2.218505859375, 2.30859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 20.0, 53.0, 147.0, 291.0, 297.0, 112.0, 48.0, 16.0, 1.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.45870590209961, -15.191529273986816, -13.924352645874023, -12.657175064086914, -11.389998435974121, -10.122821807861328, -8.855644226074219, -7.588467597961426, -6.321290969848633, -5.05411434173584, -3.7869372367858887, -2.5197603702545166, -1.2525835037231445, 0.014593124389648438, 1.2817702293395996, 2.548947334289551, 3.8161239624023438, 5.083300590515137, 6.350477695465088, 7.617654800415039, 8.884831428527832, 10.152008056640625, 11.419185638427734, 12.686362266540527, 13.95353889465332, 15.220715522766113, 16.487892150878906, 17.755069732666016, 19.022247314453125, 20.2894229888916, 21.55660057067871, 22.823776245117188, 24.090957641601562, 25.358135223388672, 26.62531089782715, 27.892488479614258, 29.159664154052734, 30.426841735839844, 31.694019317626953, 32.96119689941406, 34.228370666503906, 35.495548248291016, 36.762725830078125, 38.02989959716797, 39.29707717895508, 40.56425476074219, 41.8314323425293, 43.098609924316406, 44.365787506103516, 45.632965087890625, 46.900142669677734, 48.16731643676758, 49.43449401855469, 50.7016716003418, 51.968849182128906, 53.236026763916016, 54.503204345703125, 55.770381927490234, 57.037559509277344, 58.30473327636719, 59.5719108581543, 60.839088439941406, 62.106266021728516, 63.373443603515625, 64.64061737060547]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 12.0, 2.0, 3.0, 8.0, 5.0, 9.0, 14.0, 11.0, 12.0, 21.0, 18.0, 23.0, 23.0, 21.0, 31.0, 29.0, 34.0, 28.0, 32.0, 40.0, 43.0, 61.0, 44.0, 44.0, 45.0, 33.0, 50.0, 54.0, 36.0, 20.0, 27.0, 28.0, 24.0, 20.0, 21.0, 14.0, 10.0, 7.0, 10.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.347648620605469, -9.04265308380127, -8.73765754699707, -8.432662963867188, -8.127667427062988, -7.822671890258789, -7.51767635345459, -7.212680816650391, -6.90768575668335, -6.60269021987915, -6.297695159912109, -5.99269962310791, -5.687704086303711, -5.38270902633667, -5.077713489532471, -4.77271842956543, -4.4677228927612305, -4.162727355957031, -3.8577322959899902, -3.552736759185791, -3.247741460800171, -2.942746162414551, -2.6377506256103516, -2.3327553272247314, -2.0277600288391113, -1.7227647304534912, -1.4177693128585815, -1.1127738952636719, -0.8077785968780518, -0.5027832984924316, -0.19778788089752197, 0.1072075366973877, 0.4122018814086914, 0.7171972393989563, 1.0221925973892212, 1.3271880149841309, 1.632183313369751, 1.937178611755371, 2.2421741485595703, 2.5471694469451904, 2.8521647453308105, 3.1571600437164307, 3.462155342102051, 3.76715087890625, 4.072146415710449, 4.37714147567749, 4.6821370124816895, 4.9871320724487305, 5.29212760925293, 5.597123146057129, 5.90211820602417, 6.207113742828369, 6.51210880279541, 6.817104339599609, 7.122099876403809, 7.427095413208008, 7.732090473175049, 8.03708553314209, 8.342081069946289, 8.647076606750488, 8.952072143554688, 9.25706672668457, 9.56206226348877, 9.867057800292969, 10.172053337097168]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 12.0, 15.0, 38.0, 45.0, 70.0, 103.0, 171.0, 291.0, 417.0, 708.0, 1243.0, 2536.0, 4763.0, 10496.0, 24762.0, 67734.0, 270896.0, 479122.0, 118280.0, 37711.0, 15103.0, 6752.0, 3257.0, 1684.0, 925.0, 556.0, 318.0, 176.0, 130.0, 80.0, 59.0, 27.0, 22.0, 12.0, 15.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.99237060546875, -1.9241943359375, -1.85601806640625, -1.787841796875, -1.71966552734375, -1.6514892578125, -1.58331298828125, -1.51513671875, -1.44696044921875, -1.3787841796875, -1.31060791015625, -1.242431640625, -1.17425537109375, -1.1060791015625, -1.03790283203125, -0.9697265625, -0.90155029296875, -0.8333740234375, -0.76519775390625, -0.697021484375, -0.62884521484375, -0.5606689453125, -0.49249267578125, -0.42431640625, -0.35614013671875, -0.2879638671875, -0.21978759765625, -0.151611328125, -0.08343505859375, -0.0152587890625, 0.05291748046875, 0.12109375, 0.18927001953125, 0.2574462890625, 0.32562255859375, 0.393798828125, 0.46197509765625, 0.5301513671875, 0.59832763671875, 0.66650390625, 0.73468017578125, 0.8028564453125, 0.87103271484375, 0.939208984375, 1.00738525390625, 1.0755615234375, 1.14373779296875, 1.2119140625, 1.28009033203125, 1.3482666015625, 1.41644287109375, 1.484619140625, 1.55279541015625, 1.6209716796875, 1.68914794921875, 1.75732421875, 1.82550048828125, 1.8936767578125, 1.96185302734375, 2.030029296875, 2.09820556640625, 2.1663818359375, 2.23455810546875, 2.302734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 12.0, 13.0, 12.0, 19.0, 18.0, 24.0, 29.0, 33.0, 33.0, 42.0, 59.0, 45.0, 53.0, 42.0, 49.0, 55.0, 48.0, 51.0, 47.0, 45.0, 43.0, 40.0, 33.0, 29.0, 22.0, 19.0, 18.0, 12.0, 21.0, 8.0, 6.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86181640625, -0.83673095703125, -0.8116455078125, -0.78656005859375, -0.761474609375, -0.73638916015625, -0.7113037109375, -0.68621826171875, -0.6611328125, -0.63604736328125, -0.6109619140625, -0.58587646484375, -0.560791015625, -0.53570556640625, -0.5106201171875, -0.48553466796875, -0.46044921875, -0.43536376953125, -0.4102783203125, -0.38519287109375, -0.360107421875, -0.33502197265625, -0.3099365234375, -0.28485107421875, -0.259765625, -0.23468017578125, -0.2095947265625, -0.18450927734375, -0.159423828125, -0.13433837890625, -0.1092529296875, -0.08416748046875, -0.05908203125, -0.03399658203125, -0.0089111328125, 0.01617431640625, 0.041259765625, 0.06634521484375, 0.0914306640625, 0.11651611328125, 0.1416015625, 0.16668701171875, 0.1917724609375, 0.21685791015625, 0.241943359375, 0.26702880859375, 0.2921142578125, 0.31719970703125, 0.34228515625, 0.36737060546875, 0.3924560546875, 0.41754150390625, 0.442626953125, 0.46771240234375, 0.4927978515625, 0.51788330078125, 0.54296875, 0.56805419921875, 0.5931396484375, 0.61822509765625, 0.643310546875, 0.66839599609375, 0.6934814453125, 0.71856689453125, 0.74365234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 6.0, 11.0, 15.0, 18.0, 26.0, 20.0, 40.0, 64.0, 87.0, 105.0, 173.0, 313.0, 436.0, 823.0, 1598.0, 4020.0, 13695.0, 81095.0, 806968.0, 113560.0, 16744.0, 4572.0, 1872.0, 898.0, 475.0, 271.0, 183.0, 113.0, 87.0, 79.0, 36.0, 35.0, 29.0, 17.0, 9.0, 13.0, 13.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.53515625, -3.40692138671875, -3.2786865234375, -3.15045166015625, -3.022216796875, -2.89398193359375, -2.7657470703125, -2.63751220703125, -2.50927734375, -2.38104248046875, -2.2528076171875, -2.12457275390625, -1.996337890625, -1.86810302734375, -1.7398681640625, -1.61163330078125, -1.4833984375, -1.35516357421875, -1.2269287109375, -1.09869384765625, -0.970458984375, -0.84222412109375, -0.7139892578125, -0.58575439453125, -0.45751953125, -0.32928466796875, -0.2010498046875, -0.07281494140625, 0.055419921875, 0.18365478515625, 0.3118896484375, 0.44012451171875, 0.568359375, 0.69659423828125, 0.8248291015625, 0.95306396484375, 1.081298828125, 1.20953369140625, 1.3377685546875, 1.46600341796875, 1.59423828125, 1.72247314453125, 1.8507080078125, 1.97894287109375, 2.107177734375, 2.23541259765625, 2.3636474609375, 2.49188232421875, 2.6201171875, 2.74835205078125, 2.8765869140625, 3.00482177734375, 3.133056640625, 3.26129150390625, 3.3895263671875, 3.51776123046875, 3.64599609375, 3.77423095703125, 3.9024658203125, 4.03070068359375, 4.158935546875, 4.28717041015625, 4.4154052734375, 4.54364013671875, 4.671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 14.0, 16.0, 16.0, 27.0, 35.0, 34.0, 41.0, 58.0, 52.0, 60.0, 55.0, 59.0, 61.0, 50.0, 63.0, 50.0, 52.0, 46.0, 28.0, 34.0, 28.0, 28.0, 22.0, 12.0, 7.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.162841796875, -4.01708984375, -3.871337890625, -3.7255859375, -3.579833984375, -3.43408203125, -3.288330078125, -3.142578125, -2.996826171875, -2.85107421875, -2.705322265625, -2.5595703125, -2.413818359375, -2.26806640625, -2.122314453125, -1.9765625, -1.830810546875, -1.68505859375, -1.539306640625, -1.3935546875, -1.247802734375, -1.10205078125, -0.956298828125, -0.810546875, -0.664794921875, -0.51904296875, -0.373291015625, -0.2275390625, -0.081787109375, 0.06396484375, 0.209716796875, 0.35546875, 0.501220703125, 0.64697265625, 0.792724609375, 0.9384765625, 1.084228515625, 1.22998046875, 1.375732421875, 1.521484375, 1.667236328125, 1.81298828125, 1.958740234375, 2.1044921875, 2.250244140625, 2.39599609375, 2.541748046875, 2.6875, 2.833251953125, 2.97900390625, 3.124755859375, 3.2705078125, 3.416259765625, 3.56201171875, 3.707763671875, 3.853515625, 3.999267578125, 4.14501953125, 4.290771484375, 4.4365234375, 4.582275390625, 4.72802734375, 4.873779296875, 5.01953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 8.0, 2.0, 4.0, 19.0, 11.0, 21.0, 35.0, 52.0, 50.0, 94.0, 170.0, 230.0, 497.0, 868.0, 2012.0, 4855.0, 15351.0, 84789.0, 783404.0, 125920.0, 19744.0, 5836.0, 2217.0, 1024.0, 545.0, 272.0, 195.0, 115.0, 67.0, 44.0, 41.0, 15.0, 15.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9775390625, -1.921966552734375, -1.86639404296875, -1.810821533203125, -1.7552490234375, -1.699676513671875, -1.64410400390625, -1.588531494140625, -1.532958984375, -1.477386474609375, -1.42181396484375, -1.366241455078125, -1.3106689453125, -1.255096435546875, -1.19952392578125, -1.143951416015625, -1.08837890625, -1.032806396484375, -0.97723388671875, -0.921661376953125, -0.8660888671875, -0.810516357421875, -0.75494384765625, -0.699371337890625, -0.643798828125, -0.588226318359375, -0.53265380859375, -0.477081298828125, -0.4215087890625, -0.365936279296875, -0.31036376953125, -0.254791259765625, -0.19921875, -0.143646240234375, -0.08807373046875, -0.032501220703125, 0.0230712890625, 0.078643798828125, 0.13421630859375, 0.189788818359375, 0.245361328125, 0.300933837890625, 0.35650634765625, 0.412078857421875, 0.4676513671875, 0.523223876953125, 0.57879638671875, 0.634368896484375, 0.68994140625, 0.745513916015625, 0.80108642578125, 0.856658935546875, 0.9122314453125, 0.967803955078125, 1.02337646484375, 1.078948974609375, 1.134521484375, 1.190093994140625, 1.24566650390625, 1.301239013671875, 1.3568115234375, 1.412384033203125, 1.46795654296875, 1.523529052734375, 1.5791015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 13.0, 10.0, 12.0, 29.0, 34.0, 53.0, 104.0, 152.0, 206.0, 140.0, 79.0, 47.0, 30.0, 13.0, 15.0, 9.0, 5.0, 3.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0005998611450195312, -0.0005850009620189667, -0.0005701407790184021, -0.0005552805960178375, -0.000540420413017273, -0.0005255602300167084, -0.0005107000470161438, -0.0004958398640155792, -0.00048097968101501465, -0.0004661194980144501, -0.0004512593150138855, -0.0004363991320133209, -0.00042153894901275635, -0.00040667876601219177, -0.0003918185830116272, -0.0003769584000110626, -0.00036209821701049805, -0.00034723803400993347, -0.0003323778510093689, -0.0003175176680088043, -0.00030265748500823975, -0.00028779730200767517, -0.0002729371190071106, -0.000258076936006546, -0.00024321675300598145, -0.00022835657000541687, -0.0002134963870048523, -0.00019863620400428772, -0.00018377602100372314, -0.00016891583800315857, -0.000154055655002594, -0.00013919547200202942, -0.00012433528900146484, -0.00010947510600090027, -9.46149230003357e-05, -7.975473999977112e-05, -6.489455699920654e-05, -5.003437399864197e-05, -3.517419099807739e-05, -2.0314007997512817e-05, -5.453824996948242e-06, 9.406358003616333e-06, 2.4266541004180908e-05, 3.9126724004745483e-05, 5.398690700531006e-05, 6.884709000587463e-05, 8.370727300643921e-05, 9.856745600700378e-05, 0.00011342763900756836, 0.00012828782200813293, 0.0001431480050086975, 0.00015800818800926208, 0.00017286837100982666, 0.00018772855401039124, 0.0002025887370109558, 0.00021744892001152039, 0.00023230910301208496, 0.00024716928601264954, 0.0002620294690132141, 0.0002768896520137787, 0.00029174983501434326, 0.00030661001801490784, 0.0003214702010154724, 0.000336330384016037, 0.00035119056701660156]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 15.0, 13.0, 27.0, 27.0, 39.0, 49.0, 45.0, 91.0, 160.0, 225.0, 358.0, 733.0, 1520.0, 4087.0, 14565.0, 122642.0, 810964.0, 75515.0, 11130.0, 3336.0, 1347.0, 628.0, 321.0, 230.0, 157.0, 81.0, 59.0, 44.0, 33.0, 18.0, 15.0, 14.0, 11.0, 5.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.791015625, -1.7339935302734375, -1.676971435546875, -1.6199493408203125, -1.56292724609375, -1.5059051513671875, -1.448883056640625, -1.3918609619140625, -1.3348388671875, -1.2778167724609375, -1.220794677734375, -1.1637725830078125, -1.10675048828125, -1.0497283935546875, -0.992706298828125, -0.9356842041015625, -0.878662109375, -0.8216400146484375, -0.764617919921875, -0.7075958251953125, -0.65057373046875, -0.5935516357421875, -0.536529541015625, -0.4795074462890625, -0.4224853515625, -0.3654632568359375, -0.308441162109375, -0.2514190673828125, -0.19439697265625, -0.1373748779296875, -0.080352783203125, -0.0233306884765625, 0.03369140625, 0.0907135009765625, 0.147735595703125, 0.2047576904296875, 0.26177978515625, 0.3188018798828125, 0.375823974609375, 0.4328460693359375, 0.4898681640625, 0.5468902587890625, 0.603912353515625, 0.6609344482421875, 0.71795654296875, 0.7749786376953125, 0.832000732421875, 0.8890228271484375, 0.946044921875, 1.0030670166015625, 1.060089111328125, 1.1171112060546875, 1.17413330078125, 1.2311553955078125, 1.288177490234375, 1.3451995849609375, 1.4022216796875, 1.4592437744140625, 1.516265869140625, 1.5732879638671875, 1.63031005859375, 1.6873321533203125, 1.744354248046875, 1.8013763427734375, 1.8583984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 13.0, 9.0, 23.0, 17.0, 19.0, 27.0, 30.0, 41.0, 69.0, 72.0, 113.0, 102.0, 86.0, 83.0, 53.0, 53.0, 33.0, 35.0, 28.0, 14.0, 12.0, 15.0, 6.0, 7.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.595703125, -1.545318603515625, -1.49493408203125, -1.444549560546875, -1.3941650390625, -1.343780517578125, -1.29339599609375, -1.243011474609375, -1.192626953125, -1.142242431640625, -1.09185791015625, -1.041473388671875, -0.9910888671875, -0.940704345703125, -0.89031982421875, -0.839935302734375, -0.78955078125, -0.739166259765625, -0.68878173828125, -0.638397216796875, -0.5880126953125, -0.537628173828125, -0.48724365234375, -0.436859130859375, -0.386474609375, -0.336090087890625, -0.28570556640625, -0.235321044921875, -0.1849365234375, -0.134552001953125, -0.08416748046875, -0.033782958984375, 0.0166015625, 0.066986083984375, 0.11737060546875, 0.167755126953125, 0.2181396484375, 0.268524169921875, 0.31890869140625, 0.369293212890625, 0.419677734375, 0.470062255859375, 0.52044677734375, 0.570831298828125, 0.6212158203125, 0.671600341796875, 0.72198486328125, 0.772369384765625, 0.82275390625, 0.873138427734375, 0.92352294921875, 0.973907470703125, 1.0242919921875, 1.074676513671875, 1.12506103515625, 1.175445556640625, 1.225830078125, 1.276214599609375, 1.32659912109375, 1.376983642578125, 1.4273681640625, 1.477752685546875, 1.52813720703125, 1.578521728515625, 1.62890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 11.0, 22.0, 109.0, 277.0, 366.0, 142.0, 50.0, 10.0, 5.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.76612091064453, -18.912282943725586, -17.058446884155273, -15.204608917236328, -13.3507719039917, -11.49693489074707, -9.643096923828125, -7.789259910583496, -5.935422897338867, -4.081585884094238, -2.227748394012451, -0.37391090393066406, 1.4799261093139648, 3.3337631225585938, 5.187601089477539, 7.041438102722168, 8.895275115966797, 10.749112129211426, 12.602949142456055, 14.456787109375, 16.310623168945312, 18.164461135864258, 20.018299102783203, 21.872135162353516, 23.72597312927246, 25.579811096191406, 27.43364715576172, 29.287485122680664, 31.14132308959961, 32.99515914916992, 34.8489990234375, 36.70283508300781, 38.556671142578125, 40.41050720214844, 42.264347076416016, 44.11818313598633, 45.97201919555664, 47.82585906982422, 49.67969512939453, 51.533531188964844, 53.387367248535156, 55.24120330810547, 57.09504318237305, 58.94887924194336, 60.80271530151367, 62.65655517578125, 64.51039123535156, 66.36422729492188, 68.21806335449219, 70.0718994140625, 71.92573547363281, 73.77957153320312, 75.63341522216797, 77.48725128173828, 79.3410873413086, 81.1949234008789, 83.04876708984375, 84.90260314941406, 86.75643920898438, 88.61027526855469, 90.46411895751953, 92.31795501708984, 94.17179107666016, 96.02562713623047, 97.87946319580078]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 11.0, 15.0, 8.0, 13.0, 22.0, 16.0, 17.0, 31.0, 26.0, 32.0, 24.0, 28.0, 35.0, 41.0, 38.0, 48.0, 41.0, 50.0, 48.0, 40.0, 54.0, 36.0, 46.0, 35.0, 22.0, 27.0, 27.0, 22.0, 14.0, 20.0, 14.0, 14.0, 14.0, 14.0, 8.0, 10.0, 8.0, 2.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.20739459991455, -11.807621002197266, -11.407846450805664, -11.008072853088379, -10.608299255371094, -10.208524703979492, -9.808751106262207, -9.408977508544922, -9.00920295715332, -8.609429359436035, -8.209654808044434, -7.809881210327148, -7.410107612609863, -7.01033353805542, -6.610559463500977, -6.210785865783691, -5.811012268066406, -5.411238193511963, -5.011464595794678, -4.611690521240234, -4.211916923522949, -3.812142848968506, -3.4123687744140625, -3.0125949382781982, -2.612821102142334, -2.2130472660064697, -1.813273310661316, -1.413499355316162, -1.0137255191802979, -0.6139516830444336, -0.21417760848999023, 0.18559622764587402, 0.5853691101074219, 0.9851430058479309, 1.38491690158844, 1.7846908569335938, 2.184464693069458, 2.5842385292053223, 2.9840126037597656, 3.38378643989563, 3.783560276031494, 4.1833343505859375, 4.583107948303223, 4.982882022857666, 5.382656097412109, 5.7824296951293945, 6.182203769683838, 6.581977844238281, 6.981751441955566, 7.38152551651001, 7.781299114227295, 8.181073188781738, 8.580846786499023, 8.980621337890625, 9.38039493560791, 9.780168533325195, 10.179943084716797, 10.579716682434082, 10.979491233825684, 11.379264831542969, 11.779038429260254, 12.178812026977539, 12.57858657836914, 12.978360176086426, 13.378133773803711]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 8.0, 4.0, 11.0, 12.0, 22.0, 21.0, 31.0, 45.0, 48.0, 89.0, 162.0, 249.0, 726.0, 2897.0, 24829.0, 2930324.0, 1213016.0, 18085.0, 2353.0, 634.0, 245.0, 156.0, 88.0, 63.0, 39.0, 33.0, 18.0, 17.0, 17.0, 10.0, 8.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.920166015625, -3.79345703125, -3.666748046875, -3.5400390625, -3.413330078125, -3.28662109375, -3.159912109375, -3.033203125, -2.906494140625, -2.77978515625, -2.653076171875, -2.5263671875, -2.399658203125, -2.27294921875, -2.146240234375, -2.01953125, -1.892822265625, -1.76611328125, -1.639404296875, -1.5126953125, -1.385986328125, -1.25927734375, -1.132568359375, -1.005859375, -0.879150390625, -0.75244140625, -0.625732421875, -0.4990234375, -0.372314453125, -0.24560546875, -0.118896484375, 0.0078125, 0.134521484375, 0.26123046875, 0.387939453125, 0.5146484375, 0.641357421875, 0.76806640625, 0.894775390625, 1.021484375, 1.148193359375, 1.27490234375, 1.401611328125, 1.5283203125, 1.655029296875, 1.78173828125, 1.908447265625, 2.03515625, 2.161865234375, 2.28857421875, 2.415283203125, 2.5419921875, 2.668701171875, 2.79541015625, 2.922119140625, 3.048828125, 3.175537109375, 3.30224609375, 3.428955078125, 3.5556640625, 3.682373046875, 3.80908203125, 3.935791015625, 4.0625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 10.0, 16.0, 3.0, 15.0, 16.0, 20.0, 38.0, 25.0, 33.0, 40.0, 39.0, 38.0, 56.0, 36.0, 49.0, 54.0, 54.0, 47.0, 52.0, 53.0, 47.0, 35.0, 38.0, 33.0, 26.0, 26.0, 24.0, 17.0, 11.0, 6.0, 6.0, 4.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.77099609375, -0.7472686767578125, -0.723541259765625, -0.6998138427734375, -0.67608642578125, -0.6523590087890625, -0.628631591796875, -0.6049041748046875, -0.5811767578125, -0.5574493408203125, -0.533721923828125, -0.5099945068359375, -0.48626708984375, -0.4625396728515625, -0.438812255859375, -0.4150848388671875, -0.391357421875, -0.3676300048828125, -0.343902587890625, -0.3201751708984375, -0.29644775390625, -0.2727203369140625, -0.248992919921875, -0.2252655029296875, -0.2015380859375, -0.1778106689453125, -0.154083251953125, -0.1303558349609375, -0.10662841796875, -0.0829010009765625, -0.059173583984375, -0.0354461669921875, -0.01171875, 0.0120086669921875, 0.035736083984375, 0.0594635009765625, 0.08319091796875, 0.1069183349609375, 0.130645751953125, 0.1543731689453125, 0.1781005859375, 0.2018280029296875, 0.225555419921875, 0.2492828369140625, 0.27301025390625, 0.2967376708984375, 0.320465087890625, 0.3441925048828125, 0.367919921875, 0.3916473388671875, 0.415374755859375, 0.4391021728515625, 0.46282958984375, 0.4865570068359375, 0.510284423828125, 0.5340118408203125, 0.5577392578125, 0.5814666748046875, 0.605194091796875, 0.6289215087890625, 0.65264892578125, 0.6763763427734375, 0.700103759765625, 0.7238311767578125, 0.74755859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 8.0, 4.0, 7.0, 10.0, 14.0, 10.0, 27.0, 25.0, 41.0, 56.0, 80.0, 117.0, 248.0, 505.0, 1139.0, 3006.0, 9471.0, 40522.0, 384852.0, 3513525.0, 201247.0, 28181.0, 7230.0, 2309.0, 819.0, 367.0, 174.0, 93.0, 56.0, 38.0, 32.0, 23.0, 20.0, 5.0, 2.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.342864990234375, -2.25408935546875, -2.165313720703125, -2.0765380859375, -1.987762451171875, -1.89898681640625, -1.810211181640625, -1.721435546875, -1.632659912109375, -1.54388427734375, -1.455108642578125, -1.3663330078125, -1.277557373046875, -1.18878173828125, -1.100006103515625, -1.01123046875, -0.922454833984375, -0.83367919921875, -0.744903564453125, -0.6561279296875, -0.567352294921875, -0.47857666015625, -0.389801025390625, -0.301025390625, -0.212249755859375, -0.12347412109375, -0.034698486328125, 0.0540771484375, 0.142852783203125, 0.23162841796875, 0.320404052734375, 0.4091796875, 0.497955322265625, 0.58673095703125, 0.675506591796875, 0.7642822265625, 0.853057861328125, 0.94183349609375, 1.030609130859375, 1.119384765625, 1.208160400390625, 1.29693603515625, 1.385711669921875, 1.4744873046875, 1.563262939453125, 1.65203857421875, 1.740814208984375, 1.82958984375, 1.918365478515625, 2.00714111328125, 2.095916748046875, 2.1846923828125, 2.273468017578125, 2.36224365234375, 2.451019287109375, 2.539794921875, 2.628570556640625, 2.71734619140625, 2.806121826171875, 2.8948974609375, 2.983673095703125, 3.07244873046875, 3.161224365234375, 3.25]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 5.0, 8.0, 15.0, 23.0, 37.0, 44.0, 107.0, 227.0, 575.0, 1507.0, 890.0, 332.0, 129.0, 57.0, 47.0, 19.0, 22.0, 7.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.31640625, -5.1947021484375, -5.072998046875, -4.9512939453125, -4.82958984375, -4.7078857421875, -4.586181640625, -4.4644775390625, -4.3427734375, -4.2210693359375, -4.099365234375, -3.9776611328125, -3.85595703125, -3.7342529296875, -3.612548828125, -3.4908447265625, -3.369140625, -3.2474365234375, -3.125732421875, -3.0040283203125, -2.88232421875, -2.7606201171875, -2.638916015625, -2.5172119140625, -2.3955078125, -2.2738037109375, -2.152099609375, -2.0303955078125, -1.90869140625, -1.7869873046875, -1.665283203125, -1.5435791015625, -1.421875, -1.3001708984375, -1.178466796875, -1.0567626953125, -0.93505859375, -0.8133544921875, -0.691650390625, -0.5699462890625, -0.4482421875, -0.3265380859375, -0.204833984375, -0.0831298828125, 0.03857421875, 0.1602783203125, 0.281982421875, 0.4036865234375, 0.525390625, 0.6470947265625, 0.768798828125, 0.8905029296875, 1.01220703125, 1.1339111328125, 1.255615234375, 1.3773193359375, 1.4990234375, 1.6207275390625, 1.742431640625, 1.8641357421875, 1.98583984375, 2.1075439453125, 2.229248046875, 2.3509521484375, 2.47265625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 19.0, 69.0, 158.0, 278.0, 251.0, 120.0, 56.0, 10.0, 11.0, 8.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.7574348449707, -39.707603454589844, -38.65777587890625, -37.60794448852539, -36.55811309814453, -35.50828552246094, -34.45845413208008, -33.408626556396484, -32.358795166015625, -31.3089656829834, -30.259136199951172, -29.209304809570312, -28.159475326538086, -27.10964584350586, -26.059814453125, -25.009984970092773, -23.960155487060547, -22.91032600402832, -21.860496520996094, -20.810665130615234, -19.760835647583008, -18.71100616455078, -17.661174774169922, -16.611345291137695, -15.561515808105469, -14.511686325073242, -13.4618558883667, -12.412025451660156, -11.36219596862793, -10.312366485595703, -9.26253604888916, -8.212705612182617, -7.162876129150391, -6.113046169281006, -5.063216209411621, -4.013386249542236, -2.9635562896728516, -1.9137263298034668, -0.863896369934082, 0.18593358993530273, 1.2357635498046875, 2.2855935096740723, 3.335423469543457, 4.385253429412842, 5.435083389282227, 6.484913349151611, 7.534743309020996, 8.584573745727539, 9.634403228759766, 10.684232711791992, 11.734063148498535, 12.783893585205078, 13.833723068237305, 14.883552551269531, 15.933382987976074, 16.983213424682617, 18.033042907714844, 19.08287239074707, 20.132701873779297, 21.182533264160156, 22.232362747192383, 23.28219223022461, 24.33202362060547, 25.381853103637695, 26.431682586669922]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 8.0, 9.0, 15.0, 17.0, 23.0, 33.0, 26.0, 27.0, 42.0, 32.0, 35.0, 45.0, 47.0, 47.0, 48.0, 48.0, 54.0, 49.0, 46.0, 47.0, 36.0, 46.0, 31.0, 35.0, 26.0, 19.0, 25.0, 13.0, 13.0, 4.0, 9.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.534239768981934, -10.21699333190918, -9.899747848510742, -9.582501411437988, -9.265254974365234, -8.94800853729248, -8.630763053894043, -8.313516616821289, -7.996270179748535, -7.6790242195129395, -7.3617777824401855, -7.04453182220459, -6.727285385131836, -6.41003942489624, -6.0927934646606445, -5.775547027587891, -5.458301067352295, -5.141055107116699, -4.823808670043945, -4.50656270980835, -4.189316272735596, -3.8720703125, -3.554824113845825, -3.2375779151916504, -2.9203317165374756, -2.603085517883301, -2.285839319229126, -1.9685932397842407, -1.651347041130066, -1.3341008424758911, -1.0168547630310059, -0.699608564376831, -0.38236236572265625, -0.06511619687080383, 0.2521299719810486, 0.5693761110305786, 0.8866223096847534, 1.2038685083389282, 1.5211145877838135, 1.8383607864379883, 2.155606985092163, 2.472853183746338, 2.7900993824005127, 3.1073455810546875, 3.424591541290283, 3.741837978363037, 4.059083938598633, 4.376330375671387, 4.693576335906982, 5.010822296142578, 5.328068733215332, 5.645314693450928, 5.962561130523682, 6.279807090759277, 6.597053527832031, 6.914299488067627, 7.231545448303223, 7.548791408538818, 7.866037845611572, 8.183283805847168, 8.500530242919922, 8.817776679992676, 9.135022163391113, 9.452268600463867, 9.769515037536621]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 10.0, 18.0, 19.0, 18.0, 52.0, 73.0, 150.0, 240.0, 403.0, 736.0, 1334.0, 2816.0, 6081.0, 14272.0, 37391.0, 132209.0, 526493.0, 235461.0, 55228.0, 19863.0, 8147.0, 3686.0, 1777.0, 925.0, 450.0, 270.0, 140.0, 113.0, 68.0, 43.0, 33.0, 10.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9775390625, -1.9109039306640625, -1.844268798828125, -1.7776336669921875, -1.71099853515625, -1.6443634033203125, -1.577728271484375, -1.5110931396484375, -1.4444580078125, -1.3778228759765625, -1.311187744140625, -1.2445526123046875, -1.17791748046875, -1.1112823486328125, -1.044647216796875, -0.9780120849609375, -0.911376953125, -0.8447418212890625, -0.778106689453125, -0.7114715576171875, -0.64483642578125, -0.5782012939453125, -0.511566162109375, -0.4449310302734375, -0.3782958984375, -0.3116607666015625, -0.245025634765625, -0.1783905029296875, -0.11175537109375, -0.0451202392578125, 0.021514892578125, 0.0881500244140625, 0.15478515625, 0.2214202880859375, 0.288055419921875, 0.3546905517578125, 0.42132568359375, 0.4879608154296875, 0.554595947265625, 0.6212310791015625, 0.6878662109375, 0.7545013427734375, 0.821136474609375, 0.8877716064453125, 0.95440673828125, 1.0210418701171875, 1.087677001953125, 1.1543121337890625, 1.220947265625, 1.2875823974609375, 1.354217529296875, 1.4208526611328125, 1.48748779296875, 1.5541229248046875, 1.620758056640625, 1.6873931884765625, 1.7540283203125, 1.8206634521484375, 1.887298583984375, 1.9539337158203125, 2.02056884765625, 2.0872039794921875, 2.153839111328125, 2.2204742431640625, 2.287109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 3.0, 12.0, 11.0, 10.0, 10.0, 16.0, 17.0, 20.0, 29.0, 27.0, 29.0, 36.0, 36.0, 38.0, 55.0, 43.0, 37.0, 27.0, 45.0, 53.0, 53.0, 54.0, 39.0, 41.0, 39.0, 36.0, 23.0, 22.0, 22.0, 18.0, 19.0, 11.0, 10.0, 7.0, 11.0, 4.0, 9.0, 6.0, 2.0, 5.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.765625, -0.74267578125, -0.7197265625, -0.69677734375, -0.673828125, -0.65087890625, -0.6279296875, -0.60498046875, -0.58203125, -0.55908203125, -0.5361328125, -0.51318359375, -0.490234375, -0.46728515625, -0.4443359375, -0.42138671875, -0.3984375, -0.37548828125, -0.3525390625, -0.32958984375, -0.306640625, -0.28369140625, -0.2607421875, -0.23779296875, -0.21484375, -0.19189453125, -0.1689453125, -0.14599609375, -0.123046875, -0.10009765625, -0.0771484375, -0.05419921875, -0.03125, -0.00830078125, 0.0146484375, 0.03759765625, 0.060546875, 0.08349609375, 0.1064453125, 0.12939453125, 0.15234375, 0.17529296875, 0.1982421875, 0.22119140625, 0.244140625, 0.26708984375, 0.2900390625, 0.31298828125, 0.3359375, 0.35888671875, 0.3818359375, 0.40478515625, 0.427734375, 0.45068359375, 0.4736328125, 0.49658203125, 0.51953125, 0.54248046875, 0.5654296875, 0.58837890625, 0.611328125, 0.63427734375, 0.6572265625, 0.68017578125, 0.703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 4.0, 9.0, 8.0, 19.0, 15.0, 28.0, 41.0, 53.0, 103.0, 128.0, 258.0, 427.0, 742.0, 1548.0, 3845.0, 13603.0, 71863.0, 770607.0, 153505.0, 21850.0, 5607.0, 2093.0, 948.0, 478.0, 276.0, 147.0, 99.0, 72.0, 47.0, 29.0, 31.0, 13.0, 10.0, 14.0, 7.0, 5.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.92633056640625, -3.8096923828125, -3.69305419921875, -3.576416015625, -3.45977783203125, -3.3431396484375, -3.22650146484375, -3.10986328125, -2.99322509765625, -2.8765869140625, -2.75994873046875, -2.643310546875, -2.52667236328125, -2.4100341796875, -2.29339599609375, -2.1767578125, -2.06011962890625, -1.9434814453125, -1.82684326171875, -1.710205078125, -1.59356689453125, -1.4769287109375, -1.36029052734375, -1.24365234375, -1.12701416015625, -1.0103759765625, -0.89373779296875, -0.777099609375, -0.66046142578125, -0.5438232421875, -0.42718505859375, -0.310546875, -0.19390869140625, -0.0772705078125, 0.03936767578125, 0.156005859375, 0.27264404296875, 0.3892822265625, 0.50592041015625, 0.62255859375, 0.73919677734375, 0.8558349609375, 0.97247314453125, 1.089111328125, 1.20574951171875, 1.3223876953125, 1.43902587890625, 1.5556640625, 1.67230224609375, 1.7889404296875, 1.90557861328125, 2.022216796875, 2.13885498046875, 2.2554931640625, 2.37213134765625, 2.48876953125, 2.60540771484375, 2.7220458984375, 2.83868408203125, 2.955322265625, 3.07196044921875, 3.1885986328125, 3.30523681640625, 3.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 10.0, 7.0, 7.0, 11.0, 13.0, 15.0, 17.0, 25.0, 31.0, 34.0, 43.0, 39.0, 60.0, 57.0, 67.0, 68.0, 87.0, 57.0, 57.0, 50.0, 51.0, 43.0, 37.0, 19.0, 16.0, 29.0, 11.0, 8.0, 9.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.300262451171875, -3.16107177734375, -3.021881103515625, -2.8826904296875, -2.743499755859375, -2.60430908203125, -2.465118408203125, -2.325927734375, -2.186737060546875, -2.04754638671875, -1.908355712890625, -1.7691650390625, -1.629974365234375, -1.49078369140625, -1.351593017578125, -1.21240234375, -1.073211669921875, -0.93402099609375, -0.794830322265625, -0.6556396484375, -0.516448974609375, -0.37725830078125, -0.238067626953125, -0.098876953125, 0.040313720703125, 0.17950439453125, 0.318695068359375, 0.4578857421875, 0.597076416015625, 0.73626708984375, 0.875457763671875, 1.0146484375, 1.153839111328125, 1.29302978515625, 1.432220458984375, 1.5714111328125, 1.710601806640625, 1.84979248046875, 1.988983154296875, 2.128173828125, 2.267364501953125, 2.40655517578125, 2.545745849609375, 2.6849365234375, 2.824127197265625, 2.96331787109375, 3.102508544921875, 3.24169921875, 3.380889892578125, 3.52008056640625, 3.659271240234375, 3.7984619140625, 3.937652587890625, 4.07684326171875, 4.216033935546875, 4.355224609375, 4.494415283203125, 4.63360595703125, 4.772796630859375, 4.9119873046875, 5.051177978515625, 5.19036865234375, 5.329559326171875, 5.46875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 5.0, 6.0, 15.0, 18.0, 23.0, 43.0, 73.0, 102.0, 195.0, 388.0, 1045.0, 3269.0, 13825.0, 114867.0, 791944.0, 104808.0, 12960.0, 2990.0, 1025.0, 427.0, 219.0, 103.0, 67.0, 38.0, 27.0, 15.0, 14.0, 12.0, 2.0, 8.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0], "bins": [-2.509765625, -2.446197509765625, -2.38262939453125, -2.319061279296875, -2.2554931640625, -2.191925048828125, -2.12835693359375, -2.064788818359375, -2.001220703125, -1.937652587890625, -1.87408447265625, -1.810516357421875, -1.7469482421875, -1.683380126953125, -1.61981201171875, -1.556243896484375, -1.49267578125, -1.429107666015625, -1.36553955078125, -1.301971435546875, -1.2384033203125, -1.174835205078125, -1.11126708984375, -1.047698974609375, -0.984130859375, -0.920562744140625, -0.85699462890625, -0.793426513671875, -0.7298583984375, -0.666290283203125, -0.60272216796875, -0.539154052734375, -0.4755859375, -0.412017822265625, -0.34844970703125, -0.284881591796875, -0.2213134765625, -0.157745361328125, -0.09417724609375, -0.030609130859375, 0.032958984375, 0.096527099609375, 0.16009521484375, 0.223663330078125, 0.2872314453125, 0.350799560546875, 0.41436767578125, 0.477935791015625, 0.54150390625, 0.605072021484375, 0.66864013671875, 0.732208251953125, 0.7957763671875, 0.859344482421875, 0.92291259765625, 0.986480712890625, 1.050048828125, 1.113616943359375, 1.17718505859375, 1.240753173828125, 1.3043212890625, 1.367889404296875, 1.43145751953125, 1.495025634765625, 1.55859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 9.0, 8.0, 6.0, 14.0, 21.0, 19.0, 42.0, 55.0, 95.0, 132.0, 166.0, 116.0, 104.0, 77.0, 37.0, 30.0, 18.0, 10.0, 16.0, 9.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003952980041503906, -0.00038191676139831543, -0.00036853551864624023, -0.00035515427589416504, -0.00034177303314208984, -0.00032839179039001465, -0.00031501054763793945, -0.00030162930488586426, -0.00028824806213378906, -0.00027486681938171387, -0.00026148557662963867, -0.0002481043338775635, -0.00023472309112548828, -0.00022134184837341309, -0.0002079606056213379, -0.0001945793628692627, -0.0001811981201171875, -0.0001678168773651123, -0.0001544356346130371, -0.00014105439186096191, -0.00012767314910888672, -0.00011429190635681152, -0.00010091066360473633, -8.752942085266113e-05, -7.414817810058594e-05, -6.076693534851074e-05, -4.738569259643555e-05, -3.400444984436035e-05, -2.0623207092285156e-05, -7.241964340209961e-06, 6.139278411865234e-06, 1.952052116394043e-05, 3.2901763916015625e-05, 4.628300666809082e-05, 5.9664249420166016e-05, 7.304549217224121e-05, 8.64267349243164e-05, 9.98079776763916e-05, 0.0001131892204284668, 0.000126570463180542, 0.0001399517059326172, 0.00015333294868469238, 0.00016671419143676758, 0.00018009543418884277, 0.00019347667694091797, 0.00020685791969299316, 0.00022023916244506836, 0.00023362040519714355, 0.00024700164794921875, 0.00026038289070129395, 0.00027376413345336914, 0.00028714537620544434, 0.00030052661895751953, 0.0003139078617095947, 0.0003272891044616699, 0.0003406703472137451, 0.0003540515899658203, 0.0003674328327178955, 0.0003808140754699707, 0.0003941953182220459, 0.0004075765609741211, 0.0004209578037261963, 0.0004343390464782715, 0.0004477202892303467, 0.0004611015319824219]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 3.0, 7.0, 9.0, 10.0, 22.0, 39.0, 41.0, 52.0, 94.0, 138.0, 184.0, 315.0, 557.0, 1170.0, 2491.0, 5983.0, 19825.0, 104235.0, 649327.0, 215325.0, 33336.0, 8849.0, 3253.0, 1464.0, 740.0, 394.0, 206.0, 142.0, 111.0, 54.0, 43.0, 28.0, 19.0, 23.0, 7.0, 11.0, 14.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.5107421875, -1.4683990478515625, -1.426055908203125, -1.3837127685546875, -1.34136962890625, -1.2990264892578125, -1.256683349609375, -1.2143402099609375, -1.1719970703125, -1.1296539306640625, -1.087310791015625, -1.0449676513671875, -1.00262451171875, -0.9602813720703125, -0.917938232421875, -0.8755950927734375, -0.833251953125, -0.7909088134765625, -0.748565673828125, -0.7062225341796875, -0.66387939453125, -0.6215362548828125, -0.579193115234375, -0.5368499755859375, -0.4945068359375, -0.4521636962890625, -0.409820556640625, -0.3674774169921875, -0.32513427734375, -0.2827911376953125, -0.240447998046875, -0.1981048583984375, -0.15576171875, -0.1134185791015625, -0.071075439453125, -0.0287322998046875, 0.01361083984375, 0.0559539794921875, 0.098297119140625, 0.1406402587890625, 0.1829833984375, 0.2253265380859375, 0.267669677734375, 0.3100128173828125, 0.35235595703125, 0.3946990966796875, 0.437042236328125, 0.4793853759765625, 0.521728515625, 0.5640716552734375, 0.606414794921875, 0.6487579345703125, 0.69110107421875, 0.7334442138671875, 0.775787353515625, 0.8181304931640625, 0.8604736328125, 0.9028167724609375, 0.945159912109375, 0.9875030517578125, 1.02984619140625, 1.0721893310546875, 1.114532470703125, 1.1568756103515625, 1.19921875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 3.0, 5.0, 5.0, 6.0, 12.0, 14.0, 8.0, 22.0, 24.0, 37.0, 40.0, 36.0, 43.0, 53.0, 63.0, 72.0, 67.0, 64.0, 72.0, 56.0, 43.0, 40.0, 35.0, 46.0, 19.0, 16.0, 19.0, 16.0, 10.0, 5.0, 5.0, 4.0, 4.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.19921875, -1.1649703979492188, -1.1307220458984375, -1.0964736938476562, -1.062225341796875, -1.0279769897460938, -0.9937286376953125, -0.9594802856445312, -0.92523193359375, -0.8909835815429688, -0.8567352294921875, -0.8224868774414062, -0.788238525390625, -0.7539901733398438, -0.7197418212890625, -0.6854934692382812, -0.6512451171875, -0.6169967651367188, -0.5827484130859375, -0.5485000610351562, -0.514251708984375, -0.48000335693359375, -0.4457550048828125, -0.41150665283203125, -0.37725830078125, -0.34300994873046875, -0.3087615966796875, -0.27451324462890625, -0.240264892578125, -0.20601654052734375, -0.1717681884765625, -0.13751983642578125, -0.103271484375, -0.06902313232421875, -0.0347747802734375, -0.00052642822265625, 0.033721923828125, 0.06797027587890625, 0.1022186279296875, 0.13646697998046875, 0.17071533203125, 0.20496368408203125, 0.2392120361328125, 0.27346038818359375, 0.307708740234375, 0.34195709228515625, 0.3762054443359375, 0.41045379638671875, 0.4447021484375, 0.47895050048828125, 0.5131988525390625, 0.5474472045898438, 0.581695556640625, 0.6159439086914062, 0.6501922607421875, 0.6844406127929688, 0.71868896484375, 0.7529373168945312, 0.7871856689453125, 0.8214340209960938, 0.855682373046875, 0.8899307250976562, 0.9241790771484375, 0.9584274291992188, 0.99267578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 18.0, 64.0, 148.0, 223.0, 283.0, 144.0, 53.0, 28.0, 11.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.971389770507812, -23.79489517211914, -22.61840057373047, -21.441905975341797, -20.265411376953125, -19.088916778564453, -17.912424087524414, -16.735929489135742, -15.55943489074707, -14.382940292358398, -13.206445693969727, -12.029952049255371, -10.8534574508667, -9.676962852478027, -8.500469207763672, -7.323974609375, -6.147480010986328, -4.970985412597656, -3.7944912910461426, -2.61799693107605, -1.441502571105957, -0.26500797271728516, 0.9114861488342285, 2.087980270385742, 3.264474868774414, 4.440969467163086, 5.6174635887146, 6.793957710266113, 7.970452308654785, 9.146946907043457, 10.323440551757812, 11.499935150146484, 12.676429748535156, 13.852924346923828, 15.0294189453125, 16.205913543701172, 17.382408142089844, 18.558902740478516, 19.735395431518555, 20.911890029907227, 22.0883846282959, 23.26487922668457, 24.441373825073242, 25.617868423461914, 26.794361114501953, 27.970855712890625, 29.147350311279297, 30.32384490966797, 31.50033950805664, 32.67683410644531, 33.853328704833984, 35.029823303222656, 36.20631790161133, 37.3828125, 38.55930709838867, 39.735801696777344, 40.91229248046875, 42.08878707885742, 43.265281677246094, 44.441776275634766, 45.61827087402344, 46.79476547241211, 47.97126007080078, 49.14775085449219, 50.324249267578125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 10.0, 11.0, 10.0, 11.0, 11.0, 19.0, 16.0, 19.0, 26.0, 29.0, 23.0, 30.0, 26.0, 22.0, 39.0, 40.0, 42.0, 53.0, 52.0, 54.0, 41.0, 47.0, 35.0, 35.0, 40.0, 28.0, 22.0, 28.0, 34.0, 30.0, 16.0, 13.0, 10.0, 13.0, 11.0, 5.0, 6.0, 8.0, 4.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.466285705566406, -12.071855545043945, -11.6774263381958, -11.282997131347656, -10.888566970825195, -10.494136810302734, -10.09970760345459, -9.705278396606445, -9.310848236083984, -8.916418075561523, -8.521988868713379, -8.127559661865234, -7.733129501342773, -7.338699817657471, -6.944270133972168, -6.549840450286865, -6.1554107666015625, -5.76098108291626, -5.366551399230957, -4.972121715545654, -4.577692031860352, -4.183262348175049, -3.788832664489746, -3.3944029808044434, -2.9999732971191406, -2.605543613433838, -2.211113929748535, -1.8166842460632324, -1.4222545623779297, -1.027824878692627, -0.6333951950073242, -0.23896551132202148, 0.15546417236328125, 0.549893856048584, 0.9443235397338867, 1.3387532234191895, 1.7331829071044922, 2.127612590789795, 2.5220422744750977, 2.9164719581604004, 3.310901641845703, 3.705331325531006, 4.099761009216309, 4.494190692901611, 4.888620376586914, 5.283050060272217, 5.6774797439575195, 6.071909427642822, 6.466339111328125, 6.860768795013428, 7.2551984786987305, 7.649628162384033, 8.044057846069336, 8.438488006591797, 8.832917213439941, 9.227346420288086, 9.621776580810547, 10.016206741333008, 10.410635948181152, 10.805065155029297, 11.199495315551758, 11.593925476074219, 11.988354682922363, 12.382783889770508, 12.777214050292969]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 7.0, 17.0, 18.0, 25.0, 35.0, 59.0, 93.0, 135.0, 192.0, 351.0, 553.0, 922.0, 1605.0, 3045.0, 6236.0, 13816.0, 36490.0, 121244.0, 580172.0, 2355893.0, 832298.0, 161949.0, 46787.0, 17235.0, 7332.0, 3425.0, 1791.0, 1052.0, 593.0, 324.0, 207.0, 141.0, 88.0, 50.0, 33.0, 15.0, 12.0, 9.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.357421875, -1.3181915283203125, -1.278961181640625, -1.2397308349609375, -1.20050048828125, -1.1612701416015625, -1.122039794921875, -1.0828094482421875, -1.0435791015625, -1.0043487548828125, -0.965118408203125, -0.9258880615234375, -0.88665771484375, -0.8474273681640625, -0.808197021484375, -0.7689666748046875, -0.729736328125, -0.6905059814453125, -0.651275634765625, -0.6120452880859375, -0.57281494140625, -0.5335845947265625, -0.494354248046875, -0.4551239013671875, -0.4158935546875, -0.3766632080078125, -0.337432861328125, -0.2982025146484375, -0.25897216796875, -0.2197418212890625, -0.180511474609375, -0.1412811279296875, -0.10205078125, -0.0628204345703125, -0.023590087890625, 0.0156402587890625, 0.05487060546875, 0.0941009521484375, 0.133331298828125, 0.1725616455078125, 0.2117919921875, 0.2510223388671875, 0.290252685546875, 0.3294830322265625, 0.36871337890625, 0.4079437255859375, 0.447174072265625, 0.4864044189453125, 0.525634765625, 0.5648651123046875, 0.604095458984375, 0.6433258056640625, 0.68255615234375, 0.7217864990234375, 0.761016845703125, 0.8002471923828125, 0.8394775390625, 0.8787078857421875, 0.917938232421875, 0.9571685791015625, 0.99639892578125, 1.0356292724609375, 1.074859619140625, 1.1140899658203125, 1.1533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 7.0, 4.0, 8.0, 6.0, 14.0, 18.0, 15.0, 19.0, 12.0, 29.0, 31.0, 39.0, 32.0, 30.0, 41.0, 39.0, 29.0, 41.0, 50.0, 44.0, 45.0, 41.0, 38.0, 33.0, 42.0, 33.0, 26.0, 30.0, 22.0, 26.0, 24.0, 20.0, 9.0, 16.0, 18.0, 10.0, 10.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.65869140625, -0.6383743286132812, -0.6180572509765625, -0.5977401733398438, -0.577423095703125, -0.5571060180664062, -0.5367889404296875, -0.5164718627929688, -0.49615478515625, -0.47583770751953125, -0.4555206298828125, -0.43520355224609375, -0.414886474609375, -0.39456939697265625, -0.3742523193359375, -0.35393524169921875, -0.3336181640625, -0.31330108642578125, -0.2929840087890625, -0.27266693115234375, -0.252349853515625, -0.23203277587890625, -0.2117156982421875, -0.19139862060546875, -0.17108154296875, -0.15076446533203125, -0.1304473876953125, -0.11013031005859375, -0.089813232421875, -0.06949615478515625, -0.0491790771484375, -0.02886199951171875, -0.008544921875, 0.01177215576171875, 0.0320892333984375, 0.05240631103515625, 0.072723388671875, 0.09304046630859375, 0.1133575439453125, 0.13367462158203125, 0.15399169921875, 0.17430877685546875, 0.1946258544921875, 0.21494293212890625, 0.235260009765625, 0.25557708740234375, 0.2758941650390625, 0.29621124267578125, 0.3165283203125, 0.33684539794921875, 0.3571624755859375, 0.37747955322265625, 0.397796630859375, 0.41811370849609375, 0.4384307861328125, 0.45874786376953125, 0.47906494140625, 0.49938201904296875, 0.5196990966796875, 0.5400161743164062, 0.560333251953125, 0.5806503295898438, 0.6009674072265625, 0.6212844848632812, 0.6416015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 5.0, 8.0, 10.0, 10.0, 13.0, 29.0, 33.0, 55.0, 68.0, 109.0, 158.0, 238.0, 426.0, 767.0, 1465.0, 3591.0, 12211.0, 68842.0, 1237490.0, 2726952.0, 116103.0, 17999.0, 4491.0, 1602.0, 720.0, 355.0, 210.0, 122.0, 70.0, 42.0, 27.0, 19.0, 12.0, 7.0, 3.0, 5.0, 7.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.79150390625, -2.6845703125, -2.57763671875, -2.470703125, -2.36376953125, -2.2568359375, -2.14990234375, -2.04296875, -1.93603515625, -1.8291015625, -1.72216796875, -1.615234375, -1.50830078125, -1.4013671875, -1.29443359375, -1.1875, -1.08056640625, -0.9736328125, -0.86669921875, -0.759765625, -0.65283203125, -0.5458984375, -0.43896484375, -0.33203125, -0.22509765625, -0.1181640625, -0.01123046875, 0.095703125, 0.20263671875, 0.3095703125, 0.41650390625, 0.5234375, 0.63037109375, 0.7373046875, 0.84423828125, 0.951171875, 1.05810546875, 1.1650390625, 1.27197265625, 1.37890625, 1.48583984375, 1.5927734375, 1.69970703125, 1.806640625, 1.91357421875, 2.0205078125, 2.12744140625, 2.234375, 2.34130859375, 2.4482421875, 2.55517578125, 2.662109375, 2.76904296875, 2.8759765625, 2.98291015625, 3.08984375, 3.19677734375, 3.3037109375, 3.41064453125, 3.517578125, 3.62451171875, 3.7314453125, 3.83837890625, 3.9453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 4.0, 20.0, 48.0, 56.0, 101.0, 224.0, 654.0, 1487.0, 817.0, 311.0, 157.0, 82.0, 45.0, 30.0, 8.0, 13.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.09735107421875, -6.9134521484375, -6.72955322265625, -6.545654296875, -6.36175537109375, -6.1778564453125, -5.99395751953125, -5.81005859375, -5.62615966796875, -5.4422607421875, -5.25836181640625, -5.074462890625, -4.89056396484375, -4.7066650390625, -4.52276611328125, -4.3388671875, -4.15496826171875, -3.9710693359375, -3.78717041015625, -3.603271484375, -3.41937255859375, -3.2354736328125, -3.05157470703125, -2.86767578125, -2.68377685546875, -2.4998779296875, -2.31597900390625, -2.132080078125, -1.94818115234375, -1.7642822265625, -1.58038330078125, -1.396484375, -1.21258544921875, -1.0286865234375, -0.84478759765625, -0.660888671875, -0.47698974609375, -0.2930908203125, -0.10919189453125, 0.07470703125, 0.25860595703125, 0.4425048828125, 0.62640380859375, 0.810302734375, 0.99420166015625, 1.1781005859375, 1.36199951171875, 1.5458984375, 1.72979736328125, 1.9136962890625, 2.09759521484375, 2.281494140625, 2.46539306640625, 2.6492919921875, 2.83319091796875, 3.01708984375, 3.20098876953125, 3.3848876953125, 3.56878662109375, 3.752685546875, 3.93658447265625, 4.1204833984375, 4.30438232421875, 4.48828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 9.0, 13.0, 19.0, 29.0, 68.0, 131.0, 184.0, 191.0, 180.0, 85.0, 37.0, 20.0, 5.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.32672882080078, -38.319305419921875, -37.311885833740234, -36.30446243286133, -35.29704284667969, -34.28961944580078, -33.282196044921875, -32.274776458740234, -31.267353057861328, -30.259931564331055, -29.25251007080078, -28.245086669921875, -27.2376651763916, -26.230243682861328, -25.222822189331055, -24.21540069580078, -23.207979202270508, -22.200557708740234, -21.19313621520996, -20.185714721679688, -19.17829132080078, -18.170869827270508, -17.163448333740234, -16.15602684020996, -15.148604393005371, -14.141182899475098, -13.133760452270508, -12.126338958740234, -11.118917465209961, -10.111495018005371, -9.104073524475098, -8.096651077270508, -7.089229583740234, -6.081807613372803, -5.074385643005371, -4.066964149475098, -3.059542179107666, -2.0521202087402344, -1.044698715209961, -0.0372767448425293, 0.9701452255249023, 1.9775670766830444, 2.9849889278411865, 3.992410659790039, 4.999832630157471, 6.007254600524902, 7.014676094055176, 8.022098541259766, 9.029520034790039, 10.036941528320312, 11.044363975524902, 12.051785469055176, 13.059207916259766, 14.066629409790039, 15.074050903320312, 16.081472396850586, 17.08889389038086, 18.096315383911133, 19.103736877441406, 20.111160278320312, 21.118581771850586, 22.12600326538086, 23.133424758911133, 24.140846252441406, 25.148269653320312]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 15.0, 11.0, 16.0, 19.0, 24.0, 16.0, 30.0, 26.0, 32.0, 42.0, 46.0, 49.0, 44.0, 57.0, 56.0, 43.0, 61.0, 56.0, 45.0, 48.0, 46.0, 25.0, 27.0, 23.0, 40.0, 22.0, 15.0, 11.0, 10.0, 6.0, 11.0, 10.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.264878273010254, -13.729978561401367, -13.19507884979248, -12.660179138183594, -12.125280380249023, -11.590380668640137, -11.05548095703125, -10.520581245422363, -9.985681533813477, -9.45078182220459, -8.915882110595703, -8.380983352661133, -7.846083641052246, -7.311183929443359, -6.776284217834473, -6.241384506225586, -5.706485748291016, -5.171586036682129, -4.6366868019104, -4.101787090301514, -3.566887617111206, -3.0319881439208984, -2.4970884323120117, -1.962188959121704, -1.4272894859313965, -0.8923899531364441, -0.3574904203414917, 0.17740917205810547, 0.7123086452484131, 1.2472081184387207, 1.7821078300476074, 2.317007303237915, 2.851907730102539, 3.3868072032928467, 3.9217066764831543, 4.456606388092041, 4.9915056228637695, 5.526405334472656, 6.061305046081543, 6.59620475769043, 7.131103992462158, 7.666003704071045, 8.200902938842773, 8.73580265045166, 9.270702362060547, 9.805601119995117, 10.34050178527832, 10.87540054321289, 11.410300254821777, 11.945199966430664, 12.48009967803955, 13.014999389648438, 13.549898147583008, 14.084797859191895, 14.619697570800781, 15.154597282409668, 15.689496994018555, 16.224395751953125, 16.759296417236328, 17.2941951751709, 17.8290958404541, 18.363994598388672, 18.898895263671875, 19.433794021606445, 19.968692779541016]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 6.0, 11.0, 10.0, 15.0, 27.0, 32.0, 54.0, 62.0, 135.0, 181.0, 315.0, 502.0, 923.0, 1922.0, 3836.0, 8305.0, 20311.0, 54647.0, 169888.0, 474348.0, 207192.0, 64161.0, 23454.0, 9346.0, 4233.0, 2069.0, 1038.0, 567.0, 349.0, 206.0, 143.0, 74.0, 55.0, 30.0, 39.0, 15.0, 13.0, 6.0, 9.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.146759033203125, -2.06890869140625, -1.991058349609375, -1.9132080078125, -1.835357666015625, -1.75750732421875, -1.679656982421875, -1.601806640625, -1.523956298828125, -1.44610595703125, -1.368255615234375, -1.2904052734375, -1.212554931640625, -1.13470458984375, -1.056854248046875, -0.97900390625, -0.901153564453125, -0.82330322265625, -0.745452880859375, -0.6676025390625, -0.589752197265625, -0.51190185546875, -0.434051513671875, -0.356201171875, -0.278350830078125, -0.20050048828125, -0.122650146484375, -0.0447998046875, 0.033050537109375, 0.11090087890625, 0.188751220703125, 0.2666015625, 0.344451904296875, 0.42230224609375, 0.500152587890625, 0.5780029296875, 0.655853271484375, 0.73370361328125, 0.811553955078125, 0.889404296875, 0.967254638671875, 1.04510498046875, 1.122955322265625, 1.2008056640625, 1.278656005859375, 1.35650634765625, 1.434356689453125, 1.51220703125, 1.590057373046875, 1.66790771484375, 1.745758056640625, 1.8236083984375, 1.901458740234375, 1.97930908203125, 2.057159423828125, 2.135009765625, 2.212860107421875, 2.29071044921875, 2.368560791015625, 2.4464111328125, 2.524261474609375, 2.60211181640625, 2.679962158203125, 2.7578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 7.0, 9.0, 8.0, 9.0, 7.0, 12.0, 18.0, 15.0, 22.0, 31.0, 32.0, 39.0, 48.0, 48.0, 59.0, 53.0, 45.0, 67.0, 44.0, 46.0, 49.0, 34.0, 52.0, 35.0, 30.0, 30.0, 23.0, 30.0, 23.0, 13.0, 10.0, 10.0, 8.0, 9.0, 9.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86328125, -0.833526611328125, -0.80377197265625, -0.774017333984375, -0.7442626953125, -0.714508056640625, -0.68475341796875, -0.654998779296875, -0.625244140625, -0.595489501953125, -0.56573486328125, -0.535980224609375, -0.5062255859375, -0.476470947265625, -0.44671630859375, -0.416961669921875, -0.38720703125, -0.357452392578125, -0.32769775390625, -0.297943115234375, -0.2681884765625, -0.238433837890625, -0.20867919921875, -0.178924560546875, -0.149169921875, -0.119415283203125, -0.08966064453125, -0.059906005859375, -0.0301513671875, -0.000396728515625, 0.02935791015625, 0.059112548828125, 0.0888671875, 0.118621826171875, 0.14837646484375, 0.178131103515625, 0.2078857421875, 0.237640380859375, 0.26739501953125, 0.297149658203125, 0.326904296875, 0.356658935546875, 0.38641357421875, 0.416168212890625, 0.4459228515625, 0.475677490234375, 0.50543212890625, 0.535186767578125, 0.56494140625, 0.594696044921875, 0.62445068359375, 0.654205322265625, 0.6839599609375, 0.713714599609375, 0.74346923828125, 0.773223876953125, 0.802978515625, 0.832733154296875, 0.86248779296875, 0.892242431640625, 0.9219970703125, 0.951751708984375, 0.98150634765625, 1.011260986328125, 1.041015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 14.0, 12.0, 26.0, 31.0, 63.0, 78.0, 150.0, 261.0, 545.0, 1232.0, 3176.0, 13741.0, 220398.0, 777792.0, 23763.0, 4339.0, 1504.0, 653.0, 259.0, 197.0, 108.0, 55.0, 46.0, 25.0, 22.0, 18.0, 7.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -8.0120849609375, -7.727294921875, -7.4425048828125, -7.15771484375, -6.8729248046875, -6.588134765625, -6.3033447265625, -6.0185546875, -5.7337646484375, -5.448974609375, -5.1641845703125, -4.87939453125, -4.5946044921875, -4.309814453125, -4.0250244140625, -3.740234375, -3.4554443359375, -3.170654296875, -2.8858642578125, -2.60107421875, -2.3162841796875, -2.031494140625, -1.7467041015625, -1.4619140625, -1.1771240234375, -0.892333984375, -0.6075439453125, -0.32275390625, -0.0379638671875, 0.246826171875, 0.5316162109375, 0.81640625, 1.1011962890625, 1.385986328125, 1.6707763671875, 1.95556640625, 2.2403564453125, 2.525146484375, 2.8099365234375, 3.0947265625, 3.3795166015625, 3.664306640625, 3.9490966796875, 4.23388671875, 4.5186767578125, 4.803466796875, 5.0882568359375, 5.373046875, 5.6578369140625, 5.942626953125, 6.2274169921875, 6.51220703125, 6.7969970703125, 7.081787109375, 7.3665771484375, 7.6513671875, 7.9361572265625, 8.220947265625, 8.5057373046875, 8.79052734375, 9.0753173828125, 9.360107421875, 9.6448974609375, 9.9296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 5.0, 17.0, 12.0, 23.0, 23.0, 28.0, 37.0, 44.0, 60.0, 64.0, 76.0, 66.0, 84.0, 70.0, 68.0, 61.0, 60.0, 42.0, 33.0, 31.0, 30.0, 16.0, 12.0, 8.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.859375, -6.63409423828125, -6.4088134765625, -6.18353271484375, -5.958251953125, -5.73297119140625, -5.5076904296875, -5.28240966796875, -5.05712890625, -4.83184814453125, -4.6065673828125, -4.38128662109375, -4.156005859375, -3.93072509765625, -3.7054443359375, -3.48016357421875, -3.2548828125, -3.02960205078125, -2.8043212890625, -2.57904052734375, -2.353759765625, -2.12847900390625, -1.9031982421875, -1.67791748046875, -1.45263671875, -1.22735595703125, -1.0020751953125, -0.77679443359375, -0.551513671875, -0.32623291015625, -0.1009521484375, 0.12432861328125, 0.349609375, 0.57489013671875, 0.8001708984375, 1.02545166015625, 1.250732421875, 1.47601318359375, 1.7012939453125, 1.92657470703125, 2.15185546875, 2.37713623046875, 2.6024169921875, 2.82769775390625, 3.052978515625, 3.27825927734375, 3.5035400390625, 3.72882080078125, 3.9541015625, 4.17938232421875, 4.4046630859375, 4.62994384765625, 4.855224609375, 5.08050537109375, 5.3057861328125, 5.53106689453125, 5.75634765625, 5.98162841796875, 6.2069091796875, 6.43218994140625, 6.657470703125, 6.88275146484375, 7.1080322265625, 7.33331298828125, 7.55859375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 6.0, 14.0, 6.0, 11.0, 19.0, 18.0, 40.0, 60.0, 84.0, 125.0, 223.0, 343.0, 564.0, 974.0, 1870.0, 3909.0, 9240.0, 24892.0, 78723.0, 487133.0, 328910.0, 72053.0, 22918.0, 8659.0, 3755.0, 1719.0, 877.0, 529.0, 293.0, 200.0, 101.0, 97.0, 58.0, 35.0, 32.0, 16.0, 10.0, 8.0, 13.0, 8.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1415863037109375, -1.103485107421875, -1.0653839111328125, -1.02728271484375, -0.9891815185546875, -0.951080322265625, -0.9129791259765625, -0.8748779296875, -0.8367767333984375, -0.798675537109375, -0.7605743408203125, -0.72247314453125, -0.6843719482421875, -0.646270751953125, -0.6081695556640625, -0.570068359375, -0.5319671630859375, -0.493865966796875, -0.4557647705078125, -0.41766357421875, -0.3795623779296875, -0.341461181640625, -0.3033599853515625, -0.2652587890625, -0.2271575927734375, -0.189056396484375, -0.1509552001953125, -0.11285400390625, -0.0747528076171875, -0.036651611328125, 0.0014495849609375, 0.03955078125, 0.0776519775390625, 0.115753173828125, 0.1538543701171875, 0.19195556640625, 0.2300567626953125, 0.268157958984375, 0.3062591552734375, 0.3443603515625, 0.3824615478515625, 0.420562744140625, 0.4586639404296875, 0.49676513671875, 0.5348663330078125, 0.572967529296875, 0.6110687255859375, 0.649169921875, 0.6872711181640625, 0.725372314453125, 0.7634735107421875, 0.80157470703125, 0.8396759033203125, 0.877777099609375, 0.9158782958984375, 0.9539794921875, 0.9920806884765625, 1.030181884765625, 1.0682830810546875, 1.10638427734375, 1.1444854736328125, 1.182586669921875, 1.2206878662109375, 1.2587890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 7.0, 10.0, 7.0, 6.0, 9.0, 15.0, 15.0, 11.0, 21.0, 29.0, 33.0, 39.0, 44.0, 66.0, 109.0, 126.0, 116.0, 59.0, 45.0, 37.0, 31.0, 32.0, 20.0, 22.0, 15.0, 13.0, 14.0, 10.0, 3.0, 5.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00037097930908203125, -0.00035958364605903625, -0.00034818798303604126, -0.00033679232001304626, -0.00032539665699005127, -0.0003140009939670563, -0.0003026053309440613, -0.0002912096679210663, -0.0002798140048980713, -0.0002684183418750763, -0.0002570226788520813, -0.0002456270158290863, -0.0002342313528060913, -0.0002228356897830963, -0.00021144002676010132, -0.00020004436373710632, -0.00018864870071411133, -0.00017725303769111633, -0.00016585737466812134, -0.00015446171164512634, -0.00014306604862213135, -0.00013167038559913635, -0.00012027472257614136, -0.00010887905955314636, -9.748339653015137e-05, -8.608773350715637e-05, -7.469207048416138e-05, -6.329640746116638e-05, -5.190074443817139e-05, -4.050508141517639e-05, -2.9109418392181396e-05, -1.77137553691864e-05, -6.318092346191406e-06, 5.077570676803589e-06, 1.6473233699798584e-05, 2.786889672279358e-05, 3.9264559745788574e-05, 5.066022276878357e-05, 6.205588579177856e-05, 7.345154881477356e-05, 8.484721183776855e-05, 9.624287486076355e-05, 0.00010763853788375854, 0.00011903420090675354, 0.00013042986392974854, 0.00014182552695274353, 0.00015322118997573853, 0.00016461685299873352, 0.00017601251602172852, 0.0001874081790447235, 0.0001988038420677185, 0.0002101995050907135, 0.0002215951681137085, 0.0002329908311367035, 0.0002443864941596985, 0.0002557821571826935, 0.0002671778202056885, 0.00027857348322868347, 0.00028996914625167847, 0.00030136480927467346, 0.00031276047229766846, 0.00032415613532066345, 0.00033555179834365845, 0.00034694746136665344, 0.00035834312438964844]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 9.0, 9.0, 15.0, 12.0, 23.0, 42.0, 63.0, 97.0, 181.0, 305.0, 574.0, 1131.0, 2874.0, 9633.0, 57659.0, 724692.0, 218520.0, 23658.0, 5283.0, 1889.0, 778.0, 449.0, 247.0, 139.0, 98.0, 57.0, 30.0, 27.0, 21.0, 10.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.388671875, -2.3270721435546875, -2.265472412109375, -2.2038726806640625, -2.14227294921875, -2.0806732177734375, -2.019073486328125, -1.9574737548828125, -1.8958740234375, -1.8342742919921875, -1.772674560546875, -1.7110748291015625, -1.64947509765625, -1.5878753662109375, -1.526275634765625, -1.4646759033203125, -1.403076171875, -1.3414764404296875, -1.279876708984375, -1.2182769775390625, -1.15667724609375, -1.0950775146484375, -1.033477783203125, -0.9718780517578125, -0.9102783203125, -0.8486785888671875, -0.787078857421875, -0.7254791259765625, -0.66387939453125, -0.6022796630859375, -0.540679931640625, -0.4790802001953125, -0.41748046875, -0.3558807373046875, -0.294281005859375, -0.2326812744140625, -0.17108154296875, -0.1094818115234375, -0.047882080078125, 0.0137176513671875, 0.0753173828125, 0.1369171142578125, 0.198516845703125, 0.2601165771484375, 0.32171630859375, 0.3833160400390625, 0.444915771484375, 0.5065155029296875, 0.568115234375, 0.6297149658203125, 0.691314697265625, 0.7529144287109375, 0.81451416015625, 0.8761138916015625, 0.937713623046875, 0.9993133544921875, 1.0609130859375, 1.1225128173828125, 1.184112548828125, 1.2457122802734375, 1.30731201171875, 1.3689117431640625, 1.430511474609375, 1.4921112060546875, 1.5537109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 10.0, 6.0, 12.0, 11.0, 17.0, 18.0, 18.0, 27.0, 31.0, 37.0, 45.0, 60.0, 81.0, 105.0, 84.0, 79.0, 59.0, 51.0, 41.0, 40.0, 35.0, 19.0, 25.0, 19.0, 11.0, 8.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.142486572265625, -1.09454345703125, -1.046600341796875, -0.9986572265625, -0.950714111328125, -0.90277099609375, -0.854827880859375, -0.806884765625, -0.758941650390625, -0.71099853515625, -0.663055419921875, -0.6151123046875, -0.567169189453125, -0.51922607421875, -0.471282958984375, -0.42333984375, -0.375396728515625, -0.32745361328125, -0.279510498046875, -0.2315673828125, -0.183624267578125, -0.13568115234375, -0.087738037109375, -0.039794921875, 0.008148193359375, 0.05609130859375, 0.104034423828125, 0.1519775390625, 0.199920654296875, 0.24786376953125, 0.295806884765625, 0.34375, 0.391693115234375, 0.43963623046875, 0.487579345703125, 0.5355224609375, 0.583465576171875, 0.63140869140625, 0.679351806640625, 0.727294921875, 0.775238037109375, 0.82318115234375, 0.871124267578125, 0.9190673828125, 0.967010498046875, 1.01495361328125, 1.062896728515625, 1.11083984375, 1.158782958984375, 1.20672607421875, 1.254669189453125, 1.3026123046875, 1.350555419921875, 1.39849853515625, 1.446441650390625, 1.494384765625, 1.542327880859375, 1.59027099609375, 1.638214111328125, 1.6861572265625, 1.734100341796875, 1.78204345703125, 1.829986572265625, 1.8779296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 8.0, 17.0, 17.0, 32.0, 48.0, 103.0, 125.0, 156.0, 174.0, 114.0, 66.0, 43.0, 28.0, 9.0, 16.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.91774559020996, -29.951597213745117, -28.98544692993164, -28.019298553466797, -27.053150177001953, -26.08700180053711, -25.120851516723633, -24.15470314025879, -23.188552856445312, -22.22240447998047, -21.256254196166992, -20.29010581970215, -19.323957443237305, -18.357807159423828, -17.391658782958984, -16.42551040649414, -15.459362030029297, -14.493212699890137, -13.527064323425293, -12.560914993286133, -11.594766616821289, -10.628617286682129, -9.662467956542969, -8.696319580078125, -7.730170249938965, -6.764021396636963, -5.797872543334961, -4.831723213195801, -3.865574359893799, -2.899425506591797, -1.9332761764526367, -0.9671273231506348, -0.000980377197265625, 0.9651685953140259, 1.9313175678253174, 2.8974666595458984, 3.8636155128479004, 4.829764366149902, 5.7959136962890625, 6.7620625495910645, 7.728211402893066, 8.694360733032227, 9.66050910949707, 10.62665843963623, 11.59280776977539, 12.558956146240234, 13.525105476379395, 14.491254806518555, 15.457403182983398, 16.423551559448242, 17.38970184326172, 18.355850219726562, 19.321998596191406, 20.28814697265625, 21.254297256469727, 22.22044563293457, 23.186595916748047, 24.15274429321289, 25.118894577026367, 26.08504295349121, 27.051191329956055, 28.01734161376953, 28.983489990234375, 29.94963836669922, 30.915786743164062]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 8.0, 2.0, 13.0, 7.0, 10.0, 11.0, 15.0, 22.0, 16.0, 23.0, 36.0, 35.0, 24.0, 33.0, 37.0, 45.0, 48.0, 54.0, 76.0, 69.0, 64.0, 46.0, 42.0, 42.0, 35.0, 22.0, 30.0, 27.0, 18.0, 23.0, 21.0, 15.0, 6.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.426401138305664, -19.834808349609375, -19.243215560913086, -18.65162467956543, -18.06003189086914, -17.46843910217285, -16.876846313476562, -16.285253524780273, -15.6936616897583, -15.102068901062012, -14.510477066040039, -13.91888427734375, -13.327291488647461, -12.735699653625488, -12.1441068649292, -11.552515029907227, -10.960922241210938, -10.369329452514648, -9.777737617492676, -9.186144828796387, -8.594552993774414, -8.002960205078125, -7.411367416381836, -6.819775104522705, -6.228182792663574, -5.636590480804443, -5.0449981689453125, -4.453405380249023, -3.8618130683898926, -3.2702207565307617, -2.6786282062530518, -2.087035655975342, -1.4954414367675781, -0.9038490056991577, -0.3122565746307373, 0.2793358564376831, 0.8709282875061035, 1.4625205993652344, 2.0541131496429443, 2.6457056999206543, 3.237298011779785, 3.828890323638916, 4.420482635498047, 5.012075424194336, 5.603667736053467, 6.195260047912598, 6.786852836608887, 7.378445148468018, 7.970037460327148, 8.561630249023438, 9.15322208404541, 9.7448148727417, 10.336406707763672, 10.927999496459961, 11.51959228515625, 12.111185073852539, 12.702776908874512, 13.2943696975708, 13.885961532592773, 14.477554321289062, 15.069147109985352, 15.660738945007324, 16.252330780029297, 16.843923568725586, 17.435516357421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 11.0, 12.0, 14.0, 25.0, 42.0, 45.0, 73.0, 94.0, 181.0, 300.0, 448.0, 813.0, 1656.0, 3819.0, 9955.0, 32202.0, 152775.0, 1534959.0, 2184403.0, 210759.0, 40952.0, 12181.0, 4523.0, 1923.0, 971.0, 423.0, 280.0, 165.0, 89.0, 56.0, 44.0, 22.0, 19.0, 15.0, 12.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0], "bins": [-2.34375, -2.2852783203125, -2.226806640625, -2.1683349609375, -2.10986328125, -2.0513916015625, -1.992919921875, -1.9344482421875, -1.8759765625, -1.8175048828125, -1.759033203125, -1.7005615234375, -1.64208984375, -1.5836181640625, -1.525146484375, -1.4666748046875, -1.408203125, -1.3497314453125, -1.291259765625, -1.2327880859375, -1.17431640625, -1.1158447265625, -1.057373046875, -0.9989013671875, -0.9404296875, -0.8819580078125, -0.823486328125, -0.7650146484375, -0.70654296875, -0.6480712890625, -0.589599609375, -0.5311279296875, -0.47265625, -0.4141845703125, -0.355712890625, -0.2972412109375, -0.23876953125, -0.1802978515625, -0.121826171875, -0.0633544921875, -0.0048828125, 0.0535888671875, 0.112060546875, 0.1705322265625, 0.22900390625, 0.2874755859375, 0.345947265625, 0.4044189453125, 0.462890625, 0.5213623046875, 0.579833984375, 0.6383056640625, 0.69677734375, 0.7552490234375, 0.813720703125, 0.8721923828125, 0.9306640625, 0.9891357421875, 1.047607421875, 1.1060791015625, 1.16455078125, 1.2230224609375, 1.281494140625, 1.3399658203125, 1.3984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 4.0, 10.0, 10.0, 10.0, 18.0, 21.0, 27.0, 21.0, 32.0, 35.0, 37.0, 35.0, 49.0, 52.0, 48.0, 51.0, 48.0, 44.0, 59.0, 46.0, 40.0, 45.0, 39.0, 45.0, 25.0, 20.0, 26.0, 22.0, 16.0, 8.0, 8.0, 8.0, 4.0, 8.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9755859375, -0.9456329345703125, -0.915679931640625, -0.8857269287109375, -0.85577392578125, -0.8258209228515625, -0.795867919921875, -0.7659149169921875, -0.7359619140625, -0.7060089111328125, -0.676055908203125, -0.6461029052734375, -0.61614990234375, -0.5861968994140625, -0.556243896484375, -0.5262908935546875, -0.496337890625, -0.4663848876953125, -0.436431884765625, -0.4064788818359375, -0.37652587890625, -0.3465728759765625, -0.316619873046875, -0.2866668701171875, -0.2567138671875, -0.2267608642578125, -0.196807861328125, -0.1668548583984375, -0.13690185546875, -0.1069488525390625, -0.076995849609375, -0.0470428466796875, -0.01708984375, 0.0128631591796875, 0.042816162109375, 0.0727691650390625, 0.10272216796875, 0.1326751708984375, 0.162628173828125, 0.1925811767578125, 0.2225341796875, 0.2524871826171875, 0.282440185546875, 0.3123931884765625, 0.34234619140625, 0.3722991943359375, 0.402252197265625, 0.4322052001953125, 0.462158203125, 0.4921112060546875, 0.522064208984375, 0.5520172119140625, 0.58197021484375, 0.6119232177734375, 0.641876220703125, 0.6718292236328125, 0.7017822265625, 0.7317352294921875, 0.761688232421875, 0.7916412353515625, 0.82159423828125, 0.8515472412109375, 0.881500244140625, 0.9114532470703125, 0.94140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 9.0, 8.0, 16.0, 14.0, 22.0, 36.0, 55.0, 80.0, 143.0, 243.0, 551.0, 1241.0, 3781.0, 16964.0, 246745.0, 3772900.0, 134553.0, 12714.0, 2734.0, 802.0, 337.0, 158.0, 78.0, 33.0, 26.0, 11.0, 10.0, 11.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.30035400390625, -4.1241455078125, -3.94793701171875, -3.771728515625, -3.59552001953125, -3.4193115234375, -3.24310302734375, -3.06689453125, -2.89068603515625, -2.7144775390625, -2.53826904296875, -2.362060546875, -2.18585205078125, -2.0096435546875, -1.83343505859375, -1.6572265625, -1.48101806640625, -1.3048095703125, -1.12860107421875, -0.952392578125, -0.77618408203125, -0.5999755859375, -0.42376708984375, -0.24755859375, -0.07135009765625, 0.1048583984375, 0.28106689453125, 0.457275390625, 0.63348388671875, 0.8096923828125, 0.98590087890625, 1.162109375, 1.33831787109375, 1.5145263671875, 1.69073486328125, 1.866943359375, 2.04315185546875, 2.2193603515625, 2.39556884765625, 2.57177734375, 2.74798583984375, 2.9241943359375, 3.10040283203125, 3.276611328125, 3.45281982421875, 3.6290283203125, 3.80523681640625, 3.9814453125, 4.15765380859375, 4.3338623046875, 4.51007080078125, 4.686279296875, 4.86248779296875, 5.0386962890625, 5.21490478515625, 5.39111328125, 5.56732177734375, 5.7435302734375, 5.91973876953125, 6.095947265625, 6.27215576171875, 6.4483642578125, 6.62457275390625, 6.80078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 7.0, 4.0, 11.0, 11.0, 33.0, 37.0, 88.0, 190.0, 446.0, 1174.0, 1141.0, 468.0, 210.0, 114.0, 42.0, 44.0, 17.0, 14.0, 8.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.42303466796875, -7.2327880859375, -7.04254150390625, -6.852294921875, -6.66204833984375, -6.4718017578125, -6.28155517578125, -6.09130859375, -5.90106201171875, -5.7108154296875, -5.52056884765625, -5.330322265625, -5.14007568359375, -4.9498291015625, -4.75958251953125, -4.5693359375, -4.37908935546875, -4.1888427734375, -3.99859619140625, -3.808349609375, -3.61810302734375, -3.4278564453125, -3.23760986328125, -3.04736328125, -2.85711669921875, -2.6668701171875, -2.47662353515625, -2.286376953125, -2.09613037109375, -1.9058837890625, -1.71563720703125, -1.525390625, -1.33514404296875, -1.1448974609375, -0.95465087890625, -0.764404296875, -0.57415771484375, -0.3839111328125, -0.19366455078125, -0.00341796875, 0.18682861328125, 0.3770751953125, 0.56732177734375, 0.757568359375, 0.94781494140625, 1.1380615234375, 1.32830810546875, 1.5185546875, 1.70880126953125, 1.8990478515625, 2.08929443359375, 2.279541015625, 2.46978759765625, 2.6600341796875, 2.85028076171875, 3.04052734375, 3.23077392578125, 3.4210205078125, 3.61126708984375, 3.801513671875, 3.99176025390625, 4.1820068359375, 4.37225341796875, 4.5625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 40.0, 60.0, 126.0, 227.0, 233.0, 161.0, 66.0, 34.0, 11.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.90185546875, -36.49960708618164, -35.09735870361328, -33.69511413574219, -32.29286575317383, -30.89061737060547, -29.48836898803711, -28.086122512817383, -26.683876037597656, -25.281627655029297, -23.87938117980957, -22.47713279724121, -21.074886322021484, -19.672637939453125, -18.270389556884766, -16.86814308166504, -15.46589469909668, -14.063647270202637, -12.661399841308594, -11.259151458740234, -9.856904983520508, -8.454656600952148, -7.0524091720581055, -5.6501617431640625, -4.2479143142700195, -2.8456668853759766, -1.4434192180633545, -0.04117155075073242, 1.3610758781433105, 2.7633233070373535, 4.165571212768555, 5.567818641662598, 6.970066070556641, 8.372313499450684, 9.774560928344727, 11.176809310913086, 12.579055786132812, 13.981304168701172, 15.383551597595215, 16.785799026489258, 18.188045501708984, 19.590293884277344, 20.99254035949707, 22.39478874206543, 23.797035217285156, 25.199283599853516, 26.601531982421875, 28.0037784576416, 29.40602684020996, 30.80827522277832, 32.21052169799805, 33.612770080566406, 35.015018463134766, 36.41726303100586, 37.81951141357422, 39.22175979614258, 40.62400817871094, 42.0262565612793, 43.428504943847656, 44.83074951171875, 46.23299789428711, 47.63524627685547, 49.03749465942383, 50.43974304199219, 51.84198760986328]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 10.0, 9.0, 15.0, 19.0, 14.0, 22.0, 28.0, 16.0, 34.0, 19.0, 41.0, 41.0, 48.0, 41.0, 52.0, 62.0, 58.0, 56.0, 41.0, 46.0, 38.0, 50.0, 41.0, 35.0, 26.0, 19.0, 18.0, 19.0, 14.0, 10.0, 9.0, 7.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.757925033569336, -17.172780990600586, -16.587636947631836, -16.002490997314453, -15.417346954345703, -14.832202911376953, -14.247058868408203, -13.661914825439453, -13.076769828796387, -12.491625785827637, -11.90648078918457, -11.32133674621582, -10.73619270324707, -10.151047706604004, -9.565903663635254, -8.980758666992188, -8.395614624023438, -7.810470104217529, -7.225325584411621, -6.640181541442871, -6.055037021636963, -5.469892501831055, -4.884748458862305, -4.2996039390563965, -3.7144594192504883, -3.12931489944458, -2.544170618057251, -1.9590262174606323, -1.3738818168640137, -0.7887372970581055, -0.20359301567077637, 0.38155126571655273, 0.9666976928710938, 1.5518420934677124, 2.136986494064331, 2.72213077545166, 3.3072752952575684, 3.8924198150634766, 4.477563858032227, 5.062708377838135, 5.647852897644043, 6.232997417449951, 6.818141937255859, 7.403285980224609, 7.988430500030518, 8.573575019836426, 9.158719062805176, 9.743864059448242, 10.329008102416992, 10.914152145385742, 11.499297142028809, 12.084441184997559, 12.669586181640625, 13.254730224609375, 13.839874267578125, 14.425018310546875, 15.010163307189941, 15.595307350158691, 16.180452346801758, 16.765596389770508, 17.350740432739258, 17.93588638305664, 18.52103042602539, 19.10617446899414, 19.69131851196289]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 6.0, 14.0, 7.0, 18.0, 41.0, 43.0, 64.0, 86.0, 140.0, 206.0, 332.0, 524.0, 841.0, 1381.0, 2312.0, 4200.0, 7961.0, 15555.0, 34397.0, 98860.0, 372533.0, 351067.0, 92557.0, 32789.0, 14799.0, 7580.0, 4229.0, 2412.0, 1321.0, 811.0, 530.0, 323.0, 198.0, 107.0, 97.0, 63.0, 34.0, 35.0, 13.0, 15.0, 13.0, 10.0, 5.0, 6.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.353515625, -2.28424072265625, -2.2149658203125, -2.14569091796875, -2.076416015625, -2.00714111328125, -1.9378662109375, -1.86859130859375, -1.79931640625, -1.73004150390625, -1.6607666015625, -1.59149169921875, -1.522216796875, -1.45294189453125, -1.3836669921875, -1.31439208984375, -1.2451171875, -1.17584228515625, -1.1065673828125, -1.03729248046875, -0.968017578125, -0.89874267578125, -0.8294677734375, -0.76019287109375, -0.69091796875, -0.62164306640625, -0.5523681640625, -0.48309326171875, -0.413818359375, -0.34454345703125, -0.2752685546875, -0.20599365234375, -0.13671875, -0.06744384765625, 0.0018310546875, 0.07110595703125, 0.140380859375, 0.20965576171875, 0.2789306640625, 0.34820556640625, 0.41748046875, 0.48675537109375, 0.5560302734375, 0.62530517578125, 0.694580078125, 0.76385498046875, 0.8331298828125, 0.90240478515625, 0.9716796875, 1.04095458984375, 1.1102294921875, 1.17950439453125, 1.248779296875, 1.31805419921875, 1.3873291015625, 1.45660400390625, 1.52587890625, 1.59515380859375, 1.6644287109375, 1.73370361328125, 1.802978515625, 1.87225341796875, 1.9415283203125, 2.01080322265625, 2.080078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 4.0, 4.0, 9.0, 13.0, 9.0, 23.0, 20.0, 26.0, 33.0, 37.0, 30.0, 43.0, 48.0, 53.0, 52.0, 43.0, 61.0, 51.0, 56.0, 49.0, 57.0, 37.0, 33.0, 32.0, 29.0, 26.0, 17.0, 24.0, 19.0, 12.0, 13.0, 9.0, 9.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1328125, -1.0973968505859375, -1.061981201171875, -1.0265655517578125, -0.99114990234375, -0.9557342529296875, -0.920318603515625, -0.8849029541015625, -0.8494873046875, -0.8140716552734375, -0.778656005859375, -0.7432403564453125, -0.70782470703125, -0.6724090576171875, -0.636993408203125, -0.6015777587890625, -0.566162109375, -0.5307464599609375, -0.495330810546875, -0.4599151611328125, -0.42449951171875, -0.3890838623046875, -0.353668212890625, -0.3182525634765625, -0.2828369140625, -0.2474212646484375, -0.212005615234375, -0.1765899658203125, -0.14117431640625, -0.1057586669921875, -0.070343017578125, -0.0349273681640625, 0.00048828125, 0.0359039306640625, 0.071319580078125, 0.1067352294921875, 0.14215087890625, 0.1775665283203125, 0.212982177734375, 0.2483978271484375, 0.2838134765625, 0.3192291259765625, 0.354644775390625, 0.3900604248046875, 0.42547607421875, 0.4608917236328125, 0.496307373046875, 0.5317230224609375, 0.567138671875, 0.6025543212890625, 0.637969970703125, 0.6733856201171875, 0.70880126953125, 0.7442169189453125, 0.779632568359375, 0.8150482177734375, 0.8504638671875, 0.8858795166015625, 0.921295166015625, 0.9567108154296875, 0.99212646484375, 1.0275421142578125, 1.062957763671875, 1.0983734130859375, 1.1337890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 10.0, 5.0, 6.0, 9.0, 15.0, 16.0, 20.0, 33.0, 36.0, 49.0, 64.0, 105.0, 138.0, 217.0, 319.0, 475.0, 888.0, 1580.0, 3619.0, 10024.0, 39097.0, 341211.0, 583541.0, 47135.0, 11485.0, 4120.0, 1772.0, 946.0, 528.0, 311.0, 233.0, 136.0, 106.0, 70.0, 68.0, 35.0, 21.0, 23.0, 19.0, 13.0, 12.0, 11.0, 10.0, 5.0, 2.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.54296875, -4.409576416015625, -4.27618408203125, -4.142791748046875, -4.0093994140625, -3.876007080078125, -3.74261474609375, -3.609222412109375, -3.475830078125, -3.342437744140625, -3.20904541015625, -3.075653076171875, -2.9422607421875, -2.808868408203125, -2.67547607421875, -2.542083740234375, -2.40869140625, -2.275299072265625, -2.14190673828125, -2.008514404296875, -1.8751220703125, -1.741729736328125, -1.60833740234375, -1.474945068359375, -1.341552734375, -1.208160400390625, -1.07476806640625, -0.941375732421875, -0.8079833984375, -0.674591064453125, -0.54119873046875, -0.407806396484375, -0.2744140625, -0.141021728515625, -0.00762939453125, 0.125762939453125, 0.2591552734375, 0.392547607421875, 0.52593994140625, 0.659332275390625, 0.792724609375, 0.926116943359375, 1.05950927734375, 1.192901611328125, 1.3262939453125, 1.459686279296875, 1.59307861328125, 1.726470947265625, 1.85986328125, 1.993255615234375, 2.12664794921875, 2.260040283203125, 2.3934326171875, 2.526824951171875, 2.66021728515625, 2.793609619140625, 2.927001953125, 3.060394287109375, 3.19378662109375, 3.327178955078125, 3.4605712890625, 3.593963623046875, 3.72735595703125, 3.860748291015625, 3.994140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 11.0, 16.0, 13.0, 18.0, 13.0, 29.0, 33.0, 43.0, 24.0, 46.0, 43.0, 41.0, 54.0, 61.0, 59.0, 60.0, 55.0, 43.0, 37.0, 44.0, 34.0, 45.0, 20.0, 31.0, 20.0, 15.0, 19.0, 7.0, 9.0, 7.0, 6.0, 8.0, 3.0, 6.0, 6.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5447998046875, -4.386474609375, -4.2281494140625, -4.06982421875, -3.9114990234375, -3.753173828125, -3.5948486328125, -3.4365234375, -3.2781982421875, -3.119873046875, -2.9615478515625, -2.80322265625, -2.6448974609375, -2.486572265625, -2.3282470703125, -2.169921875, -2.0115966796875, -1.853271484375, -1.6949462890625, -1.53662109375, -1.3782958984375, -1.219970703125, -1.0616455078125, -0.9033203125, -0.7449951171875, -0.586669921875, -0.4283447265625, -0.27001953125, -0.1116943359375, 0.046630859375, 0.2049560546875, 0.36328125, 0.5216064453125, 0.679931640625, 0.8382568359375, 0.99658203125, 1.1549072265625, 1.313232421875, 1.4715576171875, 1.6298828125, 1.7882080078125, 1.946533203125, 2.1048583984375, 2.26318359375, 2.4215087890625, 2.579833984375, 2.7381591796875, 2.896484375, 3.0548095703125, 3.213134765625, 3.3714599609375, 3.52978515625, 3.6881103515625, 3.846435546875, 4.0047607421875, 4.1630859375, 4.3214111328125, 4.479736328125, 4.6380615234375, 4.79638671875, 4.9547119140625, 5.113037109375, 5.2713623046875, 5.4296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 6.0, 17.0, 20.0, 23.0, 41.0, 57.0, 93.0, 143.0, 254.0, 380.0, 732.0, 1523.0, 3401.0, 8923.0, 29708.0, 130453.0, 663136.0, 157578.0, 34502.0, 10344.0, 3726.0, 1623.0, 723.0, 432.0, 233.0, 148.0, 117.0, 63.0, 36.0, 20.0, 28.0, 17.0, 16.0, 7.0, 6.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25, -1.2046356201171875, -1.159271240234375, -1.1139068603515625, -1.06854248046875, -1.0231781005859375, -0.977813720703125, -0.9324493408203125, -0.8870849609375, -0.8417205810546875, -0.796356201171875, -0.7509918212890625, -0.70562744140625, -0.6602630615234375, -0.614898681640625, -0.5695343017578125, -0.524169921875, -0.4788055419921875, -0.433441162109375, -0.3880767822265625, -0.34271240234375, -0.2973480224609375, -0.251983642578125, -0.2066192626953125, -0.1612548828125, -0.1158905029296875, -0.070526123046875, -0.0251617431640625, 0.02020263671875, 0.0655670166015625, 0.110931396484375, 0.1562957763671875, 0.20166015625, 0.2470245361328125, 0.292388916015625, 0.3377532958984375, 0.38311767578125, 0.4284820556640625, 0.473846435546875, 0.5192108154296875, 0.5645751953125, 0.6099395751953125, 0.655303955078125, 0.7006683349609375, 0.74603271484375, 0.7913970947265625, 0.836761474609375, 0.8821258544921875, 0.927490234375, 0.9728546142578125, 1.018218994140625, 1.0635833740234375, 1.10894775390625, 1.1543121337890625, 1.199676513671875, 1.2450408935546875, 1.2904052734375, 1.3357696533203125, 1.381134033203125, 1.4264984130859375, 1.47186279296875, 1.5172271728515625, 1.562591552734375, 1.6079559326171875, 1.6533203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 9.0, 12.0, 21.0, 11.0, 17.0, 32.0, 35.0, 61.0, 101.0, 134.0, 139.0, 119.0, 87.0, 60.0, 36.0, 29.0, 19.0, 16.0, 14.0, 5.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035119056701660156, -0.0003355257213115692, -0.00031986087560653687, -0.0003041960299015045, -0.00028853118419647217, -0.0002728663384914398, -0.00025720149278640747, -0.00024153664708137512, -0.00022587180137634277, -0.00021020695567131042, -0.00019454210996627808, -0.00017887726426124573, -0.00016321241855621338, -0.00014754757285118103, -0.00013188272714614868, -0.00011621788144111633, -0.00010055303573608398, -8.488819003105164e-05, -6.922334432601929e-05, -5.355849862098694e-05, -3.789365291595459e-05, -2.222880721092224e-05, -6.563961505889893e-06, 9.100884199142456e-06, 2.4765729904174805e-05, 4.043057560920715e-05, 5.60954213142395e-05, 7.176026701927185e-05, 8.74251127243042e-05, 0.00010308995842933655, 0.0001187548041343689, 0.00013441964983940125, 0.0001500844955444336, 0.00016574934124946594, 0.0001814141869544983, 0.00019707903265953064, 0.000212743878364563, 0.00022840872406959534, 0.00024407356977462769, 0.00025973841547966003, 0.0002754032611846924, 0.00029106810688972473, 0.0003067329525947571, 0.00032239779829978943, 0.0003380626440048218, 0.0003537274897098541, 0.0003693923354148865, 0.0003850571811199188, 0.00040072202682495117, 0.0004163868725299835, 0.00043205171823501587, 0.0004477165639400482, 0.00046338140964508057, 0.0004790462553501129, 0.0004947111010551453, 0.0005103759467601776, 0.00052604079246521, 0.0005417056381702423, 0.0005573704838752747, 0.000573035329580307, 0.0005887001752853394, 0.0006043650209903717, 0.000620029866695404, 0.0006356947124004364, 0.0006513595581054688]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 9.0, 9.0, 16.0, 16.0, 28.0, 30.0, 44.0, 81.0, 154.0, 222.0, 361.0, 684.0, 1495.0, 3914.0, 13003.0, 72491.0, 708146.0, 209275.0, 27672.0, 6446.0, 2236.0, 1039.0, 439.0, 262.0, 157.0, 95.0, 75.0, 46.0, 27.0, 22.0, 16.0, 11.0, 7.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.837890625, -1.7817535400390625, -1.725616455078125, -1.6694793701171875, -1.61334228515625, -1.5572052001953125, -1.501068115234375, -1.4449310302734375, -1.3887939453125, -1.3326568603515625, -1.276519775390625, -1.2203826904296875, -1.16424560546875, -1.1081085205078125, -1.051971435546875, -0.9958343505859375, -0.939697265625, -0.8835601806640625, -0.827423095703125, -0.7712860107421875, -0.71514892578125, -0.6590118408203125, -0.602874755859375, -0.5467376708984375, -0.4906005859375, -0.4344635009765625, -0.378326416015625, -0.3221893310546875, -0.26605224609375, -0.2099151611328125, -0.153778076171875, -0.0976409912109375, -0.04150390625, 0.0146331787109375, 0.070770263671875, 0.1269073486328125, 0.18304443359375, 0.2391815185546875, 0.295318603515625, 0.3514556884765625, 0.4075927734375, 0.4637298583984375, 0.519866943359375, 0.5760040283203125, 0.63214111328125, 0.6882781982421875, 0.744415283203125, 0.8005523681640625, 0.856689453125, 0.9128265380859375, 0.968963623046875, 1.0251007080078125, 1.08123779296875, 1.1373748779296875, 1.193511962890625, 1.2496490478515625, 1.3057861328125, 1.3619232177734375, 1.418060302734375, 1.4741973876953125, 1.53033447265625, 1.5864715576171875, 1.642608642578125, 1.6987457275390625, 1.7548828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 8.0, 11.0, 21.0, 23.0, 32.0, 51.0, 40.0, 46.0, 62.0, 70.0, 98.0, 97.0, 103.0, 76.0, 58.0, 55.0, 35.0, 28.0, 20.0, 12.0, 8.0, 11.0, 6.0, 7.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2509765625, -1.2013702392578125, -1.151763916015625, -1.1021575927734375, -1.05255126953125, -1.0029449462890625, -0.953338623046875, -0.9037322998046875, -0.8541259765625, -0.8045196533203125, -0.754913330078125, -0.7053070068359375, -0.65570068359375, -0.6060943603515625, -0.556488037109375, -0.5068817138671875, -0.457275390625, -0.4076690673828125, -0.358062744140625, -0.3084564208984375, -0.25885009765625, -0.2092437744140625, -0.159637451171875, -0.1100311279296875, -0.0604248046875, -0.0108184814453125, 0.038787841796875, 0.0883941650390625, 0.13800048828125, 0.1876068115234375, 0.237213134765625, 0.2868194580078125, 0.33642578125, 0.3860321044921875, 0.435638427734375, 0.4852447509765625, 0.53485107421875, 0.5844573974609375, 0.634063720703125, 0.6836700439453125, 0.7332763671875, 0.7828826904296875, 0.832489013671875, 0.8820953369140625, 0.93170166015625, 0.9813079833984375, 1.030914306640625, 1.0805206298828125, 1.130126953125, 1.1797332763671875, 1.229339599609375, 1.2789459228515625, 1.32855224609375, 1.3781585693359375, 1.427764892578125, 1.4773712158203125, 1.5269775390625, 1.5765838623046875, 1.626190185546875, 1.6757965087890625, 1.72540283203125, 1.7750091552734375, 1.824615478515625, 1.8742218017578125, 1.923828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 20.0, 45.0, 137.0, 259.0, 332.0, 118.0, 42.0, 13.0, 3.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.91419982910156, -43.257564544677734, -41.600929260253906, -39.94429016113281, -38.287654876708984, -36.631019592285156, -34.97438430786133, -33.3177490234375, -31.661113739013672, -30.004478454589844, -28.347841262817383, -26.691205978393555, -25.034570693969727, -23.377933502197266, -21.721298217773438, -20.06466293334961, -18.40802574157715, -16.75139045715332, -15.094754219055176, -13.438117980957031, -11.781482696533203, -10.124846458435059, -8.468210220336914, -6.811574935913086, -5.154938697814941, -3.498302936553955, -1.8416669368743896, -0.18503093719482422, 1.471604824066162, 3.1282405853271484, 4.784876823425293, 6.441512107849121, 8.098148345947266, 9.75478458404541, 11.411419868469238, 13.068056106567383, 14.724691390991211, 16.381328582763672, 18.0379638671875, 19.694599151611328, 21.351234436035156, 23.007869720458984, 24.664506912231445, 26.321142196655273, 27.9777774810791, 29.634414672851562, 31.29104995727539, 32.94768524169922, 34.60432434082031, 36.26095962524414, 37.91759490966797, 39.57423400878906, 41.23086929321289, 42.88750457763672, 44.54413986206055, 46.200775146484375, 47.8574104309082, 49.51404571533203, 51.17068099975586, 52.82731628417969, 54.48395538330078, 56.14059066772461, 57.79722595214844, 59.453861236572266, 61.110496520996094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 7.0, 5.0, 3.0, 11.0, 13.0, 14.0, 18.0, 20.0, 18.0, 24.0, 28.0, 31.0, 21.0, 36.0, 39.0, 45.0, 75.0, 61.0, 72.0, 54.0, 47.0, 44.0, 40.0, 47.0, 37.0, 29.0, 21.0, 23.0, 18.0, 19.0, 5.0, 7.0, 13.0, 7.0, 5.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.38871955871582, -19.800575256347656, -19.21242904663086, -18.624284744262695, -18.03614044189453, -17.447994232177734, -16.85984992980957, -16.271705627441406, -15.683560371398926, -15.095415115356445, -14.507270812988281, -13.9191255569458, -13.33098030090332, -12.742835998535156, -12.154690742492676, -11.566545486450195, -10.978401184082031, -10.39025592803955, -9.802111625671387, -9.213966369628906, -8.625822067260742, -8.037676811218262, -7.449531555175781, -6.861386775970459, -6.273241996765137, -5.6850972175598145, -5.096952438354492, -4.508807182312012, -3.9206624031066895, -3.332517623901367, -2.744372606277466, -2.1562275886535645, -1.5680828094482422, -0.9799379110336304, -0.39179301261901855, 0.19635188579559326, 0.7844967842102051, 1.3726415634155273, 1.9607865810394287, 2.54893159866333, 3.1370763778686523, 3.7252211570739746, 4.313365936279297, 4.901511192321777, 5.4896559715271, 6.077800750732422, 6.665946006774902, 7.254090785980225, 7.842235565185547, 8.430380821228027, 9.018525123596191, 9.606670379638672, 10.194814682006836, 10.782959938049316, 11.371105194091797, 11.959249496459961, 12.547394752502441, 13.135540008544922, 13.723684310913086, 14.311829566955566, 14.899974822998047, 15.488119125366211, 16.076263427734375, 16.664409637451172, 17.252553939819336]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 14.0, 4.0, 17.0, 14.0, 32.0, 46.0, 65.0, 105.0, 171.0, 347.0, 572.0, 1116.0, 2285.0, 5187.0, 13885.0, 46669.0, 280810.0, 2857123.0, 860164.0, 88308.0, 22341.0, 8054.0, 3509.0, 1555.0, 809.0, 431.0, 237.0, 139.0, 103.0, 47.0, 36.0, 26.0, 17.0, 11.0, 7.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.322265625, -2.2606964111328125, -2.199127197265625, -2.1375579833984375, -2.07598876953125, -2.0144195556640625, -1.952850341796875, -1.8912811279296875, -1.8297119140625, -1.7681427001953125, -1.706573486328125, -1.6450042724609375, -1.58343505859375, -1.5218658447265625, -1.460296630859375, -1.3987274169921875, -1.337158203125, -1.2755889892578125, -1.214019775390625, -1.1524505615234375, -1.09088134765625, -1.0293121337890625, -0.967742919921875, -0.9061737060546875, -0.8446044921875, -0.7830352783203125, -0.721466064453125, -0.6598968505859375, -0.59832763671875, -0.5367584228515625, -0.475189208984375, -0.4136199951171875, -0.35205078125, -0.2904815673828125, -0.228912353515625, -0.1673431396484375, -0.10577392578125, -0.0442047119140625, 0.017364501953125, 0.0789337158203125, 0.1405029296875, 0.2020721435546875, 0.263641357421875, 0.3252105712890625, 0.38677978515625, 0.4483489990234375, 0.509918212890625, 0.5714874267578125, 0.633056640625, 0.6946258544921875, 0.756195068359375, 0.8177642822265625, 0.87933349609375, 0.9409027099609375, 1.002471923828125, 1.0640411376953125, 1.1256103515625, 1.1871795654296875, 1.248748779296875, 1.3103179931640625, 1.37188720703125, 1.4334564208984375, 1.495025634765625, 1.5565948486328125, 1.6181640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 6.0, 5.0, 6.0, 8.0, 7.0, 12.0, 22.0, 18.0, 21.0, 9.0, 27.0, 44.0, 29.0, 57.0, 44.0, 38.0, 39.0, 40.0, 48.0, 56.0, 44.0, 47.0, 36.0, 30.0, 42.0, 34.0, 34.0, 27.0, 33.0, 17.0, 19.0, 21.0, 19.0, 18.0, 5.0, 13.0, 3.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.974609375, -0.946258544921875, -0.91790771484375, -0.889556884765625, -0.8612060546875, -0.832855224609375, -0.80450439453125, -0.776153564453125, -0.747802734375, -0.719451904296875, -0.69110107421875, -0.662750244140625, -0.6343994140625, -0.606048583984375, -0.57769775390625, -0.549346923828125, -0.52099609375, -0.492645263671875, -0.46429443359375, -0.435943603515625, -0.4075927734375, -0.379241943359375, -0.35089111328125, -0.322540283203125, -0.294189453125, -0.265838623046875, -0.23748779296875, -0.209136962890625, -0.1807861328125, -0.152435302734375, -0.12408447265625, -0.095733642578125, -0.0673828125, -0.039031982421875, -0.01068115234375, 0.017669677734375, 0.0460205078125, 0.074371337890625, 0.10272216796875, 0.131072998046875, 0.159423828125, 0.187774658203125, 0.21612548828125, 0.244476318359375, 0.2728271484375, 0.301177978515625, 0.32952880859375, 0.357879638671875, 0.38623046875, 0.414581298828125, 0.44293212890625, 0.471282958984375, 0.4996337890625, 0.527984619140625, 0.55633544921875, 0.584686279296875, 0.613037109375, 0.641387939453125, 0.66973876953125, 0.698089599609375, 0.7264404296875, 0.754791259765625, 0.78314208984375, 0.811492919921875, 0.83984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 11.0, 7.0, 14.0, 19.0, 33.0, 52.0, 112.0, 202.0, 403.0, 977.0, 2686.0, 10145.0, 71027.0, 3358187.0, 709422.0, 31857.0, 6075.0, 1750.0, 642.0, 284.0, 156.0, 78.0, 51.0, 28.0, 21.0, 14.0, 7.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.77734375, -5.6114501953125, -5.445556640625, -5.2796630859375, -5.11376953125, -4.9478759765625, -4.781982421875, -4.6160888671875, -4.4501953125, -4.2843017578125, -4.118408203125, -3.9525146484375, -3.78662109375, -3.6207275390625, -3.454833984375, -3.2889404296875, -3.123046875, -2.9571533203125, -2.791259765625, -2.6253662109375, -2.45947265625, -2.2935791015625, -2.127685546875, -1.9617919921875, -1.7958984375, -1.6300048828125, -1.464111328125, -1.2982177734375, -1.13232421875, -0.9664306640625, -0.800537109375, -0.6346435546875, -0.46875, -0.3028564453125, -0.136962890625, 0.0289306640625, 0.19482421875, 0.3607177734375, 0.526611328125, 0.6925048828125, 0.8583984375, 1.0242919921875, 1.190185546875, 1.3560791015625, 1.52197265625, 1.6878662109375, 1.853759765625, 2.0196533203125, 2.185546875, 2.3514404296875, 2.517333984375, 2.6832275390625, 2.84912109375, 3.0150146484375, 3.180908203125, 3.3468017578125, 3.5126953125, 3.6785888671875, 3.844482421875, 4.0103759765625, 4.17626953125, 4.3421630859375, 4.508056640625, 4.6739501953125, 4.83984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 5.0, 11.0, 7.0, 15.0, 22.0, 26.0, 48.0, 91.0, 165.0, 365.0, 837.0, 1236.0, 639.0, 259.0, 138.0, 62.0, 50.0, 28.0, 23.0, 10.0, 9.0, 4.0, 8.0, 2.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.87078857421875, -3.7181396484375, -3.56549072265625, -3.412841796875, -3.26019287109375, -3.1075439453125, -2.95489501953125, -2.80224609375, -2.64959716796875, -2.4969482421875, -2.34429931640625, -2.191650390625, -2.03900146484375, -1.8863525390625, -1.73370361328125, -1.5810546875, -1.42840576171875, -1.2757568359375, -1.12310791015625, -0.970458984375, -0.81781005859375, -0.6651611328125, -0.51251220703125, -0.35986328125, -0.20721435546875, -0.0545654296875, 0.09808349609375, 0.250732421875, 0.40338134765625, 0.5560302734375, 0.70867919921875, 0.861328125, 1.01397705078125, 1.1666259765625, 1.31927490234375, 1.471923828125, 1.62457275390625, 1.7772216796875, 1.92987060546875, 2.08251953125, 2.23516845703125, 2.3878173828125, 2.54046630859375, 2.693115234375, 2.84576416015625, 2.9984130859375, 3.15106201171875, 3.3037109375, 3.45635986328125, 3.6090087890625, 3.76165771484375, 3.914306640625, 4.06695556640625, 4.2196044921875, 4.37225341796875, 4.52490234375, 4.67755126953125, 4.8302001953125, 4.98284912109375, 5.135498046875, 5.28814697265625, 5.4407958984375, 5.59344482421875, 5.74609375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 7.0, 29.0, 38.0, 85.0, 214.0, 274.0, 201.0, 83.0, 42.0, 9.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.968963623046875, -46.44316864013672, -44.9173698425293, -43.39157485961914, -41.86577606201172, -40.33998107910156, -38.814186096191406, -37.288387298583984, -35.76258850097656, -34.236793518066406, -32.710994720458984, -31.185199737548828, -29.659400939941406, -28.13360595703125, -26.60780906677246, -25.082012176513672, -23.556217193603516, -22.030420303344727, -20.504623413085938, -18.97882843017578, -17.45302963256836, -15.927233695983887, -14.401437759399414, -12.875640869140625, -11.349843978881836, -9.824047088623047, -8.298250198364258, -6.772454261779785, -5.246657371520996, -3.720860481262207, -2.1950645446777344, -0.6692676544189453, 0.8565292358398438, 2.3823258876800537, 3.9081225395202637, 5.4339189529418945, 6.959715843200684, 8.485512733459473, 10.011308670043945, 11.537105560302734, 13.062902450561523, 14.588699340820312, 16.1144962310791, 17.64029312133789, 19.166088104248047, 20.69188690185547, 22.217681884765625, 23.743478775024414, 25.269275665283203, 26.795072555541992, 28.32086944580078, 29.846664428710938, 31.37246322631836, 32.898258209228516, 34.42405700683594, 35.949851989746094, 37.47564697265625, 39.001441955566406, 40.52724075317383, 42.053035736083984, 43.578834533691406, 45.10462951660156, 46.63042449951172, 48.15622329711914, 49.68202209472656]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 6.0, 2.0, 7.0, 10.0, 10.0, 11.0, 21.0, 24.0, 26.0, 32.0, 33.0, 35.0, 39.0, 54.0, 45.0, 48.0, 45.0, 52.0, 52.0, 54.0, 51.0, 45.0, 34.0, 40.0, 44.0, 23.0, 28.0, 23.0, 18.0, 13.0, 15.0, 15.0, 6.0, 9.0, 11.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.264839172363281, -14.776976585388184, -14.289114952087402, -13.801252365112305, -13.313390731811523, -12.825528144836426, -12.337665557861328, -11.849803924560547, -11.36194133758545, -10.874078750610352, -10.38621711730957, -9.898354530334473, -9.410491943359375, -8.922630310058594, -8.434767723083496, -7.946905612945557, -7.459043502807617, -6.971181392669678, -6.483319282531738, -5.995456695556641, -5.507594585418701, -5.019732475280762, -4.531869888305664, -4.044007778167725, -3.556145668029785, -3.0682835578918457, -2.580421209335327, -2.0925588607788086, -1.6046967506408691, -1.1168346405029297, -0.6289722919464111, -0.14110994338989258, 0.3467531204223633, 0.8346153497695923, 1.3224775791168213, 1.8103398084640503, 2.2982020378112793, 2.7860641479492188, 3.2739264965057373, 3.761788845062256, 4.249650955200195, 4.737513065338135, 5.225375175476074, 5.713237762451172, 6.201099872589111, 6.688961982727051, 7.176824569702148, 7.664686679840088, 8.152548789978027, 8.640411376953125, 9.128273010253906, 9.616135597229004, 10.103998184204102, 10.591859817504883, 11.07972240447998, 11.567584991455078, 12.05544662475586, 12.543309211730957, 13.031170845031738, 13.519033432006836, 14.006895065307617, 14.494757652282715, 14.982620239257812, 15.470481872558594, 15.958344459533691]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 13.0, 8.0, 17.0, 17.0, 31.0, 49.0, 73.0, 109.0, 182.0, 347.0, 600.0, 1132.0, 2320.0, 4842.0, 13206.0, 55373.0, 384043.0, 485018.0, 74362.0, 15833.0, 5630.0, 2475.0, 1240.0, 664.0, 349.0, 237.0, 127.0, 81.0, 50.0, 38.0, 23.0, 19.0, 6.0, 7.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7734375, -2.686981201171875, -2.60052490234375, -2.514068603515625, -2.4276123046875, -2.341156005859375, -2.25469970703125, -2.168243408203125, -2.081787109375, -1.995330810546875, -1.90887451171875, -1.822418212890625, -1.7359619140625, -1.649505615234375, -1.56304931640625, -1.476593017578125, -1.39013671875, -1.303680419921875, -1.21722412109375, -1.130767822265625, -1.0443115234375, -0.957855224609375, -0.87139892578125, -0.784942626953125, -0.698486328125, -0.612030029296875, -0.52557373046875, -0.439117431640625, -0.3526611328125, -0.266204833984375, -0.17974853515625, -0.093292236328125, -0.0068359375, 0.079620361328125, 0.16607666015625, 0.252532958984375, 0.3389892578125, 0.425445556640625, 0.51190185546875, 0.598358154296875, 0.684814453125, 0.771270751953125, 0.85772705078125, 0.944183349609375, 1.0306396484375, 1.117095947265625, 1.20355224609375, 1.290008544921875, 1.37646484375, 1.462921142578125, 1.54937744140625, 1.635833740234375, 1.7222900390625, 1.808746337890625, 1.89520263671875, 1.981658935546875, 2.068115234375, 2.154571533203125, 2.24102783203125, 2.327484130859375, 2.4139404296875, 2.500396728515625, 2.58685302734375, 2.673309326171875, 2.759765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 7.0, 3.0, 7.0, 7.0, 9.0, 17.0, 13.0, 22.0, 18.0, 27.0, 31.0, 34.0, 38.0, 38.0, 44.0, 46.0, 47.0, 38.0, 44.0, 51.0, 53.0, 44.0, 49.0, 34.0, 33.0, 43.0, 28.0, 39.0, 23.0, 21.0, 21.0, 15.0, 11.0, 9.0, 6.0, 12.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.16796875, -1.1329345703125, -1.097900390625, -1.0628662109375, -1.02783203125, -0.9927978515625, -0.957763671875, -0.9227294921875, -0.8876953125, -0.8526611328125, -0.817626953125, -0.7825927734375, -0.74755859375, -0.7125244140625, -0.677490234375, -0.6424560546875, -0.607421875, -0.5723876953125, -0.537353515625, -0.5023193359375, -0.46728515625, -0.4322509765625, -0.397216796875, -0.3621826171875, -0.3271484375, -0.2921142578125, -0.257080078125, -0.2220458984375, -0.18701171875, -0.1519775390625, -0.116943359375, -0.0819091796875, -0.046875, -0.0118408203125, 0.023193359375, 0.0582275390625, 0.09326171875, 0.1282958984375, 0.163330078125, 0.1983642578125, 0.2333984375, 0.2684326171875, 0.303466796875, 0.3385009765625, 0.37353515625, 0.4085693359375, 0.443603515625, 0.4786376953125, 0.513671875, 0.5487060546875, 0.583740234375, 0.6187744140625, 0.65380859375, 0.6888427734375, 0.723876953125, 0.7589111328125, 0.7939453125, 0.8289794921875, 0.864013671875, 0.8990478515625, 0.93408203125, 0.9691162109375, 1.004150390625, 1.0391845703125, 1.07421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 10.0, 13.0, 18.0, 16.0, 50.0, 68.0, 111.0, 229.0, 418.0, 998.0, 2671.0, 10662.0, 158252.0, 831789.0, 35182.0, 5263.0, 1571.0, 612.0, 280.0, 142.0, 77.0, 42.0, 32.0, 10.0, 11.0, 7.0, 4.0, 3.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.92132568359375, -3.7528076171875, -3.58428955078125, -3.415771484375, -3.24725341796875, -3.0787353515625, -2.91021728515625, -2.74169921875, -2.57318115234375, -2.4046630859375, -2.23614501953125, -2.067626953125, -1.89910888671875, -1.7305908203125, -1.56207275390625, -1.3935546875, -1.22503662109375, -1.0565185546875, -0.88800048828125, -0.719482421875, -0.55096435546875, -0.3824462890625, -0.21392822265625, -0.04541015625, 0.12310791015625, 0.2916259765625, 0.46014404296875, 0.628662109375, 0.79718017578125, 0.9656982421875, 1.13421630859375, 1.302734375, 1.47125244140625, 1.6397705078125, 1.80828857421875, 1.976806640625, 2.14532470703125, 2.3138427734375, 2.48236083984375, 2.65087890625, 2.81939697265625, 2.9879150390625, 3.15643310546875, 3.324951171875, 3.49346923828125, 3.6619873046875, 3.83050537109375, 3.9990234375, 4.16754150390625, 4.3360595703125, 4.50457763671875, 4.673095703125, 4.84161376953125, 5.0101318359375, 5.17864990234375, 5.34716796875, 5.51568603515625, 5.6842041015625, 5.85272216796875, 6.021240234375, 6.18975830078125, 6.3582763671875, 6.52679443359375, 6.6953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 5.0, 17.0, 20.0, 25.0, 33.0, 47.0, 42.0, 47.0, 63.0, 59.0, 71.0, 63.0, 71.0, 76.0, 56.0, 59.0, 54.0, 40.0, 33.0, 28.0, 20.0, 16.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.63427734375, -7.4287109375, -7.22314453125, -7.017578125, -6.81201171875, -6.6064453125, -6.40087890625, -6.1953125, -5.98974609375, -5.7841796875, -5.57861328125, -5.373046875, -5.16748046875, -4.9619140625, -4.75634765625, -4.55078125, -4.34521484375, -4.1396484375, -3.93408203125, -3.728515625, -3.52294921875, -3.3173828125, -3.11181640625, -2.90625, -2.70068359375, -2.4951171875, -2.28955078125, -2.083984375, -1.87841796875, -1.6728515625, -1.46728515625, -1.26171875, -1.05615234375, -0.8505859375, -0.64501953125, -0.439453125, -0.23388671875, -0.0283203125, 0.17724609375, 0.3828125, 0.58837890625, 0.7939453125, 0.99951171875, 1.205078125, 1.41064453125, 1.6162109375, 1.82177734375, 2.02734375, 2.23291015625, 2.4384765625, 2.64404296875, 2.849609375, 3.05517578125, 3.2607421875, 3.46630859375, 3.671875, 3.87744140625, 4.0830078125, 4.28857421875, 4.494140625, 4.69970703125, 4.9052734375, 5.11083984375, 5.31640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 11.0, 16.0, 19.0, 37.0, 44.0, 65.0, 132.0, 235.0, 516.0, 1061.0, 2983.0, 8356.0, 30517.0, 155096.0, 677365.0, 132679.0, 27119.0, 7545.0, 2762.0, 997.0, 459.0, 209.0, 117.0, 78.0, 43.0, 26.0, 17.0, 7.0, 17.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4931640625, -1.4485321044921875, -1.403900146484375, -1.3592681884765625, -1.31463623046875, -1.2700042724609375, -1.225372314453125, -1.1807403564453125, -1.1361083984375, -1.0914764404296875, -1.046844482421875, -1.0022125244140625, -0.95758056640625, -0.9129486083984375, -0.868316650390625, -0.8236846923828125, -0.779052734375, -0.7344207763671875, -0.689788818359375, -0.6451568603515625, -0.60052490234375, -0.5558929443359375, -0.511260986328125, -0.4666290283203125, -0.4219970703125, -0.3773651123046875, -0.332733154296875, -0.2881011962890625, -0.24346923828125, -0.1988372802734375, -0.154205322265625, -0.1095733642578125, -0.06494140625, -0.0203094482421875, 0.024322509765625, 0.0689544677734375, 0.11358642578125, 0.1582183837890625, 0.202850341796875, 0.2474822998046875, 0.2921142578125, 0.3367462158203125, 0.381378173828125, 0.4260101318359375, 0.47064208984375, 0.5152740478515625, 0.559906005859375, 0.6045379638671875, 0.649169921875, 0.6938018798828125, 0.738433837890625, 0.7830657958984375, 0.82769775390625, 0.8723297119140625, 0.916961669921875, 0.9615936279296875, 1.0062255859375, 1.0508575439453125, 1.095489501953125, 1.1401214599609375, 1.18475341796875, 1.2293853759765625, 1.274017333984375, 1.3186492919921875, 1.36328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 14.0, 24.0, 14.0, 18.0, 25.0, 38.0, 54.0, 67.0, 95.0, 123.0, 109.0, 95.0, 96.0, 60.0, 37.0, 21.0, 23.0, 12.0, 13.0, 7.0, 9.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003027915954589844, -0.0002917088568210602, -0.000280626118183136, -0.0002695433795452118, -0.0002584606409072876, -0.0002473779022693634, -0.0002362951636314392, -0.00022521242499351501, -0.00021412968635559082, -0.00020304694771766663, -0.00019196420907974243, -0.00018088147044181824, -0.00016979873180389404, -0.00015871599316596985, -0.00014763325452804565, -0.00013655051589012146, -0.00012546777725219727, -0.00011438503861427307, -0.00010330229997634888, -9.221956133842468e-05, -8.113682270050049e-05, -7.00540840625763e-05, -5.89713454246521e-05, -4.7888606786727905e-05, -3.680586814880371e-05, -2.5723129510879517e-05, -1.4640390872955322e-05, -3.557652235031128e-06, 7.525086402893066e-06, 1.860782504081726e-05, 2.9690563678741455e-05, 4.077330231666565e-05, 5.1856040954589844e-05, 6.293877959251404e-05, 7.402151823043823e-05, 8.510425686836243e-05, 9.618699550628662e-05, 0.00010726973414421082, 0.00011835247278213501, 0.0001294352114200592, 0.0001405179500579834, 0.0001516006886959076, 0.0001626834273338318, 0.00017376616597175598, 0.00018484890460968018, 0.00019593164324760437, 0.00020701438188552856, 0.00021809712052345276, 0.00022917985916137695, 0.00024026259779930115, 0.00025134533643722534, 0.00026242807507514954, 0.00027351081371307373, 0.0002845935523509979, 0.0002956762909889221, 0.0003067590296268463, 0.0003178417682647705, 0.0003289245069026947, 0.0003400072455406189, 0.0003510899841785431, 0.0003621727228164673, 0.0003732554614543915, 0.0003843382000923157, 0.00039542093873023987, 0.00040650367736816406]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 5.0, 10.0, 8.0, 19.0, 27.0, 43.0, 77.0, 184.0, 414.0, 1089.0, 3897.0, 19213.0, 192914.0, 756605.0, 61739.0, 8902.0, 2194.0, 697.0, 260.0, 120.0, 55.0, 33.0, 17.0, 19.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.740234375, -1.67138671875, -1.6025390625, -1.53369140625, -1.46484375, -1.39599609375, -1.3271484375, -1.25830078125, -1.189453125, -1.12060546875, -1.0517578125, -0.98291015625, -0.9140625, -0.84521484375, -0.7763671875, -0.70751953125, -0.638671875, -0.56982421875, -0.5009765625, -0.43212890625, -0.36328125, -0.29443359375, -0.2255859375, -0.15673828125, -0.087890625, -0.01904296875, 0.0498046875, 0.11865234375, 0.1875, 0.25634765625, 0.3251953125, 0.39404296875, 0.462890625, 0.53173828125, 0.6005859375, 0.66943359375, 0.73828125, 0.80712890625, 0.8759765625, 0.94482421875, 1.013671875, 1.08251953125, 1.1513671875, 1.22021484375, 1.2890625, 1.35791015625, 1.4267578125, 1.49560546875, 1.564453125, 1.63330078125, 1.7021484375, 1.77099609375, 1.83984375, 1.90869140625, 1.9775390625, 2.04638671875, 2.115234375, 2.18408203125, 2.2529296875, 2.32177734375, 2.390625, 2.45947265625, 2.5283203125, 2.59716796875, 2.666015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 7.0, 5.0, 12.0, 18.0, 20.0, 22.0, 39.0, 53.0, 74.0, 101.0, 108.0, 98.0, 91.0, 100.0, 63.0, 51.0, 35.0, 34.0, 18.0, 12.0, 12.0, 9.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3017578125, -1.250518798828125, -1.19927978515625, -1.148040771484375, -1.0968017578125, -1.045562744140625, -0.99432373046875, -0.943084716796875, -0.891845703125, -0.840606689453125, -0.78936767578125, -0.738128662109375, -0.6868896484375, -0.635650634765625, -0.58441162109375, -0.533172607421875, -0.48193359375, -0.430694580078125, -0.37945556640625, -0.328216552734375, -0.2769775390625, -0.225738525390625, -0.17449951171875, -0.123260498046875, -0.072021484375, -0.020782470703125, 0.03045654296875, 0.081695556640625, 0.1329345703125, 0.184173583984375, 0.23541259765625, 0.286651611328125, 0.337890625, 0.389129638671875, 0.44036865234375, 0.491607666015625, 0.5428466796875, 0.594085693359375, 0.64532470703125, 0.696563720703125, 0.747802734375, 0.799041748046875, 0.85028076171875, 0.901519775390625, 0.9527587890625, 1.003997802734375, 1.05523681640625, 1.106475830078125, 1.15771484375, 1.208953857421875, 1.26019287109375, 1.311431884765625, 1.3626708984375, 1.413909912109375, 1.46514892578125, 1.516387939453125, 1.567626953125, 1.618865966796875, 1.67010498046875, 1.721343994140625, 1.7725830078125, 1.823822021484375, 1.87506103515625, 1.926300048828125, 1.9775390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 15.0, 22.0, 52.0, 84.0, 188.0, 295.0, 157.0, 79.0, 46.0, 17.0, 9.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.103439331054688, -23.07608985900879, -22.04874038696289, -21.02138900756836, -19.99403953552246, -18.966690063476562, -17.93933868408203, -16.911989212036133, -15.884639739990234, -14.857290267944336, -13.829939842224121, -12.802589416503906, -11.775239944458008, -10.74789047241211, -9.720540046691895, -8.69318962097168, -7.665840148925781, -6.638490200042725, -5.611140251159668, -4.583790302276611, -3.5564403533935547, -2.529090404510498, -1.5017404556274414, -0.47439050674438477, 0.5529594421386719, 1.5803093910217285, 2.607659339904785, 3.635009288787842, 4.662359237670898, 5.689709186553955, 6.717059135437012, 7.744409084320068, 8.771759033203125, 9.799108505249023, 10.826458930969238, 11.853809356689453, 12.881158828735352, 13.90850830078125, 14.935858726501465, 15.96320915222168, 16.990558624267578, 18.017908096313477, 19.045257568359375, 20.072608947753906, 21.099958419799805, 22.127307891845703, 23.154659271240234, 24.182008743286133, 25.20935821533203, 26.23670768737793, 27.264057159423828, 28.29140853881836, 29.318758010864258, 30.346107482910156, 31.373458862304688, 32.40080642700195, 33.428157806396484, 34.455509185791016, 35.48285675048828, 36.51020812988281, 37.537559509277344, 38.56490707397461, 39.59225845336914, 40.619606018066406, 41.64695739746094]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 10.0, 6.0, 5.0, 4.0, 13.0, 8.0, 17.0, 17.0, 15.0, 17.0, 22.0, 31.0, 27.0, 22.0, 32.0, 44.0, 57.0, 56.0, 59.0, 67.0, 69.0, 62.0, 44.0, 35.0, 33.0, 33.0, 20.0, 24.0, 25.0, 15.0, 16.0, 16.0, 14.0, 16.0, 10.0, 5.0, 9.0, 5.0, 8.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.634265899658203, -18.070852279663086, -17.507436752319336, -16.94402313232422, -16.38060760498047, -15.817193984985352, -15.253779411315918, -14.690364837646484, -14.12695026397705, -13.563535690307617, -13.000121116638184, -12.43670654296875, -11.873292922973633, -11.309877395629883, -10.746463775634766, -10.183049201965332, -9.619634628295898, -9.056220054626465, -8.492805480957031, -7.929391384124756, -7.365976810455322, -6.802562236785889, -6.239148139953613, -5.67573356628418, -5.112318992614746, -4.5489044189453125, -3.985490083694458, -3.4220757484436035, -2.85866117477417, -2.2952466011047363, -1.7318322658538818, -1.1684179306030273, -0.6050033569335938, -0.04158890247344971, 0.5218255519866943, 1.0852400064468384, 1.6486544609069824, 2.212069034576416, 2.7754833698272705, 3.338897705078125, 3.9023122787475586, 4.465726852416992, 5.029141426086426, 5.592555522918701, 6.155970096588135, 6.719384670257568, 7.282798767089844, 7.846213340759277, 8.409627914428711, 8.973042488098145, 9.536457061767578, 10.099871635437012, 10.663286209106445, 11.226699829101562, 11.790114402770996, 12.35352897644043, 12.916943550109863, 13.480358123779297, 14.04377269744873, 14.607187271118164, 15.170600891113281, 15.734016418457031, 16.29743003845215, 16.860843658447266, 17.424259185791016]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 11.0, 9.0, 14.0, 28.0, 27.0, 46.0, 88.0, 152.0, 310.0, 832.0, 2611.0, 11224.0, 95201.0, 3506553.0, 544080.0, 25539.0, 5020.0, 1481.0, 550.0, 250.0, 111.0, 57.0, 36.0, 18.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.16143798828125, -4.0416259765625, -3.92181396484375, -3.802001953125, -3.68218994140625, -3.5623779296875, -3.44256591796875, -3.32275390625, -3.20294189453125, -3.0831298828125, -2.96331787109375, -2.843505859375, -2.72369384765625, -2.6038818359375, -2.48406982421875, -2.3642578125, -2.24444580078125, -2.1246337890625, -2.00482177734375, -1.885009765625, -1.76519775390625, -1.6453857421875, -1.52557373046875, -1.40576171875, -1.28594970703125, -1.1661376953125, -1.04632568359375, -0.926513671875, -0.80670166015625, -0.6868896484375, -0.56707763671875, -0.447265625, -0.32745361328125, -0.2076416015625, -0.08782958984375, 0.031982421875, 0.15179443359375, 0.2716064453125, 0.39141845703125, 0.51123046875, 0.63104248046875, 0.7508544921875, 0.87066650390625, 0.990478515625, 1.11029052734375, 1.2301025390625, 1.34991455078125, 1.4697265625, 1.58953857421875, 1.7093505859375, 1.82916259765625, 1.948974609375, 2.06878662109375, 2.1885986328125, 2.30841064453125, 2.42822265625, 2.54803466796875, 2.6678466796875, 2.78765869140625, 2.907470703125, 3.02728271484375, 3.1470947265625, 3.26690673828125, 3.38671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 9.0, 11.0, 8.0, 18.0, 19.0, 20.0, 29.0, 21.0, 32.0, 37.0, 36.0, 46.0, 53.0, 45.0, 52.0, 56.0, 52.0, 49.0, 49.0, 45.0, 34.0, 39.0, 42.0, 36.0, 26.0, 23.0, 19.0, 15.0, 15.0, 11.0, 11.0, 12.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.0403900146484375, -1.004608154296875, -0.9688262939453125, -0.93304443359375, -0.8972625732421875, -0.861480712890625, -0.8256988525390625, -0.7899169921875, -0.7541351318359375, -0.718353271484375, -0.6825714111328125, -0.64678955078125, -0.6110076904296875, -0.575225830078125, -0.5394439697265625, -0.503662109375, -0.4678802490234375, -0.432098388671875, -0.3963165283203125, -0.36053466796875, -0.3247528076171875, -0.288970947265625, -0.2531890869140625, -0.2174072265625, -0.1816253662109375, -0.145843505859375, -0.1100616455078125, -0.07427978515625, -0.0384979248046875, -0.002716064453125, 0.0330657958984375, 0.06884765625, 0.1046295166015625, 0.140411376953125, 0.1761932373046875, 0.21197509765625, 0.2477569580078125, 0.283538818359375, 0.3193206787109375, 0.3551025390625, 0.3908843994140625, 0.426666259765625, 0.4624481201171875, 0.49822998046875, 0.5340118408203125, 0.569793701171875, 0.6055755615234375, 0.641357421875, 0.6771392822265625, 0.712921142578125, 0.7487030029296875, 0.78448486328125, 0.8202667236328125, 0.856048583984375, 0.8918304443359375, 0.9276123046875, 0.9633941650390625, 0.999176025390625, 1.0349578857421875, 1.07073974609375, 1.1065216064453125, 1.142303466796875, 1.1780853271484375, 1.2138671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 3.0, 7.0, 10.0, 18.0, 20.0, 39.0, 49.0, 80.0, 170.0, 469.0, 1664.0, 7655.0, 64405.0, 3448975.0, 638635.0, 26201.0, 4183.0, 1031.0, 324.0, 130.0, 61.0, 45.0, 28.0, 20.0, 14.0, 11.0, 6.0, 6.0, 3.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3515625, -5.183349609375, -5.01513671875, -4.846923828125, -4.6787109375, -4.510498046875, -4.34228515625, -4.174072265625, -4.005859375, -3.837646484375, -3.66943359375, -3.501220703125, -3.3330078125, -3.164794921875, -2.99658203125, -2.828369140625, -2.66015625, -2.491943359375, -2.32373046875, -2.155517578125, -1.9873046875, -1.819091796875, -1.65087890625, -1.482666015625, -1.314453125, -1.146240234375, -0.97802734375, -0.809814453125, -0.6416015625, -0.473388671875, -0.30517578125, -0.136962890625, 0.03125, 0.199462890625, 0.36767578125, 0.535888671875, 0.7041015625, 0.872314453125, 1.04052734375, 1.208740234375, 1.376953125, 1.545166015625, 1.71337890625, 1.881591796875, 2.0498046875, 2.218017578125, 2.38623046875, 2.554443359375, 2.72265625, 2.890869140625, 3.05908203125, 3.227294921875, 3.3955078125, 3.563720703125, 3.73193359375, 3.900146484375, 4.068359375, 4.236572265625, 4.40478515625, 4.572998046875, 4.7412109375, 4.909423828125, 5.07763671875, 5.245849609375, 5.4140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 3.0, 2.0, 5.0, 9.0, 16.0, 14.0, 17.0, 19.0, 39.0, 55.0, 60.0, 110.0, 196.0, 406.0, 721.0, 930.0, 598.0, 323.0, 183.0, 125.0, 62.0, 49.0, 30.0, 25.0, 19.0, 15.0, 14.0, 7.0, 5.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.74609375, -3.64031982421875, -3.5345458984375, -3.42877197265625, -3.322998046875, -3.21722412109375, -3.1114501953125, -3.00567626953125, -2.89990234375, -2.79412841796875, -2.6883544921875, -2.58258056640625, -2.476806640625, -2.37103271484375, -2.2652587890625, -2.15948486328125, -2.0537109375, -1.94793701171875, -1.8421630859375, -1.73638916015625, -1.630615234375, -1.52484130859375, -1.4190673828125, -1.31329345703125, -1.20751953125, -1.10174560546875, -0.9959716796875, -0.89019775390625, -0.784423828125, -0.67864990234375, -0.5728759765625, -0.46710205078125, -0.361328125, -0.25555419921875, -0.1497802734375, -0.04400634765625, 0.061767578125, 0.16754150390625, 0.2733154296875, 0.37908935546875, 0.48486328125, 0.59063720703125, 0.6964111328125, 0.80218505859375, 0.907958984375, 1.01373291015625, 1.1195068359375, 1.22528076171875, 1.3310546875, 1.43682861328125, 1.5426025390625, 1.64837646484375, 1.754150390625, 1.85992431640625, 1.9656982421875, 2.07147216796875, 2.17724609375, 2.28302001953125, 2.3887939453125, 2.49456787109375, 2.600341796875, 2.70611572265625, 2.8118896484375, 2.91766357421875, 3.0234375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 10.0, 19.0, 20.0, 43.0, 82.0, 156.0, 217.0, 176.0, 124.0, 73.0, 40.0, 12.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.242881774902344, -24.273448944091797, -23.304014205932617, -22.33458137512207, -21.36514663696289, -20.395713806152344, -19.426280975341797, -18.45684814453125, -17.48741340637207, -16.517980575561523, -15.548545837402344, -14.579113006591797, -13.609679222106934, -12.64024543762207, -11.670812606811523, -10.70137882232666, -9.731945037841797, -8.762511253356934, -7.7930779457092285, -6.823644638061523, -5.85421085357666, -4.884777069091797, -3.915343761444092, -2.9459104537963867, -1.9764766693115234, -1.0070431232452393, -0.03760957717895508, 0.9318239688873291, 1.9012575149536133, 2.8706912994384766, 3.8401246070861816, 4.809557914733887, 5.77899169921875, 6.748425483703613, 7.717858791351318, 8.687292098999023, 9.656725883483887, 10.62615966796875, 11.595592498779297, 12.56502628326416, 13.534460067749023, 14.503893852233887, 15.47332763671875, 16.442760467529297, 17.412193298339844, 18.381628036499023, 19.35106086730957, 20.32049560546875, 21.289928436279297, 22.259361267089844, 23.228796005249023, 24.19822883605957, 25.16766357421875, 26.137096405029297, 27.106529235839844, 28.07596206665039, 29.04539680480957, 30.014829635620117, 30.984264373779297, 31.953697204589844, 32.92313003540039, 33.89256286621094, 34.86199951171875, 35.8314323425293, 36.800865173339844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 4.0, 5.0, 9.0, 10.0, 11.0, 14.0, 5.0, 10.0, 12.0, 19.0, 14.0, 18.0, 27.0, 21.0, 33.0, 39.0, 31.0, 37.0, 45.0, 59.0, 34.0, 35.0, 40.0, 46.0, 53.0, 35.0, 34.0, 22.0, 34.0, 28.0, 27.0, 18.0, 23.0, 14.0, 26.0, 27.0, 13.0, 11.0, 8.0, 11.0, 6.0, 6.0, 7.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-11.434929847717285, -11.08916187286377, -10.74339485168457, -10.397626876831055, -10.051858901977539, -9.70609188079834, -9.360323905944824, -9.014556884765625, -8.66878890991211, -8.323020935058594, -7.9772539138793945, -7.631485939025879, -7.2857184410095215, -6.939950942993164, -6.594182968139648, -6.248415470123291, -5.902647972106934, -5.556880474090576, -5.211112976074219, -4.865345001220703, -4.519577503204346, -4.173810005187988, -3.8280422687530518, -3.4822745323181152, -3.136507034301758, -2.7907395362854004, -2.444971799850464, -2.0992040634155273, -1.75343656539917, -1.407668948173523, -1.061901330947876, -0.7161335945129395, -0.3703651428222656, -0.024597525596618652, 0.3211700916290283, 0.6669377088546753, 1.0127053260803223, 1.3584729433059692, 1.7042405605316162, 2.0500082969665527, 2.39577579498291, 2.7415432929992676, 3.087311029434204, 3.4330787658691406, 3.778846263885498, 4.1246137619018555, 4.470381736755371, 4.8161492347717285, 5.161916732788086, 5.507684230804443, 5.853451728820801, 6.199219703674316, 6.544987201690674, 6.890754699707031, 7.236522674560547, 7.582290172576904, 7.928057670593262, 8.273825645446777, 8.619592666625977, 8.965360641479492, 9.311128616333008, 9.656895637512207, 10.002663612365723, 10.348430633544922, 10.694198608398438]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 13.0, 11.0, 24.0, 36.0, 67.0, 115.0, 213.0, 381.0, 783.0, 1841.0, 5128.0, 21661.0, 240071.0, 700760.0, 62369.0, 9708.0, 2893.0, 1311.0, 530.0, 249.0, 164.0, 68.0, 55.0, 31.0, 21.0, 10.0, 10.0, 8.0, 8.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.35546875, -4.235321044921875, -4.11517333984375, -3.995025634765625, -3.8748779296875, -3.754730224609375, -3.63458251953125, -3.514434814453125, -3.394287109375, -3.274139404296875, -3.15399169921875, -3.033843994140625, -2.9136962890625, -2.793548583984375, -2.67340087890625, -2.553253173828125, -2.43310546875, -2.312957763671875, -2.19281005859375, -2.072662353515625, -1.9525146484375, -1.832366943359375, -1.71221923828125, -1.592071533203125, -1.471923828125, -1.351776123046875, -1.23162841796875, -1.111480712890625, -0.9913330078125, -0.871185302734375, -0.75103759765625, -0.630889892578125, -0.5107421875, -0.390594482421875, -0.27044677734375, -0.150299072265625, -0.0301513671875, 0.089996337890625, 0.21014404296875, 0.330291748046875, 0.450439453125, 0.570587158203125, 0.69073486328125, 0.810882568359375, 0.9310302734375, 1.051177978515625, 1.17132568359375, 1.291473388671875, 1.41162109375, 1.531768798828125, 1.65191650390625, 1.772064208984375, 1.8922119140625, 2.012359619140625, 2.13250732421875, 2.252655029296875, 2.372802734375, 2.492950439453125, 2.61309814453125, 2.733245849609375, 2.8533935546875, 2.973541259765625, 3.09368896484375, 3.213836669921875, 3.333984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 9.0, 6.0, 9.0, 8.0, 12.0, 12.0, 14.0, 15.0, 31.0, 26.0, 32.0, 35.0, 38.0, 41.0, 43.0, 49.0, 43.0, 53.0, 42.0, 64.0, 30.0, 56.0, 53.0, 40.0, 41.0, 27.0, 22.0, 27.0, 19.0, 21.0, 14.0, 16.0, 15.0, 8.0, 13.0, 3.0, 4.0, 6.0, 0.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9137039184570312, -0.8747711181640625, -0.8358383178710938, -0.796905517578125, -0.7579727172851562, -0.7190399169921875, -0.6801071166992188, -0.64117431640625, -0.6022415161132812, -0.5633087158203125, -0.5243759155273438, -0.485443115234375, -0.44651031494140625, -0.4075775146484375, -0.36864471435546875, -0.3297119140625, -0.29077911376953125, -0.2518463134765625, -0.21291351318359375, -0.173980712890625, -0.13504791259765625, -0.0961151123046875, -0.05718231201171875, -0.01824951171875, 0.02068328857421875, 0.0596160888671875, 0.09854888916015625, 0.137481689453125, 0.17641448974609375, 0.2153472900390625, 0.25428009033203125, 0.293212890625, 0.33214569091796875, 0.3710784912109375, 0.41001129150390625, 0.448944091796875, 0.48787689208984375, 0.5268096923828125, 0.5657424926757812, 0.60467529296875, 0.6436080932617188, 0.6825408935546875, 0.7214736938476562, 0.760406494140625, 0.7993392944335938, 0.8382720947265625, 0.8772048950195312, 0.9161376953125, 0.9550704956054688, 0.9940032958984375, 1.0329360961914062, 1.071868896484375, 1.1108016967773438, 1.1497344970703125, 1.1886672973632812, 1.22760009765625, 1.2665328979492188, 1.3054656982421875, 1.3443984985351562, 1.383331298828125, 1.4222640991210938, 1.4611968994140625, 1.5001296997070312, 1.5390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 9.0, 22.0, 31.0, 43.0, 74.0, 121.0, 232.0, 491.0, 1112.0, 3246.0, 21969.0, 884376.0, 126691.0, 6877.0, 1769.0, 660.0, 374.0, 181.0, 90.0, 53.0, 43.0, 31.0, 22.0, 4.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91796875, -5.7254638671875, -5.532958984375, -5.3404541015625, -5.14794921875, -4.9554443359375, -4.762939453125, -4.5704345703125, -4.3779296875, -4.1854248046875, -3.992919921875, -3.8004150390625, -3.60791015625, -3.4154052734375, -3.222900390625, -3.0303955078125, -2.837890625, -2.6453857421875, -2.452880859375, -2.2603759765625, -2.06787109375, -1.8753662109375, -1.682861328125, -1.4903564453125, -1.2978515625, -1.1053466796875, -0.912841796875, -0.7203369140625, -0.52783203125, -0.3353271484375, -0.142822265625, 0.0496826171875, 0.2421875, 0.4346923828125, 0.627197265625, 0.8197021484375, 1.01220703125, 1.2047119140625, 1.397216796875, 1.5897216796875, 1.7822265625, 1.9747314453125, 2.167236328125, 2.3597412109375, 2.55224609375, 2.7447509765625, 2.937255859375, 3.1297607421875, 3.322265625, 3.5147705078125, 3.707275390625, 3.8997802734375, 4.09228515625, 4.2847900390625, 4.477294921875, 4.6697998046875, 4.8623046875, 5.0548095703125, 5.247314453125, 5.4398193359375, 5.63232421875, 5.8248291015625, 6.017333984375, 6.2098388671875, 6.40234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 5.0, 12.0, 5.0, 10.0, 6.0, 8.0, 12.0, 25.0, 19.0, 25.0, 32.0, 34.0, 41.0, 46.0, 53.0, 55.0, 49.0, 52.0, 59.0, 54.0, 55.0, 55.0, 47.0, 44.0, 36.0, 29.0, 21.0, 15.0, 17.0, 17.0, 8.0, 10.0, 9.0, 7.0, 7.0, 12.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0], "bins": [-6.22265625, -6.06292724609375, -5.9031982421875, -5.74346923828125, -5.583740234375, -5.42401123046875, -5.2642822265625, -5.10455322265625, -4.94482421875, -4.78509521484375, -4.6253662109375, -4.46563720703125, -4.305908203125, -4.14617919921875, -3.9864501953125, -3.82672119140625, -3.6669921875, -3.50726318359375, -3.3475341796875, -3.18780517578125, -3.028076171875, -2.86834716796875, -2.7086181640625, -2.54888916015625, -2.38916015625, -2.22943115234375, -2.0697021484375, -1.90997314453125, -1.750244140625, -1.59051513671875, -1.4307861328125, -1.27105712890625, -1.111328125, -0.95159912109375, -0.7918701171875, -0.63214111328125, -0.472412109375, -0.31268310546875, -0.1529541015625, 0.00677490234375, 0.16650390625, 0.32623291015625, 0.4859619140625, 0.64569091796875, 0.805419921875, 0.96514892578125, 1.1248779296875, 1.28460693359375, 1.4443359375, 1.60406494140625, 1.7637939453125, 1.92352294921875, 2.083251953125, 2.24298095703125, 2.4027099609375, 2.56243896484375, 2.72216796875, 2.88189697265625, 3.0416259765625, 3.20135498046875, 3.361083984375, 3.52081298828125, 3.6805419921875, 3.84027099609375, 4.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 5.0, 16.0, 24.0, 26.0, 35.0, 72.0, 106.0, 196.0, 453.0, 949.0, 2232.0, 6047.0, 19308.0, 95687.0, 749444.0, 137177.0, 24793.0, 7098.0, 2676.0, 1081.0, 514.0, 248.0, 135.0, 84.0, 36.0, 35.0, 23.0, 12.0, 12.0, 5.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.3874053955078125, -1.346099853515625, -1.3047943115234375, -1.26348876953125, -1.2221832275390625, -1.180877685546875, -1.1395721435546875, -1.0982666015625, -1.0569610595703125, -1.015655517578125, -0.9743499755859375, -0.93304443359375, -0.8917388916015625, -0.850433349609375, -0.8091278076171875, -0.767822265625, -0.7265167236328125, -0.685211181640625, -0.6439056396484375, -0.60260009765625, -0.5612945556640625, -0.519989013671875, -0.4786834716796875, -0.4373779296875, -0.3960723876953125, -0.354766845703125, -0.3134613037109375, -0.27215576171875, -0.2308502197265625, -0.189544677734375, -0.1482391357421875, -0.10693359375, -0.0656280517578125, -0.024322509765625, 0.0169830322265625, 0.05828857421875, 0.0995941162109375, 0.140899658203125, 0.1822052001953125, 0.2235107421875, 0.2648162841796875, 0.306121826171875, 0.3474273681640625, 0.38873291015625, 0.4300384521484375, 0.471343994140625, 0.5126495361328125, 0.553955078125, 0.5952606201171875, 0.636566162109375, 0.6778717041015625, 0.71917724609375, 0.7604827880859375, 0.801788330078125, 0.8430938720703125, 0.8843994140625, 0.9257049560546875, 0.967010498046875, 1.0083160400390625, 1.04962158203125, 1.0909271240234375, 1.132232666015625, 1.1735382080078125, 1.21484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 2.0, 3.0, 4.0, 8.0, 11.0, 25.0, 31.0, 59.0, 79.0, 112.0, 177.0, 166.0, 106.0, 82.0, 51.0, 26.0, 14.0, 6.0, 11.0, 5.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004391670227050781, -0.00042582303285598755, -0.00041247904300689697, -0.0003991350531578064, -0.0003857910633087158, -0.00037244707345962524, -0.00035910308361053467, -0.0003457590937614441, -0.0003324151039123535, -0.00031907111406326294, -0.00030572712421417236, -0.0002923831343650818, -0.0002790391445159912, -0.00026569515466690063, -0.00025235116481781006, -0.00023900717496871948, -0.0002256631851196289, -0.00021231919527053833, -0.00019897520542144775, -0.00018563121557235718, -0.0001722872257232666, -0.00015894323587417603, -0.00014559924602508545, -0.00013225525617599487, -0.0001189112663269043, -0.00010556727647781372, -9.222328662872314e-05, -7.887929677963257e-05, -6.553530693054199e-05, -5.2191317081451416e-05, -3.884732723236084e-05, -2.5503337383270264e-05, -1.2159347534179688e-05, 1.1846423149108887e-06, 1.4528632164001465e-05, 2.787262201309204e-05, 4.121661186218262e-05, 5.456060171127319e-05, 6.790459156036377e-05, 8.124858140945435e-05, 9.459257125854492e-05, 0.0001079365611076355, 0.00012128055095672607, 0.00013462454080581665, 0.00014796853065490723, 0.0001613125205039978, 0.00017465651035308838, 0.00018800050020217896, 0.00020134449005126953, 0.0002146884799003601, 0.00022803246974945068, 0.00024137645959854126, 0.00025472044944763184, 0.0002680644392967224, 0.000281408429145813, 0.00029475241899490356, 0.00030809640884399414, 0.0003214403986930847, 0.0003347843885421753, 0.00034812837839126587, 0.00036147236824035645, 0.000374816358089447, 0.0003881603479385376, 0.0004015043377876282, 0.00041484832763671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 6.0, 8.0, 2.0, 5.0, 16.0, 16.0, 25.0, 55.0, 55.0, 95.0, 158.0, 323.0, 675.0, 1469.0, 4007.0, 13112.0, 62115.0, 697826.0, 223955.0, 31967.0, 7934.0, 2608.0, 1083.0, 468.0, 232.0, 104.0, 83.0, 39.0, 41.0, 26.0, 10.0, 13.0, 11.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.474578857421875, -1.42962646484375, -1.384674072265625, -1.3397216796875, -1.294769287109375, -1.24981689453125, -1.204864501953125, -1.159912109375, -1.114959716796875, -1.07000732421875, -1.025054931640625, -0.9801025390625, -0.935150146484375, -0.89019775390625, -0.845245361328125, -0.80029296875, -0.755340576171875, -0.71038818359375, -0.665435791015625, -0.6204833984375, -0.575531005859375, -0.53057861328125, -0.485626220703125, -0.440673828125, -0.395721435546875, -0.35076904296875, -0.305816650390625, -0.2608642578125, -0.215911865234375, -0.17095947265625, -0.126007080078125, -0.0810546875, -0.036102294921875, 0.00885009765625, 0.053802490234375, 0.0987548828125, 0.143707275390625, 0.18865966796875, 0.233612060546875, 0.278564453125, 0.323516845703125, 0.36846923828125, 0.413421630859375, 0.4583740234375, 0.503326416015625, 0.54827880859375, 0.593231201171875, 0.63818359375, 0.683135986328125, 0.72808837890625, 0.773040771484375, 0.8179931640625, 0.862945556640625, 0.90789794921875, 0.952850341796875, 0.997802734375, 1.042755126953125, 1.08770751953125, 1.132659912109375, 1.1776123046875, 1.222564697265625, 1.26751708984375, 1.312469482421875, 1.357421875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 2.0, 1.0, 7.0, 7.0, 12.0, 11.0, 14.0, 22.0, 36.0, 35.0, 64.0, 79.0, 79.0, 92.0, 89.0, 80.0, 86.0, 72.0, 49.0, 33.0, 27.0, 18.0, 16.0, 12.0, 8.0, 9.0, 3.0, 5.0, 2.0, 2.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.28125, -1.2459716796875, -1.210693359375, -1.1754150390625, -1.14013671875, -1.1048583984375, -1.069580078125, -1.0343017578125, -0.9990234375, -0.9637451171875, -0.928466796875, -0.8931884765625, -0.85791015625, -0.8226318359375, -0.787353515625, -0.7520751953125, -0.716796875, -0.6815185546875, -0.646240234375, -0.6109619140625, -0.57568359375, -0.5404052734375, -0.505126953125, -0.4698486328125, -0.4345703125, -0.3992919921875, -0.364013671875, -0.3287353515625, -0.29345703125, -0.2581787109375, -0.222900390625, -0.1876220703125, -0.15234375, -0.1170654296875, -0.081787109375, -0.0465087890625, -0.01123046875, 0.0240478515625, 0.059326171875, 0.0946044921875, 0.1298828125, 0.1651611328125, 0.200439453125, 0.2357177734375, 0.27099609375, 0.3062744140625, 0.341552734375, 0.3768310546875, 0.412109375, 0.4473876953125, 0.482666015625, 0.5179443359375, 0.55322265625, 0.5885009765625, 0.623779296875, 0.6590576171875, 0.6943359375, 0.7296142578125, 0.764892578125, 0.8001708984375, 0.83544921875, 0.8707275390625, 0.906005859375, 0.9412841796875, 0.9765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 17.0, 59.0, 164.0, 426.0, 202.0, 85.0, 24.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.74911880493164, -52.103763580322266, -50.458404541015625, -48.81304931640625, -47.16769027709961, -45.522335052490234, -43.876976013183594, -42.23162078857422, -40.586265563964844, -38.94091033935547, -37.29555130004883, -35.65019607543945, -34.00483703613281, -32.35948181152344, -30.71412467956543, -29.068767547607422, -27.42340850830078, -25.778051376342773, -24.132694244384766, -22.48733901977539, -20.84197998046875, -19.196624755859375, -17.551267623901367, -15.90591049194336, -14.260553359985352, -12.615196228027344, -10.969839096069336, -9.324482917785645, -7.679125785827637, -6.033768653869629, -4.3884124755859375, -2.7430553436279297, -1.0976982116699219, 0.5476586818695068, 2.1930155754089355, 3.838372230529785, 5.483729362487793, 7.129086494445801, 8.774442672729492, 10.4197998046875, 12.065156936645508, 13.710514068603516, 15.355871200561523, 17.00122833251953, 18.646583557128906, 20.291942596435547, 21.937297821044922, 23.58265495300293, 25.228012084960938, 26.873369216918945, 28.518726348876953, 30.164081573486328, 31.80944061279297, 33.454795837402344, 35.10015106201172, 36.74551010131836, 38.390869140625, 40.036224365234375, 41.681583404541016, 43.32693862915039, 44.97229766845703, 46.617652893066406, 48.26300811767578, 49.90836715698242, 51.5537223815918]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 14.0, 10.0, 8.0, 12.0, 13.0, 21.0, 28.0, 18.0, 18.0, 32.0, 35.0, 34.0, 41.0, 59.0, 92.0, 87.0, 87.0, 50.0, 33.0, 42.0, 25.0, 21.0, 22.0, 27.0, 20.0, 30.0, 20.0, 10.0, 11.0, 12.0, 17.0, 7.0, 4.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.671428680419922, -18.113868713378906, -17.55630874633789, -16.998750686645508, -16.441190719604492, -15.883630752563477, -15.326070785522461, -14.768511772155762, -14.210952758789062, -13.653392791748047, -13.095833778381348, -12.538273811340332, -11.980714797973633, -11.423154830932617, -10.865594863891602, -10.308035850524902, -9.750475883483887, -9.192915916442871, -8.635356903076172, -8.077796936035156, -7.520237922668457, -6.962677955627441, -6.405118465423584, -5.847558975219727, -5.289999485015869, -4.732439994812012, -4.174880504608154, -3.6173207759857178, -3.0597612857818604, -2.502201795578003, -1.9446420669555664, -1.387082576751709, -0.8295230865478516, -0.27196353673934937, 0.28559601306915283, 0.8431556224822998, 1.4007151126861572, 1.9582746028900146, 2.515834331512451, 3.0733938217163086, 3.630953311920166, 4.188512802124023, 4.746072292327881, 5.303631782531738, 5.861191749572754, 6.418750762939453, 6.976310729980469, 7.533870220184326, 8.091429710388184, 8.6489896774292, 9.206548690795898, 9.764108657836914, 10.321667671203613, 10.879227638244629, 11.436786651611328, 11.994346618652344, 12.55190658569336, 13.109466552734375, 13.667025566101074, 14.22458553314209, 14.782144546508789, 15.339704513549805, 15.89726448059082, 16.454822540283203, 17.01238250732422]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 3.0, 6.0, 12.0, 6.0, 18.0, 29.0, 51.0, 69.0, 102.0, 264.0, 642.0, 2232.0, 12864.0, 257163.0, 3761533.0, 146090.0, 10107.0, 2030.0, 582.0, 221.0, 116.0, 63.0, 29.0, 21.0, 13.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.70703125, -5.56927490234375, -5.4315185546875, -5.29376220703125, -5.156005859375, -5.01824951171875, -4.8804931640625, -4.74273681640625, -4.60498046875, -4.46722412109375, -4.3294677734375, -4.19171142578125, -4.053955078125, -3.91619873046875, -3.7784423828125, -3.64068603515625, -3.5029296875, -3.36517333984375, -3.2274169921875, -3.08966064453125, -2.951904296875, -2.81414794921875, -2.6763916015625, -2.53863525390625, -2.40087890625, -2.26312255859375, -2.1253662109375, -1.98760986328125, -1.849853515625, -1.71209716796875, -1.5743408203125, -1.43658447265625, -1.298828125, -1.16107177734375, -1.0233154296875, -0.88555908203125, -0.747802734375, -0.61004638671875, -0.4722900390625, -0.33453369140625, -0.19677734375, -0.05902099609375, 0.0787353515625, 0.21649169921875, 0.354248046875, 0.49200439453125, 0.6297607421875, 0.76751708984375, 0.9052734375, 1.04302978515625, 1.1807861328125, 1.31854248046875, 1.456298828125, 1.59405517578125, 1.7318115234375, 1.86956787109375, 2.00732421875, 2.14508056640625, 2.2828369140625, 2.42059326171875, 2.558349609375, 2.69610595703125, 2.8338623046875, 2.97161865234375, 3.109375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 3.0, 9.0, 10.0, 15.0, 11.0, 19.0, 20.0, 24.0, 25.0, 27.0, 49.0, 52.0, 45.0, 56.0, 55.0, 55.0, 62.0, 73.0, 47.0, 54.0, 58.0, 34.0, 26.0, 28.0, 34.0, 18.0, 15.0, 16.0, 14.0, 10.0, 12.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0753631591796875, -1.032562255859375, -0.9897613525390625, -0.94696044921875, -0.9041595458984375, -0.861358642578125, -0.8185577392578125, -0.7757568359375, -0.7329559326171875, -0.690155029296875, -0.6473541259765625, -0.60455322265625, -0.5617523193359375, -0.518951416015625, -0.4761505126953125, -0.433349609375, -0.3905487060546875, -0.347747802734375, -0.3049468994140625, -0.26214599609375, -0.2193450927734375, -0.176544189453125, -0.1337432861328125, -0.0909423828125, -0.0481414794921875, -0.005340576171875, 0.0374603271484375, 0.08026123046875, 0.1230621337890625, 0.165863037109375, 0.2086639404296875, 0.25146484375, 0.2942657470703125, 0.337066650390625, 0.3798675537109375, 0.42266845703125, 0.4654693603515625, 0.508270263671875, 0.5510711669921875, 0.5938720703125, 0.6366729736328125, 0.679473876953125, 0.7222747802734375, 0.76507568359375, 0.8078765869140625, 0.850677490234375, 0.8934783935546875, 0.936279296875, 0.9790802001953125, 1.021881103515625, 1.0646820068359375, 1.10748291015625, 1.1502838134765625, 1.193084716796875, 1.2358856201171875, 1.2786865234375, 1.3214874267578125, 1.364288330078125, 1.4070892333984375, 1.44989013671875, 1.4926910400390625, 1.535491943359375, 1.5782928466796875, 1.62109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 12.0, 9.0, 10.0, 16.0, 42.0, 49.0, 118.0, 222.0, 641.0, 1886.0, 9426.0, 144715.0, 3931305.0, 95773.0, 7458.0, 1635.0, 489.0, 216.0, 104.0, 51.0, 36.0, 18.0, 12.0, 8.0, 12.0, 1.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.5078125, -7.30181884765625, -7.0958251953125, -6.88983154296875, -6.683837890625, -6.47784423828125, -6.2718505859375, -6.06585693359375, -5.85986328125, -5.65386962890625, -5.4478759765625, -5.24188232421875, -5.035888671875, -4.82989501953125, -4.6239013671875, -4.41790771484375, -4.2119140625, -4.00592041015625, -3.7999267578125, -3.59393310546875, -3.387939453125, -3.18194580078125, -2.9759521484375, -2.76995849609375, -2.56396484375, -2.35797119140625, -2.1519775390625, -1.94598388671875, -1.739990234375, -1.53399658203125, -1.3280029296875, -1.12200927734375, -0.916015625, -0.71002197265625, -0.5040283203125, -0.29803466796875, -0.092041015625, 0.11395263671875, 0.3199462890625, 0.52593994140625, 0.73193359375, 0.93792724609375, 1.1439208984375, 1.34991455078125, 1.555908203125, 1.76190185546875, 1.9678955078125, 2.17388916015625, 2.3798828125, 2.58587646484375, 2.7918701171875, 2.99786376953125, 3.203857421875, 3.40985107421875, 3.6158447265625, 3.82183837890625, 4.02783203125, 4.23382568359375, 4.4398193359375, 4.64581298828125, 4.851806640625, 5.05780029296875, 5.2637939453125, 5.46978759765625, 5.67578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 3.0, 11.0, 14.0, 24.0, 23.0, 46.0, 68.0, 87.0, 202.0, 392.0, 894.0, 1122.0, 577.0, 235.0, 144.0, 81.0, 51.0, 28.0, 29.0, 9.0, 6.0, 11.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.865234375, -3.717742919921875, -3.57025146484375, -3.422760009765625, -3.2752685546875, -3.127777099609375, -2.98028564453125, -2.832794189453125, -2.685302734375, -2.537811279296875, -2.39031982421875, -2.242828369140625, -2.0953369140625, -1.947845458984375, -1.80035400390625, -1.652862548828125, -1.50537109375, -1.357879638671875, -1.21038818359375, -1.062896728515625, -0.9154052734375, -0.767913818359375, -0.62042236328125, -0.472930908203125, -0.325439453125, -0.177947998046875, -0.03045654296875, 0.117034912109375, 0.2645263671875, 0.412017822265625, 0.55950927734375, 0.707000732421875, 0.8544921875, 1.001983642578125, 1.14947509765625, 1.296966552734375, 1.4444580078125, 1.591949462890625, 1.73944091796875, 1.886932373046875, 2.034423828125, 2.181915283203125, 2.32940673828125, 2.476898193359375, 2.6243896484375, 2.771881103515625, 2.91937255859375, 3.066864013671875, 3.21435546875, 3.361846923828125, 3.50933837890625, 3.656829833984375, 3.8043212890625, 3.951812744140625, 4.09930419921875, 4.246795654296875, 4.394287109375, 4.541778564453125, 4.68927001953125, 4.836761474609375, 4.9842529296875, 5.131744384765625, 5.27923583984375, 5.426727294921875, 5.57421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 4.0, 4.0, 4.0, 11.0, 14.0, 16.0, 22.0, 33.0, 64.0, 89.0, 118.0, 122.0, 148.0, 133.0, 78.0, 44.0, 27.0, 16.0, 14.0, 10.0, 12.0, 3.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.18642234802246, -24.4731502532959, -23.75988006591797, -23.046607971191406, -22.333335876464844, -21.62006378173828, -20.90679168701172, -20.19352149963379, -19.480249404907227, -18.766977310180664, -18.053707122802734, -17.340435028076172, -16.62716293334961, -15.913890838623047, -15.2006196975708, -14.487348556518555, -13.774076461791992, -13.06080436706543, -12.347533226013184, -11.634262084960938, -10.920989990234375, -10.207717895507812, -9.494446754455566, -8.78117561340332, -8.067903518676758, -7.3546319007873535, -6.641360282897949, -5.928088665008545, -5.214817047119141, -4.501545429229736, -3.788273811340332, -3.0750021934509277, -2.3617286682128906, -1.6484570503234863, -0.935185432434082, -0.22191381454467773, 0.49135780334472656, 1.2046294212341309, 1.9179010391235352, 2.6311726570129395, 3.3444442749023438, 4.057715892791748, 4.770987510681152, 5.484259128570557, 6.197530746459961, 6.910802364349365, 7.6240739822387695, 8.337345123291016, 9.050617218017578, 9.76388931274414, 10.477160453796387, 11.190431594848633, 11.903703689575195, 12.616975784301758, 13.330246925354004, 14.04351806640625, 14.756790161132812, 15.470062255859375, 16.183334350585938, 16.896604537963867, 17.60987663269043, 18.323148727416992, 19.036418914794922, 19.749691009521484, 20.462963104248047]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 8.0, 12.0, 13.0, 14.0, 15.0, 28.0, 27.0, 27.0, 39.0, 46.0, 49.0, 43.0, 56.0, 58.0, 63.0, 43.0, 52.0, 49.0, 39.0, 33.0, 32.0, 40.0, 31.0, 34.0, 27.0, 19.0, 11.0, 13.0, 10.0, 10.0, 9.0, 6.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.882389068603516, -16.36464500427246, -15.846901893615723, -15.329157829284668, -14.81141471862793, -14.293670654296875, -13.77592658996582, -13.258182525634766, -12.740439414978027, -12.222695350646973, -11.704952239990234, -11.18720817565918, -10.669464111328125, -10.151721000671387, -9.633976936340332, -9.116233825683594, -8.598489761352539, -8.080745697021484, -7.563002586364746, -7.045258522033691, -6.527514934539795, -6.009771347045898, -5.492027282714844, -4.974283695220947, -4.456540107727051, -3.9387965202331543, -3.4210526943206787, -2.903308868408203, -2.3855652809143066, -1.8678216934204102, -1.3500778675079346, -0.832334041595459, -0.3145904541015625, 0.20315325260162354, 0.7208969593048096, 1.2386406660079956, 1.7563843727111816, 2.274127960205078, 2.7918717861175537, 3.3096156120300293, 3.827359199523926, 4.345102787017822, 4.862846374511719, 5.380590438842773, 5.89833402633667, 6.416077613830566, 6.933821678161621, 7.451565265655518, 7.969308853149414, 8.487052917480469, 9.004796028137207, 9.522540092468262, 10.040283203125, 10.558027267456055, 11.07577133178711, 11.593515396118164, 12.111258506774902, 12.629002571105957, 13.146745681762695, 13.66448974609375, 14.182233810424805, 14.699976921081543, 15.217720985412598, 15.735464096069336, 16.25320816040039]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 1.0, 7.0, 10.0, 12.0, 27.0, 32.0, 47.0, 97.0, 174.0, 296.0, 571.0, 1116.0, 2541.0, 6736.0, 21124.0, 89565.0, 481625.0, 354047.0, 64608.0, 16128.0, 5500.0, 2149.0, 1074.0, 463.0, 257.0, 131.0, 83.0, 62.0, 26.0, 15.0, 12.0, 4.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.04669189453125, -1.9644775390625, -1.88226318359375, -1.800048828125, -1.71783447265625, -1.6356201171875, -1.55340576171875, -1.47119140625, -1.38897705078125, -1.3067626953125, -1.22454833984375, -1.142333984375, -1.06011962890625, -0.9779052734375, -0.89569091796875, -0.8134765625, -0.73126220703125, -0.6490478515625, -0.56683349609375, -0.484619140625, -0.40240478515625, -0.3201904296875, -0.23797607421875, -0.15576171875, -0.07354736328125, 0.0086669921875, 0.09088134765625, 0.173095703125, 0.25531005859375, 0.3375244140625, 0.41973876953125, 0.501953125, 0.58416748046875, 0.6663818359375, 0.74859619140625, 0.830810546875, 0.91302490234375, 0.9952392578125, 1.07745361328125, 1.15966796875, 1.24188232421875, 1.3240966796875, 1.40631103515625, 1.488525390625, 1.57073974609375, 1.6529541015625, 1.73516845703125, 1.8173828125, 1.89959716796875, 1.9818115234375, 2.06402587890625, 2.146240234375, 2.22845458984375, 2.3106689453125, 2.39288330078125, 2.47509765625, 2.55731201171875, 2.6395263671875, 2.72174072265625, 2.803955078125, 2.88616943359375, 2.9683837890625, 3.05059814453125, 3.1328125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 6.0, 11.0, 10.0, 11.0, 14.0, 20.0, 13.0, 22.0, 37.0, 35.0, 40.0, 44.0, 36.0, 56.0, 49.0, 65.0, 51.0, 55.0, 49.0, 51.0, 56.0, 36.0, 35.0, 33.0, 33.0, 20.0, 22.0, 22.0, 14.0, 9.0, 9.0, 3.0, 5.0, 3.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.2169342041015625, -1.167266845703125, -1.1175994873046875, -1.06793212890625, -1.0182647705078125, -0.968597412109375, -0.9189300537109375, -0.8692626953125, -0.8195953369140625, -0.769927978515625, -0.7202606201171875, -0.67059326171875, -0.6209259033203125, -0.571258544921875, -0.5215911865234375, -0.471923828125, -0.4222564697265625, -0.372589111328125, -0.3229217529296875, -0.27325439453125, -0.2235870361328125, -0.173919677734375, -0.1242523193359375, -0.0745849609375, -0.0249176025390625, 0.024749755859375, 0.0744171142578125, 0.12408447265625, 0.1737518310546875, 0.223419189453125, 0.2730865478515625, 0.32275390625, 0.3724212646484375, 0.422088623046875, 0.4717559814453125, 0.52142333984375, 0.5710906982421875, 0.620758056640625, 0.6704254150390625, 0.7200927734375, 0.7697601318359375, 0.819427490234375, 0.8690948486328125, 0.91876220703125, 0.9684295654296875, 1.018096923828125, 1.0677642822265625, 1.117431640625, 1.1670989990234375, 1.216766357421875, 1.2664337158203125, 1.31610107421875, 1.3657684326171875, 1.415435791015625, 1.4651031494140625, 1.5147705078125, 1.5644378662109375, 1.614105224609375, 1.6637725830078125, 1.71343994140625, 1.7631072998046875, 1.812774658203125, 1.8624420166015625, 1.912109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 5.0, 2.0, 11.0, 8.0, 17.0, 33.0, 50.0, 94.0, 121.0, 231.0, 464.0, 947.0, 2660.0, 11091.0, 122027.0, 859037.0, 42164.0, 6214.0, 1803.0, 760.0, 324.0, 168.0, 120.0, 69.0, 36.0, 30.0, 17.0, 15.0, 8.0, 6.0, 4.0, 5.0, 1.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-5.97265625, -5.8167724609375, -5.660888671875, -5.5050048828125, -5.34912109375, -5.1932373046875, -5.037353515625, -4.8814697265625, -4.7255859375, -4.5697021484375, -4.413818359375, -4.2579345703125, -4.10205078125, -3.9461669921875, -3.790283203125, -3.6343994140625, -3.478515625, -3.3226318359375, -3.166748046875, -3.0108642578125, -2.85498046875, -2.6990966796875, -2.543212890625, -2.3873291015625, -2.2314453125, -2.0755615234375, -1.919677734375, -1.7637939453125, -1.60791015625, -1.4520263671875, -1.296142578125, -1.1402587890625, -0.984375, -0.8284912109375, -0.672607421875, -0.5167236328125, -0.36083984375, -0.2049560546875, -0.049072265625, 0.1068115234375, 0.2626953125, 0.4185791015625, 0.574462890625, 0.7303466796875, 0.88623046875, 1.0421142578125, 1.197998046875, 1.3538818359375, 1.509765625, 1.6656494140625, 1.821533203125, 1.9774169921875, 2.13330078125, 2.2891845703125, 2.445068359375, 2.6009521484375, 2.7568359375, 2.9127197265625, 3.068603515625, 3.2244873046875, 3.38037109375, 3.5362548828125, 3.692138671875, 3.8480224609375, 4.00390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 8.0, 17.0, 27.0, 37.0, 46.0, 74.0, 90.0, 141.0, 135.0, 89.0, 96.0, 65.0, 53.0, 33.0, 26.0, 13.0, 13.0, 16.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.29254150390625, -6.9171142578125, -6.54168701171875, -6.166259765625, -5.79083251953125, -5.4154052734375, -5.03997802734375, -4.66455078125, -4.28912353515625, -3.9136962890625, -3.53826904296875, -3.162841796875, -2.78741455078125, -2.4119873046875, -2.03656005859375, -1.6611328125, -1.28570556640625, -0.9102783203125, -0.53485107421875, -0.159423828125, 0.21600341796875, 0.5914306640625, 0.96685791015625, 1.34228515625, 1.71771240234375, 2.0931396484375, 2.46856689453125, 2.843994140625, 3.21942138671875, 3.5948486328125, 3.97027587890625, 4.345703125, 4.72113037109375, 5.0965576171875, 5.47198486328125, 5.847412109375, 6.22283935546875, 6.5982666015625, 6.97369384765625, 7.34912109375, 7.72454833984375, 8.0999755859375, 8.47540283203125, 8.850830078125, 9.22625732421875, 9.6016845703125, 9.97711181640625, 10.3525390625, 10.72796630859375, 11.1033935546875, 11.47882080078125, 11.854248046875, 12.22967529296875, 12.6051025390625, 12.98052978515625, 13.35595703125, 13.73138427734375, 14.1068115234375, 14.48223876953125, 14.857666015625, 15.23309326171875, 15.6085205078125, 15.98394775390625, 16.359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 15.0, 9.0, 25.0, 40.0, 70.0, 111.0, 216.0, 409.0, 920.0, 2355.0, 7189.0, 28208.0, 180639.0, 736342.0, 70595.0, 14404.0, 4163.0, 1546.0, 620.0, 294.0, 159.0, 82.0, 45.0, 33.0, 12.0, 12.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.971221923828125, -0.93560791015625, -0.899993896484375, -0.8643798828125, -0.828765869140625, -0.79315185546875, -0.757537841796875, -0.721923828125, -0.686309814453125, -0.65069580078125, -0.615081787109375, -0.5794677734375, -0.543853759765625, -0.50823974609375, -0.472625732421875, -0.43701171875, -0.401397705078125, -0.36578369140625, -0.330169677734375, -0.2945556640625, -0.258941650390625, -0.22332763671875, -0.187713623046875, -0.152099609375, -0.116485595703125, -0.08087158203125, -0.045257568359375, -0.0096435546875, 0.025970458984375, 0.06158447265625, 0.097198486328125, 0.1328125, 0.168426513671875, 0.20404052734375, 0.239654541015625, 0.2752685546875, 0.310882568359375, 0.34649658203125, 0.382110595703125, 0.417724609375, 0.453338623046875, 0.48895263671875, 0.524566650390625, 0.5601806640625, 0.595794677734375, 0.63140869140625, 0.667022705078125, 0.70263671875, 0.738250732421875, 0.77386474609375, 0.809478759765625, 0.8450927734375, 0.880706787109375, 0.91632080078125, 0.951934814453125, 0.987548828125, 1.023162841796875, 1.05877685546875, 1.094390869140625, 1.1300048828125, 1.165618896484375, 1.20123291015625, 1.236846923828125, 1.2724609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 9.0, 14.0, 15.0, 13.0, 14.0, 30.0, 31.0, 46.0, 60.0, 94.0, 125.0, 122.0, 101.0, 70.0, 50.0, 42.0, 33.0, 24.0, 18.0, 14.0, 14.0, 16.0, 9.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003082752227783203, -0.00029839202761650085, -0.0002885088324546814, -0.00027862563729286194, -0.0002687424421310425, -0.000258859246969223, -0.00024897605180740356, -0.0002390928566455841, -0.00022920966148376465, -0.0002193264663219452, -0.00020944327116012573, -0.00019956007599830627, -0.00018967688083648682, -0.00017979368567466736, -0.0001699104905128479, -0.00016002729535102844, -0.00015014410018920898, -0.00014026090502738953, -0.00013037770986557007, -0.00012049451470375061, -0.00011061131954193115, -0.0001007281243801117, -9.084492921829224e-05, -8.096173405647278e-05, -7.107853889465332e-05, -6.119534373283386e-05, -5.1312148571014404e-05, -4.1428953409194946e-05, -3.154575824737549e-05, -2.166256308555603e-05, -1.1779367923736572e-05, -1.8961727619171143e-06, 7.987022399902344e-06, 1.7870217561721802e-05, 2.775341272354126e-05, 3.763660788536072e-05, 4.7519803047180176e-05, 5.7402998208999634e-05, 6.728619337081909e-05, 7.716938853263855e-05, 8.705258369445801e-05, 9.693577885627747e-05, 0.00010681897401809692, 0.00011670216917991638, 0.00012658536434173584, 0.0001364685595035553, 0.00014635175466537476, 0.00015623494982719421, 0.00016611814498901367, 0.00017600134015083313, 0.0001858845353126526, 0.00019576773047447205, 0.0002056509256362915, 0.00021553412079811096, 0.00022541731595993042, 0.00023530051112174988, 0.00024518370628356934, 0.0002550669014453888, 0.00026495009660720825, 0.0002748332917690277, 0.00028471648693084717, 0.0002945996820926666, 0.0003044828772544861, 0.00031436607241630554, 0.000324249267578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 7.0, 15.0, 20.0, 33.0, 53.0, 105.0, 179.0, 371.0, 944.0, 2814.0, 13420.0, 149821.0, 824206.0, 47300.0, 6330.0, 1641.0, 656.0, 279.0, 158.0, 75.0, 40.0, 33.0, 10.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.701171875, -1.6484832763671875, -1.595794677734375, -1.5431060791015625, -1.49041748046875, -1.4377288818359375, -1.385040283203125, -1.3323516845703125, -1.2796630859375, -1.2269744873046875, -1.174285888671875, -1.1215972900390625, -1.06890869140625, -1.0162200927734375, -0.963531494140625, -0.9108428955078125, -0.858154296875, -0.8054656982421875, -0.752777099609375, -0.7000885009765625, -0.64739990234375, -0.5947113037109375, -0.542022705078125, -0.4893341064453125, -0.4366455078125, -0.3839569091796875, -0.331268310546875, -0.2785797119140625, -0.22589111328125, -0.1732025146484375, -0.120513916015625, -0.0678253173828125, -0.01513671875, 0.0375518798828125, 0.090240478515625, 0.1429290771484375, 0.19561767578125, 0.2483062744140625, 0.300994873046875, 0.3536834716796875, 0.4063720703125, 0.4590606689453125, 0.511749267578125, 0.5644378662109375, 0.61712646484375, 0.6698150634765625, 0.722503662109375, 0.7751922607421875, 0.827880859375, 0.8805694580078125, 0.933258056640625, 0.9859466552734375, 1.03863525390625, 1.0913238525390625, 1.144012451171875, 1.1967010498046875, 1.2493896484375, 1.3020782470703125, 1.354766845703125, 1.4074554443359375, 1.46014404296875, 1.5128326416015625, 1.565521240234375, 1.6182098388671875, 1.6708984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 4.0, 7.0, 5.0, 13.0, 6.0, 15.0, 13.0, 19.0, 23.0, 41.0, 37.0, 68.0, 69.0, 86.0, 90.0, 96.0, 77.0, 75.0, 54.0, 43.0, 33.0, 34.0, 22.0, 15.0, 13.0, 8.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1552734375, -1.12139892578125, -1.0875244140625, -1.05364990234375, -1.019775390625, -0.98590087890625, -0.9520263671875, -0.91815185546875, -0.88427734375, -0.85040283203125, -0.8165283203125, -0.78265380859375, -0.748779296875, -0.71490478515625, -0.6810302734375, -0.64715576171875, -0.61328125, -0.57940673828125, -0.5455322265625, -0.51165771484375, -0.477783203125, -0.44390869140625, -0.4100341796875, -0.37615966796875, -0.34228515625, -0.30841064453125, -0.2745361328125, -0.24066162109375, -0.206787109375, -0.17291259765625, -0.1390380859375, -0.10516357421875, -0.0712890625, -0.03741455078125, -0.0035400390625, 0.03033447265625, 0.064208984375, 0.09808349609375, 0.1319580078125, 0.16583251953125, 0.19970703125, 0.23358154296875, 0.2674560546875, 0.30133056640625, 0.335205078125, 0.36907958984375, 0.4029541015625, 0.43682861328125, 0.470703125, 0.50457763671875, 0.5384521484375, 0.57232666015625, 0.606201171875, 0.64007568359375, 0.6739501953125, 0.70782470703125, 0.74169921875, 0.77557373046875, 0.8094482421875, 0.84332275390625, 0.877197265625, 0.91107177734375, 0.9449462890625, 0.97882080078125, 1.0126953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 6.0, 18.0, 28.0, 39.0, 73.0, 96.0, 255.0, 219.0, 111.0, 52.0, 39.0, 21.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.847827911376953, -19.054201126098633, -18.260574340820312, -17.466947555541992, -16.673320770263672, -15.879694938659668, -15.086069107055664, -14.292442321777344, -13.498815536499023, -12.705188751220703, -11.911561965942383, -11.117936134338379, -10.324309349060059, -9.530682563781738, -8.737056732177734, -7.943429946899414, -7.149803161621094, -6.356176376342773, -5.562550067901611, -4.768923759460449, -3.975296974182129, -3.1816704273223877, -2.3880438804626465, -1.5944175720214844, -0.8007907867431641, -0.0071642398834228516, 0.7864623069763184, 1.5800888538360596, 2.373715400695801, 3.167341947555542, 3.960968494415283, 4.754594802856445, 5.548221588134766, 6.341848373413086, 7.135474681854248, 7.92910099029541, 8.72272777557373, 9.51635456085205, 10.309980392456055, 11.103607177734375, 11.897233963012695, 12.690860748291016, 13.484487533569336, 14.27811336517334, 15.07174015045166, 15.86536693572998, 16.658992767333984, 17.452619552612305, 18.246246337890625, 19.039873123168945, 19.833499908447266, 20.627126693725586, 21.420753479003906, 22.214378356933594, 23.008005142211914, 23.801631927490234, 24.595258712768555, 25.388885498046875, 26.182512283325195, 26.976139068603516, 27.769763946533203, 28.563390731811523, 29.357017517089844, 30.150644302368164, 30.944271087646484]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 7.0, 9.0, 14.0, 14.0, 12.0, 15.0, 24.0, 28.0, 33.0, 38.0, 42.0, 44.0, 68.0, 103.0, 147.0, 78.0, 55.0, 34.0, 26.0, 25.0, 26.0, 23.0, 27.0, 17.0, 13.0, 19.0, 10.0, 6.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.944660186767578, -24.148767471313477, -23.352874755859375, -22.556982040405273, -21.761089324951172, -20.965194702148438, -20.16930389404297, -19.373409271240234, -18.577516555786133, -17.78162384033203, -16.98573112487793, -16.189838409423828, -15.39394474029541, -14.598052024841309, -13.802159309387207, -13.006265640258789, -12.210373878479004, -11.414481163024902, -10.6185884475708, -9.822694778442383, -9.026802062988281, -8.23090934753418, -7.435016632080078, -6.639123439788818, -5.843230724334717, -5.047338008880615, -4.2514448165893555, -3.455552101135254, -2.6596591472625732, -1.8637661933898926, -1.067873477935791, -0.27198028564453125, 0.5239124298095703, 1.319805383682251, 2.1156983375549316, 2.911591053009033, 3.707484006881714, 4.5033769607543945, 5.299269676208496, 6.095162868499756, 6.891055583953857, 7.686948299407959, 8.482841491699219, 9.27873420715332, 10.074626922607422, 10.870519638061523, 11.666412353515625, 12.462306022644043, 13.258198738098145, 14.054091453552246, 14.849984169006348, 15.645877838134766, 16.441770553588867, 17.23766326904297, 18.03355598449707, 18.829448699951172, 19.625341415405273, 20.421234130859375, 21.217126846313477, 22.013019561767578, 22.80891227722168, 23.60480499267578, 24.400699615478516, 25.196592330932617, 25.99248504638672]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 10.0, 4.0, 6.0, 7.0, 15.0, 32.0, 42.0, 57.0, 83.0, 161.0, 264.0, 422.0, 933.0, 2002.0, 5291.0, 19481.0, 131298.0, 1634387.0, 2191053.0, 174221.0, 23964.0, 6154.0, 2188.0, 991.0, 531.0, 283.0, 136.0, 109.0, 56.0, 34.0, 17.0, 14.0, 10.0, 4.0, 4.0, 4.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.80078125, -4.674652099609375, -4.54852294921875, -4.422393798828125, -4.2962646484375, -4.170135498046875, -4.04400634765625, -3.917877197265625, -3.791748046875, -3.665618896484375, -3.53948974609375, -3.413360595703125, -3.2872314453125, -3.161102294921875, -3.03497314453125, -2.908843994140625, -2.78271484375, -2.656585693359375, -2.53045654296875, -2.404327392578125, -2.2781982421875, -2.152069091796875, -2.02593994140625, -1.899810791015625, -1.773681640625, -1.647552490234375, -1.52142333984375, -1.395294189453125, -1.2691650390625, -1.143035888671875, -1.01690673828125, -0.890777587890625, -0.7646484375, -0.638519287109375, -0.51239013671875, -0.386260986328125, -0.2601318359375, -0.134002685546875, -0.00787353515625, 0.118255615234375, 0.244384765625, 0.370513916015625, 0.49664306640625, 0.622772216796875, 0.7489013671875, 0.875030517578125, 1.00115966796875, 1.127288818359375, 1.25341796875, 1.379547119140625, 1.50567626953125, 1.631805419921875, 1.7579345703125, 1.884063720703125, 2.01019287109375, 2.136322021484375, 2.262451171875, 2.388580322265625, 2.51470947265625, 2.640838623046875, 2.7669677734375, 2.893096923828125, 3.01922607421875, 3.145355224609375, 3.271484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 8.0, 7.0, 4.0, 8.0, 11.0, 11.0, 14.0, 15.0, 18.0, 16.0, 25.0, 21.0, 29.0, 33.0, 35.0, 39.0, 35.0, 39.0, 47.0, 54.0, 38.0, 43.0, 40.0, 52.0, 40.0, 34.0, 37.0, 27.0, 31.0, 32.0, 14.0, 26.0, 21.0, 14.0, 10.0, 22.0, 10.0, 4.0, 4.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.083984375, -1.0464324951171875, -1.008880615234375, -0.9713287353515625, -0.93377685546875, -0.8962249755859375, -0.858673095703125, -0.8211212158203125, -0.7835693359375, -0.7460174560546875, -0.708465576171875, -0.6709136962890625, -0.63336181640625, -0.5958099365234375, -0.558258056640625, -0.5207061767578125, -0.483154296875, -0.4456024169921875, -0.408050537109375, -0.3704986572265625, -0.33294677734375, -0.2953948974609375, -0.257843017578125, -0.2202911376953125, -0.1827392578125, -0.1451873779296875, -0.107635498046875, -0.0700836181640625, -0.03253173828125, 0.0050201416015625, 0.042572021484375, 0.0801239013671875, 0.11767578125, 0.1552276611328125, 0.192779541015625, 0.2303314208984375, 0.26788330078125, 0.3054351806640625, 0.342987060546875, 0.3805389404296875, 0.4180908203125, 0.4556427001953125, 0.493194580078125, 0.5307464599609375, 0.56829833984375, 0.6058502197265625, 0.643402099609375, 0.6809539794921875, 0.718505859375, 0.7560577392578125, 0.793609619140625, 0.8311614990234375, 0.86871337890625, 0.9062652587890625, 0.943817138671875, 0.9813690185546875, 1.0189208984375, 1.0564727783203125, 1.094024658203125, 1.1315765380859375, 1.16912841796875, 1.2066802978515625, 1.244232177734375, 1.2817840576171875, 1.3193359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 14.0, 9.0, 20.0, 32.0, 30.0, 67.0, 98.0, 167.0, 314.0, 691.0, 1791.0, 6746.0, 100192.0, 4000769.0, 74044.0, 6204.0, 1630.0, 665.0, 309.0, 183.0, 89.0, 76.0, 40.0, 30.0, 18.0, 16.0, 4.0, 4.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.34375, -12.987548828125, -12.63134765625, -12.275146484375, -11.9189453125, -11.562744140625, -11.20654296875, -10.850341796875, -10.494140625, -10.137939453125, -9.78173828125, -9.425537109375, -9.0693359375, -8.713134765625, -8.35693359375, -8.000732421875, -7.64453125, -7.288330078125, -6.93212890625, -6.575927734375, -6.2197265625, -5.863525390625, -5.50732421875, -5.151123046875, -4.794921875, -4.438720703125, -4.08251953125, -3.726318359375, -3.3701171875, -3.013916015625, -2.65771484375, -2.301513671875, -1.9453125, -1.589111328125, -1.23291015625, -0.876708984375, -0.5205078125, -0.164306640625, 0.19189453125, 0.548095703125, 0.904296875, 1.260498046875, 1.61669921875, 1.972900390625, 2.3291015625, 2.685302734375, 3.04150390625, 3.397705078125, 3.75390625, 4.110107421875, 4.46630859375, 4.822509765625, 5.1787109375, 5.534912109375, 5.89111328125, 6.247314453125, 6.603515625, 6.959716796875, 7.31591796875, 7.672119140625, 8.0283203125, 8.384521484375, 8.74072265625, 9.096923828125, 9.453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 6.0, 12.0, 5.0, 20.0, 22.0, 34.0, 31.0, 71.0, 103.0, 133.0, 184.0, 275.0, 437.0, 615.0, 625.0, 493.0, 314.0, 223.0, 130.0, 99.0, 77.0, 44.0, 31.0, 26.0, 17.0, 18.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -5.02978515625, -4.8564453125, -4.68310546875, -4.509765625, -4.33642578125, -4.1630859375, -3.98974609375, -3.81640625, -3.64306640625, -3.4697265625, -3.29638671875, -3.123046875, -2.94970703125, -2.7763671875, -2.60302734375, -2.4296875, -2.25634765625, -2.0830078125, -1.90966796875, -1.736328125, -1.56298828125, -1.3896484375, -1.21630859375, -1.04296875, -0.86962890625, -0.6962890625, -0.52294921875, -0.349609375, -0.17626953125, -0.0029296875, 0.17041015625, 0.34375, 0.51708984375, 0.6904296875, 0.86376953125, 1.037109375, 1.21044921875, 1.3837890625, 1.55712890625, 1.73046875, 1.90380859375, 2.0771484375, 2.25048828125, 2.423828125, 2.59716796875, 2.7705078125, 2.94384765625, 3.1171875, 3.29052734375, 3.4638671875, 3.63720703125, 3.810546875, 3.98388671875, 4.1572265625, 4.33056640625, 4.50390625, 4.67724609375, 4.8505859375, 5.02392578125, 5.197265625, 5.37060546875, 5.5439453125, 5.71728515625, 5.890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 20.0, 59.0, 120.0, 282.0, 264.0, 131.0, 67.0, 18.0, 12.0, 13.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.87012481689453, -105.57633972167969, -102.28256225585938, -98.98877716064453, -95.69499206542969, -92.40120697021484, -89.107421875, -85.81364440917969, -82.51985931396484, -79.22607421875, -75.93229675292969, -72.63851165771484, -69.3447265625, -66.05094146728516, -62.75716018676758, -59.46337890625, -56.169593811035156, -52.87580871582031, -49.582027435302734, -46.288246154785156, -42.99446105957031, -39.70067596435547, -36.40689468383789, -33.11311340332031, -29.81932830810547, -26.525545120239258, -23.231761932373047, -19.937978744506836, -16.644195556640625, -13.350412368774414, -10.056629180908203, -6.762845993041992, -3.46905517578125, -0.17527198791503906, 3.118511199951172, 6.412294387817383, 9.706077575683594, 12.999860763549805, 16.293643951416016, 19.587427139282227, 22.881210327148438, 26.17499351501465, 29.46877670288086, 32.76255798339844, 36.05634307861328, 39.350128173828125, 42.6439094543457, 45.93769073486328, 49.231475830078125, 52.52526092529297, 55.81904220581055, 59.112823486328125, 62.40660858154297, 65.70039367675781, 68.99417114257812, 72.28795623779297, 75.58174133300781, 78.87552642822266, 82.1693115234375, 85.46308898925781, 88.75687408447266, 92.0506591796875, 95.34443664550781, 98.63822174072266, 101.9320068359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 4.0, 5.0, 11.0, 5.0, 15.0, 19.0, 16.0, 21.0, 28.0, 27.0, 27.0, 28.0, 41.0, 46.0, 40.0, 46.0, 40.0, 40.0, 52.0, 61.0, 53.0, 40.0, 39.0, 43.0, 37.0, 27.0, 29.0, 17.0, 25.0, 30.0, 19.0, 11.0, 12.0, 12.0, 6.0, 5.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-31.45941734313965, -30.613887786865234, -29.768360137939453, -28.92283058166504, -28.077302932739258, -27.231773376464844, -26.386245727539062, -25.54071617126465, -24.695186614990234, -23.84965705871582, -23.00412940979004, -22.158599853515625, -21.313072204589844, -20.46754264831543, -19.622013092041016, -18.776485443115234, -17.930957794189453, -17.08542823791504, -16.239900588989258, -15.394371032714844, -14.548842430114746, -13.703313827514648, -12.85778522491455, -12.012256622314453, -11.166727066040039, -10.321198463439941, -9.475669860839844, -8.63014030456543, -7.784611701965332, -6.939083099365234, -6.093554496765137, -5.248025417327881, -4.402496337890625, -3.5569674968719482, -2.7114386558532715, -1.8659100532531738, -1.020381212234497, -0.1748523712158203, 0.6706762313842773, 1.5162053108215332, 2.361733913421631, 3.2072627544403076, 4.052791595458984, 4.898320198059082, 5.74384880065918, 6.5893778800964355, 7.434906482696533, 8.280435562133789, 9.125964164733887, 9.971492767333984, 10.817021369934082, 11.66254997253418, 12.508079528808594, 13.353608131408691, 14.199136734008789, 15.044666290283203, 15.890193939208984, 16.7357234954834, 17.58125114440918, 18.426780700683594, 19.272308349609375, 20.11783790588379, 20.963367462158203, 21.808895111083984, 22.6544246673584]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 9.0, 3.0, 13.0, 11.0, 16.0, 24.0, 36.0, 58.0, 101.0, 148.0, 297.0, 606.0, 1301.0, 3353.0, 9883.0, 42071.0, 311279.0, 591706.0, 65585.0, 14516.0, 4399.0, 1629.0, 711.0, 313.0, 207.0, 92.0, 51.0, 39.0, 27.0, 18.0, 20.0, 7.0, 9.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.291168212890625, -3.18194580078125, -3.072723388671875, -2.9635009765625, -2.854278564453125, -2.74505615234375, -2.635833740234375, -2.526611328125, -2.417388916015625, -2.30816650390625, -2.198944091796875, -2.0897216796875, -1.980499267578125, -1.87127685546875, -1.762054443359375, -1.65283203125, -1.543609619140625, -1.43438720703125, -1.325164794921875, -1.2159423828125, -1.106719970703125, -0.99749755859375, -0.888275146484375, -0.779052734375, -0.669830322265625, -0.56060791015625, -0.451385498046875, -0.3421630859375, -0.232940673828125, -0.12371826171875, -0.014495849609375, 0.0947265625, 0.203948974609375, 0.31317138671875, 0.422393798828125, 0.5316162109375, 0.640838623046875, 0.75006103515625, 0.859283447265625, 0.968505859375, 1.077728271484375, 1.18695068359375, 1.296173095703125, 1.4053955078125, 1.514617919921875, 1.62384033203125, 1.733062744140625, 1.84228515625, 1.951507568359375, 2.06072998046875, 2.169952392578125, 2.2791748046875, 2.388397216796875, 2.49761962890625, 2.606842041015625, 2.716064453125, 2.825286865234375, 2.93450927734375, 3.043731689453125, 3.1529541015625, 3.262176513671875, 3.37139892578125, 3.480621337890625, 3.58984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 14.0, 25.0, 43.0, 42.0, 61.0, 75.0, 92.0, 96.0, 75.0, 79.0, 73.0, 59.0, 66.0, 50.0, 41.0, 21.0, 27.0, 17.0, 11.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.673828125, -3.557952880859375, -3.44207763671875, -3.326202392578125, -3.2103271484375, -3.094451904296875, -2.97857666015625, -2.862701416015625, -2.746826171875, -2.630950927734375, -2.51507568359375, -2.399200439453125, -2.2833251953125, -2.167449951171875, -2.05157470703125, -1.935699462890625, -1.81982421875, -1.703948974609375, -1.58807373046875, -1.472198486328125, -1.3563232421875, -1.240447998046875, -1.12457275390625, -1.008697509765625, -0.892822265625, -0.776947021484375, -0.66107177734375, -0.545196533203125, -0.4293212890625, -0.313446044921875, -0.19757080078125, -0.081695556640625, 0.0341796875, 0.150054931640625, 0.26593017578125, 0.381805419921875, 0.4976806640625, 0.613555908203125, 0.72943115234375, 0.845306396484375, 0.961181640625, 1.077056884765625, 1.19293212890625, 1.308807373046875, 1.4246826171875, 1.540557861328125, 1.65643310546875, 1.772308349609375, 1.88818359375, 2.004058837890625, 2.11993408203125, 2.235809326171875, 2.3516845703125, 2.467559814453125, 2.58343505859375, 2.699310302734375, 2.815185546875, 2.931060791015625, 3.04693603515625, 3.162811279296875, 3.2786865234375, 3.394561767578125, 3.51043701171875, 3.626312255859375, 3.7421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 14.0, 12.0, 16.0, 31.0, 56.0, 88.0, 97.0, 168.0, 316.0, 613.0, 1280.0, 3484.0, 11788.0, 75187.0, 882519.0, 57417.0, 10070.0, 2954.0, 1104.0, 513.0, 301.0, 169.0, 90.0, 71.0, 32.0, 41.0, 23.0, 19.0, 17.0, 12.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.096405029296875, -3.97015380859375, -3.843902587890625, -3.7176513671875, -3.591400146484375, -3.46514892578125, -3.338897705078125, -3.212646484375, -3.086395263671875, -2.96014404296875, -2.833892822265625, -2.7076416015625, -2.581390380859375, -2.45513916015625, -2.328887939453125, -2.20263671875, -2.076385498046875, -1.95013427734375, -1.823883056640625, -1.6976318359375, -1.571380615234375, -1.44512939453125, -1.318878173828125, -1.192626953125, -1.066375732421875, -0.94012451171875, -0.813873291015625, -0.6876220703125, -0.561370849609375, -0.43511962890625, -0.308868408203125, -0.1826171875, -0.056365966796875, 0.06988525390625, 0.196136474609375, 0.3223876953125, 0.448638916015625, 0.57489013671875, 0.701141357421875, 0.827392578125, 0.953643798828125, 1.07989501953125, 1.206146240234375, 1.3323974609375, 1.458648681640625, 1.58489990234375, 1.711151123046875, 1.83740234375, 1.963653564453125, 2.08990478515625, 2.216156005859375, 2.3424072265625, 2.468658447265625, 2.59490966796875, 2.721160888671875, 2.847412109375, 2.973663330078125, 3.09991455078125, 3.226165771484375, 3.3524169921875, 3.478668212890625, 3.60491943359375, 3.731170654296875, 3.857421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 5.0, 11.0, 8.0, 13.0, 14.0, 8.0, 16.0, 25.0, 35.0, 25.0, 35.0, 64.0, 54.0, 72.0, 75.0, 97.0, 79.0, 64.0, 52.0, 46.0, 35.0, 30.0, 17.0, 17.0, 18.0, 14.0, 12.0, 14.0, 9.0, 7.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.367919921875, -10.04833984375, -9.728759765625, -9.4091796875, -9.089599609375, -8.77001953125, -8.450439453125, -8.130859375, -7.811279296875, -7.49169921875, -7.172119140625, -6.8525390625, -6.532958984375, -6.21337890625, -5.893798828125, -5.57421875, -5.254638671875, -4.93505859375, -4.615478515625, -4.2958984375, -3.976318359375, -3.65673828125, -3.337158203125, -3.017578125, -2.697998046875, -2.37841796875, -2.058837890625, -1.7392578125, -1.419677734375, -1.10009765625, -0.780517578125, -0.4609375, -0.141357421875, 0.17822265625, 0.497802734375, 0.8173828125, 1.136962890625, 1.45654296875, 1.776123046875, 2.095703125, 2.415283203125, 2.73486328125, 3.054443359375, 3.3740234375, 3.693603515625, 4.01318359375, 4.332763671875, 4.65234375, 4.971923828125, 5.29150390625, 5.611083984375, 5.9306640625, 6.250244140625, 6.56982421875, 6.889404296875, 7.208984375, 7.528564453125, 7.84814453125, 8.167724609375, 8.4873046875, 8.806884765625, 9.12646484375, 9.446044921875, 9.765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 9.0, 8.0, 15.0, 22.0, 31.0, 57.0, 77.0, 128.0, 227.0, 447.0, 894.0, 2249.0, 6950.0, 31422.0, 835181.0, 145874.0, 17224.0, 4519.0, 1611.0, 733.0, 371.0, 182.0, 100.0, 68.0, 51.0, 24.0, 22.0, 12.0, 10.0, 5.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0234375, -0.9891204833984375, -0.954803466796875, -0.9204864501953125, -0.88616943359375, -0.8518524169921875, -0.817535400390625, -0.7832183837890625, -0.7489013671875, -0.7145843505859375, -0.680267333984375, -0.6459503173828125, -0.61163330078125, -0.5773162841796875, -0.542999267578125, -0.5086822509765625, -0.474365234375, -0.4400482177734375, -0.405731201171875, -0.3714141845703125, -0.33709716796875, -0.3027801513671875, -0.268463134765625, -0.2341461181640625, -0.1998291015625, -0.1655120849609375, -0.131195068359375, -0.0968780517578125, -0.06256103515625, -0.0282440185546875, 0.006072998046875, 0.0403900146484375, 0.07470703125, 0.1090240478515625, 0.143341064453125, 0.1776580810546875, 0.21197509765625, 0.2462921142578125, 0.280609130859375, 0.3149261474609375, 0.3492431640625, 0.3835601806640625, 0.417877197265625, 0.4521942138671875, 0.48651123046875, 0.5208282470703125, 0.555145263671875, 0.5894622802734375, 0.623779296875, 0.6580963134765625, 0.692413330078125, 0.7267303466796875, 0.76104736328125, 0.7953643798828125, 0.829681396484375, 0.8639984130859375, 0.8983154296875, 0.9326324462890625, 0.966949462890625, 1.0012664794921875, 1.03558349609375, 1.0699005126953125, 1.104217529296875, 1.1385345458984375, 1.1728515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 11.0, 15.0, 22.0, 27.0, 37.0, 54.0, 104.0, 140.0, 186.0, 128.0, 94.0, 57.0, 28.0, 21.0, 16.0, 7.0, 6.0, 8.0, 3.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.00023480132222175598, -0.00022546201944351196, -0.00021612271666526794, -0.00020678341388702393, -0.0001974441111087799, -0.0001881048083305359, -0.00017876550555229187, -0.00016942620277404785, -0.00016008689999580383, -0.00015074759721755981, -0.0001414082944393158, -0.00013206899166107178, -0.00012272968888282776, -0.00011339038610458374, -0.00010405108332633972, -9.47117805480957e-05, -8.537247776985168e-05, -7.603317499160767e-05, -6.669387221336365e-05, -5.735456943511963e-05, -4.801526665687561e-05, -3.867596387863159e-05, -2.9336661100387573e-05, -1.9997358322143555e-05, -1.0658055543899536e-05, -1.3187527656555176e-06, 8.020550012588501e-06, 1.735985279083252e-05, 2.6699155569076538e-05, 3.603845834732056e-05, 4.5377761125564575e-05, 5.4717063903808594e-05, 6.405636668205261e-05, 7.339566946029663e-05, 8.273497223854065e-05, 9.207427501678467e-05, 0.00010141357779502869, 0.0001107528805732727, 0.00012009218335151672, 0.00012943148612976074, 0.00013877078890800476, 0.00014811009168624878, 0.0001574493944644928, 0.00016678869724273682, 0.00017612800002098083, 0.00018546730279922485, 0.00019480660557746887, 0.0002041459083557129, 0.0002134852111339569, 0.00022282451391220093, 0.00023216381669044495, 0.00024150311946868896, 0.000250842422246933, 0.000260181725025177, 0.000269521027803421, 0.00027886033058166504, 0.00028819963335990906, 0.0002975389361381531, 0.0003068782389163971, 0.0003162175416946411, 0.00032555684447288513, 0.00033489614725112915, 0.00034423545002937317, 0.0003535747528076172]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 11.0, 12.0, 17.0, 31.0, 55.0, 74.0, 151.0, 403.0, 932.0, 2632.0, 9486.0, 67768.0, 913784.0, 42507.0, 7189.0, 2044.0, 739.0, 323.0, 148.0, 92.0, 50.0, 26.0, 13.0, 13.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1875, -1.1425323486328125, -1.097564697265625, -1.0525970458984375, -1.00762939453125, -0.9626617431640625, -0.917694091796875, -0.8727264404296875, -0.8277587890625, -0.7827911376953125, -0.737823486328125, -0.6928558349609375, -0.64788818359375, -0.6029205322265625, -0.557952880859375, -0.5129852294921875, -0.468017578125, -0.4230499267578125, -0.378082275390625, -0.3331146240234375, -0.28814697265625, -0.2431793212890625, -0.198211669921875, -0.1532440185546875, -0.1082763671875, -0.0633087158203125, -0.018341064453125, 0.0266265869140625, 0.07159423828125, 0.1165618896484375, 0.161529541015625, 0.2064971923828125, 0.25146484375, 0.2964324951171875, 0.341400146484375, 0.3863677978515625, 0.43133544921875, 0.4763031005859375, 0.521270751953125, 0.5662384033203125, 0.6112060546875, 0.6561737060546875, 0.701141357421875, 0.7461090087890625, 0.79107666015625, 0.8360443115234375, 0.881011962890625, 0.9259796142578125, 0.970947265625, 1.0159149169921875, 1.060882568359375, 1.1058502197265625, 1.15081787109375, 1.1957855224609375, 1.240753173828125, 1.2857208251953125, 1.3306884765625, 1.3756561279296875, 1.420623779296875, 1.4655914306640625, 1.51055908203125, 1.5555267333984375, 1.600494384765625, 1.6454620361328125, 1.6904296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 16.0, 17.0, 20.0, 16.0, 23.0, 39.0, 55.0, 90.0, 110.0, 139.0, 128.0, 78.0, 60.0, 47.0, 27.0, 26.0, 18.0, 16.0, 8.0, 8.0, 9.0, 5.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.369140625, -1.33172607421875, -1.2943115234375, -1.25689697265625, -1.219482421875, -1.18206787109375, -1.1446533203125, -1.10723876953125, -1.06982421875, -1.03240966796875, -0.9949951171875, -0.95758056640625, -0.920166015625, -0.88275146484375, -0.8453369140625, -0.80792236328125, -0.7705078125, -0.73309326171875, -0.6956787109375, -0.65826416015625, -0.620849609375, -0.58343505859375, -0.5460205078125, -0.50860595703125, -0.47119140625, -0.43377685546875, -0.3963623046875, -0.35894775390625, -0.321533203125, -0.28411865234375, -0.2467041015625, -0.20928955078125, -0.171875, -0.13446044921875, -0.0970458984375, -0.05963134765625, -0.022216796875, 0.01519775390625, 0.0526123046875, 0.09002685546875, 0.12744140625, 0.16485595703125, 0.2022705078125, 0.23968505859375, 0.277099609375, 0.31451416015625, 0.3519287109375, 0.38934326171875, 0.4267578125, 0.46417236328125, 0.5015869140625, 0.53900146484375, 0.576416015625, 0.61383056640625, 0.6512451171875, 0.68865966796875, 0.72607421875, 0.76348876953125, 0.8009033203125, 0.83831787109375, 0.875732421875, 0.91314697265625, 0.9505615234375, 0.98797607421875, 1.025390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 0.0, 5.0, 8.0, 23.0, 27.0, 74.0, 154.0, 362.0, 196.0, 70.0, 36.0, 16.0, 12.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-63.461448669433594, -62.18071365356445, -60.89997482299805, -59.619239807128906, -58.3385009765625, -57.05776596069336, -55.77702713012695, -54.49629211425781, -53.215553283691406, -51.934818267822266, -50.65407943725586, -49.37334442138672, -48.09260559082031, -46.81187057495117, -45.531131744384766, -44.250396728515625, -42.969661712646484, -41.688926696777344, -40.40818786621094, -39.1274528503418, -37.84671401977539, -36.56597900390625, -35.285240173339844, -34.0045051574707, -32.72377014160156, -31.44303321838379, -30.162296295166016, -28.881559371948242, -27.60082244873047, -26.320087432861328, -25.039350509643555, -23.75861358642578, -22.47787857055664, -21.197141647338867, -19.916404724121094, -18.63566780090332, -17.354930877685547, -16.074195861816406, -14.793458938598633, -13.51272201538086, -12.231985092163086, -10.951248168945312, -9.670511245727539, -8.389775276184082, -7.109038352966309, -5.828301429748535, -4.54756498336792, -3.2668285369873047, -1.9860916137695312, -0.7053549289703369, 0.5753817558288574, 1.8561184406280518, 3.136855125427246, 4.4175920486450195, 5.698328495025635, 6.97906494140625, 8.259801864624023, 9.540538787841797, 10.82127571105957, 12.102011680603027, 13.3827486038208, 14.663485527038574, 15.944221496582031, 17.224958419799805, 18.505695343017578]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 8.0, 7.0, 13.0, 13.0, 9.0, 9.0, 16.0, 25.0, 25.0, 49.0, 61.0, 104.0, 68.0, 95.0, 95.0, 84.0, 80.0, 44.0, 24.0, 20.0, 16.0, 20.0, 16.0, 12.0, 15.0, 5.0, 13.0, 10.0, 3.0, 4.0, 7.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.855684280395508, -22.028165817260742, -21.200647354125977, -20.37312889099121, -19.545610427856445, -18.71809196472168, -17.890573501586914, -17.06305503845215, -16.235536575317383, -15.408018112182617, -14.580499649047852, -13.752981185913086, -12.92546272277832, -12.097944259643555, -11.270425796508789, -10.442907333374023, -9.615389823913574, -8.787871360778809, -7.960352897644043, -7.132834434509277, -6.305315971374512, -5.477797985076904, -4.650279521942139, -3.822761058807373, -2.9952425956726074, -2.167724132537842, -1.3402057886123657, -0.5126874446868896, 0.314831018447876, 1.1423492431640625, 1.9698677062988281, 2.7973861694335938, 3.6249046325683594, 4.452423095703125, 5.279941558837891, 6.107460021972656, 6.934978485107422, 7.762496471405029, 8.590015411376953, 9.417533874511719, 10.245052337646484, 11.07257080078125, 11.900089263916016, 12.727607727050781, 13.555126190185547, 14.382644653320312, 15.210163116455078, 16.037681579589844, 16.86520004272461, 17.692718505859375, 18.52023696899414, 19.347755432128906, 20.175273895263672, 21.002792358398438, 21.830310821533203, 22.65782928466797, 23.4853458404541, 24.312864303588867, 25.140382766723633, 25.9679012298584, 26.795419692993164, 27.62293815612793, 28.450456619262695, 29.27797508239746, 30.105493545532227]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 2.0, 11.0, 6.0, 11.0, 8.0, 17.0, 16.0, 25.0, 26.0, 38.0, 38.0, 44.0, 66.0, 147.0, 217.0, 73.0, 66.0, 39.0, 24.0, 27.0, 25.0, 21.0, 15.0, 7.0, 10.0, 12.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7958984375, -1.6970367431640625, -1.598175048828125, -1.4993133544921875, -1.40045166015625, -1.3015899658203125, -1.202728271484375, -1.1038665771484375, -1.0050048828125, -0.9061431884765625, -0.807281494140625, -0.7084197998046875, -0.60955810546875, -0.5106964111328125, -0.411834716796875, -0.3129730224609375, -0.214111328125, -0.1152496337890625, -0.016387939453125, 0.0824737548828125, 0.18133544921875, 0.2801971435546875, 0.379058837890625, 0.4779205322265625, 0.5767822265625, 0.6756439208984375, 0.774505615234375, 0.8733673095703125, 0.97222900390625, 1.0710906982421875, 1.169952392578125, 1.2688140869140625, 1.36767578125, 1.4665374755859375, 1.565399169921875, 1.6642608642578125, 1.76312255859375, 1.8619842529296875, 1.960845947265625, 2.0597076416015625, 2.1585693359375, 2.2574310302734375, 2.356292724609375, 2.4551544189453125, 2.55401611328125, 2.6528778076171875, 2.751739501953125, 2.8506011962890625, 2.949462890625, 3.0483245849609375, 3.147186279296875, 3.2460479736328125, 3.34490966796875, 3.4437713623046875, 3.542633056640625, 3.6414947509765625, 3.7403564453125, 3.8392181396484375, 3.938079833984375, 4.0369415283203125, 4.13580322265625, 4.2346649169921875, 4.333526611328125, 4.4323883056640625, 4.53125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 5.0, 7.0, 7.0, 11.0, 13.0, 10.0, 18.0, 16.0, 20.0, 34.0, 50.0, 79.0, 115.0, 224.0, 551.0, 1277.0, 3865.0, 18351.0, 8312719.0, 42330.0, 5700.0, 1719.0, 692.0, 322.0, 160.0, 85.0, 64.0, 41.0, 18.0, 18.0, 12.0, 15.0, 6.0, 7.0, 3.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-12.786225318908691, -12.417206764221191, -12.048187255859375, -11.679168701171875, -11.310150146484375, -10.941130638122559, -10.572112083435059, -10.203092575073242, -9.834074020385742, -9.465055465698242, -9.096035957336426, -8.727017402648926, -8.35799789428711, -7.988979339599609, -7.619960784912109, -7.250941753387451, -6.881922721862793, -6.512903690338135, -6.143884658813477, -5.774866104125977, -5.405847072601318, -5.03682804107666, -4.66780948638916, -4.298790454864502, -3.9297714233398438, -3.5607523918151855, -3.1917335987091064, -2.8227148056030273, -2.453695774078369, -2.084676742553711, -1.7156579494476318, -1.3466391563415527, -0.9776201248168945, -0.6086012125015259, -0.23958230018615723, 0.12943661212921143, 0.4984555244445801, 0.8674744367599487, 1.2364933490753174, 1.6055121421813965, 1.9745311737060547, 2.343550205230713, 2.712568998336792, 3.081587791442871, 3.4506068229675293, 3.8196258544921875, 4.1886444091796875, 4.557663440704346, 4.926682472229004, 5.295701503753662, 5.66472053527832, 6.03373908996582, 6.4027581214904785, 6.771777153015137, 7.140795707702637, 7.509814739227295, 7.878833770751953, 8.247852325439453, 8.61687183380127, 8.98589038848877, 9.354909896850586, 9.723928451538086, 10.092947006225586, 10.461965560913086, 10.830985069274902]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 3.0, 8.0, 4.0, 7.0, 6.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.76610565185547, -21.13652992248535, -20.506954193115234, -19.877378463745117, -19.247802734375, -18.61822509765625, -17.988651275634766, -17.359073638916016, -16.7294979095459, -16.09992218017578, -15.470346450805664, -14.840770721435547, -14.211194038391113, -13.581618309020996, -12.952042579650879, -12.322465896606445, -11.692891120910645, -11.063315391540527, -10.43373966217041, -9.804162979125977, -9.17458724975586, -8.545011520385742, -7.915435791015625, -7.28585958480835, -6.656283855438232, -6.026708126068115, -5.39713191986084, -4.767556190490723, -4.1379804611206055, -3.50840425491333, -2.878828525543213, -2.2492523193359375, -1.6196765899658203, -0.9901006817817688, -0.3605247735977173, 0.26905107498168945, 0.8986270427703857, 1.528203010559082, 2.157778739929199, 2.7873549461364746, 3.416930675506592, 4.046506404876709, 4.676082611083984, 5.305658340454102, 5.935234069824219, 6.564810276031494, 7.194386005401611, 7.823962211608887, 8.453537940979004, 9.083113670349121, 9.712689399719238, 10.342266082763672, 10.971841812133789, 11.601417541503906, 12.230993270874023, 12.86056900024414, 13.490144729614258, 14.119720458984375, 14.749296188354492, 15.37887191772461, 16.008447647094727, 16.638023376464844, 17.267601013183594, 17.89717674255371, 18.526752471923828]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 5.0, 4.0, 6.0, 12.0, 10.0, 11.0, 16.0, 35.0, 46.0, 40.0, 55.0, 71.0, 79.0, 88.0, 67.0, 78.0, 70.0, 66.0, 41.0, 49.0, 35.0, 34.0, 27.0, 14.0, 15.0, 4.0, 9.0, 7.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.7890777587890625, -1.711944580078125, -1.6348114013671875, -1.55767822265625, -1.4805450439453125, -1.403411865234375, -1.3262786865234375, -1.2491455078125, -1.1720123291015625, -1.094879150390625, -1.0177459716796875, -0.94061279296875, -0.8634796142578125, -0.786346435546875, -0.7092132568359375, -0.632080078125, -0.5549468994140625, -0.477813720703125, -0.4006805419921875, -0.32354736328125, -0.2464141845703125, -0.169281005859375, -0.0921478271484375, -0.0150146484375, 0.0621185302734375, 0.139251708984375, 0.2163848876953125, 0.29351806640625, 0.3706512451171875, 0.447784423828125, 0.5249176025390625, 0.60205078125, 0.6791839599609375, 0.756317138671875, 0.8334503173828125, 0.91058349609375, 0.9877166748046875, 1.064849853515625, 1.1419830322265625, 1.2191162109375, 1.2962493896484375, 1.373382568359375, 1.4505157470703125, 1.52764892578125, 1.6047821044921875, 1.681915283203125, 1.7590484619140625, 1.836181640625, 1.9133148193359375, 1.990447998046875, 2.0675811767578125, 2.14471435546875, 2.2218475341796875, 2.298980712890625, 2.3761138916015625, 2.4532470703125, 2.5303802490234375, 2.607513427734375, 2.6846466064453125, 2.76177978515625, 2.8389129638671875, 2.916046142578125, 2.9931793212890625, 3.0703125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 17.0, 22.0, 28.0, 53.0, 58.0, 84.0, 117.0, 161.0, 268.0, 435.0, 809.0, 1509.0, 3135.0, 7925.0, 24797.0, 99216.0, 248116.0, 97696.0, 25416.0, 7807.0, 3092.0, 1459.0, 762.0, 467.0, 254.0, 176.0, 94.0, 64.0, 46.0, 36.0, 31.0, 25.0, 17.0, 12.0, 7.0, 6.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0], "bins": [-20.59375, -20.0587158203125, -19.523681640625, -18.9886474609375, -18.45361328125, -17.9185791015625, -17.383544921875, -16.8485107421875, -16.3134765625, -15.7784423828125, -15.243408203125, -14.7083740234375, -14.17333984375, -13.6383056640625, -13.103271484375, -12.5682373046875, -12.033203125, -11.4981689453125, -10.963134765625, -10.4281005859375, -9.89306640625, -9.3580322265625, -8.822998046875, -8.2879638671875, -7.7529296875, -7.2178955078125, -6.682861328125, -6.1478271484375, -5.61279296875, -5.0777587890625, -4.542724609375, -4.0076904296875, -3.47265625, -2.9376220703125, -2.402587890625, -1.8675537109375, -1.33251953125, -0.7974853515625, -0.262451171875, 0.2725830078125, 0.8076171875, 1.3426513671875, 1.877685546875, 2.4127197265625, 2.94775390625, 3.4827880859375, 4.017822265625, 4.5528564453125, 5.087890625, 5.6229248046875, 6.157958984375, 6.6929931640625, 7.22802734375, 7.7630615234375, 8.298095703125, 8.8331298828125, 9.3681640625, 9.9031982421875, 10.438232421875, 10.9732666015625, 11.50830078125, 12.0433349609375, 12.578369140625, 13.1134033203125, 13.6484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 12.0, 18.0, 9.0, 25.0, 25.0, 33.0, 37.0, 56.0, 60.0, 70.0, 77.0, 79.0, 91.0, 65.0, 68.0, 60.0, 49.0, 44.0, 35.0, 15.0, 18.0, 14.0, 10.0, 5.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-3.609375, -3.520599365234375, -3.43182373046875, -3.343048095703125, -3.2542724609375, -3.165496826171875, -3.07672119140625, -2.987945556640625, -2.899169921875, -2.810394287109375, -2.72161865234375, -2.632843017578125, -2.5440673828125, -2.455291748046875, -2.36651611328125, -2.277740478515625, -2.18896484375, -2.100189208984375, -2.01141357421875, -1.922637939453125, -1.8338623046875, -1.745086669921875, -1.65631103515625, -1.567535400390625, -1.478759765625, -1.389984130859375, -1.30120849609375, -1.212432861328125, -1.1236572265625, -1.034881591796875, -0.94610595703125, -0.857330322265625, -0.7685546875, -0.679779052734375, -0.59100341796875, -0.502227783203125, -0.4134521484375, -0.324676513671875, -0.23590087890625, -0.147125244140625, -0.058349609375, 0.030426025390625, 0.11920166015625, 0.207977294921875, 0.2967529296875, 0.385528564453125, 0.47430419921875, 0.563079833984375, 0.65185546875, 0.740631103515625, 0.82940673828125, 0.918182373046875, 1.0069580078125, 1.095733642578125, 1.18450927734375, 1.273284912109375, 1.362060546875, 1.450836181640625, 1.53961181640625, 1.628387451171875, 1.7171630859375, 1.805938720703125, 1.89471435546875, 1.983489990234375, 2.072265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 11.0, 11.0, 12.0, 33.0, 82.0, 133.0, 92.0, 54.0, 9.0, 15.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.769437789916992, -11.139138221740723, -10.508838653564453, -9.878539085388184, -9.248239517211914, -8.617939949035645, -7.987639904022217, -7.357340335845947, -6.727040767669678, -6.096741199493408, -5.466441631317139, -4.836141586303711, -4.205842018127441, -3.575542688369751, -2.9452428817749023, -2.314943313598633, -1.6846437454223633, -1.0543441772460938, -0.42404448986053467, 0.20625519752502441, 0.836554765701294, 1.4668543338775635, 2.097154140472412, 2.7274537086486816, 3.357753276824951, 3.9880528450012207, 4.61835241317749, 5.248652458190918, 5.8789520263671875, 6.509251594543457, 7.139551162719727, 7.769850730895996, 8.400150299072266, 9.030449867248535, 9.660749435424805, 10.291049003601074, 10.921348571777344, 11.551648139953613, 12.181947708129883, 12.812248229980469, 13.442546844482422, 14.072846412658691, 14.703145980834961, 15.33344554901123, 15.9637451171875, 16.594045639038086, 17.22434425354004, 17.854644775390625, 18.484943389892578, 19.115243911743164, 19.745542526245117, 20.375843048095703, 21.006141662597656, 21.636442184448242, 22.266740798950195, 22.89704132080078, 23.527341842651367, 24.157642364501953, 24.787940979003906, 25.418241500854492, 26.048540115356445, 26.67884063720703, 27.309139251708984, 27.93943977355957, 28.569738388061523]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 8.0, 9.0, 23.0, 58.0, 121.0, 122.0, 50.0, 21.0, 12.0, 10.0, 7.0, 7.0, 7.0, 3.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.337013244628906, -19.70686149597168, -19.076711654663086, -18.44655990600586, -17.816410064697266, -17.18625831604004, -16.556106567382812, -15.925955772399902, -15.295804977416992, -14.665654182434082, -14.035503387451172, -13.405351638793945, -12.775200843811035, -12.145050048828125, -11.514898300170898, -10.884747505187988, -10.254596710205078, -9.624445915222168, -8.994295120239258, -8.364143371582031, -7.733992576599121, -7.103841781616211, -6.473690509796143, -5.843539237976074, -5.213388442993164, -4.583237648010254, -3.9530863761901855, -3.3229353427886963, -2.692784309387207, -2.0626332759857178, -1.4324822425842285, -0.8023309707641602, -0.17218017578125, 0.45797085762023926, 1.0881218910217285, 1.7182729244232178, 2.348423957824707, 2.9785749912261963, 3.6087260246276855, 4.238877296447754, 4.869028091430664, 5.499178886413574, 6.129330158233643, 6.759481430053711, 7.389632225036621, 8.019783020019531, 8.649934768676758, 9.280085563659668, 9.910236358642578, 10.540387153625488, 11.170537948608398, 11.800689697265625, 12.430840492248535, 13.060991287231445, 13.691143035888672, 14.321293830871582, 14.951444625854492, 15.581595420837402, 16.211746215820312, 16.84189796447754, 17.472049713134766, 18.10219955444336, 18.732351303100586, 19.362503051757812, 19.992652893066406]}}