diff --git "a/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" "b/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" --- "a/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" +++ "b/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.003, "train/learning_rate": 4.659144893111639e-05, "train/epoch": 11.21, "train/global_step": 10000, "_runtime": 63253, "_timestamp": 1647161023, "_step": 10003, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 23.0, 27.0, 53.0, 85.0, 156.0, 208.0, 183.0, 103.0, 61.0, 42.0, 24.0, 15.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.404080390930176, -9.215886116027832, -9.027691841125488, -8.839497566223145, -8.6513032913208, -8.463109016418457, -8.274914741516113, -8.08672046661377, -7.898525714874268, -7.710331439971924, -7.52213716506958, -7.333942890167236, -7.145748615264893, -6.957553863525391, -6.769359588623047, -6.581165313720703, -6.392971038818359, -6.204776763916016, -6.016582489013672, -5.828388214111328, -5.640193939208984, -5.451999664306641, -5.263805389404297, -5.075610637664795, -4.887416839599609, -4.699222564697266, -4.511028289794922, -4.322834014892578, -4.134639739990234, -3.9464452266693115, -3.7582509517669678, -3.570056438446045, -3.3818624019622803, -3.1936681270599365, -3.0054738521575928, -2.81727933883667, -2.629085063934326, -2.4408907890319824, -2.2526965141296387, -2.064502239227295, -1.8763078451156616, -1.6881135702133179, -1.4999191761016846, -1.3117249011993408, -1.123530626296997, -0.9353362321853638, -0.74714195728302, -0.5589475631713867, -0.37075328826904297, -0.18255896866321564, 0.005635350942611694, 0.19382965564727783, 0.38202399015426636, 0.5702183246612549, 0.7584125995635986, 0.9466069936752319, 1.1348012685775757, 1.3229955434799194, 1.5111899375915527, 1.6993842124938965, 1.8875784873962402, 2.075772762298584, 2.2639670372009277, 2.4521615505218506, 2.6403558254241943]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 3.0, 5.0, 10.0, 8.0, 6.0, 20.0, 14.0, 16.0, 23.0, 23.0, 28.0, 24.0, 23.0, 24.0, 26.0, 25.0, 45.0, 36.0, 36.0, 39.0, 43.0, 36.0, 38.0, 35.0, 23.0, 40.0, 41.0, 35.0, 22.0, 30.0, 25.0, 26.0, 26.0, 21.0, 19.0, 18.0, 12.0, 13.0, 8.0, 9.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.6241624355316162, -1.5738426446914673, -1.5235228538513184, -1.4732030630111694, -1.4228832721710205, -1.3725634813308716, -1.3222436904907227, -1.2719240188598633, -1.2216041088104248, -1.1712843179702759, -1.120964527130127, -1.070644736289978, -1.020324945449829, -0.9700051546096802, -0.919685423374176, -0.8693656325340271, -0.819045901298523, -0.768726110458374, -0.7184063196182251, -0.6680865287780762, -0.6177667379379272, -0.5674469470977783, -0.5171272158622742, -0.46680742502212524, -0.4164876341819763, -0.3661678433418274, -0.31584805250167847, -0.26552829146385193, -0.215208500623703, -0.16488870978355408, -0.11456894874572754, -0.06424915790557861, -0.013929247856140137, 0.03639053553342819, 0.08671031892299652, 0.13703009486198425, 0.18734988570213318, 0.2376696765422821, 0.28798943758010864, 0.33830922842025757, 0.3886290192604065, 0.4389488101005554, 0.48926860094070435, 0.5395883321762085, 0.5899081230163574, 0.6402279138565063, 0.6905477046966553, 0.7408674955368042, 0.7911872863769531, 0.841507077217102, 0.891826868057251, 0.9421466588973999, 0.9924664497375488, 1.0427862405776978, 1.0931060314178467, 1.143425703048706, 1.1937456130981445, 1.2440654039382935, 1.2943851947784424, 1.3447049856185913, 1.3950247764587402, 1.4453445672988892, 1.495664358139038, 1.5459840297698975, 1.5963038206100464]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 12.0, 8.0, 8.0, 18.0, 15.0, 29.0, 33.0, 29.0, 40.0, 34.0, 35.0, 41.0, 49.0, 42.0, 62.0, 58.0, 50.0, 59.0, 39.0, 40.0, 40.0, 49.0, 27.0, 37.0, 33.0, 24.0, 19.0, 19.0, 11.0, 12.0, 7.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1806640625, -0.17270278930664062, -0.16474151611328125, -0.15678024291992188, -0.1488189697265625, -0.14085769653320312, -0.13289642333984375, -0.12493515014648438, -0.116973876953125, -0.10901260375976562, -0.10105133056640625, -0.09309005737304688, -0.0851287841796875, -0.07716751098632812, -0.06920623779296875, -0.061244964599609375, -0.05328369140625, -0.045322418212890625, -0.03736114501953125, -0.029399871826171875, -0.0214385986328125, -0.013477325439453125, -0.00551605224609375, 0.002445220947265625, 0.010406494140625, 0.018367767333984375, 0.02632904052734375, 0.034290313720703125, 0.0422515869140625, 0.050212860107421875, 0.05817413330078125, 0.06613540649414062, 0.0740966796875, 0.08205795288085938, 0.09001922607421875, 0.09798049926757812, 0.1059417724609375, 0.11390304565429688, 0.12186431884765625, 0.12982559204101562, 0.137786865234375, 0.14574813842773438, 0.15370941162109375, 0.16167068481445312, 0.1696319580078125, 0.17759323120117188, 0.18555450439453125, 0.19351577758789062, 0.20147705078125, 0.20943832397460938, 0.21739959716796875, 0.22536087036132812, 0.2333221435546875, 0.24128341674804688, 0.24924468994140625, 0.2572059631347656, 0.265167236328125, 0.2731285095214844, 0.28108978271484375, 0.2890510559082031, 0.2970123291015625, 0.3049736022949219, 0.31293487548828125, 0.3208961486816406, 0.328857421875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 10.0, 8.0, 1.0, 12.0, 18.0, 16.0, 37.0, 32.0, 42.0, 64.0, 75.0, 114.0, 139.0, 185.0, 257.0, 348.0, 579.0, 1052.0, 2577.0, 8858.0, 50597.0, 3474878.0, 611254.0, 31915.0, 6437.0, 2058.0, 973.0, 519.0, 311.0, 206.0, 188.0, 136.0, 103.0, 80.0, 49.0, 44.0, 31.0, 22.0, 21.0, 17.0, 5.0, 10.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.1220703125, -2.033203125, -1.9443359375, -1.85546875, -1.7666015625, -1.677734375, -1.5888671875, -1.5, -1.4111328125, -1.322265625, -1.2333984375, -1.14453125, -1.0556640625, -0.966796875, -0.8779296875, -0.7890625, -0.7001953125, -0.611328125, -0.5224609375, -0.43359375, -0.3447265625, -0.255859375, -0.1669921875, -0.078125, 0.0107421875, 0.099609375, 0.1884765625, 0.27734375, 0.3662109375, 0.455078125, 0.5439453125, 0.6328125, 0.7216796875, 0.810546875, 0.8994140625, 0.98828125, 1.0771484375, 1.166015625, 1.2548828125, 1.34375, 1.4326171875, 1.521484375, 1.6103515625, 1.69921875, 1.7880859375, 1.876953125, 1.9658203125, 2.0546875, 2.1435546875, 2.232421875, 2.3212890625, 2.41015625, 2.4990234375, 2.587890625, 2.6767578125, 2.765625, 2.8544921875, 2.943359375, 3.0322265625, 3.12109375, 3.2099609375, 3.298828125, 3.3876953125, 3.4765625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 8.0, 6.0, 14.0, 17.0, 16.0, 30.0, 48.0, 56.0, 77.0, 113.0, 201.0, 351.0, 825.0, 1170.0, 489.0, 228.0, 135.0, 81.0, 52.0, 37.0, 29.0, 20.0, 22.0, 11.0, 8.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.50390625, -1.4690933227539062, -1.4342803955078125, -1.3994674682617188, -1.364654541015625, -1.3298416137695312, -1.2950286865234375, -1.2602157592773438, -1.22540283203125, -1.1905899047851562, -1.1557769775390625, -1.1209640502929688, -1.086151123046875, -1.0513381958007812, -1.0165252685546875, -0.9817123413085938, -0.9468994140625, -0.9120864868164062, -0.8772735595703125, -0.8424606323242188, -0.807647705078125, -0.7728347778320312, -0.7380218505859375, -0.7032089233398438, -0.66839599609375, -0.6335830688476562, -0.5987701416015625, -0.5639572143554688, -0.529144287109375, -0.49433135986328125, -0.4595184326171875, -0.42470550537109375, -0.389892578125, -0.35507965087890625, -0.3202667236328125, -0.28545379638671875, -0.250640869140625, -0.21582794189453125, -0.1810150146484375, -0.14620208740234375, -0.11138916015625, -0.07657623291015625, -0.0417633056640625, -0.00695037841796875, 0.027862548828125, 0.06267547607421875, 0.0974884033203125, 0.13230133056640625, 0.1671142578125, 0.20192718505859375, 0.2367401123046875, 0.27155303955078125, 0.306365966796875, 0.34117889404296875, 0.3759918212890625, 0.41080474853515625, 0.44561767578125, 0.48043060302734375, 0.5152435302734375, 0.5500564575195312, 0.584869384765625, 0.6196823120117188, 0.6544952392578125, 0.6893081665039062, 0.72412109375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 16.0, 21.0, 41.0, 50.0, 112.0, 165.0, 346.0, 867.0, 2796.0, 10793.0, 53662.0, 872018.0, 3143401.0, 88497.0, 15717.0, 3800.0, 1113.0, 377.0, 194.0, 112.0, 70.0, 36.0, 29.0, 20.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.529632568359375, -4.41082763671875, -4.292022705078125, -4.1732177734375, -4.054412841796875, -3.93560791015625, -3.816802978515625, -3.697998046875, -3.579193115234375, -3.46038818359375, -3.341583251953125, -3.2227783203125, -3.103973388671875, -2.98516845703125, -2.866363525390625, -2.74755859375, -2.628753662109375, -2.50994873046875, -2.391143798828125, -2.2723388671875, -2.153533935546875, -2.03472900390625, -1.915924072265625, -1.797119140625, -1.678314208984375, -1.55950927734375, -1.440704345703125, -1.3218994140625, -1.203094482421875, -1.08428955078125, -0.965484619140625, -0.8466796875, -0.727874755859375, -0.60906982421875, -0.490264892578125, -0.3714599609375, -0.252655029296875, -0.13385009765625, -0.015045166015625, 0.103759765625, 0.222564697265625, 0.34136962890625, 0.460174560546875, 0.5789794921875, 0.697784423828125, 0.81658935546875, 0.935394287109375, 1.05419921875, 1.173004150390625, 1.29180908203125, 1.410614013671875, 1.5294189453125, 1.648223876953125, 1.76702880859375, 1.885833740234375, 2.004638671875, 2.123443603515625, 2.24224853515625, 2.361053466796875, 2.4798583984375, 2.598663330078125, 2.71746826171875, 2.836273193359375, 2.955078125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 8.0, 22.0, 16.0, 36.0, 46.0, 77.0, 105.0, 138.0, 134.0, 138.0, 106.0, 65.0, 47.0, 24.0, 19.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.948432207107544, -2.7967147827148438, -2.6449973583221436, -2.4932799339294434, -2.341562271118164, -2.189845085144043, -2.0381274223327637, -1.8864099979400635, -1.7346925735473633, -1.582975149154663, -1.431257724761963, -1.2795401811599731, -1.127822756767273, -0.9761053323745728, -0.8243878483772278, -0.6726703643798828, -0.5209529399871826, -0.36923548579216003, -0.21751803159713745, -0.06580057740211487, 0.08591687679290771, 0.2376343011856079, 0.3893517851829529, 0.5410692691802979, 0.692786693572998, 0.8445041179656982, 0.9962216019630432, 1.1479390859603882, 1.2996565103530884, 1.4513739347457886, 1.6030914783477783, 1.7548089027404785, 1.9065265655517578, 2.058243989944458, 2.209961414337158, 2.3616788387298584, 2.5133962631225586, 2.665113925933838, 2.816831350326538, 2.9685487747192383, 3.1202661991119385, 3.2719836235046387, 3.423701047897339, 3.575418472290039, 3.7271361351013184, 3.8788533210754395, 4.030570983886719, 4.18228816986084, 4.334005832672119, 4.485723495483398, 4.6374406814575195, 4.789158344268799, 4.94087553024292, 5.092593193054199, 5.24431037902832, 5.3960280418396, 5.547745704650879, 5.699463367462158, 5.851180553436279, 6.002898216247559, 6.15461540222168, 6.306333065032959, 6.45805025100708, 6.609767913818359, 6.7614850997924805]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 3.0, 5.0, 5.0, 8.0, 10.0, 11.0, 10.0, 6.0, 17.0, 23.0, 15.0, 20.0, 14.0, 31.0, 26.0, 29.0, 27.0, 35.0, 34.0, 32.0, 45.0, 37.0, 35.0, 43.0, 42.0, 43.0, 31.0, 38.0, 25.0, 34.0, 20.0, 27.0, 32.0, 24.0, 26.0, 21.0, 24.0, 23.0, 12.0, 13.0, 6.0, 10.0, 8.0, 3.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.29062557220459, -2.2169036865234375, -2.143181800842285, -2.069460153579712, -1.9957382678985596, -1.9220163822174072, -1.8482946157455444, -1.7745728492736816, -1.7008509635925293, -1.627129077911377, -1.5534073114395142, -1.4796855449676514, -1.405963659286499, -1.3322417736053467, -1.2585200071334839, -1.184798240661621, -1.1110763549804688, -1.0373544692993164, -0.9636327028274536, -0.889910876750946, -0.8161890506744385, -0.7424672245979309, -0.6687453985214233, -0.5950235724449158, -0.5213017463684082, -0.44757992029190063, -0.37385809421539307, -0.3001362681388855, -0.22641444206237793, -0.15269261598587036, -0.07897078990936279, -0.005248963832855225, 0.06847262382507324, 0.1421944499015808, 0.21591627597808838, 0.28963810205459595, 0.3633599281311035, 0.4370817542076111, 0.5108035802841187, 0.5845254063606262, 0.6582472324371338, 0.7319690585136414, 0.8056908845901489, 0.8794127106666565, 0.9531345367431641, 1.0268564224243164, 1.1005781888961792, 1.174299955368042, 1.2480218410491943, 1.3217437267303467, 1.3954654932022095, 1.4691872596740723, 1.5429091453552246, 1.616631031036377, 1.6903527975082397, 1.7640745639801025, 1.8377964496612549, 1.9115183353424072, 1.98524010181427, 2.058961868286133, 2.132683753967285, 2.2064056396484375, 2.28012752532959, 2.353849172592163, 2.4275710582733154]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 9.0, 11.0, 12.0, 12.0, 25.0, 33.0, 35.0, 37.0, 37.0, 37.0, 47.0, 35.0, 47.0, 51.0, 54.0, 54.0, 60.0, 51.0, 51.0, 35.0, 40.0, 43.0, 26.0, 22.0, 22.0, 28.0, 17.0, 18.0, 14.0, 7.0, 7.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2218017578125, -0.21328163146972656, -0.20476150512695312, -0.1962413787841797, -0.18772125244140625, -0.1792011260986328, -0.17068099975585938, -0.16216087341308594, -0.1536407470703125, -0.14512062072753906, -0.13660049438476562, -0.1280803680419922, -0.11956024169921875, -0.11104011535644531, -0.10251998901367188, -0.09399986267089844, -0.085479736328125, -0.07695960998535156, -0.06843948364257812, -0.05991935729980469, -0.05139923095703125, -0.04287910461425781, -0.034358978271484375, -0.025838851928710938, -0.0173187255859375, -0.008798599243164062, -0.000278472900390625, 0.008241653442382812, 0.01676177978515625, 0.025281906127929688, 0.033802032470703125, 0.04232215881347656, 0.05084228515625, 0.05936241149902344, 0.06788253784179688, 0.07640266418457031, 0.08492279052734375, 0.09344291687011719, 0.10196304321289062, 0.11048316955566406, 0.1190032958984375, 0.12752342224121094, 0.13604354858398438, 0.1445636749267578, 0.15308380126953125, 0.1616039276123047, 0.17012405395507812, 0.17864418029785156, 0.187164306640625, 0.19568443298339844, 0.20420455932617188, 0.2127246856689453, 0.22124481201171875, 0.2297649383544922, 0.23828506469726562, 0.24680519104003906, 0.2553253173828125, 0.26384544372558594, 0.2723655700683594, 0.2808856964111328, 0.28940582275390625, 0.2979259490966797, 0.3064460754394531, 0.31496620178222656, 0.323486328125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 7.0, 8.0, 19.0, 19.0, 28.0, 51.0, 62.0, 121.0, 159.0, 266.0, 443.0, 702.0, 1178.0, 2020.0, 3680.0, 6727.0, 13303.0, 26460.0, 53833.0, 114082.0, 230489.0, 285669.0, 158456.0, 76148.0, 36297.0, 17884.0, 9103.0, 4909.0, 2576.0, 1590.0, 846.0, 523.0, 316.0, 195.0, 141.0, 93.0, 47.0, 34.0, 22.0, 19.0, 10.0, 4.0, 8.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.30419921875, -0.29531097412109375, -0.2864227294921875, -0.27753448486328125, -0.268646240234375, -0.25975799560546875, -0.2508697509765625, -0.24198150634765625, -0.23309326171875, -0.22420501708984375, -0.2153167724609375, -0.20642852783203125, -0.197540283203125, -0.18865203857421875, -0.1797637939453125, -0.17087554931640625, -0.1619873046875, -0.15309906005859375, -0.1442108154296875, -0.13532257080078125, -0.126434326171875, -0.11754608154296875, -0.1086578369140625, -0.09976959228515625, -0.09088134765625, -0.08199310302734375, -0.0731048583984375, -0.06421661376953125, -0.055328369140625, -0.04644012451171875, -0.0375518798828125, -0.02866363525390625, -0.019775390625, -0.01088714599609375, -0.0019989013671875, 0.00688934326171875, 0.015777587890625, 0.02466583251953125, 0.0335540771484375, 0.04244232177734375, 0.05133056640625, 0.06021881103515625, 0.0691070556640625, 0.07799530029296875, 0.086883544921875, 0.09577178955078125, 0.1046600341796875, 0.11354827880859375, 0.1224365234375, 0.13132476806640625, 0.1402130126953125, 0.14910125732421875, 0.157989501953125, 0.16687774658203125, 0.1757659912109375, 0.18465423583984375, 0.19354248046875, 0.20243072509765625, 0.2113189697265625, 0.22020721435546875, 0.229095458984375, 0.23798370361328125, 0.2468719482421875, 0.25576019287109375, 0.2646484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 7.0, 8.0, 4.0, 6.0, 8.0, 10.0, 12.0, 10.0, 17.0, 25.0, 24.0, 23.0, 21.0, 19.0, 31.0, 30.0, 37.0, 33.0, 33.0, 46.0, 38.0, 34.0, 1065.0, 36.0, 40.0, 38.0, 25.0, 32.0, 39.0, 25.0, 35.0, 28.0, 26.0, 21.0, 21.0, 21.0, 22.0, 14.0, 7.0, 11.0, 15.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20263671875, -0.1958179473876953, -0.18899917602539062, -0.18218040466308594, -0.17536163330078125, -0.16854286193847656, -0.16172409057617188, -0.1549053192138672, -0.1480865478515625, -0.1412677764892578, -0.13444900512695312, -0.12763023376464844, -0.12081146240234375, -0.11399269104003906, -0.10717391967773438, -0.10035514831542969, -0.093536376953125, -0.08671760559082031, -0.07989883422851562, -0.07308006286621094, -0.06626129150390625, -0.05944252014160156, -0.052623748779296875, -0.04580497741699219, -0.0389862060546875, -0.03216743469238281, -0.025348663330078125, -0.018529891967773438, -0.01171112060546875, -0.0048923492431640625, 0.001926422119140625, 0.008745193481445312, 0.01556396484375, 0.022382736206054688, 0.029201507568359375, 0.03602027893066406, 0.04283905029296875, 0.04965782165527344, 0.056476593017578125, 0.06329536437988281, 0.0701141357421875, 0.07693290710449219, 0.08375167846679688, 0.09057044982910156, 0.09738922119140625, 0.10420799255371094, 0.11102676391601562, 0.11784553527832031, 0.124664306640625, 0.1314830780029297, 0.13830184936523438, 0.14512062072753906, 0.15193939208984375, 0.15875816345214844, 0.16557693481445312, 0.1723957061767578, 0.1792144775390625, 0.1860332489013672, 0.19285202026367188, 0.19967079162597656, 0.20648956298828125, 0.21330833435058594, 0.22012710571289062, 0.2269458770751953, 0.2337646484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 11.0, 6.0, 20.0, 33.0, 29.0, 55.0, 75.0, 102.0, 188.0, 262.0, 408.0, 649.0, 1019.0, 1616.0, 2798.0, 4695.0, 8785.0, 17000.0, 39103.0, 181898.0, 1692312.0, 87235.0, 28425.0, 13197.0, 7052.0, 3915.0, 2425.0, 1380.0, 842.0, 538.0, 358.0, 215.0, 146.0, 100.0, 81.0, 38.0, 33.0, 23.0, 18.0, 14.0, 5.0, 6.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.2935905456542969, -0.28322601318359375, -0.2728614807128906, -0.2624969482421875, -0.2521324157714844, -0.24176788330078125, -0.23140335083007812, -0.221038818359375, -0.21067428588867188, -0.20030975341796875, -0.18994522094726562, -0.1795806884765625, -0.16921615600585938, -0.15885162353515625, -0.14848709106445312, -0.13812255859375, -0.12775802612304688, -0.11739349365234375, -0.10702896118164062, -0.0966644287109375, -0.08629989624023438, -0.07593536376953125, -0.06557083129882812, -0.055206298828125, -0.044841766357421875, -0.03447723388671875, -0.024112701416015625, -0.0137481689453125, -0.003383636474609375, 0.00698089599609375, 0.017345428466796875, 0.0277099609375, 0.038074493408203125, 0.04843902587890625, 0.058803558349609375, 0.0691680908203125, 0.07953262329101562, 0.08989715576171875, 0.10026168823242188, 0.110626220703125, 0.12099075317382812, 0.13135528564453125, 0.14171981811523438, 0.1520843505859375, 0.16244888305664062, 0.17281341552734375, 0.18317794799804688, 0.19354248046875, 0.20390701293945312, 0.21427154541015625, 0.22463607788085938, 0.2350006103515625, 0.24536514282226562, 0.25572967529296875, 0.2660942077636719, 0.276458740234375, 0.2868232727050781, 0.29718780517578125, 0.3075523376464844, 0.3179168701171875, 0.3282814025878906, 0.33864593505859375, 0.3490104675292969, 0.359375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 8.0, 10.0, 17.0, 17.0, 10.0, 16.0, 34.0, 42.0, 45.0, 51.0, 71.0, 78.0, 80.0, 75.0, 75.0, 71.0, 66.0, 44.0, 26.0, 28.0, 22.0, 17.0, 14.0, 12.0, 12.0, 10.0, 9.0, 6.0, 6.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0604248046875, -0.05865001678466797, -0.05687522888183594, -0.055100440979003906, -0.053325653076171875, -0.051550865173339844, -0.04977607727050781, -0.04800128936767578, -0.04622650146484375, -0.04445171356201172, -0.04267692565917969, -0.040902137756347656, -0.039127349853515625, -0.037352561950683594, -0.03557777404785156, -0.03380298614501953, -0.0320281982421875, -0.03025341033935547, -0.028478622436523438, -0.026703834533691406, -0.024929046630859375, -0.023154258728027344, -0.021379470825195312, -0.01960468292236328, -0.01782989501953125, -0.01605510711669922, -0.014280319213867188, -0.012505531311035156, -0.010730743408203125, -0.008955955505371094, -0.0071811676025390625, -0.005406379699707031, -0.003631591796875, -0.0018568038940429688, -8.20159912109375e-05, 0.0016927719116210938, 0.003467559814453125, 0.005242347717285156, 0.0070171356201171875, 0.008791923522949219, 0.01056671142578125, 0.012341499328613281, 0.014116287231445312, 0.015891075134277344, 0.017665863037109375, 0.019440650939941406, 0.021215438842773438, 0.02299022674560547, 0.0247650146484375, 0.02653980255126953, 0.028314590454101562, 0.030089378356933594, 0.031864166259765625, 0.033638954162597656, 0.03541374206542969, 0.03718852996826172, 0.03896331787109375, 0.04073810577392578, 0.04251289367675781, 0.044287681579589844, 0.046062469482421875, 0.047837257385253906, 0.04961204528808594, 0.05138683319091797, 0.05316162109375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 9.0, 15.0, 18.0, 21.0, 19.0, 42.0, 37.0, 53.0, 67.0, 102.0, 141.0, 233.0, 358.0, 848.0, 8195.0, 654463.0, 376220.0, 5800.0, 811.0, 373.0, 189.0, 124.0, 108.0, 63.0, 43.0, 36.0, 25.0, 33.0, 27.0, 17.0, 9.0, 5.0, 5.0, 9.0, 5.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.904296875, -0.877655029296875, -0.85101318359375, -0.824371337890625, -0.7977294921875, -0.771087646484375, -0.74444580078125, -0.717803955078125, -0.691162109375, -0.664520263671875, -0.63787841796875, -0.611236572265625, -0.5845947265625, -0.557952880859375, -0.53131103515625, -0.504669189453125, -0.47802734375, -0.451385498046875, -0.42474365234375, -0.398101806640625, -0.3714599609375, -0.344818115234375, -0.31817626953125, -0.291534423828125, -0.264892578125, -0.238250732421875, -0.21160888671875, -0.184967041015625, -0.1583251953125, -0.131683349609375, -0.10504150390625, -0.078399658203125, -0.0517578125, -0.025115966796875, 0.00152587890625, 0.028167724609375, 0.0548095703125, 0.081451416015625, 0.10809326171875, 0.134735107421875, 0.161376953125, 0.188018798828125, 0.21466064453125, 0.241302490234375, 0.2679443359375, 0.294586181640625, 0.32122802734375, 0.347869873046875, 0.37451171875, 0.401153564453125, 0.42779541015625, 0.454437255859375, 0.4810791015625, 0.507720947265625, 0.53436279296875, 0.561004638671875, 0.587646484375, 0.614288330078125, 0.64093017578125, 0.667572021484375, 0.6942138671875, 0.720855712890625, 0.74749755859375, 0.774139404296875, 0.80078125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 16.0, 40.0, 47.0, 109.0, 188.0, 227.0, 161.0, 90.0, 48.0, 27.0, 18.0, 11.0, 4.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2659870982170105, -0.25503435730934143, -0.24408164620399475, -0.23312890529632568, -0.2221761792898178, -0.21122345328330994, -0.20027071237564087, -0.189317986369133, -0.17836526036262512, -0.16741253435611725, -0.15645980834960938, -0.1455070674419403, -0.13455434143543243, -0.12360161542892456, -0.11264888197183609, -0.10169614851474762, -0.09074342250823975, -0.07979069650173187, -0.0688379630446434, -0.05788523331284523, -0.04693250358104706, -0.035979773849248886, -0.025027044117450714, -0.014074310660362244, -0.00312158465385437, 0.007831145077943802, 0.018783874809741974, 0.029736604541540146, 0.04068933427333832, 0.05164206400513649, 0.06259479373693466, 0.07354752719402313, 0.084500253200531, 0.09545297920703888, 0.10640571266412735, 0.11735844612121582, 0.1283111721277237, 0.13926389813423157, 0.15021663904190063, 0.1611693650484085, 0.17212209105491638, 0.18307481706142426, 0.19402754306793213, 0.2049802839756012, 0.21593300998210907, 0.22688573598861694, 0.237838476896286, 0.24879120290279388, 0.25974392890930176, 0.2706966698169708, 0.2816493809223175, 0.2926021218299866, 0.30355483293533325, 0.3145075738430023, 0.3254603147506714, 0.33641302585601807, 0.34736576676368713, 0.3583185076713562, 0.3692712187767029, 0.38022395968437195, 0.391176700592041, 0.4021294116973877, 0.41308215260505676, 0.42403489351272583, 0.4349876046180725]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 4.0, 7.0, 9.0, 19.0, 15.0, 17.0, 20.0, 17.0, 28.0, 21.0, 26.0, 26.0, 36.0, 26.0, 36.0, 32.0, 30.0, 47.0, 51.0, 39.0, 36.0, 48.0, 40.0, 35.0, 33.0, 33.0, 28.0, 22.0, 27.0, 22.0, 25.0, 21.0, 18.0, 14.0, 13.0, 6.0, 11.0, 5.0, 7.0, 9.0, 12.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.13494855165481567, -0.1309211552143097, -0.1268937587738037, -0.12286636233329773, -0.11883896589279175, -0.11481156945228577, -0.11078417301177979, -0.1067567765712738, -0.10272938013076782, -0.09870198369026184, -0.09467458724975586, -0.09064719080924988, -0.0866197943687439, -0.08259239792823792, -0.07856500148773193, -0.07453760504722595, -0.07051020860671997, -0.06648281216621399, -0.06245541572570801, -0.058428019285202026, -0.054400622844696045, -0.050373226404190063, -0.04634582996368408, -0.0423184335231781, -0.03829103708267212, -0.03426364064216614, -0.030236244201660156, -0.026208847761154175, -0.022181451320648193, -0.018154054880142212, -0.01412665843963623, -0.010099261999130249, -0.006071865558624268, -0.002044469118118286, 0.0019829273223876953, 0.006010323762893677, 0.010037720203399658, 0.01406511664390564, 0.01809251308441162, 0.022119909524917603, 0.026147305965423584, 0.030174702405929565, 0.03420209884643555, 0.03822949528694153, 0.04225689172744751, 0.04628428816795349, 0.05031168460845947, 0.054339081048965454, 0.058366477489471436, 0.06239387392997742, 0.0664212703704834, 0.07044866681098938, 0.07447606325149536, 0.07850345969200134, 0.08253085613250732, 0.0865582525730133, 0.09058564901351929, 0.09461304545402527, 0.09864044189453125, 0.10266783833503723, 0.10669523477554321, 0.1107226312160492, 0.11475002765655518, 0.11877742409706116, 0.12280482053756714]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 7.0, 10.0, 10.0, 15.0, 17.0, 24.0, 39.0, 30.0, 41.0, 35.0, 40.0, 43.0, 32.0, 52.0, 51.0, 50.0, 64.0, 56.0, 49.0, 46.0, 39.0, 46.0, 31.0, 26.0, 18.0, 22.0, 30.0, 15.0, 18.0, 12.0, 11.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2188720703125, -0.2103748321533203, -0.20187759399414062, -0.19338035583496094, -0.18488311767578125, -0.17638587951660156, -0.16788864135742188, -0.1593914031982422, -0.1508941650390625, -0.1423969268798828, -0.13389968872070312, -0.12540245056152344, -0.11690521240234375, -0.10840797424316406, -0.09991073608398438, -0.09141349792480469, -0.082916259765625, -0.07441902160644531, -0.06592178344726562, -0.05742454528808594, -0.04892730712890625, -0.04043006896972656, -0.031932830810546875, -0.023435592651367188, -0.0149383544921875, -0.0064411163330078125, 0.002056121826171875, 0.010553359985351562, 0.01905059814453125, 0.027547836303710938, 0.036045074462890625, 0.04454231262207031, 0.05303955078125, 0.06153678894042969, 0.07003402709960938, 0.07853126525878906, 0.08702850341796875, 0.09552574157714844, 0.10402297973632812, 0.11252021789550781, 0.1210174560546875, 0.1295146942138672, 0.13801193237304688, 0.14650917053222656, 0.15500640869140625, 0.16350364685058594, 0.17200088500976562, 0.1804981231689453, 0.188995361328125, 0.1974925994873047, 0.20598983764648438, 0.21448707580566406, 0.22298431396484375, 0.23148155212402344, 0.23997879028320312, 0.2484760284423828, 0.2569732666015625, 0.2654705047607422, 0.2739677429199219, 0.28246498107910156, 0.29096221923828125, 0.29945945739746094, 0.3079566955566406, 0.3164539337158203, 0.324951171875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 6.0, 14.0, 14.0, 22.0, 41.0, 52.0, 108.0, 182.0, 277.0, 494.0, 936.0, 1509.0, 2919.0, 5561.0, 11211.0, 23645.0, 56084.0, 159016.0, 429185.0, 224895.0, 73801.0, 29964.0, 13891.0, 6888.0, 3452.0, 1925.0, 1043.0, 567.0, 348.0, 209.0, 112.0, 61.0, 43.0, 19.0, 23.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8515625, -0.8246536254882812, -0.7977447509765625, -0.7708358764648438, -0.743927001953125, -0.7170181274414062, -0.6901092529296875, -0.6632003784179688, -0.63629150390625, -0.6093826293945312, -0.5824737548828125, -0.5555648803710938, -0.528656005859375, -0.5017471313476562, -0.4748382568359375, -0.44792938232421875, -0.4210205078125, -0.39411163330078125, -0.3672027587890625, -0.34029388427734375, -0.313385009765625, -0.28647613525390625, -0.2595672607421875, -0.23265838623046875, -0.20574951171875, -0.17884063720703125, -0.1519317626953125, -0.12502288818359375, -0.098114013671875, -0.07120513916015625, -0.0442962646484375, -0.01738739013671875, 0.009521484375, 0.03643035888671875, 0.0633392333984375, 0.09024810791015625, 0.117156982421875, 0.14406585693359375, 0.1709747314453125, 0.19788360595703125, 0.22479248046875, 0.25170135498046875, 0.2786102294921875, 0.30551910400390625, 0.332427978515625, 0.35933685302734375, 0.3862457275390625, 0.41315460205078125, 0.4400634765625, 0.46697235107421875, 0.4938812255859375, 0.5207901000976562, 0.547698974609375, 0.5746078491210938, 0.6015167236328125, 0.6284255981445312, 0.65533447265625, 0.6822433471679688, 0.7091522216796875, 0.7360610961914062, 0.762969970703125, 0.7898788452148438, 0.8167877197265625, 0.8436965942382812, 0.87060546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 11.0, 14.0, 19.0, 16.0, 21.0, 18.0, 40.0, 30.0, 22.0, 41.0, 57.0, 47.0, 63.0, 91.0, 100.0, 147.0, 253.0, 1300.0, 151.0, 103.0, 76.0, 55.0, 63.0, 46.0, 40.0, 44.0, 21.0, 22.0, 31.0, 19.0, 16.0, 12.0, 13.0, 4.0, 13.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.93115234375, -0.9045562744140625, -0.877960205078125, -0.8513641357421875, -0.82476806640625, -0.7981719970703125, -0.771575927734375, -0.7449798583984375, -0.7183837890625, -0.6917877197265625, -0.665191650390625, -0.6385955810546875, -0.61199951171875, -0.5854034423828125, -0.558807373046875, -0.5322113037109375, -0.505615234375, -0.4790191650390625, -0.452423095703125, -0.4258270263671875, -0.39923095703125, -0.3726348876953125, -0.346038818359375, -0.3194427490234375, -0.2928466796875, -0.2662506103515625, -0.239654541015625, -0.2130584716796875, -0.18646240234375, -0.1598663330078125, -0.133270263671875, -0.1066741943359375, -0.080078125, -0.0534820556640625, -0.026885986328125, -0.0002899169921875, 0.02630615234375, 0.0529022216796875, 0.079498291015625, 0.1060943603515625, 0.1326904296875, 0.1592864990234375, 0.185882568359375, 0.2124786376953125, 0.23907470703125, 0.2656707763671875, 0.292266845703125, 0.3188629150390625, 0.345458984375, 0.3720550537109375, 0.398651123046875, 0.4252471923828125, 0.45184326171875, 0.4784393310546875, 0.505035400390625, 0.5316314697265625, 0.5582275390625, 0.5848236083984375, 0.611419677734375, 0.6380157470703125, 0.66461181640625, 0.6912078857421875, 0.717803955078125, 0.7444000244140625, 0.77099609375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 7.0, 9.0, 5.0, 10.0, 11.0, 9.0, 15.0, 14.0, 7.0, 16.0, 22.0, 27.0, 27.0, 42.0, 59.0, 96.0, 206.0, 643.0, 2584.0, 17197.0, 276265.0, 2727890.0, 108560.0, 9465.0, 1591.0, 409.0, 154.0, 84.0, 59.0, 36.0, 32.0, 24.0, 21.0, 16.0, 11.0, 17.0, 9.0, 10.0, 11.0, 7.0, 8.0, 5.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.685546875, -2.590850830078125, -2.49615478515625, -2.401458740234375, -2.3067626953125, -2.212066650390625, -2.11737060546875, -2.022674560546875, -1.927978515625, -1.833282470703125, -1.73858642578125, -1.643890380859375, -1.5491943359375, -1.454498291015625, -1.35980224609375, -1.265106201171875, -1.17041015625, -1.075714111328125, -0.98101806640625, -0.886322021484375, -0.7916259765625, -0.696929931640625, -0.60223388671875, -0.507537841796875, -0.412841796875, -0.318145751953125, -0.22344970703125, -0.128753662109375, -0.0340576171875, 0.060638427734375, 0.15533447265625, 0.250030517578125, 0.3447265625, 0.439422607421875, 0.53411865234375, 0.628814697265625, 0.7235107421875, 0.818206787109375, 0.91290283203125, 1.007598876953125, 1.102294921875, 1.196990966796875, 1.29168701171875, 1.386383056640625, 1.4810791015625, 1.575775146484375, 1.67047119140625, 1.765167236328125, 1.85986328125, 1.954559326171875, 2.04925537109375, 2.143951416015625, 2.2386474609375, 2.333343505859375, 2.42803955078125, 2.522735595703125, 2.617431640625, 2.712127685546875, 2.80682373046875, 2.901519775390625, 2.9962158203125, 3.090911865234375, 3.18560791015625, 3.280303955078125, 3.375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 356.0, 592.0, 43.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.9511775970459, -18.341232299804688, -17.731287002563477, -17.121339797973633, -16.511394500732422, -15.901449203491211, -15.29150390625, -14.681558609008789, -14.071612358093262, -13.46166706085205, -12.851720809936523, -12.241775512695312, -11.631830215454102, -11.021883964538574, -10.411938667297363, -9.801992416381836, -9.192047119140625, -8.582101821899414, -7.972155570983887, -7.362210273742676, -6.752264499664307, -6.1423187255859375, -5.532373428344727, -4.922427654266357, -4.312481880187988, -3.702536106109619, -3.092590570449829, -2.482645034790039, -1.87269926071167, -1.2627534866333008, -0.6528079509735107, -0.0428624153137207, 0.5670814514160156, 1.1770271062850952, 1.7869727611541748, 2.396918296813965, 3.006864070892334, 3.616809844970703, 4.226755142211914, 4.836700916290283, 5.446646690368652, 6.0565924644470215, 6.666538238525391, 7.276483535766602, 7.886429309844971, 8.49637508392334, 9.10632038116455, 9.716266632080078, 10.326211929321289, 10.9361572265625, 11.546103477478027, 12.156048774719238, 12.765995025634766, 13.375940322875977, 13.985885620117188, 14.595830917358398, 15.205777168273926, 15.815722465515137, 16.425668716430664, 17.035614013671875, 17.645559310913086, 18.255504608154297, 18.86545181274414, 19.47539710998535, 20.085342407226562]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 9.0, 11.0, 16.0, 14.0, 17.0, 12.0, 11.0, 17.0, 23.0, 15.0, 18.0, 28.0, 35.0, 39.0, 27.0, 27.0, 28.0, 36.0, 45.0, 41.0, 42.0, 43.0, 40.0, 36.0, 33.0, 35.0, 33.0, 26.0, 23.0, 34.0, 27.0, 20.0, 22.0, 12.0, 13.0, 18.0, 6.0, 18.0, 9.0, 2.0, 3.0, 5.0, 9.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8336727619171143, -2.7472383975982666, -2.660804033279419, -2.5743696689605713, -2.4879350662231445, -2.401500701904297, -2.315066337585449, -2.2286319732666016, -2.142197608947754, -2.0557632446289062, -1.9693288803100586, -1.8828943967819214, -1.7964600324630737, -1.710025668144226, -1.6235911846160889, -1.5371568202972412, -1.4507224559783936, -1.364288091659546, -1.2778537273406982, -1.191419243812561, -1.1049848794937134, -1.0185505151748657, -0.9321160912513733, -0.8456816673278809, -0.7592473030090332, -0.6728129386901855, -0.5863785147666931, -0.49994412064552307, -0.413509726524353, -0.327075332403183, -0.24064093828201294, -0.1542065143585205, -0.06777215003967285, 0.018662244081497192, 0.10509663820266724, 0.19153103232383728, 0.2779654264450073, 0.36439982056617737, 0.4508342146873474, 0.5372686386108398, 0.6237030029296875, 0.7101373672485352, 0.7965717911720276, 0.88300621509552, 0.9694405794143677, 1.0558749437332153, 1.1423094272613525, 1.2287437915802002, 1.3151781558990479, 1.4016125202178955, 1.4880468845367432, 1.5744813680648804, 1.660915732383728, 1.7473500967025757, 1.833784580230713, 1.9202189445495605, 2.006653308868408, 2.093087673187256, 2.1795220375061035, 2.265956401824951, 2.352390766143799, 2.4388253688812256, 2.5252597332000732, 2.611694097518921, 2.6981284618377686]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 10.0, 6.0, 10.0, 14.0, 14.0, 19.0, 26.0, 32.0, 30.0, 27.0, 30.0, 40.0, 45.0, 37.0, 45.0, 46.0, 42.0, 33.0, 51.0, 45.0, 45.0, 43.0, 43.0, 42.0, 28.0, 34.0, 29.0, 19.0, 23.0, 19.0, 15.0, 16.0, 14.0, 11.0, 6.0, 4.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2408447265625, -0.23212623596191406, -0.22340774536132812, -0.2146892547607422, -0.20597076416015625, -0.1972522735595703, -0.18853378295898438, -0.17981529235839844, -0.1710968017578125, -0.16237831115722656, -0.15365982055664062, -0.1449413299560547, -0.13622283935546875, -0.1275043487548828, -0.11878585815429688, -0.11006736755371094, -0.101348876953125, -0.09263038635253906, -0.08391189575195312, -0.07519340515136719, -0.06647491455078125, -0.05775642395019531, -0.049037933349609375, -0.04031944274902344, -0.0316009521484375, -0.022882461547851562, -0.014163970947265625, -0.0054454803466796875, 0.00327301025390625, 0.011991500854492188, 0.020709991455078125, 0.029428482055664062, 0.03814697265625, 0.04686546325683594, 0.055583953857421875, 0.06430244445800781, 0.07302093505859375, 0.08173942565917969, 0.09045791625976562, 0.09917640686035156, 0.1078948974609375, 0.11661338806152344, 0.12533187866210938, 0.1340503692626953, 0.14276885986328125, 0.1514873504638672, 0.16020584106445312, 0.16892433166503906, 0.177642822265625, 0.18636131286621094, 0.19507980346679688, 0.2037982940673828, 0.21251678466796875, 0.2212352752685547, 0.22995376586914062, 0.23867225646972656, 0.2473907470703125, 0.25610923767089844, 0.2648277282714844, 0.2735462188720703, 0.28226470947265625, 0.2909832000732422, 0.2997016906738281, 0.30842018127441406, 0.317138671875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 9.0, 19.0, 9.0, 38.0, 30.0, 73.0, 93.0, 186.0, 274.0, 513.0, 931.0, 1769.0, 3663.0, 7649.0, 17354.0, 47213.0, 213112.0, 3171365.0, 607168.0, 76882.0, 25400.0, 10466.0, 4880.0, 2383.0, 1243.0, 638.0, 333.0, 200.0, 146.0, 74.0, 52.0, 34.0, 28.0, 26.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0754241943359375, -1.036590576171875, -0.9977569580078125, -0.95892333984375, -0.9200897216796875, -0.881256103515625, -0.8424224853515625, -0.8035888671875, -0.7647552490234375, -0.725921630859375, -0.6870880126953125, -0.64825439453125, -0.6094207763671875, -0.570587158203125, -0.5317535400390625, -0.492919921875, -0.4540863037109375, -0.415252685546875, -0.3764190673828125, -0.33758544921875, -0.2987518310546875, -0.259918212890625, -0.2210845947265625, -0.1822509765625, -0.1434173583984375, -0.104583740234375, -0.0657501220703125, -0.02691650390625, 0.0119171142578125, 0.050750732421875, 0.0895843505859375, 0.12841796875, 0.1672515869140625, 0.206085205078125, 0.2449188232421875, 0.28375244140625, 0.3225860595703125, 0.361419677734375, 0.4002532958984375, 0.4390869140625, 0.4779205322265625, 0.516754150390625, 0.5555877685546875, 0.59442138671875, 0.6332550048828125, 0.672088623046875, 0.7109222412109375, 0.749755859375, 0.7885894775390625, 0.827423095703125, 0.8662567138671875, 0.90509033203125, 0.9439239501953125, 0.982757568359375, 1.0215911865234375, 1.0604248046875, 1.0992584228515625, 1.138092041015625, 1.1769256591796875, 1.21575927734375, 1.2545928955078125, 1.293426513671875, 1.3322601318359375, 1.37109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 13.0, 13.0, 14.0, 21.0, 35.0, 38.0, 62.0, 95.0, 126.0, 228.0, 423.0, 806.0, 868.0, 505.0, 287.0, 162.0, 109.0, 74.0, 48.0, 35.0, 27.0, 21.0, 16.0, 8.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25390625, -1.217193603515625, -1.18048095703125, -1.143768310546875, -1.1070556640625, -1.070343017578125, -1.03363037109375, -0.996917724609375, -0.960205078125, -0.923492431640625, -0.88677978515625, -0.850067138671875, -0.8133544921875, -0.776641845703125, -0.73992919921875, -0.703216552734375, -0.66650390625, -0.629791259765625, -0.59307861328125, -0.556365966796875, -0.5196533203125, -0.482940673828125, -0.44622802734375, -0.409515380859375, -0.372802734375, -0.336090087890625, -0.29937744140625, -0.262664794921875, -0.2259521484375, -0.189239501953125, -0.15252685546875, -0.115814208984375, -0.0791015625, -0.042388916015625, -0.00567626953125, 0.031036376953125, 0.0677490234375, 0.104461669921875, 0.14117431640625, 0.177886962890625, 0.214599609375, 0.251312255859375, 0.28802490234375, 0.324737548828125, 0.3614501953125, 0.398162841796875, 0.43487548828125, 0.471588134765625, 0.50830078125, 0.545013427734375, 0.58172607421875, 0.618438720703125, 0.6551513671875, 0.691864013671875, 0.72857666015625, 0.765289306640625, 0.802001953125, 0.838714599609375, 0.87542724609375, 0.912139892578125, 0.9488525390625, 0.985565185546875, 1.02227783203125, 1.058990478515625, 1.095703125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 10.0, 11.0, 14.0, 19.0, 25.0, 34.0, 50.0, 97.0, 113.0, 196.0, 300.0, 462.0, 819.0, 1370.0, 2345.0, 4305.0, 8531.0, 17383.0, 39956.0, 114399.0, 598554.0, 2808195.0, 434261.0, 95813.0, 34817.0, 15213.0, 7563.0, 3844.0, 2181.0, 1264.0, 786.0, 492.0, 302.0, 181.0, 124.0, 78.0, 46.0, 37.0, 17.0, 20.0, 8.0, 12.0, 10.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.796875, -1.7475433349609375, -1.698211669921875, -1.6488800048828125, -1.59954833984375, -1.5502166748046875, -1.500885009765625, -1.4515533447265625, -1.4022216796875, -1.3528900146484375, -1.303558349609375, -1.2542266845703125, -1.20489501953125, -1.1555633544921875, -1.106231689453125, -1.0569000244140625, -1.007568359375, -0.9582366943359375, -0.908905029296875, -0.8595733642578125, -0.81024169921875, -0.7609100341796875, -0.711578369140625, -0.6622467041015625, -0.6129150390625, -0.5635833740234375, -0.514251708984375, -0.4649200439453125, -0.41558837890625, -0.3662567138671875, -0.316925048828125, -0.2675933837890625, -0.21826171875, -0.1689300537109375, -0.119598388671875, -0.0702667236328125, -0.02093505859375, 0.0283966064453125, 0.077728271484375, 0.1270599365234375, 0.1763916015625, 0.2257232666015625, 0.275054931640625, 0.3243865966796875, 0.37371826171875, 0.4230499267578125, 0.472381591796875, 0.5217132568359375, 0.571044921875, 0.6203765869140625, 0.669708251953125, 0.7190399169921875, 0.76837158203125, 0.8177032470703125, 0.867034912109375, 0.9163665771484375, 0.9656982421875, 1.0150299072265625, 1.064361572265625, 1.1136932373046875, 1.16302490234375, 1.2123565673828125, 1.261688232421875, 1.3110198974609375, 1.3603515625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 23.0, 38.0, 63.0, 90.0, 167.0, 198.0, 182.0, 102.0, 54.0, 34.0, 21.0, 11.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.590128898620605, -9.369579315185547, -9.149030685424805, -8.928481101989746, -8.707932472229004, -8.487382888793945, -8.266834259033203, -8.046284675598145, -7.825736045837402, -7.605186939239502, -7.384637832641602, -7.164088726043701, -6.943539619445801, -6.7229905128479, -6.50244140625, -6.281891822814941, -6.061342716217041, -5.840793609619141, -5.62024450302124, -5.39969539642334, -5.1791462898254395, -4.958597183227539, -4.7380475997924805, -4.517498970031738, -4.29694938659668, -4.076400279998779, -3.855851173400879, -3.6353020668029785, -3.414752960205078, -3.1942038536071777, -2.9736545085906982, -2.753105401992798, -2.5325565338134766, -2.312007427215576, -2.091458320617676, -1.8709090948104858, -1.6503599882125854, -1.429810881614685, -1.2092616558074951, -0.9887125492095947, -0.7681634426116943, -0.547614336013794, -0.3270651698112488, -0.10651600360870361, 0.11403310298919678, 0.33458220958709717, 0.5551314353942871, 0.7756805419921875, 0.9962296485900879, 1.2167787551879883, 1.4373278617858887, 1.6578770875930786, 1.878426194190979, 2.09897518157959, 2.3195245265960693, 2.5400736331939697, 2.76062273979187, 2.9811718463897705, 3.201720952987671, 3.4222702980041504, 3.642819404602051, 3.863368511199951, 4.083917617797852, 4.304466724395752, 4.525015830993652]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 10.0, 8.0, 12.0, 8.0, 15.0, 10.0, 14.0, 16.0, 21.0, 27.0, 25.0, 32.0, 41.0, 36.0, 39.0, 36.0, 43.0, 37.0, 26.0, 42.0, 45.0, 49.0, 35.0, 44.0, 30.0, 36.0, 33.0, 28.0, 32.0, 21.0, 25.0, 27.0, 12.0, 19.0, 8.0, 14.0, 11.0, 6.0, 7.0, 11.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0], "bins": [-3.2392160892486572, -3.150736093521118, -3.062256097793579, -2.973776340484619, -2.88529634475708, -2.796816349029541, -2.708336353302002, -2.619856357574463, -2.531376361846924, -2.4428963661193848, -2.3544163703918457, -2.2659363746643066, -2.1774566173553467, -2.0889766216278076, -2.0004966259002686, -1.9120166301727295, -1.8235368728637695, -1.7350568771362305, -1.646577000617981, -1.558097004890442, -1.4696171283721924, -1.3811371326446533, -1.2926571369171143, -1.2041771411895752, -1.1156972646713257, -1.0272172689437866, -0.9387373924255371, -0.850257396697998, -0.7617774605751038, -0.6732975244522095, -0.5848175287246704, -0.4963375926017761, -0.40785741806030273, -0.31937748193740845, -0.23089751601219177, -0.1424175500869751, -0.05393761396408081, 0.03454232215881348, 0.12302231788635254, 0.21150225400924683, 0.2999821901321411, 0.3884621262550354, 0.4769420921802521, 0.5654220581054688, 0.653901994228363, 0.7423819303512573, 0.8308619260787964, 0.9193418622016907, 1.007821798324585, 1.096301794052124, 1.1847816705703735, 1.2732616662979126, 1.361741542816162, 1.4502215385437012, 1.5387015342712402, 1.6271815299987793, 1.7156614065170288, 1.8041414022445679, 1.8926212787628174, 1.9811012744903564, 2.0695812702178955, 2.1580610275268555, 2.2465410232543945, 2.3350210189819336, 2.4235010147094727]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 9.0, 8.0, 11.0, 4.0, 12.0, 20.0, 15.0, 22.0, 26.0, 30.0, 35.0, 31.0, 31.0, 40.0, 28.0, 45.0, 32.0, 48.0, 40.0, 34.0, 55.0, 36.0, 33.0, 34.0, 45.0, 33.0, 29.0, 21.0, 34.0, 20.0, 23.0, 15.0, 21.0, 19.0, 10.0, 17.0, 4.0, 8.0, 4.0, 0.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2288818359375, -0.22080039978027344, -0.21271896362304688, -0.2046375274658203, -0.19655609130859375, -0.1884746551513672, -0.18039321899414062, -0.17231178283691406, -0.1642303466796875, -0.15614891052246094, -0.14806747436523438, -0.1399860382080078, -0.13190460205078125, -0.12382316589355469, -0.11574172973632812, -0.10766029357910156, -0.099578857421875, -0.09149742126464844, -0.08341598510742188, -0.07533454895019531, -0.06725311279296875, -0.05917167663574219, -0.051090240478515625, -0.04300880432128906, -0.0349273681640625, -0.026845932006835938, -0.018764495849609375, -0.010683059692382812, -0.00260162353515625, 0.0054798126220703125, 0.013561248779296875, 0.021642684936523438, 0.02972412109375, 0.03780555725097656, 0.045886993408203125, 0.05396842956542969, 0.06204986572265625, 0.07013130187988281, 0.07821273803710938, 0.08629417419433594, 0.0943756103515625, 0.10245704650878906, 0.11053848266601562, 0.11861991882324219, 0.12670135498046875, 0.1347827911376953, 0.14286422729492188, 0.15094566345214844, 0.159027099609375, 0.16710853576660156, 0.17518997192382812, 0.1832714080810547, 0.19135284423828125, 0.1994342803955078, 0.20751571655273438, 0.21559715270996094, 0.2236785888671875, 0.23176002502441406, 0.23984146118164062, 0.2479228973388672, 0.25600433349609375, 0.2640857696533203, 0.2721672058105469, 0.28024864196777344, 0.288330078125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 10.0, 17.0, 21.0, 37.0, 44.0, 92.0, 116.0, 193.0, 280.0, 438.0, 703.0, 1070.0, 1740.0, 2940.0, 4755.0, 8268.0, 14853.0, 27118.0, 50638.0, 93742.0, 162238.0, 221049.0, 191283.0, 120825.0, 65840.0, 35299.0, 19031.0, 10518.0, 6117.0, 3572.0, 2168.0, 1271.0, 773.0, 511.0, 337.0, 224.0, 120.0, 103.0, 66.0, 46.0, 31.0, 13.0, 11.0, 9.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279052734375, -0.26996612548828125, -0.2608795166015625, -0.25179290771484375, -0.242706298828125, -0.23361968994140625, -0.2245330810546875, -0.21544647216796875, -0.20635986328125, -0.19727325439453125, -0.1881866455078125, -0.17910003662109375, -0.170013427734375, -0.16092681884765625, -0.1518402099609375, -0.14275360107421875, -0.1336669921875, -0.12458038330078125, -0.1154937744140625, -0.10640716552734375, -0.097320556640625, -0.08823394775390625, -0.0791473388671875, -0.07006072998046875, -0.06097412109375, -0.05188751220703125, -0.0428009033203125, -0.03371429443359375, -0.024627685546875, -0.01554107666015625, -0.0064544677734375, 0.00263214111328125, 0.01171875, 0.02080535888671875, 0.0298919677734375, 0.03897857666015625, 0.048065185546875, 0.05715179443359375, 0.0662384033203125, 0.07532501220703125, 0.08441162109375, 0.09349822998046875, 0.1025848388671875, 0.11167144775390625, 0.120758056640625, 0.12984466552734375, 0.1389312744140625, 0.14801788330078125, 0.1571044921875, 0.16619110107421875, 0.1752777099609375, 0.18436431884765625, 0.193450927734375, 0.20253753662109375, 0.2116241455078125, 0.22071075439453125, 0.22979736328125, 0.23888397216796875, 0.2479705810546875, 0.25705718994140625, 0.266143798828125, 0.27523040771484375, 0.2843170166015625, 0.29340362548828125, 0.302490234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 7.0, 9.0, 13.0, 6.0, 11.0, 19.0, 17.0, 18.0, 21.0, 21.0, 23.0, 26.0, 31.0, 30.0, 36.0, 26.0, 39.0, 32.0, 40.0, 1062.0, 38.0, 52.0, 36.0, 37.0, 36.0, 37.0, 28.0, 39.0, 26.0, 28.0, 21.0, 31.0, 12.0, 25.0, 16.0, 7.0, 10.0, 8.0, 4.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.228515625, -0.22111892700195312, -0.21372222900390625, -0.20632553100585938, -0.1989288330078125, -0.19153213500976562, -0.18413543701171875, -0.17673873901367188, -0.169342041015625, -0.16194534301757812, -0.15454864501953125, -0.14715194702148438, -0.1397552490234375, -0.13235855102539062, -0.12496185302734375, -0.11756515502929688, -0.11016845703125, -0.10277175903320312, -0.09537506103515625, -0.08797836303710938, -0.0805816650390625, -0.07318496704101562, -0.06578826904296875, -0.058391571044921875, -0.050994873046875, -0.043598175048828125, -0.03620147705078125, -0.028804779052734375, -0.0214080810546875, -0.014011383056640625, -0.00661468505859375, 0.000782012939453125, 0.0081787109375, 0.015575408935546875, 0.02297210693359375, 0.030368804931640625, 0.0377655029296875, 0.045162200927734375, 0.05255889892578125, 0.059955596923828125, 0.067352294921875, 0.07474899291992188, 0.08214569091796875, 0.08954238891601562, 0.0969390869140625, 0.10433578491210938, 0.11173248291015625, 0.11912918090820312, 0.12652587890625, 0.13392257690429688, 0.14131927490234375, 0.14871597290039062, 0.1561126708984375, 0.16350936889648438, 0.17090606689453125, 0.17830276489257812, 0.185699462890625, 0.19309616088867188, 0.20049285888671875, 0.20788955688476562, 0.2152862548828125, 0.22268295288085938, 0.23007965087890625, 0.23747634887695312, 0.244873046875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 3.0, 11.0, 16.0, 10.0, 26.0, 41.0, 52.0, 76.0, 104.0, 166.0, 234.0, 325.0, 531.0, 806.0, 1218.0, 2022.0, 3274.0, 5354.0, 9580.0, 17898.0, 37160.0, 134011.0, 1676651.0, 129292.0, 36863.0, 17611.0, 9530.0, 5500.0, 3240.0, 1923.0, 1215.0, 772.0, 531.0, 345.0, 233.0, 144.0, 112.0, 73.0, 50.0, 41.0, 21.0, 17.0, 6.0, 12.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.390869140625, -0.3798561096191406, -0.36884307861328125, -0.3578300476074219, -0.3468170166015625, -0.3358039855957031, -0.32479095458984375, -0.3137779235839844, -0.302764892578125, -0.2917518615722656, -0.28073883056640625, -0.2697257995605469, -0.2587127685546875, -0.24769973754882812, -0.23668670654296875, -0.22567367553710938, -0.21466064453125, -0.20364761352539062, -0.19263458251953125, -0.18162155151367188, -0.1706085205078125, -0.15959548950195312, -0.14858245849609375, -0.13756942749023438, -0.126556396484375, -0.11554336547851562, -0.10453033447265625, -0.09351730346679688, -0.0825042724609375, -0.07149124145507812, -0.06047821044921875, -0.049465179443359375, -0.0384521484375, -0.027439117431640625, -0.01642608642578125, -0.005413055419921875, 0.0055999755859375, 0.016613006591796875, 0.02762603759765625, 0.038639068603515625, 0.049652099609375, 0.060665130615234375, 0.07167816162109375, 0.08269119262695312, 0.0937042236328125, 0.10471725463867188, 0.11573028564453125, 0.12674331665039062, 0.13775634765625, 0.14876937866210938, 0.15978240966796875, 0.17079544067382812, 0.1818084716796875, 0.19282150268554688, 0.20383453369140625, 0.21484756469726562, 0.225860595703125, 0.23687362670898438, 0.24788665771484375, 0.2588996887207031, 0.2699127197265625, 0.2809257507324219, 0.29193878173828125, 0.3029518127441406, 0.31396484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 15.0, 14.0, 14.0, 19.0, 19.0, 28.0, 24.0, 39.0, 34.0, 58.0, 79.0, 97.0, 83.0, 83.0, 78.0, 47.0, 47.0, 29.0, 40.0, 21.0, 20.0, 16.0, 16.0, 14.0, 8.0, 6.0, 9.0, 9.0, 5.0, 3.0, 5.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.059967041015625, -0.05798959732055664, -0.05601215362548828, -0.05403470993041992, -0.05205726623535156, -0.0500798225402832, -0.048102378845214844, -0.046124935150146484, -0.044147491455078125, -0.042170047760009766, -0.040192604064941406, -0.03821516036987305, -0.03623771667480469, -0.03426027297973633, -0.03228282928466797, -0.03030538558959961, -0.02832794189453125, -0.02635049819946289, -0.02437305450439453, -0.022395610809326172, -0.020418167114257812, -0.018440723419189453, -0.016463279724121094, -0.014485836029052734, -0.012508392333984375, -0.010530948638916016, -0.008553504943847656, -0.006576061248779297, -0.0045986175537109375, -0.002621173858642578, -0.0006437301635742188, 0.0013337135314941406, 0.0033111572265625, 0.005288600921630859, 0.007266044616699219, 0.009243488311767578, 0.011220932006835938, 0.013198375701904297, 0.015175819396972656, 0.017153263092041016, 0.019130706787109375, 0.021108150482177734, 0.023085594177246094, 0.025063037872314453, 0.027040481567382812, 0.029017925262451172, 0.03099536895751953, 0.03297281265258789, 0.03495025634765625, 0.03692770004272461, 0.03890514373779297, 0.04088258743286133, 0.04286003112792969, 0.04483747482299805, 0.046814918518066406, 0.048792362213134766, 0.050769805908203125, 0.052747249603271484, 0.054724693298339844, 0.0567021369934082, 0.05867958068847656, 0.06065702438354492, 0.06263446807861328, 0.06461191177368164, 0.06658935546875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 9.0, 6.0, 5.0, 15.0, 23.0, 35.0, 38.0, 36.0, 60.0, 49.0, 95.0, 100.0, 150.0, 195.0, 535.0, 2869.0, 45346.0, 949178.0, 45687.0, 2698.0, 508.0, 221.0, 150.0, 120.0, 81.0, 66.0, 64.0, 37.0, 38.0, 25.0, 22.0, 22.0, 13.0, 8.0, 7.0, 9.0, 5.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9091796875, -0.8793716430664062, -0.8495635986328125, -0.8197555541992188, -0.789947509765625, -0.7601394653320312, -0.7303314208984375, -0.7005233764648438, -0.67071533203125, -0.6409072875976562, -0.6110992431640625, -0.5812911987304688, -0.551483154296875, -0.5216751098632812, -0.4918670654296875, -0.46205902099609375, -0.4322509765625, -0.40244293212890625, -0.3726348876953125, -0.34282684326171875, -0.313018798828125, -0.28321075439453125, -0.2534027099609375, -0.22359466552734375, -0.19378662109375, -0.16397857666015625, -0.1341705322265625, -0.10436248779296875, -0.074554443359375, -0.04474639892578125, -0.0149383544921875, 0.01486968994140625, 0.044677734375, 0.07448577880859375, 0.1042938232421875, 0.13410186767578125, 0.163909912109375, 0.19371795654296875, 0.2235260009765625, 0.25333404541015625, 0.28314208984375, 0.31295013427734375, 0.3427581787109375, 0.37256622314453125, 0.402374267578125, 0.43218231201171875, 0.4619903564453125, 0.49179840087890625, 0.5216064453125, 0.5514144897460938, 0.5812225341796875, 0.6110305786132812, 0.640838623046875, 0.6706466674804688, 0.7004547119140625, 0.7302627563476562, 0.76007080078125, 0.7898788452148438, 0.8196868896484375, 0.8494949340820312, 0.879302978515625, 0.9091110229492188, 0.9389190673828125, 0.9687271118164062, 0.99853515625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 21.0, 39.0, 196.0, 525.0, 162.0, 47.0, 15.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6840139627456665, -0.6425625085830688, -0.601111114025116, -0.5596597194671631, -0.5182082653045654, -0.47675684094429016, -0.4353054165840149, -0.3938539922237396, -0.35240256786346436, -0.3109511435031891, -0.2694997191429138, -0.22804829478263855, -0.18659687042236328, -0.145145446062088, -0.10369402170181274, -0.062242597341537476, -0.020791172981262207, 0.02066025137901306, 0.06211167573928833, 0.1035631000995636, 0.14501452445983887, 0.18646594882011414, 0.2279173731803894, 0.2693687975406647, 0.31082022190093994, 0.3522716462612152, 0.3937230706214905, 0.43517449498176575, 0.476625919342041, 0.5180773735046387, 0.5595287680625916, 0.6009801626205444, 0.6424314975738525, 0.6838829517364502, 0.7253343462944031, 0.766785740852356, 0.8082371950149536, 0.8496886491775513, 0.8911400437355042, 0.932591438293457, 0.9740428924560547, 1.0154943466186523, 1.05694580078125, 1.098397135734558, 1.1398485898971558, 1.1813000440597534, 1.2227513790130615, 1.2642028331756592, 1.3056542873382568, 1.3471057415008545, 1.3885571956634521, 1.4300085306167603, 1.471459984779358, 1.5129114389419556, 1.5543627738952637, 1.5958142280578613, 1.637265682220459, 1.6787171363830566, 1.7201685905456543, 1.7616199254989624, 1.80307137966156, 1.8445228338241577, 1.8859741687774658, 1.9274256229400635, 1.9688770771026611]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 8.0, 3.0, 3.0, 13.0, 12.0, 12.0, 17.0, 17.0, 19.0, 24.0, 25.0, 20.0, 26.0, 28.0, 34.0, 29.0, 34.0, 44.0, 42.0, 37.0, 46.0, 47.0, 46.0, 46.0, 54.0, 42.0, 39.0, 30.0, 32.0, 26.0, 29.0, 18.0, 24.0, 11.0, 16.0, 14.0, 8.0, 8.0, 5.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21779298782348633, -0.21111373603343964, -0.20443449914455414, -0.19775524735450745, -0.19107599556446075, -0.18439674377441406, -0.17771750688552856, -0.17103825509548187, -0.16435900330543518, -0.1576797515153885, -0.151000514626503, -0.1443212628364563, -0.1376420110464096, -0.13096275925636292, -0.12428352236747742, -0.11760427057743073, -0.11092503368854523, -0.10424578934907913, -0.09756653755903244, -0.09088729321956635, -0.08420804142951965, -0.07752879709005356, -0.07084955275058746, -0.06417030096054077, -0.057491056621074677, -0.05081180855631828, -0.04413256049156189, -0.037453316152095795, -0.0307740680873394, -0.024094820022583008, -0.017415575683116913, -0.01073632761836052, -0.004057079553604126, 0.002622167579829693, 0.009301414713263512, 0.015980660915374756, 0.02265990898013115, 0.029339157044887543, 0.03601840138435364, 0.04269764944911003, 0.049376897513866425, 0.05605614557862282, 0.06273539364337921, 0.0694146379828453, 0.0760938823223114, 0.0827731341123581, 0.08945237845182419, 0.09613162279129028, 0.10281087458133698, 0.10949011892080307, 0.11616937071084976, 0.12284861505031586, 0.12952786684036255, 0.13620710372924805, 0.14288635551929474, 0.14956560730934143, 0.15624484419822693, 0.16292409598827362, 0.16960333287715912, 0.1762825846672058, 0.1829618364572525, 0.1896410882472992, 0.1963203251361847, 0.20299957692623138, 0.20967882871627808]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 6.0, 7.0, 9.0, 7.0, 9.0, 7.0, 14.0, 20.0, 18.0, 31.0, 21.0, 35.0, 33.0, 29.0, 36.0, 33.0, 38.0, 45.0, 36.0, 37.0, 40.0, 46.0, 51.0, 30.0, 30.0, 36.0, 44.0, 28.0, 30.0, 34.0, 22.0, 22.0, 18.0, 19.0, 18.0, 12.0, 12.0, 11.0, 7.0, 7.0, 0.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22599411010742188, -0.21785736083984375, -0.20972061157226562, -0.2015838623046875, -0.19344711303710938, -0.18531036376953125, -0.17717361450195312, -0.169036865234375, -0.16090011596679688, -0.15276336669921875, -0.14462661743164062, -0.1364898681640625, -0.12835311889648438, -0.12021636962890625, -0.11207962036132812, -0.10394287109375, -0.09580612182617188, -0.08766937255859375, -0.07953262329101562, -0.0713958740234375, -0.06325912475585938, -0.05512237548828125, -0.046985626220703125, -0.038848876953125, -0.030712127685546875, -0.02257537841796875, -0.014438629150390625, -0.0063018798828125, 0.001834869384765625, 0.00997161865234375, 0.018108367919921875, 0.0262451171875, 0.034381866455078125, 0.04251861572265625, 0.050655364990234375, 0.0587921142578125, 0.06692886352539062, 0.07506561279296875, 0.08320236206054688, 0.091339111328125, 0.09947586059570312, 0.10761260986328125, 0.11574935913085938, 0.1238861083984375, 0.13202285766601562, 0.14015960693359375, 0.14829635620117188, 0.15643310546875, 0.16456985473632812, 0.17270660400390625, 0.18084335327148438, 0.1889801025390625, 0.19711685180664062, 0.20525360107421875, 0.21339035034179688, 0.221527099609375, 0.22966384887695312, 0.23780059814453125, 0.24593734741210938, 0.2540740966796875, 0.2622108459472656, 0.27034759521484375, 0.2784843444824219, 0.28662109375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 9.0, 20.0, 19.0, 37.0, 31.0, 52.0, 94.0, 112.0, 159.0, 189.0, 278.0, 407.0, 616.0, 901.0, 1400.0, 2526.0, 4654.0, 9317.0, 22700.0, 73809.0, 389227.0, 418228.0, 78721.0, 23520.0, 9588.0, 4728.0, 2676.0, 1497.0, 967.0, 590.0, 429.0, 284.0, 216.0, 150.0, 119.0, 64.0, 66.0, 33.0, 29.0, 32.0, 18.0, 10.0, 8.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0], "bins": [-0.681640625, -0.6621780395507812, -0.6427154541015625, -0.6232528686523438, -0.603790283203125, -0.5843276977539062, -0.5648651123046875, -0.5454025268554688, -0.52593994140625, -0.5064773559570312, -0.4870147705078125, -0.46755218505859375, -0.448089599609375, -0.42862701416015625, -0.4091644287109375, -0.38970184326171875, -0.3702392578125, -0.35077667236328125, -0.3313140869140625, -0.31185150146484375, -0.292388916015625, -0.27292633056640625, -0.2534637451171875, -0.23400115966796875, -0.21453857421875, -0.19507598876953125, -0.1756134033203125, -0.15615081787109375, -0.136688232421875, -0.11722564697265625, -0.0977630615234375, -0.07830047607421875, -0.058837890625, -0.03937530517578125, -0.0199127197265625, -0.00045013427734375, 0.019012451171875, 0.03847503662109375, 0.0579376220703125, 0.07740020751953125, 0.09686279296875, 0.11632537841796875, 0.1357879638671875, 0.15525054931640625, 0.174713134765625, 0.19417572021484375, 0.2136383056640625, 0.23310089111328125, 0.2525634765625, 0.27202606201171875, 0.2914886474609375, 0.31095123291015625, 0.330413818359375, 0.34987640380859375, 0.3693389892578125, 0.38880157470703125, 0.40826416015625, 0.42772674560546875, 0.4471893310546875, 0.46665191650390625, 0.486114501953125, 0.5055770874023438, 0.5250396728515625, 0.5445022583007812, 0.56396484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 10.0, 5.0, 6.0, 5.0, 10.0, 12.0, 13.0, 14.0, 23.0, 29.0, 33.0, 39.0, 29.0, 50.0, 43.0, 34.0, 55.0, 62.0, 97.0, 240.0, 1453.0, 222.0, 105.0, 66.0, 60.0, 65.0, 38.0, 31.0, 30.0, 31.0, 20.0, 19.0, 15.0, 13.0, 14.0, 12.0, 8.0, 6.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0733184814453125, -1.039215087890625, -1.0051116943359375, -0.97100830078125, -0.9369049072265625, -0.902801513671875, -0.8686981201171875, -0.8345947265625, -0.8004913330078125, -0.766387939453125, -0.7322845458984375, -0.69818115234375, -0.6640777587890625, -0.629974365234375, -0.5958709716796875, -0.561767578125, -0.5276641845703125, -0.493560791015625, -0.4594573974609375, -0.42535400390625, -0.3912506103515625, -0.357147216796875, -0.3230438232421875, -0.2889404296875, -0.2548370361328125, -0.220733642578125, -0.1866302490234375, -0.15252685546875, -0.1184234619140625, -0.084320068359375, -0.0502166748046875, -0.01611328125, 0.0179901123046875, 0.052093505859375, 0.0861968994140625, 0.12030029296875, 0.1544036865234375, 0.188507080078125, 0.2226104736328125, 0.2567138671875, 0.2908172607421875, 0.324920654296875, 0.3590240478515625, 0.39312744140625, 0.4272308349609375, 0.461334228515625, 0.4954376220703125, 0.529541015625, 0.5636444091796875, 0.597747802734375, 0.6318511962890625, 0.66595458984375, 0.7000579833984375, 0.734161376953125, 0.7682647705078125, 0.8023681640625, 0.8364715576171875, 0.870574951171875, 0.9046783447265625, 0.93878173828125, 0.9728851318359375, 1.006988525390625, 1.0410919189453125, 1.0751953125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 11.0, 14.0, 32.0, 32.0, 51.0, 43.0, 103.0, 149.0, 261.0, 479.0, 882.0, 1856.0, 4057.0, 10802.0, 37741.0, 401006.0, 2555118.0, 100587.0, 19923.0, 6721.0, 2843.0, 1347.0, 644.0, 345.0, 219.0, 127.0, 102.0, 68.0, 40.0, 18.0, 17.0, 9.0, 14.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.79583740234375, -1.7322998046875, -1.66876220703125, -1.605224609375, -1.54168701171875, -1.4781494140625, -1.41461181640625, -1.35107421875, -1.28753662109375, -1.2239990234375, -1.16046142578125, -1.096923828125, -1.03338623046875, -0.9698486328125, -0.90631103515625, -0.8427734375, -0.77923583984375, -0.7156982421875, -0.65216064453125, -0.588623046875, -0.52508544921875, -0.4615478515625, -0.39801025390625, -0.33447265625, -0.27093505859375, -0.2073974609375, -0.14385986328125, -0.080322265625, -0.01678466796875, 0.0467529296875, 0.11029052734375, 0.173828125, 0.23736572265625, 0.3009033203125, 0.36444091796875, 0.427978515625, 0.49151611328125, 0.5550537109375, 0.61859130859375, 0.68212890625, 0.74566650390625, 0.8092041015625, 0.87274169921875, 0.936279296875, 0.99981689453125, 1.0633544921875, 1.12689208984375, 1.1904296875, 1.25396728515625, 1.3175048828125, 1.38104248046875, 1.444580078125, 1.50811767578125, 1.5716552734375, 1.63519287109375, 1.69873046875, 1.76226806640625, 1.8258056640625, 1.88934326171875, 1.952880859375, 2.01641845703125, 2.0799560546875, 2.14349365234375, 2.20703125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 36.0, 609.0, 361.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.606966495513916, -3.8221938610076904, -3.037421226501465, -2.25264835357666, -1.4678757190704346, -0.683103084564209, 0.1016697883605957, 0.8864421844482422, 1.6712150573730469, 2.4559876918792725, 3.240760326385498, 4.025533199310303, 4.810305595397949, 5.595078468322754, 6.379851341247559, 7.164623737335205, 7.94939661026001, 8.734169006347656, 9.518941879272461, 10.303714752197266, 11.08848762512207, 11.873260498046875, 12.65803337097168, 13.442805290222168, 14.227578163146973, 15.012351036071777, 15.797123908996582, 16.58189582824707, 17.366668701171875, 18.15144157409668, 18.936214447021484, 19.72098731994629, 20.50575828552246, 21.290531158447266, 22.07530403137207, 22.860076904296875, 23.64484977722168, 24.429622650146484, 25.214393615722656, 25.99916648864746, 26.783939361572266, 27.56871223449707, 28.353485107421875, 29.13825798034668, 29.923030853271484, 30.707801818847656, 31.492576599121094, 32.277347564697266, 33.0621223449707, 33.846893310546875, 34.63166809082031, 35.416439056396484, 36.20121383666992, 36.985984802246094, 37.77075958251953, 38.5555305480957, 39.340301513671875, 40.12507247924805, 40.909847259521484, 41.694618225097656, 42.479393005371094, 43.264163970947266, 44.0489387512207, 44.833709716796875, 45.61848449707031]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 5.0, 8.0, 5.0, 13.0, 13.0, 22.0, 16.0, 17.0, 20.0, 29.0, 36.0, 34.0, 28.0, 33.0, 40.0, 49.0, 48.0, 60.0, 51.0, 59.0, 51.0, 36.0, 38.0, 35.0, 25.0, 32.0, 27.0, 23.0, 26.0, 20.0, 23.0, 13.0, 19.0, 14.0, 6.0, 4.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.193919658660889, -4.078916072845459, -3.963912010192871, -3.8489081859588623, -3.7339043617248535, -3.618900775909424, -3.503896713256836, -3.3888931274414062, -3.2738893032073975, -3.1588854789733887, -3.04388165473938, -2.928877830505371, -2.8138740062713623, -2.6988701820373535, -2.583866596221924, -2.468862771987915, -2.3538589477539062, -2.2388551235198975, -2.1238512992858887, -2.00884747505188, -1.8938437700271606, -1.7788399457931519, -1.663836121559143, -1.5488324165344238, -1.433828353881836, -1.3188245296478271, -1.2038207054138184, -1.0888168811798096, -0.9738131761550903, -0.8588093519210815, -0.7438055276870728, -0.6288017630577087, -0.5137979984283447, -0.3987942039966583, -0.2837904095649719, -0.16878658533096313, -0.05378279089927673, 0.06122100353240967, 0.17622482776641846, 0.29122859239578247, 0.40623241662979126, 0.5212362408638, 0.6362400054931641, 0.7512438297271729, 0.8662476539611816, 0.9812514185905457, 1.0962553024291992, 1.2112590074539185, 1.3262628316879272, 1.441266655921936, 1.5562704801559448, 1.671274185180664, 1.7862780094146729, 1.9012818336486816, 2.0162856578826904, 2.131289482116699, 2.246293306350708, 2.361297130584717, 2.4763009548187256, 2.5913047790527344, 2.706308603286743, 2.821312427520752, 2.9363160133361816, 3.0513198375701904, 3.166323661804199]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 6.0, 7.0, 4.0, 4.0, 7.0, 6.0, 5.0, 9.0, 15.0, 14.0, 15.0, 24.0, 24.0, 19.0, 24.0, 43.0, 30.0, 42.0, 31.0, 32.0, 37.0, 33.0, 35.0, 37.0, 48.0, 50.0, 26.0, 33.0, 25.0, 33.0, 30.0, 27.0, 31.0, 25.0, 27.0, 22.0, 27.0, 17.0, 20.0, 9.0, 12.0, 3.0, 4.0, 9.0, 6.0, 6.0, 2.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.239990234375, -0.23199462890625, -0.2239990234375, -0.21600341796875, -0.2080078125, -0.20001220703125, -0.1920166015625, -0.18402099609375, -0.176025390625, -0.16802978515625, -0.1600341796875, -0.15203857421875, -0.14404296875, -0.13604736328125, -0.1280517578125, -0.12005615234375, -0.112060546875, -0.10406494140625, -0.0960693359375, -0.08807373046875, -0.080078125, -0.07208251953125, -0.0640869140625, -0.05609130859375, -0.048095703125, -0.04010009765625, -0.0321044921875, -0.02410888671875, -0.01611328125, -0.00811767578125, -0.0001220703125, 0.00787353515625, 0.015869140625, 0.02386474609375, 0.0318603515625, 0.03985595703125, 0.0478515625, 0.05584716796875, 0.0638427734375, 0.07183837890625, 0.079833984375, 0.08782958984375, 0.0958251953125, 0.10382080078125, 0.11181640625, 0.11981201171875, 0.1278076171875, 0.13580322265625, 0.143798828125, 0.15179443359375, 0.1597900390625, 0.16778564453125, 0.17578125, 0.18377685546875, 0.1917724609375, 0.19976806640625, 0.207763671875, 0.21575927734375, 0.2237548828125, 0.23175048828125, 0.23974609375, 0.24774169921875, 0.2557373046875, 0.26373291015625, 0.271728515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 14.0, 13.0, 18.0, 22.0, 30.0, 41.0, 50.0, 69.0, 111.0, 178.0, 290.0, 539.0, 998.0, 1812.0, 3692.0, 7664.0, 18611.0, 56630.0, 332789.0, 2960354.0, 681884.0, 83668.0, 25129.0, 10218.0, 4657.0, 2165.0, 1159.0, 569.0, 338.0, 177.0, 105.0, 69.0, 52.0, 48.0, 22.0, 15.0, 22.0, 9.0, 9.0, 10.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.888671875, -0.8586883544921875, -0.828704833984375, -0.7987213134765625, -0.76873779296875, -0.7387542724609375, -0.708770751953125, -0.6787872314453125, -0.6488037109375, -0.6188201904296875, -0.588836669921875, -0.5588531494140625, -0.52886962890625, -0.4988861083984375, -0.468902587890625, -0.4389190673828125, -0.408935546875, -0.3789520263671875, -0.348968505859375, -0.3189849853515625, -0.28900146484375, -0.2590179443359375, -0.229034423828125, -0.1990509033203125, -0.1690673828125, -0.1390838623046875, -0.109100341796875, -0.0791168212890625, -0.04913330078125, -0.0191497802734375, 0.010833740234375, 0.0408172607421875, 0.07080078125, 0.1007843017578125, 0.130767822265625, 0.1607513427734375, 0.19073486328125, 0.2207183837890625, 0.250701904296875, 0.2806854248046875, 0.3106689453125, 0.3406524658203125, 0.370635986328125, 0.4006195068359375, 0.43060302734375, 0.4605865478515625, 0.490570068359375, 0.5205535888671875, 0.550537109375, 0.5805206298828125, 0.610504150390625, 0.6404876708984375, 0.67047119140625, 0.7004547119140625, 0.730438232421875, 0.7604217529296875, 0.7904052734375, 0.8203887939453125, 0.850372314453125, 0.8803558349609375, 0.91033935546875, 0.9403228759765625, 0.970306396484375, 1.0002899169921875, 1.0302734375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 7.0, 13.0, 14.0, 32.0, 47.0, 83.0, 95.0, 198.0, 359.0, 806.0, 982.0, 657.0, 305.0, 157.0, 98.0, 71.0, 45.0, 37.0, 24.0, 8.0, 10.0, 9.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.9506378173828125, -0.908111572265625, -0.8655853271484375, -0.82305908203125, -0.7805328369140625, -0.738006591796875, -0.6954803466796875, -0.6529541015625, -0.6104278564453125, -0.567901611328125, -0.5253753662109375, -0.48284912109375, -0.4403228759765625, -0.397796630859375, -0.3552703857421875, -0.312744140625, -0.2702178955078125, -0.227691650390625, -0.1851654052734375, -0.14263916015625, -0.1001129150390625, -0.057586669921875, -0.0150604248046875, 0.0274658203125, 0.0699920654296875, 0.112518310546875, 0.1550445556640625, 0.19757080078125, 0.2400970458984375, 0.282623291015625, 0.3251495361328125, 0.36767578125, 0.4102020263671875, 0.452728271484375, 0.4952545166015625, 0.53778076171875, 0.5803070068359375, 0.622833251953125, 0.6653594970703125, 0.7078857421875, 0.7504119873046875, 0.792938232421875, 0.8354644775390625, 0.87799072265625, 0.9205169677734375, 0.963043212890625, 1.0055694580078125, 1.048095703125, 1.0906219482421875, 1.133148193359375, 1.1756744384765625, 1.21820068359375, 1.2607269287109375, 1.303253173828125, 1.3457794189453125, 1.3883056640625, 1.4308319091796875, 1.473358154296875, 1.5158843994140625, 1.55841064453125, 1.6009368896484375, 1.643463134765625, 1.6859893798828125, 1.728515625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 1.0, 2.0, 6.0, 7.0, 13.0, 13.0, 24.0, 31.0, 40.0, 59.0, 109.0, 165.0, 335.0, 753.0, 1715.0, 4633.0, 16354.0, 77402.0, 1049046.0, 2861455.0, 145369.0, 25689.0, 6846.0, 2336.0, 909.0, 416.0, 235.0, 115.0, 74.0, 41.0, 27.0, 28.0, 12.0, 8.0, 12.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6923828125, -1.6160125732421875, -1.539642333984375, -1.4632720947265625, -1.38690185546875, -1.3105316162109375, -1.234161376953125, -1.1577911376953125, -1.0814208984375, -1.0050506591796875, -0.928680419921875, -0.8523101806640625, -0.77593994140625, -0.6995697021484375, -0.623199462890625, -0.5468292236328125, -0.470458984375, -0.3940887451171875, -0.317718505859375, -0.2413482666015625, -0.16497802734375, -0.0886077880859375, -0.012237548828125, 0.0641326904296875, 0.1405029296875, 0.2168731689453125, 0.293243408203125, 0.3696136474609375, 0.44598388671875, 0.5223541259765625, 0.598724365234375, 0.6750946044921875, 0.75146484375, 0.8278350830078125, 0.904205322265625, 0.9805755615234375, 1.05694580078125, 1.1333160400390625, 1.209686279296875, 1.2860565185546875, 1.3624267578125, 1.4387969970703125, 1.515167236328125, 1.5915374755859375, 1.66790771484375, 1.7442779541015625, 1.820648193359375, 1.8970184326171875, 1.973388671875, 2.0497589111328125, 2.126129150390625, 2.2024993896484375, 2.27886962890625, 2.3552398681640625, 2.431610107421875, 2.5079803466796875, 2.5843505859375, 2.6607208251953125, 2.737091064453125, 2.8134613037109375, 2.88983154296875, 2.9662017822265625, 3.042572021484375, 3.1189422607421875, 3.1953125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 6.0, 4.0, 6.0, 9.0, 4.0, 20.0, 14.0, 23.0, 24.0, 25.0, 46.0, 50.0, 69.0, 78.0, 85.0, 80.0, 101.0, 77.0, 58.0, 50.0, 37.0, 29.0, 16.0, 23.0, 13.0, 18.0, 6.0, 7.0, 2.0, 7.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.330406665802002, -3.2305705547332764, -3.1307342052459717, -3.030898094177246, -2.9310617446899414, -2.831225633621216, -2.7313895225524902, -2.6315531730651855, -2.531716823577881, -2.4318807125091553, -2.3320443630218506, -2.232208251953125, -2.1323719024658203, -2.0325357913970947, -1.9326995611190796, -1.8328633308410645, -1.7330272197723389, -1.6331909894943237, -1.5333547592163086, -1.433518648147583, -1.3336822986602783, -1.2338461875915527, -1.1340099573135376, -1.0341737270355225, -0.9343374967575073, -0.8345012664794922, -0.734665036201477, -0.6348288655281067, -0.5349926352500916, -0.4351564049720764, -0.33532023429870605, -0.23548400402069092, -0.13564753532409668, -0.03581131994724274, 0.0640248954296112, 0.16386109590530396, 0.2636973261833191, 0.36353355646133423, 0.4633697271347046, 0.5632059574127197, 0.6630421876907349, 0.76287841796875, 0.8627146482467651, 0.9625508189201355, 1.0623869895935059, 1.1622233390808105, 1.2620594501495361, 1.3618956804275513, 1.4617319107055664, 1.5615681409835815, 1.6614043712615967, 1.7612404823303223, 1.861076831817627, 1.9609129428863525, 2.060749053955078, 2.160585403442383, 2.2604217529296875, 2.360257863998413, 2.4600942134857178, 2.5599303245544434, 2.659766674041748, 2.7596027851104736, 2.859438896179199, 2.959275245666504, 3.0591113567352295]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 6.0, 10.0, 5.0, 11.0, 9.0, 17.0, 15.0, 14.0, 17.0, 21.0, 24.0, 26.0, 22.0, 23.0, 26.0, 37.0, 25.0, 27.0, 36.0, 37.0, 38.0, 39.0, 35.0, 38.0, 31.0, 38.0, 32.0, 38.0, 27.0, 37.0, 22.0, 19.0, 19.0, 21.0, 21.0, 17.0, 20.0, 15.0, 18.0, 6.0, 4.0, 10.0, 8.0, 8.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.440983772277832, -2.362919807434082, -2.284855604171753, -2.206791400909424, -2.128727436065674, -2.050663471221924, -1.9725992679595947, -1.8945351839065552, -1.8164710998535156, -1.738407015800476, -1.6603429317474365, -1.582278847694397, -1.5042147636413574, -1.4261506795883179, -1.3480865955352783, -1.2700225114822388, -1.1919584274291992, -1.1138943433761597, -1.0358302593231201, -0.9577661752700806, -0.879702091217041, -0.8016380071640015, -0.7235739231109619, -0.6455098390579224, -0.5674457550048828, -0.48938167095184326, -0.4113175868988037, -0.33325350284576416, -0.2551894187927246, -0.17712533473968506, -0.09906125068664551, -0.020997166633605957, 0.057067155838012695, 0.13513123989105225, 0.2131953239440918, 0.29125940799713135, 0.3693234920501709, 0.44738757610321045, 0.52545166015625, 0.6035157442092896, 0.6815798282623291, 0.7596439123153687, 0.8377079963684082, 0.9157720804214478, 0.9938361644744873, 1.0719002485275269, 1.1499643325805664, 1.228028416633606, 1.3060925006866455, 1.384156584739685, 1.4622206687927246, 1.5402847528457642, 1.6183488368988037, 1.6964129209518433, 1.7744770050048828, 1.8525410890579224, 1.930605173110962, 2.008669376373291, 2.086733341217041, 2.164797306060791, 2.24286150932312, 2.320925712585449, 2.398989677429199, 2.477053642272949, 2.5551178455352783]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 10.0, 13.0, 19.0, 18.0, 17.0, 17.0, 13.0, 27.0, 26.0, 25.0, 27.0, 36.0, 33.0, 32.0, 30.0, 39.0, 44.0, 31.0, 39.0, 36.0, 28.0, 36.0, 34.0, 49.0, 28.0, 33.0, 31.0, 25.0, 33.0, 28.0, 19.0, 15.0, 19.0, 14.0, 15.0, 6.0, 4.0, 5.0, 7.0, 5.0, 1.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.249267578125, -0.24105072021484375, -0.2328338623046875, -0.22461700439453125, -0.216400146484375, -0.20818328857421875, -0.1999664306640625, -0.19174957275390625, -0.18353271484375, -0.17531585693359375, -0.1670989990234375, -0.15888214111328125, -0.150665283203125, -0.14244842529296875, -0.1342315673828125, -0.12601470947265625, -0.1177978515625, -0.10958099365234375, -0.1013641357421875, -0.09314727783203125, -0.084930419921875, -0.07671356201171875, -0.0684967041015625, -0.06027984619140625, -0.05206298828125, -0.04384613037109375, -0.0356292724609375, -0.02741241455078125, -0.019195556640625, -0.01097869873046875, -0.0027618408203125, 0.00545501708984375, 0.013671875, 0.02188873291015625, 0.0301055908203125, 0.03832244873046875, 0.046539306640625, 0.05475616455078125, 0.0629730224609375, 0.07118988037109375, 0.07940673828125, 0.08762359619140625, 0.0958404541015625, 0.10405731201171875, 0.112274169921875, 0.12049102783203125, 0.1287078857421875, 0.13692474365234375, 0.1451416015625, 0.15335845947265625, 0.1615753173828125, 0.16979217529296875, 0.178009033203125, 0.18622589111328125, 0.1944427490234375, 0.20265960693359375, 0.21087646484375, 0.21909332275390625, 0.2273101806640625, 0.23552703857421875, 0.243743896484375, 0.25196075439453125, 0.2601776123046875, 0.26839447021484375, 0.276611328125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 10.0, 11.0, 22.0, 25.0, 33.0, 56.0, 68.0, 104.0, 155.0, 224.0, 326.0, 471.0, 726.0, 995.0, 1407.0, 2032.0, 3000.0, 4453.0, 6640.0, 10096.0, 15723.0, 23776.0, 36741.0, 56725.0, 83140.0, 116967.0, 166687.0, 162745.0, 114703.0, 81536.0, 54662.0, 35615.0, 23429.0, 15086.0, 9751.0, 6504.0, 4346.0, 2994.0, 2040.0, 1383.0, 998.0, 717.0, 451.0, 344.0, 214.0, 135.0, 96.0, 67.0, 45.0, 25.0, 18.0, 21.0, 15.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.24072265625, -0.23319244384765625, -0.2256622314453125, -0.21813201904296875, -0.210601806640625, -0.20307159423828125, -0.1955413818359375, -0.18801116943359375, -0.18048095703125, -0.17295074462890625, -0.1654205322265625, -0.15789031982421875, -0.150360107421875, -0.14282989501953125, -0.1352996826171875, -0.12776947021484375, -0.1202392578125, -0.11270904541015625, -0.1051788330078125, -0.09764862060546875, -0.090118408203125, -0.08258819580078125, -0.0750579833984375, -0.06752777099609375, -0.05999755859375, -0.05246734619140625, -0.0449371337890625, -0.03740692138671875, -0.029876708984375, -0.02234649658203125, -0.0148162841796875, -0.00728607177734375, 0.000244140625, 0.00777435302734375, 0.0153045654296875, 0.02283477783203125, 0.030364990234375, 0.03789520263671875, 0.0454254150390625, 0.05295562744140625, 0.06048583984375, 0.06801605224609375, 0.0755462646484375, 0.08307647705078125, 0.090606689453125, 0.09813690185546875, 0.1056671142578125, 0.11319732666015625, 0.1207275390625, 0.12825775146484375, 0.1357879638671875, 0.14331817626953125, 0.150848388671875, 0.15837860107421875, 0.1659088134765625, 0.17343902587890625, 0.18096923828125, 0.18849945068359375, 0.1960296630859375, 0.20355987548828125, 0.211090087890625, 0.21862030029296875, 0.2261505126953125, 0.23368072509765625, 0.2412109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 4.0, 9.0, 10.0, 13.0, 7.0, 11.0, 27.0, 21.0, 21.0, 23.0, 26.0, 39.0, 27.0, 37.0, 35.0, 34.0, 31.0, 41.0, 35.0, 32.0, 1058.0, 36.0, 48.0, 38.0, 39.0, 31.0, 35.0, 36.0, 31.0, 35.0, 19.0, 10.0, 13.0, 11.0, 16.0, 15.0, 15.0, 5.0, 14.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.23848915100097656, -0.23027420043945312, -0.2220592498779297, -0.21384429931640625, -0.2056293487548828, -0.19741439819335938, -0.18919944763183594, -0.1809844970703125, -0.17276954650878906, -0.16455459594726562, -0.1563396453857422, -0.14812469482421875, -0.1399097442626953, -0.13169479370117188, -0.12347984313964844, -0.115264892578125, -0.10704994201660156, -0.09883499145507812, -0.09062004089355469, -0.08240509033203125, -0.07419013977050781, -0.06597518920898438, -0.05776023864746094, -0.0495452880859375, -0.04133033752441406, -0.033115386962890625, -0.024900436401367188, -0.01668548583984375, -0.008470535278320312, -0.000255584716796875, 0.007959365844726562, 0.01617431640625, 0.024389266967773438, 0.032604217529296875, 0.04081916809082031, 0.04903411865234375, 0.05724906921386719, 0.06546401977539062, 0.07367897033691406, 0.0818939208984375, 0.09010887145996094, 0.09832382202148438, 0.10653877258300781, 0.11475372314453125, 0.12296867370605469, 0.13118362426757812, 0.13939857482910156, 0.147613525390625, 0.15582847595214844, 0.16404342651367188, 0.1722583770751953, 0.18047332763671875, 0.1886882781982422, 0.19690322875976562, 0.20511817932128906, 0.2133331298828125, 0.22154808044433594, 0.22976303100585938, 0.2379779815673828, 0.24619293212890625, 0.2544078826904297, 0.2626228332519531, 0.27083778381347656, 0.279052734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 3.0, 8.0, 8.0, 13.0, 19.0, 27.0, 21.0, 44.0, 59.0, 82.0, 117.0, 196.0, 289.0, 391.0, 590.0, 819.0, 1235.0, 1834.0, 2823.0, 4390.0, 7028.0, 11690.0, 20538.0, 42608.0, 187819.0, 1629029.0, 105776.0, 34437.0, 17385.0, 10064.0, 6217.0, 3878.0, 2501.0, 1592.0, 1163.0, 750.0, 517.0, 336.0, 239.0, 168.0, 125.0, 88.0, 63.0, 41.0, 33.0, 23.0, 21.0, 9.0, 5.0, 2.0, 4.0, 6.0, 3.0, 2.0, 3.0], "bins": [-0.400146484375, -0.3885040283203125, -0.376861572265625, -0.3652191162109375, -0.35357666015625, -0.3419342041015625, -0.330291748046875, -0.3186492919921875, -0.3070068359375, -0.2953643798828125, -0.283721923828125, -0.2720794677734375, -0.26043701171875, -0.2487945556640625, -0.237152099609375, -0.2255096435546875, -0.2138671875, -0.2022247314453125, -0.190582275390625, -0.1789398193359375, -0.16729736328125, -0.1556549072265625, -0.144012451171875, -0.1323699951171875, -0.1207275390625, -0.1090850830078125, -0.097442626953125, -0.0858001708984375, -0.07415771484375, -0.0625152587890625, -0.050872802734375, -0.0392303466796875, -0.027587890625, -0.0159454345703125, -0.004302978515625, 0.0073394775390625, 0.01898193359375, 0.0306243896484375, 0.042266845703125, 0.0539093017578125, 0.0655517578125, 0.0771942138671875, 0.088836669921875, 0.1004791259765625, 0.11212158203125, 0.1237640380859375, 0.135406494140625, 0.1470489501953125, 0.15869140625, 0.1703338623046875, 0.181976318359375, 0.1936187744140625, 0.20526123046875, 0.2169036865234375, 0.228546142578125, 0.2401885986328125, 0.2518310546875, 0.2634735107421875, 0.275115966796875, 0.2867584228515625, 0.29840087890625, 0.3100433349609375, 0.321685791015625, 0.3333282470703125, 0.344970703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 9.0, 3.0, 2.0, 6.0, 6.0, 15.0, 12.0, 17.0, 17.0, 19.0, 36.0, 39.0, 32.0, 43.0, 47.0, 59.0, 81.0, 99.0, 86.0, 50.0, 52.0, 58.0, 29.0, 29.0, 31.0, 20.0, 14.0, 18.0, 9.0, 12.0, 11.0, 9.0, 8.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0540771484375, -0.05225706100463867, -0.050436973571777344, -0.048616886138916016, -0.04679679870605469, -0.04497671127319336, -0.04315662384033203, -0.0413365364074707, -0.039516448974609375, -0.03769636154174805, -0.03587627410888672, -0.03405618667602539, -0.03223609924316406, -0.030416011810302734, -0.028595924377441406, -0.026775836944580078, -0.02495574951171875, -0.023135662078857422, -0.021315574645996094, -0.019495487213134766, -0.017675399780273438, -0.01585531234741211, -0.014035224914550781, -0.012215137481689453, -0.010395050048828125, -0.008574962615966797, -0.006754875183105469, -0.004934787750244141, -0.0031147003173828125, -0.0012946128845214844, 0.0005254745483398438, 0.002345561981201172, 0.0041656494140625, 0.005985736846923828, 0.007805824279785156, 0.009625911712646484, 0.011445999145507812, 0.01326608657836914, 0.015086174011230469, 0.016906261444091797, 0.018726348876953125, 0.020546436309814453, 0.02236652374267578, 0.02418661117553711, 0.026006698608398438, 0.027826786041259766, 0.029646873474121094, 0.03146696090698242, 0.03328704833984375, 0.03510713577270508, 0.036927223205566406, 0.038747310638427734, 0.04056739807128906, 0.04238748550415039, 0.04420757293701172, 0.04602766036987305, 0.047847747802734375, 0.0496678352355957, 0.05148792266845703, 0.05330801010131836, 0.05512809753417969, 0.056948184967041016, 0.058768272399902344, 0.06058835983276367, 0.062408447265625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 6.0, 4.0, 7.0, 5.0, 8.0, 6.0, 11.0, 13.0, 21.0, 20.0, 23.0, 26.0, 48.0, 61.0, 88.0, 120.0, 132.0, 199.0, 367.0, 943.0, 4686.0, 47579.0, 853802.0, 128760.0, 8967.0, 1399.0, 411.0, 201.0, 161.0, 114.0, 67.0, 71.0, 47.0, 42.0, 24.0, 27.0, 12.0, 21.0, 9.0, 9.0, 5.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.78759765625, -0.7627182006835938, -0.7378387451171875, -0.7129592895507812, -0.688079833984375, -0.6632003784179688, -0.6383209228515625, -0.6134414672851562, -0.58856201171875, -0.5636825561523438, -0.5388031005859375, -0.5139236450195312, -0.489044189453125, -0.46416473388671875, -0.4392852783203125, -0.41440582275390625, -0.3895263671875, -0.36464691162109375, -0.3397674560546875, -0.31488800048828125, -0.290008544921875, -0.26512908935546875, -0.2402496337890625, -0.21537017822265625, -0.19049072265625, -0.16561126708984375, -0.1407318115234375, -0.11585235595703125, -0.090972900390625, -0.06609344482421875, -0.0412139892578125, -0.01633453369140625, 0.008544921875, 0.03342437744140625, 0.0583038330078125, 0.08318328857421875, 0.108062744140625, 0.13294219970703125, 0.1578216552734375, 0.18270111083984375, 0.20758056640625, 0.23246002197265625, 0.2573394775390625, 0.28221893310546875, 0.307098388671875, 0.33197784423828125, 0.3568572998046875, 0.38173675537109375, 0.4066162109375, 0.43149566650390625, 0.4563751220703125, 0.48125457763671875, 0.506134033203125, 0.5310134887695312, 0.5558929443359375, 0.5807723999023438, 0.60565185546875, 0.6305313110351562, 0.6554107666015625, 0.6802902221679688, 0.705169677734375, 0.7300491333007812, 0.7549285888671875, 0.7798080444335938, 0.8046875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 31.0, 141.0, 430.0, 285.0, 76.0, 34.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7189536094665527, -0.6761913895606995, -0.6334291696548462, -0.5906668901443481, -0.5479046702384949, -0.5051424503326416, -0.46238023042678833, -0.41961798071861267, -0.3768557608127594, -0.33409354090690613, -0.29133129119873047, -0.2485690712928772, -0.20580683648586273, -0.16304460167884827, -0.120282381772995, -0.07752013206481934, -0.034757912158966064, 0.008004318922758102, 0.05076655000448227, 0.09352877736091614, 0.1362910121679306, 0.17905324697494507, 0.22181546688079834, 0.264577716588974, 0.30733993649482727, 0.35010215640068054, 0.3928644061088562, 0.4356266260147095, 0.47838884592056274, 0.521151065826416, 0.5639133453369141, 0.6066755652427673, 0.6494377851486206, 0.6922000050544739, 0.7349622249603271, 0.7777245044708252, 0.8204867243766785, 0.8632489442825317, 0.906011164188385, 0.9487733840942383, 0.9915356636047363, 1.0342979431152344, 1.0770601034164429, 1.119822382926941, 1.1625845432281494, 1.2053468227386475, 1.2481091022491455, 1.290871262550354, 1.3336334228515625, 1.3763957023620605, 1.419157862663269, 1.461920142173767, 1.5046823024749756, 1.5474445819854736, 1.5902068614959717, 1.6329690217971802, 1.6757313013076782, 1.7184935808181763, 1.7612557411193848, 1.8040180206298828, 1.8467801809310913, 1.8895424604415894, 1.9323046207427979, 1.975066900253296, 2.017829179763794]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 6.0, 8.0, 10.0, 8.0, 10.0, 16.0, 20.0, 18.0, 23.0, 26.0, 15.0, 27.0, 19.0, 30.0, 30.0, 33.0, 34.0, 46.0, 36.0, 44.0, 49.0, 31.0, 38.0, 31.0, 43.0, 34.0, 36.0, 28.0, 41.0, 27.0, 28.0, 27.0, 17.0, 21.0, 14.0, 17.0, 11.0, 8.0, 8.0, 4.0, 1.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.20906317234039307, -0.20200622081756592, -0.19494926929473877, -0.18789231777191162, -0.18083536624908447, -0.17377841472625732, -0.16672144830226898, -0.15966449677944183, -0.15260754525661469, -0.14555059373378754, -0.1384936422109604, -0.13143669068813324, -0.1243797317147255, -0.11732278019189835, -0.1102658212184906, -0.10320886969566345, -0.0961519181728363, -0.08909496665000916, -0.082038015127182, -0.07498105615377426, -0.06792410463094711, -0.060867153108119965, -0.05381019786000252, -0.04675324261188507, -0.03969629108905792, -0.032639339566230774, -0.025582384318113327, -0.01852543093264103, -0.011468477547168732, -0.004411526024341583, 0.0026454292237758636, 0.00970238447189331, 0.01675933599472046, 0.023816289380192757, 0.030873242765665054, 0.0379301980137825, 0.04498714953660965, 0.0520441010594368, 0.059101056307554245, 0.06615801155567169, 0.07321496307849884, 0.08027191460132599, 0.08732886612415314, 0.09438582509756088, 0.10144277662038803, 0.10849972814321518, 0.11555668711662292, 0.12261363863945007, 0.12967059016227722, 0.13672754168510437, 0.14378449320793152, 0.15084144473075867, 0.15789839625358582, 0.16495534777641296, 0.1720123142004013, 0.17906926572322845, 0.1861262172460556, 0.19318316876888275, 0.2002401202917099, 0.20729707181453705, 0.2143540382385254, 0.22141098976135254, 0.2284679412841797, 0.23552489280700684, 0.24258184432983398]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 6.0, 11.0, 18.0, 15.0, 16.0, 22.0, 12.0, 17.0, 28.0, 26.0, 25.0, 28.0, 36.0, 35.0, 36.0, 27.0, 33.0, 42.0, 36.0, 31.0, 40.0, 35.0, 36.0, 30.0, 37.0, 36.0, 32.0, 31.0, 23.0, 38.0, 19.0, 18.0, 18.0, 14.0, 19.0, 11.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2452392578125, -0.2370929718017578, -0.22894668579101562, -0.22080039978027344, -0.21265411376953125, -0.20450782775878906, -0.19636154174804688, -0.1882152557373047, -0.1800689697265625, -0.1719226837158203, -0.16377639770507812, -0.15563011169433594, -0.14748382568359375, -0.13933753967285156, -0.13119125366210938, -0.12304496765136719, -0.114898681640625, -0.10675239562988281, -0.09860610961914062, -0.09045982360839844, -0.08231353759765625, -0.07416725158691406, -0.06602096557617188, -0.05787467956542969, -0.0497283935546875, -0.04158210754394531, -0.033435821533203125, -0.025289535522460938, -0.01714324951171875, -0.008996963500976562, -0.000850677490234375, 0.0072956085205078125, 0.01544189453125, 0.023588180541992188, 0.031734466552734375, 0.03988075256347656, 0.04802703857421875, 0.05617332458496094, 0.06431961059570312, 0.07246589660644531, 0.0806121826171875, 0.08875846862792969, 0.09690475463867188, 0.10505104064941406, 0.11319732666015625, 0.12134361267089844, 0.12948989868164062, 0.1376361846923828, 0.145782470703125, 0.1539287567138672, 0.16207504272460938, 0.17022132873535156, 0.17836761474609375, 0.18651390075683594, 0.19466018676757812, 0.2028064727783203, 0.2109527587890625, 0.2190990447998047, 0.22724533081054688, 0.23539161682128906, 0.24353790283203125, 0.25168418884277344, 0.2598304748535156, 0.2679767608642578, 0.276123046875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 11.0, 16.0, 19.0, 32.0, 29.0, 47.0, 58.0, 74.0, 105.0, 145.0, 222.0, 336.0, 415.0, 668.0, 940.0, 1387.0, 2143.0, 3445.0, 5903.0, 10973.0, 24118.0, 69348.0, 276747.0, 457612.0, 122197.0, 36659.0, 15036.0, 7548.0, 4340.0, 2588.0, 1663.0, 1153.0, 775.0, 527.0, 347.0, 250.0, 180.0, 142.0, 105.0, 63.0, 54.0, 40.0, 25.0, 30.0, 16.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.76904296875, -0.7465667724609375, -0.724090576171875, -0.7016143798828125, -0.67913818359375, -0.6566619873046875, -0.634185791015625, -0.6117095947265625, -0.5892333984375, -0.5667572021484375, -0.544281005859375, -0.5218048095703125, -0.49932861328125, -0.4768524169921875, -0.454376220703125, -0.4319000244140625, -0.409423828125, -0.3869476318359375, -0.364471435546875, -0.3419952392578125, -0.31951904296875, -0.2970428466796875, -0.274566650390625, -0.2520904541015625, -0.2296142578125, -0.2071380615234375, -0.184661865234375, -0.1621856689453125, -0.13970947265625, -0.1172332763671875, -0.094757080078125, -0.0722808837890625, -0.0498046875, -0.0273284912109375, -0.004852294921875, 0.0176239013671875, 0.04010009765625, 0.0625762939453125, 0.085052490234375, 0.1075286865234375, 0.1300048828125, 0.1524810791015625, 0.174957275390625, 0.1974334716796875, 0.21990966796875, 0.2423858642578125, 0.264862060546875, 0.2873382568359375, 0.309814453125, 0.3322906494140625, 0.354766845703125, 0.3772430419921875, 0.39971923828125, 0.4221954345703125, 0.444671630859375, 0.4671478271484375, 0.4896240234375, 0.5121002197265625, 0.534576416015625, 0.5570526123046875, 0.57952880859375, 0.6020050048828125, 0.624481201171875, 0.6469573974609375, 0.66943359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 10.0, 8.0, 8.0, 14.0, 23.0, 24.0, 30.0, 33.0, 25.0, 34.0, 66.0, 68.0, 79.0, 107.0, 206.0, 1328.0, 291.0, 148.0, 105.0, 80.0, 55.0, 46.0, 34.0, 38.0, 33.0, 31.0, 19.0, 24.0, 16.0, 10.0, 11.0, 7.0, 5.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.4677734375, -1.4278717041015625, -1.387969970703125, -1.3480682373046875, -1.30816650390625, -1.2682647705078125, -1.228363037109375, -1.1884613037109375, -1.1485595703125, -1.1086578369140625, -1.068756103515625, -1.0288543701171875, -0.98895263671875, -0.9490509033203125, -0.909149169921875, -0.8692474365234375, -0.829345703125, -0.7894439697265625, -0.749542236328125, -0.7096405029296875, -0.66973876953125, -0.6298370361328125, -0.589935302734375, -0.5500335693359375, -0.5101318359375, -0.4702301025390625, -0.430328369140625, -0.3904266357421875, -0.35052490234375, -0.3106231689453125, -0.270721435546875, -0.2308197021484375, -0.19091796875, -0.1510162353515625, -0.111114501953125, -0.0712127685546875, -0.03131103515625, 0.0085906982421875, 0.048492431640625, 0.0883941650390625, 0.1282958984375, 0.1681976318359375, 0.208099365234375, 0.2480010986328125, 0.28790283203125, 0.3278045654296875, 0.367706298828125, 0.4076080322265625, 0.447509765625, 0.4874114990234375, 0.527313232421875, 0.5672149658203125, 0.60711669921875, 0.6470184326171875, 0.686920166015625, 0.7268218994140625, 0.7667236328125, 0.8066253662109375, 0.846527099609375, 0.8864288330078125, 0.92633056640625, 0.9662322998046875, 1.006134033203125, 1.0460357666015625, 1.0859375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 2.0, 15.0, 15.0, 36.0, 64.0, 116.0, 195.0, 343.0, 706.0, 1669.0, 4400.0, 14894.0, 114948.0, 2879539.0, 106852.0, 14550.0, 4280.0, 1674.0, 687.0, 318.0, 152.0, 69.0, 52.0, 33.0, 20.0, 24.0, 8.0, 14.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.60546875, -4.485809326171875, -4.36614990234375, -4.246490478515625, -4.1268310546875, -4.007171630859375, -3.88751220703125, -3.767852783203125, -3.648193359375, -3.528533935546875, -3.40887451171875, -3.289215087890625, -3.1695556640625, -3.049896240234375, -2.93023681640625, -2.810577392578125, -2.69091796875, -2.571258544921875, -2.45159912109375, -2.331939697265625, -2.2122802734375, -2.092620849609375, -1.97296142578125, -1.853302001953125, -1.733642578125, -1.613983154296875, -1.49432373046875, -1.374664306640625, -1.2550048828125, -1.135345458984375, -1.01568603515625, -0.896026611328125, -0.7763671875, -0.656707763671875, -0.53704833984375, -0.417388916015625, -0.2977294921875, -0.178070068359375, -0.05841064453125, 0.061248779296875, 0.180908203125, 0.300567626953125, 0.42022705078125, 0.539886474609375, 0.6595458984375, 0.779205322265625, 0.89886474609375, 1.018524169921875, 1.13818359375, 1.257843017578125, 1.37750244140625, 1.497161865234375, 1.6168212890625, 1.736480712890625, 1.85614013671875, 1.975799560546875, 2.095458984375, 2.215118408203125, 2.33477783203125, 2.454437255859375, 2.5740966796875, 2.693756103515625, 2.81341552734375, 2.933074951171875, 3.052734375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 25.0, 122.0, 491.0, 306.0, 55.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.91695785522461, -19.343774795532227, -18.77058982849121, -18.197406768798828, -17.624221801757812, -17.05103874206543, -16.477853775024414, -15.904670715332031, -15.331486701965332, -14.758302688598633, -14.185118675231934, -13.611934661865234, -13.038751602172852, -12.465566635131836, -11.892383575439453, -11.319199562072754, -10.746015548706055, -10.172831535339355, -9.599647521972656, -9.026463508605957, -8.453279495239258, -7.880095958709717, -7.306912422180176, -6.733728408813477, -6.160544395446777, -5.587360382080078, -5.014176368713379, -4.440992832183838, -3.8678088188171387, -3.2946248054504395, -2.7214410305023193, -2.148257255554199, -1.5750713348388672, -1.0018874406814575, -0.42870354652404785, 0.14448034763336182, 0.7176642417907715, 1.2908482551574707, 1.8640320301055908, 2.437215805053711, 3.01039981842041, 3.5835838317871094, 4.156767845153809, 4.72995138168335, 5.303135395050049, 5.876319408416748, 6.449502944946289, 7.022686958312988, 7.5958709716796875, 8.169054985046387, 8.742238998413086, 9.315423011779785, 9.888607025146484, 10.461790084838867, 11.034974098205566, 11.608158111572266, 12.181342124938965, 12.754526138305664, 13.327710151672363, 13.900894165039062, 14.474077224731445, 15.047262191772461, 15.620445251464844, 16.19363021850586, 16.766813278198242]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 4.0, 4.0, 6.0, 9.0, 10.0, 12.0, 15.0, 13.0, 22.0, 25.0, 17.0, 27.0, 29.0, 38.0, 42.0, 27.0, 43.0, 40.0, 43.0, 36.0, 48.0, 54.0, 39.0, 43.0, 39.0, 36.0, 37.0, 31.0, 32.0, 33.0, 9.0, 28.0, 19.0, 17.0, 13.0, 12.0, 12.0, 13.0, 7.0, 3.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6301040649414062, -3.50264835357666, -3.375192642211914, -3.247736930847168, -3.120281457901001, -2.992825746536255, -2.865370035171509, -2.7379143238067627, -2.6104588508605957, -2.4830031394958496, -2.3555474281311035, -2.2280917167663574, -2.1006362438201904, -1.9731805324554443, -1.8457248210906982, -1.7182691097259521, -1.590813398361206, -1.46335768699646, -1.3359020948410034, -1.2084463834762573, -1.0809907913208008, -0.9535350799560547, -0.8260793685913086, -0.6986237168312073, -0.571168065071106, -0.44371241331100464, -0.31625673174858093, -0.18880105018615723, -0.06134539842605591, 0.06611025333404541, 0.1935659646987915, 0.3210216164588928, 0.44847726821899414, 0.5759329199790955, 0.7033885717391968, 0.8308442831039429, 0.9582999348640442, 1.0857555866241455, 1.2132112979888916, 1.3406670093536377, 1.4681226015090942, 1.5955783128738403, 1.7230339050292969, 1.850489616394043, 1.977945327758789, 2.105401039123535, 2.2328567504882812, 2.3603122234344482, 2.4877679347991943, 2.6152236461639404, 2.7426793575286865, 2.8701348304748535, 2.9975905418395996, 3.1250462532043457, 3.252501964569092, 3.379957675933838, 3.507413387298584, 3.63486909866333, 3.762324810028076, 3.8897805213928223, 4.017236232757568, 4.144691467285156, 4.272147178649902, 4.399602890014648, 4.5270586013793945]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 1.0, 8.0, 4.0, 12.0, 7.0, 14.0, 14.0, 17.0, 15.0, 17.0, 17.0, 30.0, 32.0, 27.0, 25.0, 30.0, 41.0, 29.0, 38.0, 33.0, 32.0, 38.0, 46.0, 35.0, 37.0, 40.0, 26.0, 42.0, 27.0, 36.0, 25.0, 35.0, 27.0, 22.0, 10.0, 22.0, 15.0, 14.0, 18.0, 8.0, 12.0, 6.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294677734375, -0.28527069091796875, -0.2758636474609375, -0.26645660400390625, -0.257049560546875, -0.24764251708984375, -0.2382354736328125, -0.22882843017578125, -0.21942138671875, -0.21001434326171875, -0.2006072998046875, -0.19120025634765625, -0.181793212890625, -0.17238616943359375, -0.1629791259765625, -0.15357208251953125, -0.1441650390625, -0.13475799560546875, -0.1253509521484375, -0.11594390869140625, -0.106536865234375, -0.09712982177734375, -0.0877227783203125, -0.07831573486328125, -0.06890869140625, -0.05950164794921875, -0.0500946044921875, -0.04068756103515625, -0.031280517578125, -0.02187347412109375, -0.0124664306640625, -0.00305938720703125, 0.00634765625, 0.01575469970703125, 0.0251617431640625, 0.03456878662109375, 0.043975830078125, 0.05338287353515625, 0.0627899169921875, 0.07219696044921875, 0.08160400390625, 0.09101104736328125, 0.1004180908203125, 0.10982513427734375, 0.119232177734375, 0.12863922119140625, 0.1380462646484375, 0.14745330810546875, 0.1568603515625, 0.16626739501953125, 0.1756744384765625, 0.18508148193359375, 0.194488525390625, 0.20389556884765625, 0.2133026123046875, 0.22270965576171875, 0.23211669921875, 0.24152374267578125, 0.2509307861328125, 0.26033782958984375, 0.269744873046875, 0.27915191650390625, 0.2885589599609375, 0.29796600341796875, 0.307373046875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 12.0, 11.0, 12.0, 12.0, 23.0, 28.0, 47.0, 59.0, 83.0, 132.0, 227.0, 435.0, 622.0, 1204.0, 2381.0, 4919.0, 10654.0, 25722.0, 86264.0, 775455.0, 2907940.0, 291468.0, 52813.0, 18143.0, 7887.0, 3717.0, 1777.0, 864.0, 522.0, 304.0, 168.0, 109.0, 65.0, 50.0, 35.0, 23.0, 22.0, 15.0, 14.0, 15.0, 6.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.927734375, -0.896087646484375, -0.86444091796875, -0.832794189453125, -0.8011474609375, -0.769500732421875, -0.73785400390625, -0.706207275390625, -0.674560546875, -0.642913818359375, -0.61126708984375, -0.579620361328125, -0.5479736328125, -0.516326904296875, -0.48468017578125, -0.453033447265625, -0.42138671875, -0.389739990234375, -0.35809326171875, -0.326446533203125, -0.2947998046875, -0.263153076171875, -0.23150634765625, -0.199859619140625, -0.168212890625, -0.136566162109375, -0.10491943359375, -0.073272705078125, -0.0416259765625, -0.009979248046875, 0.02166748046875, 0.053314208984375, 0.0849609375, 0.116607666015625, 0.14825439453125, 0.179901123046875, 0.2115478515625, 0.243194580078125, 0.27484130859375, 0.306488037109375, 0.338134765625, 0.369781494140625, 0.40142822265625, 0.433074951171875, 0.4647216796875, 0.496368408203125, 0.52801513671875, 0.559661865234375, 0.59130859375, 0.622955322265625, 0.65460205078125, 0.686248779296875, 0.7178955078125, 0.749542236328125, 0.78118896484375, 0.812835693359375, 0.844482421875, 0.876129150390625, 0.90777587890625, 0.939422607421875, 0.9710693359375, 1.002716064453125, 1.03436279296875, 1.066009521484375, 1.09765625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 5.0, 7.0, 11.0, 16.0, 17.0, 17.0, 28.0, 50.0, 58.0, 81.0, 118.0, 173.0, 324.0, 674.0, 868.0, 654.0, 352.0, 234.0, 124.0, 71.0, 56.0, 36.0, 26.0, 22.0, 15.0, 11.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.857421875, -0.8210296630859375, -0.784637451171875, -0.7482452392578125, -0.71185302734375, -0.6754608154296875, -0.639068603515625, -0.6026763916015625, -0.5662841796875, -0.5298919677734375, -0.493499755859375, -0.4571075439453125, -0.42071533203125, -0.3843231201171875, -0.347930908203125, -0.3115386962890625, -0.275146484375, -0.2387542724609375, -0.202362060546875, -0.1659698486328125, -0.12957763671875, -0.0931854248046875, -0.056793212890625, -0.0204010009765625, 0.0159912109375, 0.0523834228515625, 0.088775634765625, 0.1251678466796875, 0.16156005859375, 0.1979522705078125, 0.234344482421875, 0.2707366943359375, 0.30712890625, 0.3435211181640625, 0.379913330078125, 0.4163055419921875, 0.45269775390625, 0.4890899658203125, 0.525482177734375, 0.5618743896484375, 0.5982666015625, 0.6346588134765625, 0.671051025390625, 0.7074432373046875, 0.74383544921875, 0.7802276611328125, 0.816619873046875, 0.8530120849609375, 0.889404296875, 0.9257965087890625, 0.962188720703125, 0.9985809326171875, 1.03497314453125, 1.0713653564453125, 1.107757568359375, 1.1441497802734375, 1.1805419921875, 1.2169342041015625, 1.253326416015625, 1.2897186279296875, 1.32611083984375, 1.3625030517578125, 1.398895263671875, 1.4352874755859375, 1.4716796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 10.0, 12.0, 12.0, 20.0, 46.0, 55.0, 109.0, 198.0, 437.0, 1004.0, 2684.0, 7439.0, 24694.0, 127025.0, 2683545.0, 1236757.0, 81896.0, 18481.0, 5762.0, 2247.0, 988.0, 439.0, 196.0, 90.0, 47.0, 43.0, 23.0, 5.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.87652587890625, -1.7979736328125, -1.71942138671875, -1.640869140625, -1.56231689453125, -1.4837646484375, -1.40521240234375, -1.32666015625, -1.24810791015625, -1.1695556640625, -1.09100341796875, -1.012451171875, -0.93389892578125, -0.8553466796875, -0.77679443359375, -0.6982421875, -0.61968994140625, -0.5411376953125, -0.46258544921875, -0.384033203125, -0.30548095703125, -0.2269287109375, -0.14837646484375, -0.06982421875, 0.00872802734375, 0.0872802734375, 0.16583251953125, 0.244384765625, 0.32293701171875, 0.4014892578125, 0.48004150390625, 0.55859375, 0.63714599609375, 0.7156982421875, 0.79425048828125, 0.872802734375, 0.95135498046875, 1.0299072265625, 1.10845947265625, 1.18701171875, 1.26556396484375, 1.3441162109375, 1.42266845703125, 1.501220703125, 1.57977294921875, 1.6583251953125, 1.73687744140625, 1.8154296875, 1.89398193359375, 1.9725341796875, 2.05108642578125, 2.129638671875, 2.20819091796875, 2.2867431640625, 2.36529541015625, 2.44384765625, 2.52239990234375, 2.6009521484375, 2.67950439453125, 2.758056640625, 2.83660888671875, 2.9151611328125, 2.99371337890625, 3.072265625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 8.0, 11.0, 8.0, 18.0, 17.0, 32.0, 49.0, 59.0, 78.0, 104.0, 101.0, 98.0, 103.0, 77.0, 67.0, 52.0, 36.0, 22.0, 16.0, 9.0, 11.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0999505519866943, -2.9526960849761963, -2.8054416179656982, -2.6581873893737793, -2.5109329223632812, -2.363678455352783, -2.216423988342285, -2.069169521331787, -1.9219151735305786, -1.7746607065200806, -1.627406358718872, -1.480151891708374, -1.332897424697876, -1.1856430768966675, -1.0383886098861694, -0.8911342620849609, -0.7438797950744629, -0.5966253876686096, -0.44937095046043396, -0.3021165132522583, -0.15486210584640503, -0.007607698440551758, 0.1396467685699463, 0.2869011163711548, 0.43415558338165283, 0.5814099907875061, 0.7286643981933594, 0.8759188652038574, 1.0231733322143555, 1.170427680015564, 1.317682147026062, 1.4649364948272705, 1.6121907234191895, 1.7594451904296875, 1.906699538230896, 2.0539541244506836, 2.2012083530426025, 2.3484628200531006, 2.4957172870635986, 2.6429715156555176, 2.7902259826660156, 2.9374804496765137, 3.0847349166870117, 3.2319893836975098, 3.3792436122894287, 3.5264980792999268, 3.673752546310425, 3.8210067749023438, 3.968261480331421, 4.11551570892334, 4.262770175933838, 4.410024642944336, 4.557279109954834, 4.704533576965332, 4.85178804397583, 4.999042510986328, 5.146296977996826, 5.293551445007324, 5.440805912017822, 5.58806037902832, 5.735314846038818, 5.882569313049316, 6.029823303222656, 6.177077770233154, 6.324332237243652]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 14.0, 13.0, 9.0, 14.0, 11.0, 15.0, 25.0, 22.0, 28.0, 30.0, 31.0, 35.0, 33.0, 32.0, 37.0, 34.0, 41.0, 37.0, 38.0, 36.0, 48.0, 45.0, 45.0, 34.0, 34.0, 25.0, 33.0, 23.0, 25.0, 27.0, 15.0, 17.0, 17.0, 16.0, 14.0, 10.0, 7.0, 8.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-3.317847967147827, -3.227163076400757, -3.1364781856536865, -3.0457935333251953, -2.955108642578125, -2.8644237518310547, -2.7737388610839844, -2.683053970336914, -2.592369318008423, -2.5016844272613525, -2.4109995365142822, -2.320314884185791, -2.2296299934387207, -2.1389451026916504, -2.04826021194458, -1.9575754404067993, -1.866890549659729, -1.7762056589126587, -1.685520887374878, -1.5948359966278076, -1.5041512250900269, -1.4134663343429565, -1.3227815628051758, -1.2320966720581055, -1.1414117813110352, -1.0507268905639648, -0.9600421190261841, -0.8693572282791138, -0.778672456741333, -0.6879875659942627, -0.5973027348518372, -0.5066179037094116, -0.41593313217163086, -0.3252483010292053, -0.2345634549856186, -0.14387860894203186, -0.05319377779960632, 0.037491053342819214, 0.12817591428756714, 0.21886074542999268, 0.3095455765724182, 0.40023040771484375, 0.4909152388572693, 0.5816000699996948, 0.6722849607467651, 0.7629697322845459, 0.8536546230316162, 0.9443394541740417, 1.0350242853164673, 1.1257091760635376, 1.2163939476013184, 1.3070788383483887, 1.3977636098861694, 1.4884485006332397, 1.5791332721710205, 1.6698181629180908, 1.7605030536651611, 1.8511879444122314, 1.9418727159500122, 2.032557487487793, 2.1232423782348633, 2.2139272689819336, 2.304612159729004, 2.395297050476074, 2.4859817028045654]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 14.0, 7.0, 5.0, 8.0, 15.0, 13.0, 15.0, 22.0, 13.0, 13.0, 24.0, 24.0, 29.0, 30.0, 35.0, 18.0, 31.0, 43.0, 35.0, 26.0, 23.0, 30.0, 29.0, 31.0, 48.0, 31.0, 34.0, 25.0, 35.0, 18.0, 30.0, 25.0, 27.0, 23.0, 23.0, 23.0, 15.0, 17.0, 14.0, 16.0, 9.0, 10.0, 5.0, 8.0, 6.0, 8.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.268798828125, -0.2601776123046875, -0.251556396484375, -0.2429351806640625, -0.23431396484375, -0.2256927490234375, -0.217071533203125, -0.2084503173828125, -0.1998291015625, -0.1912078857421875, -0.182586669921875, -0.1739654541015625, -0.16534423828125, -0.1567230224609375, -0.148101806640625, -0.1394805908203125, -0.130859375, -0.1222381591796875, -0.113616943359375, -0.1049957275390625, -0.09637451171875, -0.0877532958984375, -0.079132080078125, -0.0705108642578125, -0.0618896484375, -0.0532684326171875, -0.044647216796875, -0.0360260009765625, -0.02740478515625, -0.0187835693359375, -0.010162353515625, -0.0015411376953125, 0.007080078125, 0.0157012939453125, 0.024322509765625, 0.0329437255859375, 0.04156494140625, 0.0501861572265625, 0.058807373046875, 0.0674285888671875, 0.0760498046875, 0.0846710205078125, 0.093292236328125, 0.1019134521484375, 0.11053466796875, 0.1191558837890625, 0.127777099609375, 0.1363983154296875, 0.14501953125, 0.1536407470703125, 0.162261962890625, 0.1708831787109375, 0.17950439453125, 0.1881256103515625, 0.196746826171875, 0.2053680419921875, 0.2139892578125, 0.2226104736328125, 0.231231689453125, 0.2398529052734375, 0.24847412109375, 0.2570953369140625, 0.265716552734375, 0.2743377685546875, 0.282958984375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 5.0, 10.0, 15.0, 27.0, 51.0, 78.0, 130.0, 203.0, 272.0, 429.0, 730.0, 1142.0, 1857.0, 2960.0, 5111.0, 8848.0, 16006.0, 28964.0, 53971.0, 100881.0, 169980.0, 217614.0, 185379.0, 114507.0, 62793.0, 33542.0, 18223.0, 10120.0, 5788.0, 3472.0, 2028.0, 1226.0, 792.0, 518.0, 310.0, 214.0, 125.0, 86.0, 61.0, 31.0, 23.0, 13.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3762550354003906, -0.36310577392578125, -0.3499565124511719, -0.3368072509765625, -0.3236579895019531, -0.31050872802734375, -0.2973594665527344, -0.284210205078125, -0.2710609436035156, -0.25791168212890625, -0.24476242065429688, -0.2316131591796875, -0.21846389770507812, -0.20531463623046875, -0.19216537475585938, -0.17901611328125, -0.16586685180664062, -0.15271759033203125, -0.13956832885742188, -0.1264190673828125, -0.11326980590820312, -0.10012054443359375, -0.08697128295898438, -0.073822021484375, -0.060672760009765625, -0.04752349853515625, -0.034374237060546875, -0.0212249755859375, -0.008075714111328125, 0.00507354736328125, 0.018222808837890625, 0.0313720703125, 0.044521331787109375, 0.05767059326171875, 0.07081985473632812, 0.0839691162109375, 0.09711837768554688, 0.11026763916015625, 0.12341690063476562, 0.136566162109375, 0.14971542358398438, 0.16286468505859375, 0.17601394653320312, 0.1891632080078125, 0.20231246948242188, 0.21546173095703125, 0.22861099243164062, 0.24176025390625, 0.2549095153808594, 0.26805877685546875, 0.2812080383300781, 0.2943572998046875, 0.3075065612792969, 0.32065582275390625, 0.3338050842285156, 0.346954345703125, 0.3601036071777344, 0.37325286865234375, 0.3864021301269531, 0.3995513916015625, 0.4127006530761719, 0.42584991455078125, 0.4389991760253906, 0.4521484375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 8.0, 9.0, 9.0, 13.0, 17.0, 23.0, 22.0, 19.0, 17.0, 27.0, 28.0, 35.0, 32.0, 31.0, 22.0, 39.0, 52.0, 36.0, 1066.0, 35.0, 45.0, 41.0, 35.0, 44.0, 32.0, 42.0, 20.0, 20.0, 25.0, 21.0, 31.0, 16.0, 13.0, 17.0, 8.0, 5.0, 13.0, 7.0, 8.0, 11.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3250007629394531, -0.31479644775390625, -0.3045921325683594, -0.2943878173828125, -0.2841835021972656, -0.27397918701171875, -0.2637748718261719, -0.253570556640625, -0.24336624145507812, -0.23316192626953125, -0.22295761108398438, -0.2127532958984375, -0.20254898071289062, -0.19234466552734375, -0.18214035034179688, -0.17193603515625, -0.16173171997070312, -0.15152740478515625, -0.14132308959960938, -0.1311187744140625, -0.12091445922851562, -0.11071014404296875, -0.10050582885742188, -0.090301513671875, -0.08009719848632812, -0.06989288330078125, -0.059688568115234375, -0.0494842529296875, -0.039279937744140625, -0.02907562255859375, -0.018871307373046875, -0.0086669921875, 0.001537322998046875, 0.01174163818359375, 0.021945953369140625, 0.0321502685546875, 0.042354583740234375, 0.05255889892578125, 0.06276321411132812, 0.072967529296875, 0.08317184448242188, 0.09337615966796875, 0.10358047485351562, 0.1137847900390625, 0.12398910522460938, 0.13419342041015625, 0.14439773559570312, 0.15460205078125, 0.16480636596679688, 0.17501068115234375, 0.18521499633789062, 0.1954193115234375, 0.20562362670898438, 0.21582794189453125, 0.22603225708007812, 0.236236572265625, 0.24644088745117188, 0.25664520263671875, 0.2668495178222656, 0.2770538330078125, 0.2872581481933594, 0.29746246337890625, 0.3076667785644531, 0.31787109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 2.0, 14.0, 19.0, 28.0, 30.0, 43.0, 64.0, 78.0, 151.0, 194.0, 265.0, 433.0, 651.0, 1024.0, 1532.0, 2426.0, 3742.0, 6310.0, 10452.0, 19059.0, 39400.0, 164099.0, 1662602.0, 108912.0, 33691.0, 16633.0, 9534.0, 5723.0, 3548.0, 2246.0, 1394.0, 1005.0, 586.0, 388.0, 274.0, 190.0, 117.0, 84.0, 54.0, 36.0, 29.0, 21.0, 8.0, 9.0, 9.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.495361328125, -0.4800758361816406, -0.46479034423828125, -0.4495048522949219, -0.4342193603515625, -0.4189338684082031, -0.40364837646484375, -0.3883628845214844, -0.373077392578125, -0.3577919006347656, -0.34250640869140625, -0.3272209167480469, -0.3119354248046875, -0.2966499328613281, -0.28136444091796875, -0.2660789489746094, -0.25079345703125, -0.23550796508789062, -0.22022247314453125, -0.20493698120117188, -0.1896514892578125, -0.17436599731445312, -0.15908050537109375, -0.14379501342773438, -0.128509521484375, -0.11322402954101562, -0.09793853759765625, -0.08265304565429688, -0.0673675537109375, -0.052082061767578125, -0.03679656982421875, -0.021511077880859375, -0.0062255859375, 0.009059906005859375, 0.02434539794921875, 0.039630889892578125, 0.0549163818359375, 0.07020187377929688, 0.08548736572265625, 0.10077285766601562, 0.116058349609375, 0.13134384155273438, 0.14662933349609375, 0.16191482543945312, 0.1772003173828125, 0.19248580932617188, 0.20777130126953125, 0.22305679321289062, 0.23834228515625, 0.2536277770996094, 0.26891326904296875, 0.2841987609863281, 0.2994842529296875, 0.3147697448730469, 0.33005523681640625, 0.3453407287597656, 0.360626220703125, 0.3759117126464844, 0.39119720458984375, 0.4064826965332031, 0.4217681884765625, 0.4370536804199219, 0.45233917236328125, 0.4676246643066406, 0.48291015625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 10.0, 7.0, 4.0, 10.0, 9.0, 15.0, 17.0, 15.0, 31.0, 34.0, 37.0, 50.0, 54.0, 67.0, 60.0, 79.0, 87.0, 79.0, 62.0, 61.0, 34.0, 30.0, 30.0, 20.0, 18.0, 22.0, 8.0, 13.0, 6.0, 4.0, 1.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05601835250854492, -0.054083824157714844, -0.052149295806884766, -0.05021476745605469, -0.04828023910522461, -0.04634571075439453, -0.04441118240356445, -0.042476654052734375, -0.0405421257019043, -0.03860759735107422, -0.03667306900024414, -0.03473854064941406, -0.032804012298583984, -0.030869483947753906, -0.028934955596923828, -0.02700042724609375, -0.025065898895263672, -0.023131370544433594, -0.021196842193603516, -0.019262313842773438, -0.01732778549194336, -0.015393257141113281, -0.013458728790283203, -0.011524200439453125, -0.009589672088623047, -0.007655143737792969, -0.005720615386962891, -0.0037860870361328125, -0.0018515586853027344, 8.296966552734375e-05, 0.002017498016357422, 0.0039520263671875, 0.005886554718017578, 0.007821083068847656, 0.009755611419677734, 0.011690139770507812, 0.01362466812133789, 0.015559196472167969, 0.017493724822998047, 0.019428253173828125, 0.021362781524658203, 0.02329730987548828, 0.02523183822631836, 0.027166366577148438, 0.029100894927978516, 0.031035423278808594, 0.03296995162963867, 0.03490447998046875, 0.03683900833129883, 0.038773536682128906, 0.040708065032958984, 0.04264259338378906, 0.04457712173461914, 0.04651165008544922, 0.0484461784362793, 0.050380706787109375, 0.05231523513793945, 0.05424976348876953, 0.05618429183959961, 0.05811882019042969, 0.060053348541259766, 0.061987876892089844, 0.06392240524291992, 0.06585693359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 3.0, 5.0, 22.0, 6.0, 24.0, 22.0, 29.0, 35.0, 60.0, 72.0, 95.0, 111.0, 178.0, 255.0, 557.0, 2140.0, 15341.0, 246713.0, 741433.0, 35241.0, 4344.0, 841.0, 326.0, 181.0, 132.0, 85.0, 64.0, 63.0, 36.0, 35.0, 23.0, 17.0, 19.0, 11.0, 6.0, 6.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.79345703125, -0.768798828125, -0.744140625, -0.719482421875, -0.69482421875, -0.670166015625, -0.6455078125, -0.620849609375, -0.59619140625, -0.571533203125, -0.546875, -0.522216796875, -0.49755859375, -0.472900390625, -0.4482421875, -0.423583984375, -0.39892578125, -0.374267578125, -0.349609375, -0.324951171875, -0.30029296875, -0.275634765625, -0.2509765625, -0.226318359375, -0.20166015625, -0.177001953125, -0.15234375, -0.127685546875, -0.10302734375, -0.078369140625, -0.0537109375, -0.029052734375, -0.00439453125, 0.020263671875, 0.044921875, 0.069580078125, 0.09423828125, 0.118896484375, 0.1435546875, 0.168212890625, 0.19287109375, 0.217529296875, 0.2421875, 0.266845703125, 0.29150390625, 0.316162109375, 0.3408203125, 0.365478515625, 0.39013671875, 0.414794921875, 0.439453125, 0.464111328125, 0.48876953125, 0.513427734375, 0.5380859375, 0.562744140625, 0.58740234375, 0.612060546875, 0.63671875, 0.661376953125, 0.68603515625, 0.710693359375, 0.7353515625, 0.760009765625, 0.78466796875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 30.0, 113.0, 339.0, 362.0, 111.0, 33.0, 11.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8144052624702454, -0.7775145769119263, -0.7406238913536072, -0.7037332057952881, -0.6668424606323242, -0.6299518346786499, -0.593061089515686, -0.5561704039573669, -0.5192797183990479, -0.48238903284072876, -0.44549834728240967, -0.4086076319217682, -0.3717169463634491, -0.33482626080513, -0.2979355454444885, -0.26104485988616943, -0.22415417432785034, -0.18726348876953125, -0.15037278831005096, -0.11348209530115128, -0.07659140229225159, -0.039700716733932495, -0.0028100162744522095, 0.034080684185028076, 0.07097136974334717, 0.10786206275224686, 0.14475275576114655, 0.18164345622062683, 0.21853414177894592, 0.255424827337265, 0.2923155426979065, 0.3292062282562256, 0.3660968542098999, 0.402987539768219, 0.4398782253265381, 0.47676894068717957, 0.5136595964431763, 0.5505503416061401, 0.5874410271644592, 0.6243317127227783, 0.6612223982810974, 0.6981130838394165, 0.7350037693977356, 0.7718944549560547, 0.8087852001190186, 0.8456758260726929, 0.8825665712356567, 0.9194572567939758, 0.9563479423522949, 0.993238627910614, 1.030129313468933, 1.067020058631897, 1.1039106845855713, 1.1408014297485352, 1.1776920557022095, 1.2145828008651733, 1.2514734268188477, 1.2883641719818115, 1.3252547979354858, 1.3621455430984497, 1.399036169052124, 1.435926914215088, 1.4728175401687622, 1.509708285331726, 1.54659903049469]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 14.0, 16.0, 17.0, 20.0, 25.0, 29.0, 36.0, 25.0, 34.0, 35.0, 46.0, 50.0, 51.0, 47.0, 53.0, 51.0, 52.0, 55.0, 47.0, 42.0, 42.0, 26.0, 36.0, 24.0, 36.0, 18.0, 19.0, 14.0, 11.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20259404182434082, -0.19539883732795715, -0.1882036328315735, -0.18100842833518982, -0.17381322383880615, -0.16661801934242249, -0.15942281484603882, -0.15222761034965515, -0.14503240585327148, -0.13783720135688782, -0.13064199686050415, -0.12344679236412048, -0.11625158786773682, -0.10905638337135315, -0.10186118632555008, -0.09466598182916641, -0.08747078478336334, -0.08027558028697968, -0.07308037579059601, -0.06588517129421234, -0.05868997052311897, -0.051494766026735306, -0.04429956525564194, -0.03710436075925827, -0.029909156262874603, -0.022713951766490936, -0.015518749132752419, -0.0083235464990139, -0.0011283420026302338, 0.006066862493753433, 0.013262063264846802, 0.02045726776123047, 0.027652472257614136, 0.0348476767539978, 0.04204288125038147, 0.04923808202147484, 0.056433286517858505, 0.06362849473953247, 0.07082369178533554, 0.07801889628171921, 0.08521410077810287, 0.09240930527448654, 0.09960450977087021, 0.10679970681667328, 0.11399491131305695, 0.12119011580944061, 0.12838532030582428, 0.13558052480220795, 0.1427757292985916, 0.14997093379497528, 0.15716613829135895, 0.16436134278774261, 0.17155654728412628, 0.17875175178050995, 0.18594694137573242, 0.1931421458721161, 0.20033735036849976, 0.20753255486488342, 0.2147277593612671, 0.22192296385765076, 0.22911816835403442, 0.2363133728504181, 0.24350857734680176, 0.2507037818431854, 0.2578989863395691]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 14.0, 6.0, 7.0, 11.0, 14.0, 17.0, 13.0, 21.0, 13.0, 18.0, 23.0, 22.0, 33.0, 24.0, 35.0, 29.0, 43.0, 34.0, 29.0, 21.0, 28.0, 29.0, 34.0, 38.0, 39.0, 30.0, 29.0, 28.0, 26.0, 18.0, 37.0, 26.0, 23.0, 17.0, 28.0, 20.0, 14.0, 14.0, 13.0, 15.0, 9.0, 12.0, 7.0, 7.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.261474609375, -0.2529487609863281, -0.24442291259765625, -0.23589706420898438, -0.2273712158203125, -0.21884536743164062, -0.21031951904296875, -0.20179367065429688, -0.193267822265625, -0.18474197387695312, -0.17621612548828125, -0.16769027709960938, -0.1591644287109375, -0.15063858032226562, -0.14211273193359375, -0.13358688354492188, -0.12506103515625, -0.11653518676757812, -0.10800933837890625, -0.09948348999023438, -0.0909576416015625, -0.08243179321289062, -0.07390594482421875, -0.06538009643554688, -0.056854248046875, -0.048328399658203125, -0.03980255126953125, -0.031276702880859375, -0.0227508544921875, -0.014225006103515625, -0.00569915771484375, 0.002826690673828125, 0.0113525390625, 0.019878387451171875, 0.02840423583984375, 0.036930084228515625, 0.0454559326171875, 0.053981781005859375, 0.06250762939453125, 0.07103347778320312, 0.079559326171875, 0.08808517456054688, 0.09661102294921875, 0.10513687133789062, 0.1136627197265625, 0.12218856811523438, 0.13071441650390625, 0.13924026489257812, 0.14776611328125, 0.15629196166992188, 0.16481781005859375, 0.17334365844726562, 0.1818695068359375, 0.19039535522460938, 0.19892120361328125, 0.20744705200195312, 0.215972900390625, 0.22449874877929688, 0.23302459716796875, 0.24155044555664062, 0.2500762939453125, 0.2586021423339844, 0.26712799072265625, 0.2756538391113281, 0.2841796875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 8.0, 8.0, 15.0, 14.0, 29.0, 40.0, 63.0, 75.0, 102.0, 131.0, 209.0, 280.0, 358.0, 534.0, 746.0, 1061.0, 1463.0, 1981.0, 2767.0, 4104.0, 5965.0, 9059.0, 15066.0, 26120.0, 54688.0, 129784.0, 309327.0, 267494.0, 107712.0, 46356.0, 22968.0, 13157.0, 8283.0, 5468.0, 3810.0, 2623.0, 1842.0, 1337.0, 934.0, 717.0, 511.0, 388.0, 256.0, 211.0, 138.0, 115.0, 64.0, 52.0, 42.0, 22.0, 27.0, 14.0, 8.0, 5.0, 7.0, 1.0, 3.0, 1.0], "bins": [-0.322509765625, -0.31270599365234375, -0.3029022216796875, -0.29309844970703125, -0.283294677734375, -0.27349090576171875, -0.2636871337890625, -0.25388336181640625, -0.24407958984375, -0.23427581787109375, -0.2244720458984375, -0.21466827392578125, -0.204864501953125, -0.19506072998046875, -0.1852569580078125, -0.17545318603515625, -0.1656494140625, -0.15584564208984375, -0.1460418701171875, -0.13623809814453125, -0.126434326171875, -0.11663055419921875, -0.1068267822265625, -0.09702301025390625, -0.08721923828125, -0.07741546630859375, -0.0676116943359375, -0.05780792236328125, -0.048004150390625, -0.03820037841796875, -0.0283966064453125, -0.01859283447265625, -0.0087890625, 0.00101470947265625, 0.0108184814453125, 0.02062225341796875, 0.030426025390625, 0.04022979736328125, 0.0500335693359375, 0.05983734130859375, 0.06964111328125, 0.07944488525390625, 0.0892486572265625, 0.09905242919921875, 0.108856201171875, 0.11865997314453125, 0.1284637451171875, 0.13826751708984375, 0.1480712890625, 0.15787506103515625, 0.1676788330078125, 0.17748260498046875, 0.187286376953125, 0.19709014892578125, 0.2068939208984375, 0.21669769287109375, 0.22650146484375, 0.23630523681640625, 0.2461090087890625, 0.25591278076171875, 0.265716552734375, 0.27552032470703125, 0.2853240966796875, 0.29512786865234375, 0.304931640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 13.0, 11.0, 10.0, 7.0, 19.0, 22.0, 17.0, 27.0, 17.0, 32.0, 37.0, 42.0, 40.0, 62.0, 68.0, 105.0, 191.0, 1420.0, 304.0, 127.0, 74.0, 47.0, 37.0, 36.0, 42.0, 35.0, 30.0, 31.0, 20.0, 17.0, 18.0, 10.0, 10.0, 15.0, 10.0, 9.0, 5.0, 3.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.048828125, -1.012359619140625, -0.97589111328125, -0.939422607421875, -0.9029541015625, -0.866485595703125, -0.83001708984375, -0.793548583984375, -0.757080078125, -0.720611572265625, -0.68414306640625, -0.647674560546875, -0.6112060546875, -0.574737548828125, -0.53826904296875, -0.501800537109375, -0.46533203125, -0.428863525390625, -0.39239501953125, -0.355926513671875, -0.3194580078125, -0.282989501953125, -0.24652099609375, -0.210052490234375, -0.173583984375, -0.137115478515625, -0.10064697265625, -0.064178466796875, -0.0277099609375, 0.008758544921875, 0.04522705078125, 0.081695556640625, 0.1181640625, 0.154632568359375, 0.19110107421875, 0.227569580078125, 0.2640380859375, 0.300506591796875, 0.33697509765625, 0.373443603515625, 0.409912109375, 0.446380615234375, 0.48284912109375, 0.519317626953125, 0.5557861328125, 0.592254638671875, 0.62872314453125, 0.665191650390625, 0.70166015625, 0.738128662109375, 0.77459716796875, 0.811065673828125, 0.8475341796875, 0.884002685546875, 0.92047119140625, 0.956939697265625, 0.993408203125, 1.029876708984375, 1.06634521484375, 1.102813720703125, 1.1392822265625, 1.175750732421875, 1.21221923828125, 1.248687744140625, 1.28515625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 9.0, 4.0, 14.0, 14.0, 15.0, 21.0, 26.0, 33.0, 42.0, 78.0, 107.0, 154.0, 300.0, 614.0, 1192.0, 2791.0, 7854.0, 31118.0, 249959.0, 2556653.0, 249792.0, 31428.0, 7911.0, 2886.0, 1262.0, 615.0, 295.0, 172.0, 95.0, 78.0, 46.0, 27.0, 20.0, 14.0, 22.0, 9.0, 7.0, 10.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3515625, -1.30865478515625, -1.2657470703125, -1.22283935546875, -1.179931640625, -1.13702392578125, -1.0941162109375, -1.05120849609375, -1.00830078125, -0.96539306640625, -0.9224853515625, -0.87957763671875, -0.836669921875, -0.79376220703125, -0.7508544921875, -0.70794677734375, -0.6650390625, -0.62213134765625, -0.5792236328125, -0.53631591796875, -0.493408203125, -0.45050048828125, -0.4075927734375, -0.36468505859375, -0.32177734375, -0.27886962890625, -0.2359619140625, -0.19305419921875, -0.150146484375, -0.10723876953125, -0.0643310546875, -0.02142333984375, 0.021484375, 0.06439208984375, 0.1072998046875, 0.15020751953125, 0.193115234375, 0.23602294921875, 0.2789306640625, 0.32183837890625, 0.36474609375, 0.40765380859375, 0.4505615234375, 0.49346923828125, 0.536376953125, 0.57928466796875, 0.6221923828125, 0.66510009765625, 0.7080078125, 0.75091552734375, 0.7938232421875, 0.83673095703125, 0.879638671875, 0.92254638671875, 0.9654541015625, 1.00836181640625, 1.05126953125, 1.09417724609375, 1.1370849609375, 1.17999267578125, 1.222900390625, 1.26580810546875, 1.3087158203125, 1.35162353515625, 1.39453125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [330.0, 682.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1897190809249878, -0.1721806526184082, 0.8453577756881714, 1.8628960847854614, 2.880434513092041, 3.89797306060791, 4.915511131286621, 5.93304967880249, 6.950588226318359, 7.9681267738342285, 8.985665321350098, 10.003203392028809, 11.020742416381836, 12.038280487060547, 13.055818557739258, 14.073356628417969, 15.090895652770996, 16.108434677124023, 17.125972747802734, 18.143510818481445, 19.161048889160156, 20.1785888671875, 21.196125030517578, 22.213665008544922, 23.231203079223633, 24.248741149902344, 25.266279220581055, 26.283817291259766, 27.30135726928711, 28.31889533996582, 29.33643341064453, 30.353971481323242, 31.371509552001953, 32.3890495300293, 33.406585693359375, 34.42412567138672, 35.4416618347168, 36.45920181274414, 37.47673797607422, 38.49427795410156, 39.511817932128906, 40.52935791015625, 41.54689407348633, 42.56443405151367, 43.58197021484375, 44.599510192871094, 45.61705017089844, 46.634586334228516, 47.652122497558594, 48.66966247558594, 49.687198638916016, 50.70473861694336, 51.72227478027344, 52.73981475830078, 53.757354736328125, 54.7748908996582, 55.79243087768555, 56.80997085571289, 57.82750701904297, 58.84504699707031, 59.86258316040039, 60.880123138427734, 61.89765930175781, 62.915199279785156, 63.9327392578125]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 2.0, 5.0, 6.0, 19.0, 9.0, 12.0, 12.0, 18.0, 20.0, 21.0, 28.0, 31.0, 21.0, 34.0, 36.0, 45.0, 44.0, 26.0, 41.0, 52.0, 44.0, 42.0, 45.0, 36.0, 27.0, 40.0, 33.0, 26.0, 27.0, 28.0, 20.0, 20.0, 29.0, 17.0, 12.0, 16.0, 7.0, 12.0, 10.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.03659200668335, -3.9120683670043945, -3.7875449657440186, -3.6630215644836426, -3.5384979248046875, -3.4139742851257324, -3.2894508838653564, -3.1649274826049805, -3.0404038429260254, -2.9158802032470703, -2.7913568019866943, -2.6668334007263184, -2.5423097610473633, -2.417786121368408, -2.2932627201080322, -2.1687393188476562, -2.044215679168701, -1.9196921586990356, -1.7951686382293701, -1.6706451177597046, -1.546121597290039, -1.4215980768203735, -1.297074556350708, -1.1725510358810425, -1.048027515411377, -0.9235039949417114, -0.7989804744720459, -0.6744569540023804, -0.5499334335327148, -0.4254099130630493, -0.3008863925933838, -0.17636287212371826, -0.051839590072631836, 0.07268393039703369, 0.19720745086669922, 0.32173097133636475, 0.4462544918060303, 0.5707780122756958, 0.6953015327453613, 0.8198250532150269, 0.9443485736846924, 1.068872094154358, 1.1933956146240234, 1.317919135093689, 1.4424426555633545, 1.56696617603302, 1.6914896965026855, 1.816013216972351, 1.9405367374420166, 2.0650601387023926, 2.1895837783813477, 2.3141074180603027, 2.4386308193206787, 2.5631542205810547, 2.6876778602600098, 2.812201499938965, 2.936724901199341, 3.061248302459717, 3.185771942138672, 3.310295581817627, 3.434818983078003, 3.559342384338379, 3.683866024017334, 3.808389663696289, 3.932913064956665]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 13.0, 10.0, 9.0, 16.0, 13.0, 16.0, 18.0, 17.0, 21.0, 20.0, 26.0, 31.0, 31.0, 24.0, 34.0, 39.0, 30.0, 34.0, 33.0, 35.0, 43.0, 25.0, 37.0, 41.0, 25.0, 33.0, 28.0, 30.0, 23.0, 32.0, 30.0, 22.0, 16.0, 24.0, 17.0, 15.0, 17.0, 17.0, 11.0, 6.0, 5.0, 3.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.29248046875, -0.2831382751464844, -0.27379608154296875, -0.2644538879394531, -0.2551116943359375, -0.24576950073242188, -0.23642730712890625, -0.22708511352539062, -0.217742919921875, -0.20840072631835938, -0.19905853271484375, -0.18971633911132812, -0.1803741455078125, -0.17103195190429688, -0.16168975830078125, -0.15234756469726562, -0.14300537109375, -0.13366317749023438, -0.12432098388671875, -0.11497879028320312, -0.1056365966796875, -0.09629440307617188, -0.08695220947265625, -0.07761001586914062, -0.068267822265625, -0.058925628662109375, -0.04958343505859375, -0.040241241455078125, -0.0308990478515625, -0.021556854248046875, -0.01221466064453125, -0.002872467041015625, 0.0064697265625, 0.015811920166015625, 0.02515411376953125, 0.034496307373046875, 0.0438385009765625, 0.053180694580078125, 0.06252288818359375, 0.07186508178710938, 0.081207275390625, 0.09054946899414062, 0.09989166259765625, 0.10923385620117188, 0.1185760498046875, 0.12791824340820312, 0.13726043701171875, 0.14660263061523438, 0.15594482421875, 0.16528701782226562, 0.17462921142578125, 0.18397140502929688, 0.1933135986328125, 0.20265579223632812, 0.21199798583984375, 0.22134017944335938, 0.230682373046875, 0.24002456665039062, 0.24936676025390625, 0.2587089538574219, 0.2680511474609375, 0.2773933410644531, 0.28673553466796875, 0.2960777282714844, 0.305419921875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 8.0, 3.0, 8.0, 15.0, 12.0, 17.0, 33.0, 50.0, 62.0, 112.0, 152.0, 207.0, 363.0, 518.0, 774.0, 1193.0, 1914.0, 3146.0, 5039.0, 8406.0, 15101.0, 29852.0, 76293.0, 348059.0, 2021222.0, 1352518.0, 216241.0, 56034.0, 24857.0, 12821.0, 7304.0, 4486.0, 2657.0, 1688.0, 1148.0, 691.0, 425.0, 282.0, 179.0, 120.0, 76.0, 67.0, 38.0, 22.0, 17.0, 20.0, 11.0, 5.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6220703125, -0.6019134521484375, -0.581756591796875, -0.5615997314453125, -0.54144287109375, -0.5212860107421875, -0.501129150390625, -0.4809722900390625, -0.4608154296875, -0.4406585693359375, -0.420501708984375, -0.4003448486328125, -0.38018798828125, -0.3600311279296875, -0.339874267578125, -0.3197174072265625, -0.299560546875, -0.2794036865234375, -0.259246826171875, -0.2390899658203125, -0.21893310546875, -0.1987762451171875, -0.178619384765625, -0.1584625244140625, -0.1383056640625, -0.1181488037109375, -0.097991943359375, -0.0778350830078125, -0.05767822265625, -0.0375213623046875, -0.017364501953125, 0.0027923583984375, 0.02294921875, 0.0431060791015625, 0.063262939453125, 0.0834197998046875, 0.10357666015625, 0.1237335205078125, 0.143890380859375, 0.1640472412109375, 0.1842041015625, 0.2043609619140625, 0.224517822265625, 0.2446746826171875, 0.26483154296875, 0.2849884033203125, 0.305145263671875, 0.3253021240234375, 0.345458984375, 0.3656158447265625, 0.385772705078125, 0.4059295654296875, 0.42608642578125, 0.4462432861328125, 0.466400146484375, 0.4865570068359375, 0.5067138671875, 0.5268707275390625, 0.547027587890625, 0.5671844482421875, 0.58734130859375, 0.6074981689453125, 0.627655029296875, 0.6478118896484375, 0.66796875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 8.0, 13.0, 27.0, 25.0, 28.0, 41.0, 65.0, 92.0, 148.0, 229.0, 414.0, 671.0, 808.0, 555.0, 319.0, 183.0, 120.0, 75.0, 56.0, 44.0, 33.0, 21.0, 21.0, 12.0, 6.0, 14.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.02734375, -0.9944915771484375, -0.961639404296875, -0.9287872314453125, -0.89593505859375, -0.8630828857421875, -0.830230712890625, -0.7973785400390625, -0.7645263671875, -0.7316741943359375, -0.698822021484375, -0.6659698486328125, -0.63311767578125, -0.6002655029296875, -0.567413330078125, -0.5345611572265625, -0.501708984375, -0.4688568115234375, -0.436004638671875, -0.4031524658203125, -0.37030029296875, -0.3374481201171875, -0.304595947265625, -0.2717437744140625, -0.2388916015625, -0.2060394287109375, -0.173187255859375, -0.1403350830078125, -0.10748291015625, -0.0746307373046875, -0.041778564453125, -0.0089263916015625, 0.02392578125, 0.0567779541015625, 0.089630126953125, 0.1224822998046875, 0.15533447265625, 0.1881866455078125, 0.221038818359375, 0.2538909912109375, 0.2867431640625, 0.3195953369140625, 0.352447509765625, 0.3852996826171875, 0.41815185546875, 0.4510040283203125, 0.483856201171875, 0.5167083740234375, 0.549560546875, 0.5824127197265625, 0.615264892578125, 0.6481170654296875, 0.68096923828125, 0.7138214111328125, 0.746673583984375, 0.7795257568359375, 0.8123779296875, 0.8452301025390625, 0.878082275390625, 0.9109344482421875, 0.94378662109375, 0.9766387939453125, 1.009490966796875, 1.0423431396484375, 1.0751953125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 12.0, 6.0, 16.0, 31.0, 28.0, 54.0, 54.0, 91.0, 107.0, 139.0, 178.0, 268.0, 356.0, 509.0, 684.0, 1091.0, 1588.0, 2473.0, 4001.0, 6589.0, 11701.0, 22058.0, 47746.0, 129988.0, 590772.0, 2479241.0, 652456.0, 138312.0, 50337.0, 23000.0, 11957.0, 6592.0, 3929.0, 2523.0, 1665.0, 1056.0, 717.0, 566.0, 349.0, 298.0, 207.0, 149.0, 113.0, 79.0, 57.0, 36.0, 32.0, 24.0, 16.0, 4.0, 6.0, 7.0, 3.0, 2.0, 2.0, 3.0], "bins": [-1.126953125, -1.0933380126953125, -1.059722900390625, -1.0261077880859375, -0.99249267578125, -0.9588775634765625, -0.925262451171875, -0.8916473388671875, -0.8580322265625, -0.8244171142578125, -0.790802001953125, -0.7571868896484375, -0.72357177734375, -0.6899566650390625, -0.656341552734375, -0.6227264404296875, -0.589111328125, -0.5554962158203125, -0.521881103515625, -0.4882659912109375, -0.45465087890625, -0.4210357666015625, -0.387420654296875, -0.3538055419921875, -0.3201904296875, -0.2865753173828125, -0.252960205078125, -0.2193450927734375, -0.18572998046875, -0.1521148681640625, -0.118499755859375, -0.0848846435546875, -0.05126953125, -0.0176544189453125, 0.015960693359375, 0.0495758056640625, 0.08319091796875, 0.1168060302734375, 0.150421142578125, 0.1840362548828125, 0.2176513671875, 0.2512664794921875, 0.284881591796875, 0.3184967041015625, 0.35211181640625, 0.3857269287109375, 0.419342041015625, 0.4529571533203125, 0.486572265625, 0.5201873779296875, 0.553802490234375, 0.5874176025390625, 0.62103271484375, 0.6546478271484375, 0.688262939453125, 0.7218780517578125, 0.7554931640625, 0.7891082763671875, 0.822723388671875, 0.8563385009765625, 0.88995361328125, 0.9235687255859375, 0.957183837890625, 0.9907989501953125, 1.0244140625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 14.0, 17.0, 65.0, 161.0, 234.0, 258.0, 163.0, 56.0, 29.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.227615356445312, -16.82706069946289, -16.42650604248047, -16.025951385498047, -15.625397682189941, -15.224843978881836, -14.824289321899414, -14.423734664916992, -14.02318000793457, -13.622625350952148, -13.222071647644043, -12.821516990661621, -12.4209623336792, -12.020408630371094, -11.619853973388672, -11.21929931640625, -10.818745613098145, -10.418190956115723, -10.017637252807617, -9.617082595825195, -9.216527938842773, -8.815973281860352, -8.415419578552246, -8.014864921569824, -7.6143107414245605, -7.213756561279297, -6.813201904296875, -6.412647724151611, -6.012093544006348, -5.611538887023926, -5.210984706878662, -4.810430526733398, -4.409876823425293, -4.009322643280029, -3.6087679862976074, -3.2082138061523438, -2.807659387588501, -2.407104969024658, -2.0065507888793945, -1.6059963703155518, -1.205441951751709, -0.804887592792511, -0.404333233833313, -0.0037789344787597656, 0.396775484085083, 0.7973299026489258, 1.1978840827941895, 1.5984385013580322, 1.998992919921875, 2.3995473384857178, 2.8001017570495605, 3.200655937194824, 3.601210355758667, 4.00176477432251, 4.402318954467773, 4.802873611450195, 5.203427791595459, 5.603981971740723, 6.0045366287231445, 6.405090808868408, 6.805644989013672, 7.206199645996094, 7.606753826141357, 8.007308006286621, 8.407862663269043]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 8.0, 7.0, 10.0, 10.0, 18.0, 18.0, 17.0, 19.0, 22.0, 31.0, 29.0, 34.0, 36.0, 32.0, 35.0, 45.0, 47.0, 40.0, 41.0, 44.0, 46.0, 45.0, 47.0, 47.0, 40.0, 40.0, 26.0, 33.0, 22.0, 20.0, 15.0, 14.0, 12.0, 9.0, 9.0, 8.0, 10.0, 0.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.915860891342163, -2.8189809322357178, -2.7221007347106934, -2.625220775604248, -2.5283405780792236, -2.4314606189727783, -2.334580421447754, -2.2377004623413086, -2.140820264816284, -2.043940305709839, -1.9470601081848145, -1.8501800298690796, -1.7532999515533447, -1.6564198732376099, -1.559539794921875, -1.4626598358154297, -1.3657797574996948, -1.26889967918396, -1.172019600868225, -1.0751395225524902, -0.9782594442367554, -0.8813793659210205, -0.7844993472099304, -0.6876192688941956, -0.5907391905784607, -0.49385911226272583, -0.39697903394699097, -0.3000989854335785, -0.20321890711784363, -0.10633882880210876, -0.009458780288696289, 0.08742129802703857, 0.18430137634277344, 0.2811814546585083, 0.37806153297424316, 0.47494158148765564, 0.5718216896057129, 0.6687017679214478, 0.7655817866325378, 0.8624618649482727, 0.9593419432640076, 1.0562219619750977, 1.1531020402908325, 1.2499821186065674, 1.3468621969223022, 1.443742275238037, 1.540622353553772, 1.6375024318695068, 1.7343825101852417, 1.8312625885009766, 1.9281426668167114, 2.0250227451324463, 2.1219027042388916, 2.218782901763916, 2.3156628608703613, 2.4125430583953857, 2.509423017501831, 2.6063029766082764, 2.703183174133301, 2.800063133239746, 2.8969433307647705, 2.993823289871216, 3.0907034873962402, 3.1875834465026855, 3.28446364402771]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 11.0, 16.0, 9.0, 10.0, 21.0, 21.0, 15.0, 15.0, 19.0, 27.0, 29.0, 27.0, 28.0, 29.0, 33.0, 30.0, 42.0, 36.0, 37.0, 33.0, 39.0, 34.0, 34.0, 33.0, 32.0, 34.0, 30.0, 29.0, 21.0, 29.0, 25.0, 23.0, 24.0, 20.0, 12.0, 12.0, 14.0, 9.0, 12.0, 9.0, 4.0, 3.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30126953125, -0.2918434143066406, -0.28241729736328125, -0.2729911804199219, -0.2635650634765625, -0.2541389465332031, -0.24471282958984375, -0.23528671264648438, -0.225860595703125, -0.21643447875976562, -0.20700836181640625, -0.19758224487304688, -0.1881561279296875, -0.17873001098632812, -0.16930389404296875, -0.15987777709960938, -0.15045166015625, -0.14102554321289062, -0.13159942626953125, -0.12217330932617188, -0.1127471923828125, -0.10332107543945312, -0.09389495849609375, -0.08446884155273438, -0.075042724609375, -0.06561660766601562, -0.05619049072265625, -0.046764373779296875, -0.0373382568359375, -0.027912139892578125, -0.01848602294921875, -0.009059906005859375, 0.0003662109375, 0.009792327880859375, 0.01921844482421875, 0.028644561767578125, 0.0380706787109375, 0.047496795654296875, 0.05692291259765625, 0.06634902954101562, 0.075775146484375, 0.08520126342773438, 0.09462738037109375, 0.10405349731445312, 0.1134796142578125, 0.12290573120117188, 0.13233184814453125, 0.14175796508789062, 0.15118408203125, 0.16061019897460938, 0.17003631591796875, 0.17946243286132812, 0.1888885498046875, 0.19831466674804688, 0.20774078369140625, 0.21716690063476562, 0.226593017578125, 0.23601913452148438, 0.24544525146484375, 0.2548713684082031, 0.2642974853515625, 0.2737236022949219, 0.28314971923828125, 0.2925758361816406, 0.302001953125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 7.0, 12.0, 14.0, 25.0, 29.0, 36.0, 63.0, 90.0, 124.0, 188.0, 260.0, 393.0, 549.0, 745.0, 1063.0, 1568.0, 2116.0, 3113.0, 4557.0, 6682.0, 10027.0, 15035.0, 22354.0, 33405.0, 50514.0, 72749.0, 100728.0, 126606.0, 138415.0, 127386.0, 101134.0, 73714.0, 50539.0, 34014.0, 22831.0, 15198.0, 10126.0, 6952.0, 4726.0, 3205.0, 2140.0, 1477.0, 1053.0, 789.0, 536.0, 375.0, 268.0, 184.0, 130.0, 110.0, 63.0, 42.0, 30.0, 23.0, 23.0, 12.0, 12.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.238525390625, -0.23095703125, -0.223388671875, -0.2158203125, -0.208251953125, -0.20068359375, -0.193115234375, -0.185546875, -0.177978515625, -0.17041015625, -0.162841796875, -0.1552734375, -0.147705078125, -0.14013671875, -0.132568359375, -0.125, -0.117431640625, -0.10986328125, -0.102294921875, -0.0947265625, -0.087158203125, -0.07958984375, -0.072021484375, -0.064453125, -0.056884765625, -0.04931640625, -0.041748046875, -0.0341796875, -0.026611328125, -0.01904296875, -0.011474609375, -0.00390625, 0.003662109375, 0.01123046875, 0.018798828125, 0.0263671875, 0.033935546875, 0.04150390625, 0.049072265625, 0.056640625, 0.064208984375, 0.07177734375, 0.079345703125, 0.0869140625, 0.094482421875, 0.10205078125, 0.109619140625, 0.1171875, 0.124755859375, 0.13232421875, 0.139892578125, 0.1474609375, 0.155029296875, 0.16259765625, 0.170166015625, 0.177734375, 0.185302734375, 0.19287109375, 0.200439453125, 0.2080078125, 0.215576171875, 0.22314453125, 0.230712890625, 0.23828125, 0.245849609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 6.0, 6.0, 5.0, 8.0, 7.0, 8.0, 11.0, 19.0, 12.0, 14.0, 11.0, 22.0, 21.0, 25.0, 31.0, 45.0, 26.0, 29.0, 28.0, 39.0, 38.0, 46.0, 1060.0, 36.0, 38.0, 31.0, 40.0, 36.0, 30.0, 28.0, 36.0, 30.0, 26.0, 20.0, 21.0, 14.0, 12.0, 19.0, 14.0, 7.0, 7.0, 12.0, 10.0, 6.0, 4.0, 5.0, 1.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309326171875, -0.2999420166015625, -0.290557861328125, -0.2811737060546875, -0.27178955078125, -0.2624053955078125, -0.253021240234375, -0.2436370849609375, -0.2342529296875, -0.2248687744140625, -0.215484619140625, -0.2061004638671875, -0.19671630859375, -0.1873321533203125, -0.177947998046875, -0.1685638427734375, -0.1591796875, -0.1497955322265625, -0.140411376953125, -0.1310272216796875, -0.12164306640625, -0.1122589111328125, -0.102874755859375, -0.0934906005859375, -0.0841064453125, -0.0747222900390625, -0.065338134765625, -0.0559539794921875, -0.04656982421875, -0.0371856689453125, -0.027801513671875, -0.0184173583984375, -0.009033203125, 0.0003509521484375, 0.009735107421875, 0.0191192626953125, 0.02850341796875, 0.0378875732421875, 0.047271728515625, 0.0566558837890625, 0.0660400390625, 0.0754241943359375, 0.084808349609375, 0.0941925048828125, 0.10357666015625, 0.1129608154296875, 0.122344970703125, 0.1317291259765625, 0.14111328125, 0.1504974365234375, 0.159881591796875, 0.1692657470703125, 0.17864990234375, 0.1880340576171875, 0.197418212890625, 0.2068023681640625, 0.2161865234375, 0.2255706787109375, 0.234954833984375, 0.2443389892578125, 0.25372314453125, 0.2631072998046875, 0.272491455078125, 0.2818756103515625, 0.291259765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 20.0, 20.0, 30.0, 27.0, 60.0, 95.0, 118.0, 177.0, 285.0, 413.0, 702.0, 1092.0, 1828.0, 2920.0, 4772.0, 8288.0, 15164.0, 29183.0, 75217.0, 1488933.0, 363072.0, 51815.0, 22866.0, 12329.0, 6908.0, 4203.0, 2448.0, 1468.0, 969.0, 591.0, 386.0, 245.0, 161.0, 97.0, 56.0, 56.0, 29.0, 28.0, 8.0, 14.0, 12.0, 6.0, 4.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.478515625, -0.4634857177734375, -0.448455810546875, -0.4334259033203125, -0.41839599609375, -0.4033660888671875, -0.388336181640625, -0.3733062744140625, -0.3582763671875, -0.3432464599609375, -0.328216552734375, -0.3131866455078125, -0.29815673828125, -0.2831268310546875, -0.268096923828125, -0.2530670166015625, -0.238037109375, -0.2230072021484375, -0.207977294921875, -0.1929473876953125, -0.17791748046875, -0.1628875732421875, -0.147857666015625, -0.1328277587890625, -0.1177978515625, -0.1027679443359375, -0.087738037109375, -0.0727081298828125, -0.05767822265625, -0.0426483154296875, -0.027618408203125, -0.0125885009765625, 0.00244140625, 0.0174713134765625, 0.032501220703125, 0.0475311279296875, 0.06256103515625, 0.0775909423828125, 0.092620849609375, 0.1076507568359375, 0.1226806640625, 0.1377105712890625, 0.152740478515625, 0.1677703857421875, 0.18280029296875, 0.1978302001953125, 0.212860107421875, 0.2278900146484375, 0.242919921875, 0.2579498291015625, 0.272979736328125, 0.2880096435546875, 0.30303955078125, 0.3180694580078125, 0.333099365234375, 0.3481292724609375, 0.3631591796875, 0.3781890869140625, 0.393218994140625, 0.4082489013671875, 0.42327880859375, 0.4383087158203125, 0.453338623046875, 0.4683685302734375, 0.4833984375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 8.0, 12.0, 11.0, 20.0, 21.0, 35.0, 45.0, 54.0, 69.0, 110.0, 117.0, 104.0, 97.0, 78.0, 56.0, 37.0, 22.0, 26.0, 14.0, 11.0, 10.0, 7.0, 2.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.10145187377929688, -0.09792327880859375, -0.09439468383789062, -0.0908660888671875, -0.08733749389648438, -0.08380889892578125, -0.08028030395507812, -0.076751708984375, -0.07322311401367188, -0.06969451904296875, -0.06616592407226562, -0.0626373291015625, -0.059108734130859375, -0.05558013916015625, -0.052051544189453125, -0.04852294921875, -0.044994354248046875, -0.04146575927734375, -0.037937164306640625, -0.0344085693359375, -0.030879974365234375, -0.02735137939453125, -0.023822784423828125, -0.020294189453125, -0.016765594482421875, -0.01323699951171875, -0.009708404541015625, -0.0061798095703125, -0.002651214599609375, 0.00087738037109375, 0.004405975341796875, 0.0079345703125, 0.011463165283203125, 0.01499176025390625, 0.018520355224609375, 0.0220489501953125, 0.025577545166015625, 0.02910614013671875, 0.032634735107421875, 0.036163330078125, 0.039691925048828125, 0.04322052001953125, 0.046749114990234375, 0.0502777099609375, 0.053806304931640625, 0.05733489990234375, 0.060863494873046875, 0.06439208984375, 0.06792068481445312, 0.07144927978515625, 0.07497787475585938, 0.0785064697265625, 0.08203506469726562, 0.08556365966796875, 0.08909225463867188, 0.092620849609375, 0.09614944458007812, 0.09967803955078125, 0.10320663452148438, 0.1067352294921875, 0.11026382446289062, 0.11379241943359375, 0.11732101440429688, 0.120849609375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 7.0, 2.0, 3.0, 8.0, 11.0, 5.0, 14.0, 14.0, 20.0, 24.0, 52.0, 72.0, 106.0, 205.0, 438.0, 1333.0, 5133.0, 49250.0, 941996.0, 42856.0, 4799.0, 1228.0, 451.0, 184.0, 108.0, 65.0, 40.0, 34.0, 20.0, 13.0, 17.0, 5.0, 12.0, 4.0, 6.0, 4.0, 4.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4102783203125, -1.365478515625, -1.3206787109375, -1.27587890625, -1.2310791015625, -1.186279296875, -1.1414794921875, -1.0966796875, -1.0518798828125, -1.007080078125, -0.9622802734375, -0.91748046875, -0.8726806640625, -0.827880859375, -0.7830810546875, -0.73828125, -0.6934814453125, -0.648681640625, -0.6038818359375, -0.55908203125, -0.5142822265625, -0.469482421875, -0.4246826171875, -0.3798828125, -0.3350830078125, -0.290283203125, -0.2454833984375, -0.20068359375, -0.1558837890625, -0.111083984375, -0.0662841796875, -0.021484375, 0.0233154296875, 0.068115234375, 0.1129150390625, 0.15771484375, 0.2025146484375, 0.247314453125, 0.2921142578125, 0.3369140625, 0.3817138671875, 0.426513671875, 0.4713134765625, 0.51611328125, 0.5609130859375, 0.605712890625, 0.6505126953125, 0.6953125, 0.7401123046875, 0.784912109375, 0.8297119140625, 0.87451171875, 0.9193115234375, 0.964111328125, 1.0089111328125, 1.0537109375, 1.0985107421875, 1.143310546875, 1.1881103515625, 1.23291015625, 1.2777099609375, 1.322509765625, 1.3673095703125, 1.412109375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 15.0, 37.0, 126.0, 467.0, 252.0, 76.0, 25.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3591125011444092, -1.2867894172668457, -1.2144663333892822, -1.1421432495117188, -1.0698201656341553, -0.9974971413612366, -0.9251741170883179, -0.8528510332107544, -0.7805279493331909, -0.7082048654556274, -0.635881781578064, -0.5635587573051453, -0.4912356734275818, -0.4189125895500183, -0.3465895354747772, -0.27426648139953613, -0.20194339752197266, -0.12962032854557037, -0.05729725956916809, 0.015025809407234192, 0.08734887838363647, 0.15967196226119995, 0.23199501633644104, 0.30431807041168213, 0.3766411542892456, 0.4489642381668091, 0.5212873220443726, 0.5936103463172913, 0.6659334301948547, 0.7382565140724182, 0.8105795383453369, 0.8829026222229004, 0.9552257061004639, 1.0275487899780273, 1.0998718738555908, 1.1721949577331543, 1.2445180416107178, 1.3168411254882812, 1.3891640901565552, 1.4614871740341187, 1.5338102579116821, 1.6061333417892456, 1.678456425666809, 1.7507795095443726, 1.8231024742126465, 1.89542555809021, 1.9677486419677734, 2.040071725845337, 2.1123948097229004, 2.184717893600464, 2.2570409774780273, 2.329364061355591, 2.4016871452331543, 2.4740102291107178, 2.5463333129882812, 2.6186561584472656, 2.690979480743408, 2.7633025646209717, 2.835625648498535, 2.9079487323760986, 2.980271816253662, 3.0525949001312256, 3.124917984008789, 3.1972408294677734, 3.269563913345337]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 10.0, 6.0, 7.0, 12.0, 9.0, 13.0, 23.0, 13.0, 28.0, 15.0, 24.0, 36.0, 35.0, 47.0, 45.0, 41.0, 43.0, 34.0, 38.0, 42.0, 51.0, 37.0, 40.0, 39.0, 44.0, 29.0, 32.0, 21.0, 33.0, 16.0, 10.0, 25.0, 17.0, 21.0, 10.0, 13.0, 9.0, 5.0, 2.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3313283324241638, -0.32105985283851624, -0.31079137325286865, -0.3005228638648987, -0.2902543842792511, -0.2799859046936035, -0.26971739530563354, -0.25944891571998596, -0.24918043613433838, -0.2389119565486908, -0.22864346206188202, -0.21837496757507324, -0.20810648798942566, -0.19783800840377808, -0.1875695139169693, -0.17730101943016052, -0.16703253984451294, -0.15676406025886536, -0.14649556577205658, -0.1362270712852478, -0.12595859169960022, -0.11569010466337204, -0.10542161762714386, -0.09515313059091568, -0.0848846435546875, -0.07461615651845932, -0.06434766948223114, -0.05407918244600296, -0.04381069540977478, -0.0335422083735466, -0.02327372133731842, -0.01300523430109024, -0.0027367472648620605, 0.007531739771366119, 0.0178002268075943, 0.02806871384382248, 0.03833720088005066, 0.04860568791627884, 0.05887417495250702, 0.0691426619887352, 0.07941114902496338, 0.08967963606119156, 0.09994812309741974, 0.11021661013364792, 0.1204850971698761, 0.13075357675552368, 0.14102207124233246, 0.15129056572914124, 0.16155904531478882, 0.1718275249004364, 0.18209601938724518, 0.19236451387405396, 0.20263299345970154, 0.21290147304534912, 0.2231699675321579, 0.23343846201896667, 0.24370694160461426, 0.25397542119026184, 0.2642439007759094, 0.2745124101638794, 0.284780889749527, 0.29504936933517456, 0.30531787872314453, 0.3155863583087921, 0.3258548378944397]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 12.0, 12.0, 6.0, 11.0, 18.0, 23.0, 19.0, 18.0, 23.0, 19.0, 30.0, 29.0, 30.0, 28.0, 33.0, 36.0, 30.0, 39.0, 41.0, 33.0, 38.0, 37.0, 34.0, 28.0, 33.0, 27.0, 28.0, 33.0, 28.0, 16.0, 30.0, 22.0, 24.0, 16.0, 15.0, 19.0, 9.0, 6.0, 9.0, 13.0, 5.0, 7.0, 6.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.310546875, -0.3010597229003906, -0.29157257080078125, -0.2820854187011719, -0.2725982666015625, -0.2631111145019531, -0.25362396240234375, -0.24413681030273438, -0.234649658203125, -0.22516250610351562, -0.21567535400390625, -0.20618820190429688, -0.1967010498046875, -0.18721389770507812, -0.17772674560546875, -0.16823959350585938, -0.15875244140625, -0.14926528930664062, -0.13977813720703125, -0.13029098510742188, -0.1208038330078125, -0.11131668090820312, -0.10182952880859375, -0.09234237670898438, -0.082855224609375, -0.07336807250976562, -0.06388092041015625, -0.054393768310546875, -0.0449066162109375, -0.035419464111328125, -0.02593231201171875, -0.016445159912109375, -0.0069580078125, 0.002529144287109375, 0.01201629638671875, 0.021503448486328125, 0.0309906005859375, 0.040477752685546875, 0.04996490478515625, 0.059452056884765625, 0.068939208984375, 0.07842636108398438, 0.08791351318359375, 0.09740066528320312, 0.1068878173828125, 0.11637496948242188, 0.12586212158203125, 0.13534927368164062, 0.14483642578125, 0.15432357788085938, 0.16381072998046875, 0.17329788208007812, 0.1827850341796875, 0.19227218627929688, 0.20175933837890625, 0.21124649047851562, 0.220733642578125, 0.23022079467773438, 0.23970794677734375, 0.24919509887695312, 0.2586822509765625, 0.2681694030761719, 0.27765655517578125, 0.2871437072753906, 0.296630859375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 7.0, 23.0, 10.0, 31.0, 39.0, 46.0, 68.0, 94.0, 110.0, 156.0, 211.0, 277.0, 393.0, 605.0, 900.0, 1302.0, 1950.0, 3174.0, 5511.0, 10693.0, 23714.0, 62998.0, 249895.0, 494759.0, 118178.0, 38043.0, 15843.0, 7559.0, 4228.0, 2566.0, 1638.0, 1029.0, 691.0, 495.0, 354.0, 272.0, 190.0, 119.0, 96.0, 68.0, 50.0, 45.0, 40.0, 23.0, 19.0, 12.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6073684692382812, -0.5872955322265625, -0.5672225952148438, -0.547149658203125, -0.5270767211914062, -0.5070037841796875, -0.48693084716796875, -0.46685791015625, -0.44678497314453125, -0.4267120361328125, -0.40663909912109375, -0.386566162109375, -0.36649322509765625, -0.3464202880859375, -0.32634735107421875, -0.3062744140625, -0.28620147705078125, -0.2661285400390625, -0.24605560302734375, -0.225982666015625, -0.20590972900390625, -0.1858367919921875, -0.16576385498046875, -0.14569091796875, -0.12561798095703125, -0.1055450439453125, -0.08547210693359375, -0.065399169921875, -0.04532623291015625, -0.0252532958984375, -0.00518035888671875, 0.014892578125, 0.03496551513671875, 0.0550384521484375, 0.07511138916015625, 0.095184326171875, 0.11525726318359375, 0.1353302001953125, 0.15540313720703125, 0.17547607421875, 0.19554901123046875, 0.2156219482421875, 0.23569488525390625, 0.255767822265625, 0.27584075927734375, 0.2959136962890625, 0.31598663330078125, 0.3360595703125, 0.35613250732421875, 0.3762054443359375, 0.39627838134765625, 0.416351318359375, 0.43642425537109375, 0.4564971923828125, 0.47657012939453125, 0.49664306640625, 0.5167160034179688, 0.5367889404296875, 0.5568618774414062, 0.576934814453125, 0.5970077514648438, 0.6170806884765625, 0.6371536254882812, 0.6572265625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 7.0, 7.0, 10.0, 6.0, 12.0, 19.0, 12.0, 17.0, 31.0, 25.0, 19.0, 37.0, 37.0, 60.0, 48.0, 69.0, 78.0, 153.0, 331.0, 1363.0, 154.0, 92.0, 71.0, 55.0, 47.0, 48.0, 27.0, 33.0, 29.0, 18.0, 17.0, 20.0, 14.0, 11.0, 13.0, 10.0, 8.0, 11.0, 0.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2763671875, -1.23651123046875, -1.1966552734375, -1.15679931640625, -1.116943359375, -1.07708740234375, -1.0372314453125, -0.99737548828125, -0.95751953125, -0.91766357421875, -0.8778076171875, -0.83795166015625, -0.798095703125, -0.75823974609375, -0.7183837890625, -0.67852783203125, -0.638671875, -0.59881591796875, -0.5589599609375, -0.51910400390625, -0.479248046875, -0.43939208984375, -0.3995361328125, -0.35968017578125, -0.31982421875, -0.27996826171875, -0.2401123046875, -0.20025634765625, -0.160400390625, -0.12054443359375, -0.0806884765625, -0.04083251953125, -0.0009765625, 0.03887939453125, 0.0787353515625, 0.11859130859375, 0.158447265625, 0.19830322265625, 0.2381591796875, 0.27801513671875, 0.31787109375, 0.35772705078125, 0.3975830078125, 0.43743896484375, 0.477294921875, 0.51715087890625, 0.5570068359375, 0.59686279296875, 0.63671875, 0.67657470703125, 0.7164306640625, 0.75628662109375, 0.796142578125, 0.83599853515625, 0.8758544921875, 0.91571044921875, 0.95556640625, 0.99542236328125, 1.0352783203125, 1.07513427734375, 1.114990234375, 1.15484619140625, 1.1947021484375, 1.23455810546875, 1.2744140625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 4.0, 15.0, 10.0, 18.0, 22.0, 24.0, 39.0, 59.0, 75.0, 118.0, 191.0, 317.0, 563.0, 1054.0, 2005.0, 4598.0, 11761.0, 38292.0, 197510.0, 2332721.0, 462574.0, 63967.0, 17555.0, 6301.0, 2744.0, 1316.0, 714.0, 406.0, 244.0, 146.0, 85.0, 55.0, 49.0, 34.0, 19.0, 20.0, 12.0, 6.0, 17.0, 13.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0], "bins": [-1.69921875, -1.65289306640625, -1.6065673828125, -1.56024169921875, -1.513916015625, -1.46759033203125, -1.4212646484375, -1.37493896484375, -1.32861328125, -1.28228759765625, -1.2359619140625, -1.18963623046875, -1.143310546875, -1.09698486328125, -1.0506591796875, -1.00433349609375, -0.9580078125, -0.91168212890625, -0.8653564453125, -0.81903076171875, -0.772705078125, -0.72637939453125, -0.6800537109375, -0.63372802734375, -0.58740234375, -0.54107666015625, -0.4947509765625, -0.44842529296875, -0.402099609375, -0.35577392578125, -0.3094482421875, -0.26312255859375, -0.216796875, -0.17047119140625, -0.1241455078125, -0.07781982421875, -0.031494140625, 0.01483154296875, 0.0611572265625, 0.10748291015625, 0.15380859375, 0.20013427734375, 0.2464599609375, 0.29278564453125, 0.339111328125, 0.38543701171875, 0.4317626953125, 0.47808837890625, 0.5244140625, 0.57073974609375, 0.6170654296875, 0.66339111328125, 0.709716796875, 0.75604248046875, 0.8023681640625, 0.84869384765625, 0.89501953125, 0.94134521484375, 0.9876708984375, 1.03399658203125, 1.080322265625, 1.12664794921875, 1.1729736328125, 1.21929931640625, 1.265625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 9.0, 21.0, 96.0, 237.0, 325.0, 221.0, 80.0, 20.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.742377281188965, -3.441192150115967, -3.1400067806243896, -2.8388214111328125, -2.5376362800598145, -2.2364511489868164, -1.9352657794952393, -1.634080410003662, -1.332895278930664, -1.0317100286483765, -0.7305247783660889, -0.42933952808380127, -0.12815427780151367, 0.17303097248077393, 0.4742162227630615, 0.7754015922546387, 1.0765867233276367, 1.3777719736099243, 1.678957223892212, 1.9801424741744995, 2.281327724456787, 2.582512855529785, 2.8836982250213623, 3.1848835945129395, 3.4860687255859375, 3.7872538566589355, 4.088438987731934, 4.38962459564209, 4.690809726715088, 4.991994857788086, 5.293180465698242, 5.59436559677124, 5.895550727844238, 6.196735858917236, 6.497920989990234, 6.799106597900391, 7.100291728973389, 7.401476860046387, 7.702662467956543, 8.003847122192383, 8.305032730102539, 8.606218338012695, 8.907402992248535, 9.208588600158691, 9.509773254394531, 9.810958862304688, 10.112144470214844, 10.413330078125, 10.71451473236084, 11.015700340270996, 11.316884994506836, 11.618070602416992, 11.919256210327148, 12.220440864562988, 12.521626472473145, 12.822811126708984, 13.12399673461914, 13.425182342529297, 13.726366996765137, 14.027552604675293, 14.328737258911133, 14.629922866821289, 14.931108474731445, 15.232294082641602, 15.533478736877441]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 10.0, 10.0, 12.0, 20.0, 23.0, 25.0, 24.0, 28.0, 45.0, 43.0, 46.0, 45.0, 36.0, 57.0, 44.0, 53.0, 37.0, 50.0, 54.0, 39.0, 36.0, 39.0, 31.0, 30.0, 26.0, 15.0, 22.0, 22.0, 14.0, 12.0, 12.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234470367431641, -4.096039295196533, -3.957608222961426, -3.8191771507263184, -3.680746078491211, -3.5423150062561035, -3.403883934020996, -3.2654528617858887, -3.1270217895507812, -2.988590717315674, -2.8501596450805664, -2.711728572845459, -2.5732975006103516, -2.434866428375244, -2.2964353561401367, -2.1580042839050293, -2.019573211669922, -1.8811421394348145, -1.742711067199707, -1.6042799949645996, -1.4658489227294922, -1.3274178504943848, -1.1889867782592773, -1.05055570602417, -0.9121246337890625, -0.7736935615539551, -0.6352624893188477, -0.49683141708374023, -0.3584003448486328, -0.2199692726135254, -0.08153820037841797, 0.05689287185668945, 0.19532346725463867, 0.3337545394897461, 0.4721856117248535, 0.6106166839599609, 0.7490477561950684, 0.8874788284301758, 1.0259099006652832, 1.1643409729003906, 1.302772045135498, 1.4412031173706055, 1.579634189605713, 1.7180652618408203, 1.8564963340759277, 1.9949274063110352, 2.1333584785461426, 2.27178955078125, 2.4102206230163574, 2.548651695251465, 2.6870827674865723, 2.8255138397216797, 2.963944911956787, 3.1023759841918945, 3.240807056427002, 3.3792381286621094, 3.517669200897217, 3.656100273132324, 3.7945313453674316, 3.932962417602539, 4.0713934898376465, 4.209824562072754, 4.348255634307861, 4.486686706542969, 4.625117778778076]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 1.0, 7.0, 2.0, 8.0, 17.0, 15.0, 18.0, 17.0, 16.0, 19.0, 21.0, 27.0, 25.0, 30.0, 28.0, 29.0, 33.0, 22.0, 40.0, 45.0, 32.0, 28.0, 33.0, 36.0, 48.0, 36.0, 30.0, 33.0, 20.0, 27.0, 30.0, 31.0, 27.0, 21.0, 22.0, 20.0, 13.0, 21.0, 10.0, 11.0, 8.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0], "bins": [-0.327392578125, -0.31749725341796875, -0.3076019287109375, -0.29770660400390625, -0.287811279296875, -0.27791595458984375, -0.2680206298828125, -0.25812530517578125, -0.24822998046875, -0.23833465576171875, -0.2284393310546875, -0.21854400634765625, -0.208648681640625, -0.19875335693359375, -0.1888580322265625, -0.17896270751953125, -0.1690673828125, -0.15917205810546875, -0.1492767333984375, -0.13938140869140625, -0.129486083984375, -0.11959075927734375, -0.1096954345703125, -0.09980010986328125, -0.08990478515625, -0.08000946044921875, -0.0701141357421875, -0.06021881103515625, -0.050323486328125, -0.04042816162109375, -0.0305328369140625, -0.02063751220703125, -0.0107421875, -0.00084686279296875, 0.0090484619140625, 0.01894378662109375, 0.028839111328125, 0.03873443603515625, 0.0486297607421875, 0.05852508544921875, 0.06842041015625, 0.07831573486328125, 0.0882110595703125, 0.09810638427734375, 0.108001708984375, 0.11789703369140625, 0.1277923583984375, 0.13768768310546875, 0.1475830078125, 0.15747833251953125, 0.1673736572265625, 0.17726898193359375, 0.187164306640625, 0.19705963134765625, 0.2069549560546875, 0.21685028076171875, 0.22674560546875, 0.23664093017578125, 0.2465362548828125, 0.25643157958984375, 0.266326904296875, 0.27622222900390625, 0.2861175537109375, 0.29601287841796875, 0.305908203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 9.0, 13.0, 19.0, 27.0, 41.0, 56.0, 72.0, 92.0, 131.0, 180.0, 217.0, 318.0, 452.0, 640.0, 862.0, 1366.0, 2053.0, 3305.0, 5368.0, 9995.0, 21002.0, 54836.0, 235327.0, 1435943.0, 1940591.0, 353007.0, 73429.0, 26089.0, 11946.0, 6157.0, 3675.0, 2318.0, 1433.0, 991.0, 671.0, 500.0, 325.0, 197.0, 163.0, 112.0, 99.0, 67.0, 54.0, 37.0, 29.0, 21.0, 16.0, 10.0, 5.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0], "bins": [-0.69677734375, -0.6757354736328125, -0.654693603515625, -0.6336517333984375, -0.61260986328125, -0.5915679931640625, -0.570526123046875, -0.5494842529296875, -0.5284423828125, -0.5074005126953125, -0.486358642578125, -0.4653167724609375, -0.44427490234375, -0.4232330322265625, -0.402191162109375, -0.3811492919921875, -0.360107421875, -0.3390655517578125, -0.318023681640625, -0.2969818115234375, -0.27593994140625, -0.2548980712890625, -0.233856201171875, -0.2128143310546875, -0.1917724609375, -0.1707305908203125, -0.149688720703125, -0.1286468505859375, -0.10760498046875, -0.0865631103515625, -0.065521240234375, -0.0444793701171875, -0.0234375, -0.0023956298828125, 0.018646240234375, 0.0396881103515625, 0.06072998046875, 0.0817718505859375, 0.102813720703125, 0.1238555908203125, 0.1448974609375, 0.1659393310546875, 0.186981201171875, 0.2080230712890625, 0.22906494140625, 0.2501068115234375, 0.271148681640625, 0.2921905517578125, 0.313232421875, 0.3342742919921875, 0.355316162109375, 0.3763580322265625, 0.39739990234375, 0.4184417724609375, 0.439483642578125, 0.4605255126953125, 0.4815673828125, 0.5026092529296875, 0.523651123046875, 0.5446929931640625, 0.56573486328125, 0.5867767333984375, 0.607818603515625, 0.6288604736328125, 0.64990234375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 7.0, 7.0, 11.0, 8.0, 18.0, 21.0, 31.0, 28.0, 46.0, 49.0, 82.0, 111.0, 150.0, 230.0, 330.0, 457.0, 585.0, 551.0, 382.0, 268.0, 173.0, 122.0, 74.0, 67.0, 55.0, 41.0, 28.0, 24.0, 25.0, 15.0, 17.0, 5.0, 12.0, 9.0, 2.0, 9.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.86962890625, -0.84527587890625, -0.8209228515625, -0.79656982421875, -0.772216796875, -0.74786376953125, -0.7235107421875, -0.69915771484375, -0.6748046875, -0.65045166015625, -0.6260986328125, -0.60174560546875, -0.577392578125, -0.55303955078125, -0.5286865234375, -0.50433349609375, -0.47998046875, -0.45562744140625, -0.4312744140625, -0.40692138671875, -0.382568359375, -0.35821533203125, -0.3338623046875, -0.30950927734375, -0.28515625, -0.26080322265625, -0.2364501953125, -0.21209716796875, -0.187744140625, -0.16339111328125, -0.1390380859375, -0.11468505859375, -0.09033203125, -0.06597900390625, -0.0416259765625, -0.01727294921875, 0.007080078125, 0.03143310546875, 0.0557861328125, 0.08013916015625, 0.1044921875, 0.12884521484375, 0.1531982421875, 0.17755126953125, 0.201904296875, 0.22625732421875, 0.2506103515625, 0.27496337890625, 0.29931640625, 0.32366943359375, 0.3480224609375, 0.37237548828125, 0.396728515625, 0.42108154296875, 0.4454345703125, 0.46978759765625, 0.494140625, 0.51849365234375, 0.5428466796875, 0.56719970703125, 0.591552734375, 0.61590576171875, 0.6402587890625, 0.66461181640625, 0.68896484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 21.0, 24.0, 39.0, 49.0, 58.0, 103.0, 137.0, 200.0, 276.0, 406.0, 594.0, 911.0, 1344.0, 2066.0, 3277.0, 5264.0, 9092.0, 16748.0, 34620.0, 84422.0, 268794.0, 1336688.0, 1857087.0, 375580.0, 107580.0, 42294.0, 19854.0, 10538.0, 5929.0, 3593.0, 2211.0, 1477.0, 881.0, 603.0, 437.0, 274.0, 223.0, 150.0, 119.0, 87.0, 61.0, 41.0, 33.0, 25.0, 13.0, 12.0, 8.0, 11.0, 6.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.802734375, -0.7741851806640625, -0.745635986328125, -0.7170867919921875, -0.68853759765625, -0.6599884033203125, -0.631439208984375, -0.6028900146484375, -0.5743408203125, -0.5457916259765625, -0.517242431640625, -0.4886932373046875, -0.46014404296875, -0.4315948486328125, -0.403045654296875, -0.3744964599609375, -0.345947265625, -0.3173980712890625, -0.288848876953125, -0.2602996826171875, -0.23175048828125, -0.2032012939453125, -0.174652099609375, -0.1461029052734375, -0.1175537109375, -0.0890045166015625, -0.060455322265625, -0.0319061279296875, -0.00335693359375, 0.0251922607421875, 0.053741455078125, 0.0822906494140625, 0.11083984375, 0.1393890380859375, 0.167938232421875, 0.1964874267578125, 0.22503662109375, 0.2535858154296875, 0.282135009765625, 0.3106842041015625, 0.3392333984375, 0.3677825927734375, 0.396331787109375, 0.4248809814453125, 0.45343017578125, 0.4819793701171875, 0.510528564453125, 0.5390777587890625, 0.567626953125, 0.5961761474609375, 0.624725341796875, 0.6532745361328125, 0.68182373046875, 0.7103729248046875, 0.738922119140625, 0.7674713134765625, 0.7960205078125, 0.8245697021484375, 0.853118896484375, 0.8816680908203125, 0.91021728515625, 0.9387664794921875, 0.967315673828125, 0.9958648681640625, 1.0244140625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 4.0, 8.0, 7.0, 14.0, 18.0, 17.0, 21.0, 27.0, 28.0, 38.0, 54.0, 61.0, 75.0, 82.0, 94.0, 80.0, 65.0, 61.0, 62.0, 43.0, 38.0, 19.0, 20.0, 15.0, 10.0, 11.0, 7.0, 9.0, 4.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8044469356536865, -3.6986217498779297, -3.5927963256835938, -3.486971139907837, -3.381145715713501, -3.275320529937744, -3.169495105743408, -3.0636699199676514, -2.9578447341918945, -2.8520195484161377, -2.7461941242218018, -2.640368938446045, -2.534543514251709, -2.428718328475952, -2.3228931427001953, -2.2170677185058594, -2.1112422943115234, -2.0054171085357666, -1.8995916843414307, -1.7937664985656738, -1.687941074371338, -1.582115888595581, -1.4762905836105347, -1.3704652786254883, -1.264639973640442, -1.1588146686553955, -1.0529893636703491, -0.9471641182899475, -0.8413388133049011, -0.7355135083198547, -0.6296882629394531, -0.5238629579544067, -0.41803741455078125, -0.31221210956573486, -0.20638683438301086, -0.10056155920028687, 0.0052637457847595215, 0.11108905076980591, 0.21691429615020752, 0.3227396011352539, 0.4285649061203003, 0.5343902111053467, 0.6402155160903931, 0.7460407614707947, 0.8518660664558411, 0.9576913714408875, 1.063516616821289, 1.1693419218063354, 1.2751672267913818, 1.3809925317764282, 1.4868178367614746, 1.5926430225372314, 1.6984684467315674, 1.8042936325073242, 1.9101189374923706, 2.015944242477417, 2.121769428253174, 2.2275946140289307, 2.3334200382232666, 2.4392452239990234, 2.5450706481933594, 2.650895833969116, 2.756721019744873, 2.862546443939209, 2.968371868133545]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 8.0, 9.0, 9.0, 17.0, 9.0, 16.0, 26.0, 20.0, 27.0, 24.0, 32.0, 43.0, 28.0, 50.0, 38.0, 44.0, 53.0, 42.0, 46.0, 38.0, 39.0, 41.0, 42.0, 36.0, 34.0, 36.0, 26.0, 32.0, 22.0, 21.0, 23.0, 11.0, 10.0, 10.0, 9.0, 10.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8374063968658447, -2.7450225353240967, -2.6526386737823486, -2.5602550506591797, -2.4678711891174316, -2.3754873275756836, -2.2831034660339355, -2.1907196044921875, -2.0983357429504395, -2.0059518814086914, -1.913568139076233, -1.8211842775344849, -1.7288005352020264, -1.6364166736602783, -1.5440328121185303, -1.4516489505767822, -1.3592653274536133, -1.2668814659118652, -1.1744977235794067, -1.0821138620376587, -0.9897300601005554, -0.8973462581634521, -0.8049623966217041, -0.7125785946846008, -0.6201947927474976, -0.5278109908103943, -0.43542715907096863, -0.34304332733154297, -0.2506595253944397, -0.15827572345733643, -0.06589186191558838, 0.026491940021514893, 0.11887550354003906, 0.21125932037830353, 0.303643137216568, 0.39602696895599365, 0.4884107708930969, 0.5807945728302002, 0.6731784343719482, 0.7655622363090515, 0.8579460382461548, 0.9503298401832581, 1.0427136421203613, 1.1350975036621094, 1.2274813652038574, 1.319865107536316, 1.412248969078064, 1.5046327114105225, 1.5970165729522705, 1.6894004344940186, 1.781784176826477, 1.874168038368225, 1.9665517807006836, 2.0589356422424316, 2.1513195037841797, 2.2437033653259277, 2.336087226867676, 2.428471088409424, 2.520854949951172, 2.61323881149292, 2.705622434616089, 2.798006296157837, 2.890390157699585, 2.982774019241333, 3.075157642364502]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 7.0, 7.0, 9.0, 12.0, 17.0, 25.0, 28.0, 20.0, 22.0, 24.0, 16.0, 29.0, 47.0, 35.0, 45.0, 35.0, 46.0, 33.0, 31.0, 46.0, 39.0, 31.0, 38.0, 35.0, 33.0, 33.0, 20.0, 32.0, 34.0, 21.0, 19.0, 20.0, 21.0, 21.0, 16.0, 8.0, 11.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.32958984375, -0.31854248046875, -0.3074951171875, -0.29644775390625, -0.285400390625, -0.27435302734375, -0.2633056640625, -0.25225830078125, -0.2412109375, -0.23016357421875, -0.2191162109375, -0.20806884765625, -0.197021484375, -0.18597412109375, -0.1749267578125, -0.16387939453125, -0.15283203125, -0.14178466796875, -0.1307373046875, -0.11968994140625, -0.108642578125, -0.09759521484375, -0.0865478515625, -0.07550048828125, -0.064453125, -0.05340576171875, -0.0423583984375, -0.03131103515625, -0.020263671875, -0.00921630859375, 0.0018310546875, 0.01287841796875, 0.02392578125, 0.03497314453125, 0.0460205078125, 0.05706787109375, 0.068115234375, 0.07916259765625, 0.0902099609375, 0.10125732421875, 0.1123046875, 0.12335205078125, 0.1343994140625, 0.14544677734375, 0.156494140625, 0.16754150390625, 0.1785888671875, 0.18963623046875, 0.20068359375, 0.21173095703125, 0.2227783203125, 0.23382568359375, 0.244873046875, 0.25592041015625, 0.2669677734375, 0.27801513671875, 0.2890625, 0.30010986328125, 0.3111572265625, 0.32220458984375, 0.333251953125, 0.34429931640625, 0.3553466796875, 0.36639404296875, 0.37744140625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 9.0, 10.0, 11.0, 18.0, 30.0, 30.0, 41.0, 76.0, 109.0, 124.0, 216.0, 320.0, 457.0, 661.0, 984.0, 1459.0, 2131.0, 3024.0, 4611.0, 6871.0, 10243.0, 15330.0, 22498.0, 33574.0, 49568.0, 70942.0, 96445.0, 120810.0, 133352.0, 126026.0, 103016.0, 76659.0, 54849.0, 37310.0, 25006.0, 16970.0, 11381.0, 7587.0, 5101.0, 3318.0, 2291.0, 1625.0, 1107.0, 740.0, 485.0, 362.0, 237.0, 163.0, 118.0, 86.0, 55.0, 34.0, 30.0, 25.0, 16.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.260498046875, -0.2522621154785156, -0.24402618408203125, -0.23579025268554688, -0.2275543212890625, -0.21931838989257812, -0.21108245849609375, -0.20284652709960938, -0.194610595703125, -0.18637466430664062, -0.17813873291015625, -0.16990280151367188, -0.1616668701171875, -0.15343093872070312, -0.14519500732421875, -0.13695907592773438, -0.12872314453125, -0.12048721313476562, -0.11225128173828125, -0.10401535034179688, -0.0957794189453125, -0.08754348754882812, -0.07930755615234375, -0.07107162475585938, -0.062835693359375, -0.054599761962890625, -0.04636383056640625, -0.038127899169921875, -0.0298919677734375, -0.021656036376953125, -0.01342010498046875, -0.005184173583984375, 0.0030517578125, 0.011287689208984375, 0.01952362060546875, 0.027759552001953125, 0.0359954833984375, 0.044231414794921875, 0.05246734619140625, 0.060703277587890625, 0.068939208984375, 0.07717514038085938, 0.08541107177734375, 0.09364700317382812, 0.1018829345703125, 0.11011886596679688, 0.11835479736328125, 0.12659072875976562, 0.13482666015625, 0.14306259155273438, 0.15129852294921875, 0.15953445434570312, 0.1677703857421875, 0.17600631713867188, 0.18424224853515625, 0.19247817993164062, 0.200714111328125, 0.20895004272460938, 0.21718597412109375, 0.22542190551757812, 0.2336578369140625, 0.24189376831054688, 0.25012969970703125, 0.2583656311035156, 0.2666015625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 7.0, 6.0, 12.0, 13.0, 3.0, 11.0, 15.0, 23.0, 14.0, 22.0, 16.0, 28.0, 30.0, 32.0, 28.0, 36.0, 38.0, 32.0, 30.0, 25.0, 41.0, 1072.0, 29.0, 36.0, 35.0, 34.0, 43.0, 33.0, 26.0, 33.0, 25.0, 21.0, 36.0, 28.0, 16.0, 19.0, 17.0, 8.0, 12.0, 4.0, 12.0, 4.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.330078125, -0.3206024169921875, -0.311126708984375, -0.3016510009765625, -0.29217529296875, -0.2826995849609375, -0.273223876953125, -0.2637481689453125, -0.2542724609375, -0.2447967529296875, -0.235321044921875, -0.2258453369140625, -0.21636962890625, -0.2068939208984375, -0.197418212890625, -0.1879425048828125, -0.178466796875, -0.1689910888671875, -0.159515380859375, -0.1500396728515625, -0.14056396484375, -0.1310882568359375, -0.121612548828125, -0.1121368408203125, -0.1026611328125, -0.0931854248046875, -0.083709716796875, -0.0742340087890625, -0.06475830078125, -0.0552825927734375, -0.045806884765625, -0.0363311767578125, -0.02685546875, -0.0173797607421875, -0.007904052734375, 0.0015716552734375, 0.01104736328125, 0.0205230712890625, 0.029998779296875, 0.0394744873046875, 0.0489501953125, 0.0584259033203125, 0.067901611328125, 0.0773773193359375, 0.08685302734375, 0.0963287353515625, 0.105804443359375, 0.1152801513671875, 0.124755859375, 0.1342315673828125, 0.143707275390625, 0.1531829833984375, 0.16265869140625, 0.1721343994140625, 0.181610107421875, 0.1910858154296875, 0.2005615234375, 0.2100372314453125, 0.219512939453125, 0.2289886474609375, 0.23846435546875, 0.2479400634765625, 0.257415771484375, 0.2668914794921875, 0.2763671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 7.0, 13.0, 10.0, 11.0, 28.0, 29.0, 56.0, 70.0, 121.0, 218.0, 296.0, 523.0, 825.0, 1396.0, 2226.0, 3833.0, 6785.0, 12353.0, 24304.0, 62333.0, 1447408.0, 439103.0, 48804.0, 20980.0, 10806.0, 6010.0, 3474.0, 1961.0, 1230.0, 689.0, 458.0, 289.0, 155.0, 105.0, 81.0, 61.0, 28.0, 20.0, 10.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58984375, -0.5729408264160156, -0.5560379028320312, -0.5391349792480469, -0.5222320556640625, -0.5053291320800781, -0.48842620849609375, -0.4715232849121094, -0.454620361328125, -0.4377174377441406, -0.42081451416015625, -0.4039115905761719, -0.3870086669921875, -0.3701057434082031, -0.35320281982421875, -0.3362998962402344, -0.31939697265625, -0.3024940490722656, -0.28559112548828125, -0.2686882019042969, -0.2517852783203125, -0.23488235473632812, -0.21797943115234375, -0.20107650756835938, -0.184173583984375, -0.16727066040039062, -0.15036773681640625, -0.13346481323242188, -0.1165618896484375, -0.09965896606445312, -0.08275604248046875, -0.06585311889648438, -0.0489501953125, -0.032047271728515625, -0.01514434814453125, 0.001758575439453125, 0.0186614990234375, 0.035564422607421875, 0.05246734619140625, 0.06937026977539062, 0.086273193359375, 0.10317611694335938, 0.12007904052734375, 0.13698196411132812, 0.1538848876953125, 0.17078781127929688, 0.18769073486328125, 0.20459365844726562, 0.22149658203125, 0.23839950561523438, 0.25530242919921875, 0.2722053527832031, 0.2891082763671875, 0.3060111999511719, 0.32291412353515625, 0.3398170471191406, 0.356719970703125, 0.3736228942871094, 0.39052581787109375, 0.4074287414550781, 0.4243316650390625, 0.4412345886230469, 0.45813751220703125, 0.4750404357910156, 0.491943359375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 11.0, 4.0, 13.0, 8.0, 16.0, 28.0, 19.0, 40.0, 58.0, 56.0, 77.0, 96.0, 112.0, 87.0, 78.0, 61.0, 47.0, 30.0, 30.0, 19.0, 16.0, 19.0, 20.0, 13.0, 3.0, 7.0, 5.0, 1.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.077880859375, -0.07561397552490234, -0.07334709167480469, -0.07108020782470703, -0.06881332397460938, -0.06654644012451172, -0.06427955627441406, -0.062012672424316406, -0.05974578857421875, -0.057478904724121094, -0.05521202087402344, -0.05294513702392578, -0.050678253173828125, -0.04841136932373047, -0.04614448547363281, -0.043877601623535156, -0.0416107177734375, -0.039343833923339844, -0.03707695007324219, -0.03481006622314453, -0.032543182373046875, -0.03027629852294922, -0.028009414672851562, -0.025742530822753906, -0.02347564697265625, -0.021208763122558594, -0.018941879272460938, -0.01667499542236328, -0.014408111572265625, -0.012141227722167969, -0.009874343872070312, -0.007607460021972656, -0.005340576171875, -0.0030736923217773438, -0.0008068084716796875, 0.0014600753784179688, 0.003726959228515625, 0.005993843078613281, 0.008260726928710938, 0.010527610778808594, 0.01279449462890625, 0.015061378479003906, 0.017328262329101562, 0.01959514617919922, 0.021862030029296875, 0.02412891387939453, 0.026395797729492188, 0.028662681579589844, 0.0309295654296875, 0.033196449279785156, 0.03546333312988281, 0.03773021697998047, 0.039997100830078125, 0.04226398468017578, 0.04453086853027344, 0.046797752380371094, 0.04906463623046875, 0.051331520080566406, 0.05359840393066406, 0.05586528778076172, 0.058132171630859375, 0.06039905548095703, 0.06266593933105469, 0.06493282318115234, 0.06719970703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 10.0, 2.0, 7.0, 5.0, 12.0, 8.0, 17.0, 37.0, 40.0, 45.0, 62.0, 83.0, 161.0, 270.0, 728.0, 1899.0, 7547.0, 71734.0, 866903.0, 87135.0, 8283.0, 1976.0, 711.0, 323.0, 164.0, 80.0, 89.0, 57.0, 35.0, 26.0, 15.0, 20.0, 19.0, 13.0, 8.0, 5.0, 2.0, 5.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78564453125, -0.7590408325195312, -0.7324371337890625, -0.7058334350585938, -0.679229736328125, -0.6526260375976562, -0.6260223388671875, -0.5994186401367188, -0.57281494140625, -0.5462112426757812, -0.5196075439453125, -0.49300384521484375, -0.466400146484375, -0.43979644775390625, -0.4131927490234375, -0.38658905029296875, -0.3599853515625, -0.33338165283203125, -0.3067779541015625, -0.28017425537109375, -0.253570556640625, -0.22696685791015625, -0.2003631591796875, -0.17375946044921875, -0.14715576171875, -0.12055206298828125, -0.0939483642578125, -0.06734466552734375, -0.040740966796875, -0.01413726806640625, 0.0124664306640625, 0.03907012939453125, 0.065673828125, 0.09227752685546875, 0.1188812255859375, 0.14548492431640625, 0.172088623046875, 0.19869232177734375, 0.2252960205078125, 0.25189971923828125, 0.27850341796875, 0.30510711669921875, 0.3317108154296875, 0.35831451416015625, 0.384918212890625, 0.41152191162109375, 0.4381256103515625, 0.46472930908203125, 0.4913330078125, 0.5179367065429688, 0.5445404052734375, 0.5711441040039062, 0.597747802734375, 0.6243515014648438, 0.6509552001953125, 0.6775588989257812, 0.70416259765625, 0.7307662963867188, 0.7573699951171875, 0.7839736938476562, 0.810577392578125, 0.8371810913085938, 0.8637847900390625, 0.8903884887695312, 0.9169921875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 42.0, 156.0, 485.0, 226.0, 69.0, 17.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1127192974090576, -1.0562002658843994, -0.999681293964386, -0.9431622624397278, -0.8866432905197144, -0.8301242589950562, -0.773605227470398, -0.7170861959457397, -0.6605672240257263, -0.6040481925010681, -0.5475292205810547, -0.4910101890563965, -0.43449118733406067, -0.37797218561172485, -0.32145315408706665, -0.26493415236473083, -0.20841515064239502, -0.1518961489200592, -0.0953771322965622, -0.038858115673065186, 0.01766088604927063, 0.07417988777160645, 0.13069891929626465, 0.18721792101860046, 0.24373692274093628, 0.3002559244632721, 0.3567749261856079, 0.4132939577102661, 0.46981295943260193, 0.5263319611549377, 0.582850992679596, 0.6393699645996094, 0.6958889961242676, 0.7524080276489258, 0.8089269995689392, 0.8654460310935974, 0.9219650030136108, 0.978484034538269, 1.0350030660629272, 1.0915220975875854, 1.148041009902954, 1.2045600414276123, 1.2610790729522705, 1.3175981044769287, 1.3741170167922974, 1.4306360483169556, 1.4871550798416138, 1.543674111366272, 1.6001931428909302, 1.6567121744155884, 1.7132312059402466, 1.7697501182556152, 1.8262691497802734, 1.8827881813049316, 1.9393072128295898, 1.995826244354248, 2.0523452758789062, 2.1088643074035645, 2.1653833389282227, 2.221902370452881, 2.278421401977539, 2.3349404335021973, 2.3914594650268555, 2.4479782581329346, 2.5044972896575928]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 12.0, 6.0, 6.0, 14.0, 12.0, 22.0, 19.0, 23.0, 22.0, 39.0, 33.0, 37.0, 29.0, 42.0, 48.0, 47.0, 43.0, 41.0, 43.0, 49.0, 54.0, 48.0, 41.0, 33.0, 30.0, 27.0, 27.0, 29.0, 20.0, 18.0, 15.0, 17.0, 8.0, 15.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26642632484436035, -0.2575271427631378, -0.24862797558307648, -0.23972879350185394, -0.2308296114206314, -0.22193044424057007, -0.21303126215934753, -0.204132080078125, -0.19523289799690247, -0.18633371591567993, -0.1774345487356186, -0.16853536665439606, -0.15963618457317352, -0.15073701739311218, -0.14183783531188965, -0.13293865323066711, -0.12403948605060577, -0.11514031141996384, -0.1062411293387413, -0.09734195470809937, -0.08844277262687683, -0.0795435979962349, -0.07064442336559296, -0.06174524500966072, -0.052846066653728485, -0.04394688829779625, -0.035047709941864014, -0.026148535311222076, -0.01724935695528984, -0.008350178599357605, 0.0005489960312843323, 0.009448174387216568, 0.018347352743148804, 0.02724653109908104, 0.036145709455013275, 0.04504488408565521, 0.05394406244158745, 0.06284324079751968, 0.07174241542816162, 0.08064159750938416, 0.08954077214002609, 0.09843994677066803, 0.10733912885189056, 0.1162383034825325, 0.12513747811317444, 0.13403666019439697, 0.1429358422756195, 0.15183500945568085, 0.16073419153690338, 0.16963337361812592, 0.17853254079818726, 0.1874317228794098, 0.19633090496063232, 0.20523008704185486, 0.2141292542219162, 0.22302843630313873, 0.23192760348320007, 0.2408267855644226, 0.24972595274448395, 0.2586251497268677, 0.2675243020057678, 0.27642348408699036, 0.2853226661682129, 0.2942218482494354, 0.30312103033065796]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 7.0, 6.0, 14.0, 9.0, 18.0, 26.0, 27.0, 18.0, 25.0, 19.0, 25.0, 31.0, 37.0, 42.0, 33.0, 49.0, 52.0, 26.0, 37.0, 42.0, 45.0, 37.0, 32.0, 32.0, 29.0, 36.0, 32.0, 31.0, 21.0, 16.0, 28.0, 11.0, 26.0, 19.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3486328125, -0.33722686767578125, -0.3258209228515625, -0.31441497802734375, -0.303009033203125, -0.29160308837890625, -0.2801971435546875, -0.26879119873046875, -0.25738525390625, -0.24597930908203125, -0.2345733642578125, -0.22316741943359375, -0.211761474609375, -0.20035552978515625, -0.1889495849609375, -0.17754364013671875, -0.1661376953125, -0.15473175048828125, -0.1433258056640625, -0.13191986083984375, -0.120513916015625, -0.10910797119140625, -0.0977020263671875, -0.08629608154296875, -0.07489013671875, -0.06348419189453125, -0.0520782470703125, -0.04067230224609375, -0.029266357421875, -0.01786041259765625, -0.0064544677734375, 0.00495147705078125, 0.016357421875, 0.02776336669921875, 0.0391693115234375, 0.05057525634765625, 0.061981201171875, 0.07338714599609375, 0.0847930908203125, 0.09619903564453125, 0.10760498046875, 0.11901092529296875, 0.1304168701171875, 0.14182281494140625, 0.153228759765625, 0.16463470458984375, 0.1760406494140625, 0.18744659423828125, 0.1988525390625, 0.21025848388671875, 0.2216644287109375, 0.23307037353515625, 0.244476318359375, 0.25588226318359375, 0.2672882080078125, 0.27869415283203125, 0.29010009765625, 0.30150604248046875, 0.3129119873046875, 0.32431793212890625, 0.335723876953125, 0.34712982177734375, 0.3585357666015625, 0.36994171142578125, 0.38134765625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 5.0, 8.0, 20.0, 21.0, 37.0, 59.0, 68.0, 95.0, 134.0, 201.0, 343.0, 513.0, 768.0, 1183.0, 2079.0, 3439.0, 6335.0, 11980.0, 23686.0, 51480.0, 130078.0, 487120.0, 195220.0, 69525.0, 30680.0, 14872.0, 7773.0, 4239.0, 2523.0, 1449.0, 858.0, 585.0, 378.0, 252.0, 191.0, 116.0, 74.0, 47.0, 39.0, 26.0, 22.0, 11.0, 7.0, 4.0, 2.0, 2.0, 0.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.712890625, -0.691070556640625, -0.66925048828125, -0.647430419921875, -0.6256103515625, -0.603790283203125, -0.58197021484375, -0.560150146484375, -0.538330078125, -0.516510009765625, -0.49468994140625, -0.472869873046875, -0.4510498046875, -0.429229736328125, -0.40740966796875, -0.385589599609375, -0.36376953125, -0.341949462890625, -0.32012939453125, -0.298309326171875, -0.2764892578125, -0.254669189453125, -0.23284912109375, -0.211029052734375, -0.189208984375, -0.167388916015625, -0.14556884765625, -0.123748779296875, -0.1019287109375, -0.080108642578125, -0.05828857421875, -0.036468505859375, -0.0146484375, 0.007171630859375, 0.02899169921875, 0.050811767578125, 0.0726318359375, 0.094451904296875, 0.11627197265625, 0.138092041015625, 0.159912109375, 0.181732177734375, 0.20355224609375, 0.225372314453125, 0.2471923828125, 0.269012451171875, 0.29083251953125, 0.312652587890625, 0.33447265625, 0.356292724609375, 0.37811279296875, 0.399932861328125, 0.4217529296875, 0.443572998046875, 0.46539306640625, 0.487213134765625, 0.509033203125, 0.530853271484375, 0.55267333984375, 0.574493408203125, 0.5963134765625, 0.618133544921875, 0.63995361328125, 0.661773681640625, 0.68359375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 4.0, 3.0, 11.0, 10.0, 13.0, 24.0, 18.0, 19.0, 23.0, 29.0, 34.0, 34.0, 36.0, 41.0, 47.0, 61.0, 89.0, 131.0, 1418.0, 346.0, 153.0, 76.0, 50.0, 46.0, 45.0, 37.0, 42.0, 26.0, 27.0, 28.0, 17.0, 21.0, 15.0, 14.0, 10.0, 10.0, 8.0, 8.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.48828125, -1.445709228515625, -1.40313720703125, -1.360565185546875, -1.3179931640625, -1.275421142578125, -1.23284912109375, -1.190277099609375, -1.147705078125, -1.105133056640625, -1.06256103515625, -1.019989013671875, -0.9774169921875, -0.934844970703125, -0.89227294921875, -0.849700927734375, -0.80712890625, -0.764556884765625, -0.72198486328125, -0.679412841796875, -0.6368408203125, -0.594268798828125, -0.55169677734375, -0.509124755859375, -0.466552734375, -0.423980712890625, -0.38140869140625, -0.338836669921875, -0.2962646484375, -0.253692626953125, -0.21112060546875, -0.168548583984375, -0.1259765625, -0.083404541015625, -0.04083251953125, 0.001739501953125, 0.0443115234375, 0.086883544921875, 0.12945556640625, 0.172027587890625, 0.214599609375, 0.257171630859375, 0.29974365234375, 0.342315673828125, 0.3848876953125, 0.427459716796875, 0.47003173828125, 0.512603759765625, 0.55517578125, 0.597747802734375, 0.64031982421875, 0.682891845703125, 0.7254638671875, 0.768035888671875, 0.81060791015625, 0.853179931640625, 0.895751953125, 0.938323974609375, 0.98089599609375, 1.023468017578125, 1.0660400390625, 1.108612060546875, 1.15118408203125, 1.193756103515625, 1.236328125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 7.0, 11.0, 19.0, 24.0, 34.0, 58.0, 107.0, 207.0, 356.0, 859.0, 2934.0, 18481.0, 428938.0, 2640898.0, 45308.0, 5162.0, 1258.0, 486.0, 209.0, 127.0, 68.0, 53.0, 38.0, 22.0, 10.0, 7.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0, -2.897186279296875, -2.79437255859375, -2.691558837890625, -2.5887451171875, -2.485931396484375, -2.38311767578125, -2.280303955078125, -2.177490234375, -2.074676513671875, -1.97186279296875, -1.869049072265625, -1.7662353515625, -1.663421630859375, -1.56060791015625, -1.457794189453125, -1.35498046875, -1.252166748046875, -1.14935302734375, -1.046539306640625, -0.9437255859375, -0.840911865234375, -0.73809814453125, -0.635284423828125, -0.532470703125, -0.429656982421875, -0.32684326171875, -0.224029541015625, -0.1212158203125, -0.018402099609375, 0.08441162109375, 0.187225341796875, 0.2900390625, 0.392852783203125, 0.49566650390625, 0.598480224609375, 0.7012939453125, 0.804107666015625, 0.90692138671875, 1.009735107421875, 1.112548828125, 1.215362548828125, 1.31817626953125, 1.420989990234375, 1.5238037109375, 1.626617431640625, 1.72943115234375, 1.832244873046875, 1.93505859375, 2.037872314453125, 2.14068603515625, 2.243499755859375, 2.3463134765625, 2.449127197265625, 2.55194091796875, 2.654754638671875, 2.757568359375, 2.860382080078125, 2.96319580078125, 3.066009521484375, 3.1688232421875, 3.271636962890625, 3.37445068359375, 3.477264404296875, 3.580078125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [228.0, 791.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8141976594924927, -0.2801560163497925, 1.2538856267929077, 2.7879276275634766, 4.321969032287598, 5.856010437011719, 7.390052795410156, 8.924094200134277, 10.458135604858398, 11.99217700958252, 13.52621841430664, 15.060260772705078, 16.594303131103516, 18.12834358215332, 19.662385940551758, 21.196426391601562, 22.73046875, 24.264511108398438, 25.798551559448242, 27.33259391784668, 28.866634368896484, 30.400676727294922, 31.93471908569336, 33.4687614440918, 35.00279998779297, 36.536842346191406, 38.070884704589844, 39.60492706298828, 41.13896560668945, 42.67300796508789, 44.20705032348633, 45.741092681884766, 47.27513122558594, 48.809173583984375, 50.34321594238281, 51.87725830078125, 53.41129684448242, 54.94533920288086, 56.4793815612793, 58.013423919677734, 59.547462463378906, 61.081504821777344, 62.61554718017578, 64.14958953857422, 65.68363189697266, 67.21766662597656, 68.751708984375, 70.28575134277344, 71.81979370117188, 73.35383605957031, 74.88787841796875, 76.42192077636719, 77.95596313476562, 79.49000549316406, 81.0240478515625, 82.5580825805664, 84.09213256835938, 85.62617492675781, 87.16021728515625, 88.69425964355469, 90.22830200195312, 91.76234436035156, 93.29638671875, 94.8304214477539, 96.36446380615234]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 10.0, 10.0, 7.0, 8.0, 15.0, 7.0, 14.0, 25.0, 17.0, 15.0, 38.0, 31.0, 26.0, 61.0, 38.0, 31.0, 44.0, 35.0, 41.0, 51.0, 43.0, 51.0, 48.0, 37.0, 32.0, 38.0, 36.0, 29.0, 28.0, 24.0, 17.0, 24.0, 15.0, 12.0, 12.0, 10.0, 6.0, 2.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.199450969696045, -4.0646586418151855, -3.929866075515747, -3.7950735092163086, -3.660281181335449, -3.52548885345459, -3.3906962871551514, -3.255903720855713, -3.1211113929748535, -2.986319065093994, -2.8515264987945557, -2.716733932495117, -2.581941604614258, -2.4471492767333984, -2.31235671043396, -2.1775641441345215, -2.042771816253662, -1.9079793691635132, -1.7731869220733643, -1.6383944749832153, -1.5036020278930664, -1.3688095808029175, -1.2340171337127686, -1.0992246866226196, -0.9644322395324707, -0.8296397924423218, -0.6948473453521729, -0.5600548982620239, -0.425262451171875, -0.2904700040817261, -0.15567755699157715, -0.020885109901428223, 0.1139073371887207, 0.24869978427886963, 0.38349223136901855, 0.5182846784591675, 0.6530771255493164, 0.7878695726394653, 0.9226620197296143, 1.0574544668197632, 1.192246913909912, 1.327039361000061, 1.46183180809021, 1.5966242551803589, 1.7314167022705078, 1.8662091493606567, 2.0010015964508057, 2.135794162750244, 2.2705864906311035, 2.405378818511963, 2.5401713848114014, 2.67496395111084, 2.809756278991699, 2.9445486068725586, 3.079341173171997, 3.2141337394714355, 3.348926067352295, 3.4837183952331543, 3.6185109615325928, 3.7533035278320312, 3.8880958557128906, 4.02288818359375, 4.157680511474609, 4.292473316192627, 4.427265644073486]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 3.0, 5.0, 5.0, 8.0, 16.0, 13.0, 13.0, 16.0, 18.0, 18.0, 11.0, 30.0, 28.0, 29.0, 48.0, 27.0, 40.0, 38.0, 45.0, 32.0, 41.0, 39.0, 43.0, 43.0, 35.0, 36.0, 26.0, 37.0, 32.0, 28.0, 17.0, 18.0, 21.0, 21.0, 31.0, 23.0, 11.0, 8.0, 10.0, 9.0, 6.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.35107421875, -0.33951568603515625, -0.3279571533203125, -0.31639862060546875, -0.304840087890625, -0.29328155517578125, -0.2817230224609375, -0.27016448974609375, -0.25860595703125, -0.24704742431640625, -0.2354888916015625, -0.22393035888671875, -0.212371826171875, -0.20081329345703125, -0.1892547607421875, -0.17769622802734375, -0.1661376953125, -0.15457916259765625, -0.1430206298828125, -0.13146209716796875, -0.119903564453125, -0.10834503173828125, -0.0967864990234375, -0.08522796630859375, -0.07366943359375, -0.06211090087890625, -0.0505523681640625, -0.03899383544921875, -0.027435302734375, -0.01587677001953125, -0.0043182373046875, 0.00724029541015625, 0.018798828125, 0.03035736083984375, 0.0419158935546875, 0.05347442626953125, 0.065032958984375, 0.07659149169921875, 0.0881500244140625, 0.09970855712890625, 0.11126708984375, 0.12282562255859375, 0.1343841552734375, 0.14594268798828125, 0.157501220703125, 0.16905975341796875, 0.1806182861328125, 0.19217681884765625, 0.2037353515625, 0.21529388427734375, 0.2268524169921875, 0.23841094970703125, 0.249969482421875, 0.26152801513671875, 0.2730865478515625, 0.28464508056640625, 0.29620361328125, 0.30776214599609375, 0.3193206787109375, 0.33087921142578125, 0.342437744140625, 0.35399627685546875, 0.3655548095703125, 0.37711334228515625, 0.388671875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 11.0, 12.0, 28.0, 33.0, 41.0, 68.0, 89.0, 130.0, 158.0, 247.0, 348.0, 519.0, 668.0, 1006.0, 1484.0, 2357.0, 3826.0, 6762.0, 13905.0, 32563.0, 108249.0, 641166.0, 2389845.0, 790839.0, 128098.0, 36934.0, 15504.0, 7613.0, 4181.0, 2522.0, 1596.0, 1060.0, 693.0, 542.0, 319.0, 239.0, 177.0, 121.0, 93.0, 65.0, 54.0, 31.0, 17.0, 19.0, 14.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.7724609375, -0.7487335205078125, -0.725006103515625, -0.7012786865234375, -0.67755126953125, -0.6538238525390625, -0.630096435546875, -0.6063690185546875, -0.5826416015625, -0.5589141845703125, -0.535186767578125, -0.5114593505859375, -0.48773193359375, -0.4640045166015625, -0.440277099609375, -0.4165496826171875, -0.392822265625, -0.3690948486328125, -0.345367431640625, -0.3216400146484375, -0.29791259765625, -0.2741851806640625, -0.250457763671875, -0.2267303466796875, -0.2030029296875, -0.1792755126953125, -0.155548095703125, -0.1318206787109375, -0.10809326171875, -0.0843658447265625, -0.060638427734375, -0.0369110107421875, -0.01318359375, 0.0105438232421875, 0.034271240234375, 0.0579986572265625, 0.08172607421875, 0.1054534912109375, 0.129180908203125, 0.1529083251953125, 0.1766357421875, 0.2003631591796875, 0.224090576171875, 0.2478179931640625, 0.27154541015625, 0.2952728271484375, 0.319000244140625, 0.3427276611328125, 0.366455078125, 0.3901824951171875, 0.413909912109375, 0.4376373291015625, 0.46136474609375, 0.4850921630859375, 0.508819580078125, 0.5325469970703125, 0.5562744140625, 0.5800018310546875, 0.603729248046875, 0.6274566650390625, 0.65118408203125, 0.6749114990234375, 0.698638916015625, 0.7223663330078125, 0.74609375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 10.0, 7.0, 9.0, 24.0, 26.0, 35.0, 38.0, 62.0, 77.0, 133.0, 194.0, 304.0, 502.0, 645.0, 626.0, 475.0, 278.0, 176.0, 112.0, 79.0, 69.0, 49.0, 29.0, 17.0, 23.0, 12.0, 11.0, 7.0, 10.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0185546875, -0.9867095947265625, -0.954864501953125, -0.9230194091796875, -0.89117431640625, -0.8593292236328125, -0.827484130859375, -0.7956390380859375, -0.7637939453125, -0.7319488525390625, -0.700103759765625, -0.6682586669921875, -0.63641357421875, -0.6045684814453125, -0.572723388671875, -0.5408782958984375, -0.509033203125, -0.4771881103515625, -0.445343017578125, -0.4134979248046875, -0.38165283203125, -0.3498077392578125, -0.317962646484375, -0.2861175537109375, -0.2542724609375, -0.2224273681640625, -0.190582275390625, -0.1587371826171875, -0.12689208984375, -0.0950469970703125, -0.063201904296875, -0.0313568115234375, 0.00048828125, 0.0323333740234375, 0.064178466796875, 0.0960235595703125, 0.12786865234375, 0.1597137451171875, 0.191558837890625, 0.2234039306640625, 0.2552490234375, 0.2870941162109375, 0.318939208984375, 0.3507843017578125, 0.38262939453125, 0.4144744873046875, 0.446319580078125, 0.4781646728515625, 0.510009765625, 0.5418548583984375, 0.573699951171875, 0.6055450439453125, 0.63739013671875, 0.6692352294921875, 0.701080322265625, 0.7329254150390625, 0.7647705078125, 0.7966156005859375, 0.828460693359375, 0.8603057861328125, 0.89215087890625, 0.9239959716796875, 0.955841064453125, 0.9876861572265625, 1.01953125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 5.0, 14.0, 21.0, 30.0, 43.0, 65.0, 91.0, 114.0, 155.0, 226.0, 364.0, 514.0, 750.0, 1088.0, 1570.0, 2504.0, 3868.0, 6303.0, 10985.0, 20908.0, 45435.0, 119831.0, 458335.0, 2124661.0, 1046342.0, 213895.0, 69599.0, 29756.0, 14719.0, 8048.0, 4802.0, 3103.0, 1913.0, 1285.0, 872.0, 617.0, 452.0, 304.0, 202.0, 157.0, 104.0, 66.0, 51.0, 30.0, 24.0, 18.0, 12.0, 10.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.9775390625, -0.9467391967773438, -0.9159393310546875, -0.8851394653320312, -0.854339599609375, -0.8235397338867188, -0.7927398681640625, -0.7619400024414062, -0.73114013671875, -0.7003402709960938, -0.6695404052734375, -0.6387405395507812, -0.607940673828125, -0.5771408081054688, -0.5463409423828125, -0.5155410766601562, -0.4847412109375, -0.45394134521484375, -0.4231414794921875, -0.39234161376953125, -0.361541748046875, -0.33074188232421875, -0.2999420166015625, -0.26914215087890625, -0.23834228515625, -0.20754241943359375, -0.1767425537109375, -0.14594268798828125, -0.115142822265625, -0.08434295654296875, -0.0535430908203125, -0.02274322509765625, 0.008056640625, 0.03885650634765625, 0.0696563720703125, 0.10045623779296875, 0.131256103515625, 0.16205596923828125, 0.1928558349609375, 0.22365570068359375, 0.25445556640625, 0.28525543212890625, 0.3160552978515625, 0.34685516357421875, 0.377655029296875, 0.40845489501953125, 0.4392547607421875, 0.47005462646484375, 0.5008544921875, 0.5316543579101562, 0.5624542236328125, 0.5932540893554688, 0.624053955078125, 0.6548538208007812, 0.6856536865234375, 0.7164535522460938, 0.74725341796875, 0.7780532836914062, 0.8088531494140625, 0.8396530151367188, 0.870452880859375, 0.9012527465820312, 0.9320526123046875, 0.9628524780273438, 0.99365234375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 19.0, 60.0, 115.0, 224.0, 270.0, 160.0, 83.0, 48.0, 17.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.587477207183838, -6.205594062805176, -5.823710918426514, -5.441827774047852, -5.0599446296691895, -4.678061485290527, -4.296178817749023, -3.9142954349517822, -3.53241229057312, -3.150529146194458, -2.768646001815796, -2.386763095855713, -2.004879951477051, -1.6229966878890991, -1.2411136627197266, -0.8592305183410645, -0.47734737396240234, -0.09546425938606262, 0.2864188551902771, 0.6683019399642944, 1.0501850843429565, 1.4320682287216187, 1.8139512538909912, 2.1958343982696533, 2.5777175426483154, 2.9596006870269775, 3.3414838314056396, 3.7233667373657227, 4.105249881744385, 4.487133026123047, 4.869016170501709, 5.250899314880371, 5.632782936096191, 6.0146660804748535, 6.396549224853516, 6.778432369232178, 7.16031551361084, 7.542198657989502, 7.924081802368164, 8.305964469909668, 8.687848091125488, 9.069730758666992, 9.451614379882812, 9.833497047424316, 10.215380668640137, 10.59726333618164, 10.979146957397461, 11.361029624938965, 11.742912292480469, 12.124794960021973, 12.506678581237793, 12.888561248779297, 13.270444869995117, 13.652327537536621, 14.034211158752441, 14.416093826293945, 14.797977447509766, 15.17986011505127, 15.56174373626709, 15.943626403808594, 16.325510025024414, 16.707393646240234, 17.089275360107422, 17.471158981323242, 17.853042602539062]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 6.0, 9.0, 13.0, 6.0, 12.0, 21.0, 26.0, 20.0, 29.0, 28.0, 25.0, 31.0, 40.0, 46.0, 48.0, 43.0, 45.0, 49.0, 46.0, 51.0, 42.0, 45.0, 39.0, 35.0, 26.0, 32.0, 26.0, 21.0, 30.0, 22.0, 14.0, 17.0, 12.0, 13.0, 5.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.582629680633545, -3.478682041168213, -3.3747341632843018, -3.2707865238189697, -3.1668388843536377, -3.0628910064697266, -2.9589433670043945, -2.8549957275390625, -2.7510480880737305, -2.6471004486083984, -2.5431525707244873, -2.4392049312591553, -2.3352572917938232, -2.231309413909912, -2.12736177444458, -2.023414134979248, -1.919466257095337, -1.8155184984207153, -1.7115708589553833, -1.6076231002807617, -1.5036754608154297, -1.399727702140808, -1.2957799434661865, -1.1918323040008545, -1.087884545326233, -0.9839368462562561, -0.8799891471862793, -0.7760413885116577, -0.6720936894416809, -0.5681459903717041, -0.4641982316970825, -0.3602505326271057, -0.2563028335571289, -0.1523551195859909, -0.048407405614852905, 0.05554032325744629, 0.1594880223274231, 0.2634357213973999, 0.3673834800720215, 0.4713311791419983, 0.5752788782119751, 0.6792265772819519, 0.7831742763519287, 0.8871220350265503, 0.9910697340965271, 1.095017433166504, 1.1989651918411255, 1.302912950515747, 1.406860589981079, 1.5108083486557007, 1.6147559881210327, 1.7187037467956543, 1.8226513862609863, 1.926599144935608, 2.0305469036102295, 2.1344945430755615, 2.2384424209594727, 2.3423900604248047, 2.446337938308716, 2.550285577774048, 2.65423321723938, 2.758181095123291, 2.862128734588623, 2.966076374053955, 3.070024013519287]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 13.0, 14.0, 10.0, 11.0, 21.0, 19.0, 31.0, 20.0, 27.0, 22.0, 28.0, 32.0, 33.0, 39.0, 40.0, 31.0, 33.0, 29.0, 42.0, 45.0, 46.0, 33.0, 40.0, 36.0, 38.0, 15.0, 29.0, 19.0, 21.0, 23.0, 25.0, 23.0, 14.0, 12.0, 12.0, 9.0, 9.0, 7.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.331787109375, -0.32073211669921875, -0.3096771240234375, -0.29862213134765625, -0.287567138671875, -0.27651214599609375, -0.2654571533203125, -0.25440216064453125, -0.24334716796875, -0.23229217529296875, -0.2212371826171875, -0.21018218994140625, -0.199127197265625, -0.18807220458984375, -0.1770172119140625, -0.16596221923828125, -0.1549072265625, -0.14385223388671875, -0.1327972412109375, -0.12174224853515625, -0.110687255859375, -0.09963226318359375, -0.0885772705078125, -0.07752227783203125, -0.06646728515625, -0.05541229248046875, -0.0443572998046875, -0.03330230712890625, -0.022247314453125, -0.01119232177734375, -0.0001373291015625, 0.01091766357421875, 0.02197265625, 0.03302764892578125, 0.0440826416015625, 0.05513763427734375, 0.066192626953125, 0.07724761962890625, 0.0883026123046875, 0.09935760498046875, 0.11041259765625, 0.12146759033203125, 0.1325225830078125, 0.14357757568359375, 0.154632568359375, 0.16568756103515625, 0.1767425537109375, 0.18779754638671875, 0.1988525390625, 0.20990753173828125, 0.2209625244140625, 0.23201751708984375, 0.243072509765625, 0.25412750244140625, 0.2651824951171875, 0.27623748779296875, 0.28729248046875, 0.29834747314453125, 0.3094024658203125, 0.32045745849609375, 0.331512451171875, 0.34256744384765625, 0.3536224365234375, 0.36467742919921875, 0.375732421875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 8.0, 10.0, 22.0, 40.0, 50.0, 56.0, 80.0, 115.0, 199.0, 252.0, 336.0, 542.0, 744.0, 1129.0, 1661.0, 2477.0, 3761.0, 5654.0, 9078.0, 14296.0, 22156.0, 35114.0, 54580.0, 81154.0, 113068.0, 140635.0, 147783.0, 127956.0, 96787.0, 66791.0, 43933.0, 27935.0, 17646.0, 11298.0, 7079.0, 4581.0, 3149.0, 2020.0, 1388.0, 898.0, 677.0, 451.0, 276.0, 176.0, 163.0, 113.0, 71.0, 62.0, 42.0, 24.0, 17.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0], "bins": [-0.34130859375, -0.3310432434082031, -0.32077789306640625, -0.3105125427246094, -0.3002471923828125, -0.2899818420410156, -0.27971649169921875, -0.2694511413574219, -0.259185791015625, -0.24892044067382812, -0.23865509033203125, -0.22838973999023438, -0.2181243896484375, -0.20785903930664062, -0.19759368896484375, -0.18732833862304688, -0.17706298828125, -0.16679763793945312, -0.15653228759765625, -0.14626693725585938, -0.1360015869140625, -0.12573623657226562, -0.11547088623046875, -0.10520553588867188, -0.094940185546875, -0.08467483520507812, -0.07440948486328125, -0.06414413452148438, -0.0538787841796875, -0.043613433837890625, -0.03334808349609375, -0.023082733154296875, -0.0128173828125, -0.002552032470703125, 0.00771331787109375, 0.017978668212890625, 0.0282440185546875, 0.038509368896484375, 0.04877471923828125, 0.059040069580078125, 0.069305419921875, 0.07957077026367188, 0.08983612060546875, 0.10010147094726562, 0.1103668212890625, 0.12063217163085938, 0.13089752197265625, 0.14116287231445312, 0.15142822265625, 0.16169357299804688, 0.17195892333984375, 0.18222427368164062, 0.1924896240234375, 0.20275497436523438, 0.21302032470703125, 0.22328567504882812, 0.233551025390625, 0.24381637573242188, 0.25408172607421875, 0.2643470764160156, 0.2746124267578125, 0.2848777770996094, 0.29514312744140625, 0.3054084777832031, 0.315673828125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 7.0, 8.0, 8.0, 12.0, 18.0, 19.0, 17.0, 31.0, 24.0, 19.0, 24.0, 36.0, 48.0, 34.0, 41.0, 40.0, 41.0, 1068.0, 55.0, 33.0, 41.0, 39.0, 31.0, 32.0, 29.0, 34.0, 37.0, 35.0, 23.0, 26.0, 16.0, 15.0, 17.0, 15.0, 6.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.4228515625, -0.41101837158203125, -0.3991851806640625, -0.38735198974609375, -0.375518798828125, -0.36368560791015625, -0.3518524169921875, -0.34001922607421875, -0.32818603515625, -0.31635284423828125, -0.3045196533203125, -0.29268646240234375, -0.280853271484375, -0.26902008056640625, -0.2571868896484375, -0.24535369873046875, -0.2335205078125, -0.22168731689453125, -0.2098541259765625, -0.19802093505859375, -0.186187744140625, -0.17435455322265625, -0.1625213623046875, -0.15068817138671875, -0.13885498046875, -0.12702178955078125, -0.1151885986328125, -0.10335540771484375, -0.091522216796875, -0.07968902587890625, -0.0678558349609375, -0.05602264404296875, -0.044189453125, -0.03235626220703125, -0.0205230712890625, -0.00868988037109375, 0.003143310546875, 0.01497650146484375, 0.0268096923828125, 0.03864288330078125, 0.05047607421875, 0.06230926513671875, 0.0741424560546875, 0.08597564697265625, 0.097808837890625, 0.10964202880859375, 0.1214752197265625, 0.13330841064453125, 0.1451416015625, 0.15697479248046875, 0.1688079833984375, 0.18064117431640625, 0.192474365234375, 0.20430755615234375, 0.2161407470703125, 0.22797393798828125, 0.23980712890625, 0.25164031982421875, 0.2634735107421875, 0.27530670166015625, 0.287139892578125, 0.29897308349609375, 0.3108062744140625, 0.32263946533203125, 0.33447265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 6.0, 8.0, 12.0, 17.0, 29.0, 45.0, 65.0, 117.0, 176.0, 258.0, 431.0, 700.0, 1171.0, 1937.0, 3349.0, 5889.0, 10721.0, 22113.0, 55039.0, 1093067.0, 802047.0, 53370.0, 21582.0, 10790.0, 5934.0, 3281.0, 1956.0, 1187.0, 689.0, 412.0, 273.0, 174.0, 105.0, 65.0, 33.0, 23.0, 23.0, 9.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5810546875, -0.5628890991210938, -0.5447235107421875, -0.5265579223632812, -0.508392333984375, -0.49022674560546875, -0.4720611572265625, -0.45389556884765625, -0.43572998046875, -0.41756439208984375, -0.3993988037109375, -0.38123321533203125, -0.363067626953125, -0.34490203857421875, -0.3267364501953125, -0.30857086181640625, -0.2904052734375, -0.27223968505859375, -0.2540740966796875, -0.23590850830078125, -0.217742919921875, -0.19957733154296875, -0.1814117431640625, -0.16324615478515625, -0.14508056640625, -0.12691497802734375, -0.1087493896484375, -0.09058380126953125, -0.072418212890625, -0.05425262451171875, -0.0360870361328125, -0.01792144775390625, 0.000244140625, 0.01840972900390625, 0.0365753173828125, 0.05474090576171875, 0.072906494140625, 0.09107208251953125, 0.1092376708984375, 0.12740325927734375, 0.14556884765625, 0.16373443603515625, 0.1819000244140625, 0.20006561279296875, 0.218231201171875, 0.23639678955078125, 0.2545623779296875, 0.27272796630859375, 0.2908935546875, 0.30905914306640625, 0.3272247314453125, 0.34539031982421875, 0.363555908203125, 0.38172149658203125, 0.3998870849609375, 0.41805267333984375, 0.43621826171875, 0.45438385009765625, 0.4725494384765625, 0.49071502685546875, 0.508880615234375, 0.5270462036132812, 0.5452117919921875, 0.5633773803710938, 0.58154296875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 2.0, 6.0, 11.0, 13.0, 17.0, 15.0, 20.0, 37.0, 42.0, 37.0, 54.0, 46.0, 70.0, 62.0, 68.0, 74.0, 70.0, 62.0, 61.0, 35.0, 54.0, 26.0, 29.0, 14.0, 18.0, 16.0, 7.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.0632028579711914, -0.06115913391113281, -0.05911540985107422, -0.057071685791015625, -0.05502796173095703, -0.05298423767089844, -0.050940513610839844, -0.04889678955078125, -0.046853065490722656, -0.04480934143066406, -0.04276561737060547, -0.040721893310546875, -0.03867816925048828, -0.03663444519042969, -0.034590721130371094, -0.0325469970703125, -0.030503273010253906, -0.028459548950195312, -0.02641582489013672, -0.024372100830078125, -0.02232837677001953, -0.020284652709960938, -0.018240928649902344, -0.01619720458984375, -0.014153480529785156, -0.012109756469726562, -0.010066032409667969, -0.008022308349609375, -0.005978584289550781, -0.0039348602294921875, -0.0018911361694335938, 0.000152587890625, 0.0021963119506835938, 0.0042400360107421875, 0.006283760070800781, 0.008327484130859375, 0.010371208190917969, 0.012414932250976562, 0.014458656311035156, 0.01650238037109375, 0.018546104431152344, 0.020589828491210938, 0.02263355255126953, 0.024677276611328125, 0.02672100067138672, 0.028764724731445312, 0.030808448791503906, 0.0328521728515625, 0.034895896911621094, 0.03693962097167969, 0.03898334503173828, 0.041027069091796875, 0.04307079315185547, 0.04511451721191406, 0.047158241271972656, 0.04920196533203125, 0.051245689392089844, 0.05328941345214844, 0.05533313751220703, 0.057376861572265625, 0.05942058563232422, 0.06146430969238281, 0.0635080337524414, 0.0655517578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 12.0, 10.0, 22.0, 26.0, 31.0, 43.0, 64.0, 91.0, 149.0, 227.0, 583.0, 1724.0, 9984.0, 241125.0, 765603.0, 24271.0, 2959.0, 719.0, 346.0, 159.0, 103.0, 93.0, 49.0, 32.0, 36.0, 17.0, 21.0, 9.0, 7.0, 3.0, 10.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8586883544921875, -0.831146240234375, -0.8036041259765625, -0.77606201171875, -0.7485198974609375, -0.720977783203125, -0.6934356689453125, -0.6658935546875, -0.6383514404296875, -0.610809326171875, -0.5832672119140625, -0.55572509765625, -0.5281829833984375, -0.500640869140625, -0.4730987548828125, -0.445556640625, -0.4180145263671875, -0.390472412109375, -0.3629302978515625, -0.33538818359375, -0.3078460693359375, -0.280303955078125, -0.2527618408203125, -0.2252197265625, -0.1976776123046875, -0.170135498046875, -0.1425933837890625, -0.11505126953125, -0.0875091552734375, -0.059967041015625, -0.0324249267578125, -0.0048828125, 0.0226593017578125, 0.050201416015625, 0.0777435302734375, 0.10528564453125, 0.1328277587890625, 0.160369873046875, 0.1879119873046875, 0.2154541015625, 0.2429962158203125, 0.270538330078125, 0.2980804443359375, 0.32562255859375, 0.3531646728515625, 0.380706787109375, 0.4082489013671875, 0.435791015625, 0.4633331298828125, 0.490875244140625, 0.5184173583984375, 0.54595947265625, 0.5735015869140625, 0.601043701171875, 0.6285858154296875, 0.6561279296875, 0.6836700439453125, 0.711212158203125, 0.7387542724609375, 0.76629638671875, 0.7938385009765625, 0.821380615234375, 0.8489227294921875, 0.87646484375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 30.0, 177.0, 538.0, 209.0, 41.0, 11.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9457941651344299, -0.8921672701835632, -0.8385403156280518, -0.7849134206771851, -0.7312864661216736, -0.6776595711708069, -0.6240326166152954, -0.5704057216644287, -0.516778826713562, -0.4631519019603729, -0.40952497720718384, -0.35589808225631714, -0.30227112770080566, -0.24864423274993896, -0.19501730799674988, -0.1413903832435608, -0.08776342868804932, -0.03413650766015053, 0.01949041336774826, 0.07311733067035675, 0.12674425542354584, 0.18037116527557373, 0.23399809002876282, 0.2876250147819519, 0.341251939535141, 0.3948788642883301, 0.44850578904151917, 0.5021327137947083, 0.555759608745575, 0.6093865633010864, 0.6630134582519531, 0.7166403532028198, 0.7702673673629761, 0.8238942623138428, 0.8775212168693542, 0.931148111820221, 0.9847750663757324, 1.0384019613265991, 1.0920288562774658, 1.145655870437622, 1.1992827653884888, 1.2529096603393555, 1.3065365552902222, 1.3601635694503784, 1.4137904644012451, 1.4674173593521118, 1.5210442543029785, 1.5746712684631348, 1.628298044204712, 1.6819249391555786, 1.7355518341064453, 1.7891788482666016, 1.8428057432174683, 1.896432638168335, 1.9500595331192017, 2.0036864280700684, 2.0573134422302246, 2.110940456390381, 2.164567232131958, 2.2181942462921143, 2.2718210220336914, 2.3254480361938477, 2.379075050354004, 2.432701826095581, 2.4863288402557373]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 14.0, 12.0, 18.0, 20.0, 21.0, 31.0, 30.0, 43.0, 51.0, 45.0, 67.0, 59.0, 53.0, 54.0, 52.0, 51.0, 51.0, 51.0, 51.0, 37.0, 45.0, 26.0, 27.0, 21.0, 19.0, 15.0, 9.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32801324129104614, -0.3177160918712616, -0.30741891264915466, -0.2971217632293701, -0.2868245840072632, -0.27652743458747864, -0.2662302553653717, -0.25593310594558716, -0.24563592672348022, -0.23533876240253448, -0.22504159808158875, -0.214744433760643, -0.20444726943969727, -0.19415010511875153, -0.1838529407978058, -0.17355579137802124, -0.1632586270570755, -0.15296146273612976, -0.14266429841518402, -0.13236713409423828, -0.12206996977329254, -0.1117728054523468, -0.10147564858198166, -0.09117848426103592, -0.08088131994009018, -0.07058415561914444, -0.0602869912981987, -0.04998983070254326, -0.03969266638159752, -0.02939550206065178, -0.019098341464996338, -0.008801177144050598, 0.0014959871768951416, 0.011793150566518307, 0.022090313956141472, 0.03238747641444206, 0.0426846407353878, 0.05298180505633354, 0.06327896565198898, 0.07357612997293472, 0.08387329429388046, 0.0941704586148262, 0.10446762293577194, 0.11476477980613708, 0.12506194412708282, 0.13535910844802856, 0.1456562727689743, 0.15595343708992004, 0.16625060141086578, 0.17654776573181152, 0.18684493005275726, 0.197142094373703, 0.20743925869464874, 0.21773642301559448, 0.22803357243537903, 0.23833075165748596, 0.2486279010772705, 0.25892505049705505, 0.269222229719162, 0.27951937913894653, 0.28981655836105347, 0.300113707780838, 0.31041088700294495, 0.3207080364227295, 0.3310052156448364]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 14.0, 16.0, 10.0, 13.0, 17.0, 26.0, 17.0, 35.0, 17.0, 35.0, 23.0, 35.0, 31.0, 34.0, 41.0, 38.0, 35.0, 32.0, 37.0, 56.0, 35.0, 34.0, 47.0, 35.0, 26.0, 24.0, 24.0, 14.0, 21.0, 25.0, 20.0, 20.0, 21.0, 7.0, 11.0, 9.0, 8.0, 6.0, 7.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.333740234375, -0.3224601745605469, -0.31118011474609375, -0.2999000549316406, -0.2886199951171875, -0.2773399353027344, -0.26605987548828125, -0.2547798156738281, -0.243499755859375, -0.23221969604492188, -0.22093963623046875, -0.20965957641601562, -0.1983795166015625, -0.18709945678710938, -0.17581939697265625, -0.16453933715820312, -0.15325927734375, -0.14197921752929688, -0.13069915771484375, -0.11941909790039062, -0.1081390380859375, -0.09685897827148438, -0.08557891845703125, -0.07429885864257812, -0.063018798828125, -0.051738739013671875, -0.04045867919921875, -0.029178619384765625, -0.0178985595703125, -0.006618499755859375, 0.00466156005859375, 0.015941619873046875, 0.0272216796875, 0.038501739501953125, 0.04978179931640625, 0.061061859130859375, 0.0723419189453125, 0.08362197875976562, 0.09490203857421875, 0.10618209838867188, 0.117462158203125, 0.12874221801757812, 0.14002227783203125, 0.15130233764648438, 0.1625823974609375, 0.17386245727539062, 0.18514251708984375, 0.19642257690429688, 0.20770263671875, 0.21898269653320312, 0.23026275634765625, 0.24154281616210938, 0.2528228759765625, 0.2641029357910156, 0.27538299560546875, 0.2866630554199219, 0.297943115234375, 0.3092231750488281, 0.32050323486328125, 0.3317832946777344, 0.3430633544921875, 0.3543434143066406, 0.36562347412109375, 0.3769035339355469, 0.38818359375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 15.0, 15.0, 13.0, 16.0, 30.0, 40.0, 40.0, 66.0, 124.0, 146.0, 198.0, 300.0, 417.0, 658.0, 1103.0, 1789.0, 3055.0, 5448.0, 10476.0, 22005.0, 56302.0, 233024.0, 513727.0, 125819.0, 38306.0, 16228.0, 8164.0, 4376.0, 2433.0, 1466.0, 892.0, 591.0, 391.0, 257.0, 163.0, 116.0, 84.0, 71.0, 42.0, 32.0, 27.0, 17.0, 19.0, 8.0, 6.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.70947265625, -0.6868133544921875, -0.664154052734375, -0.6414947509765625, -0.61883544921875, -0.5961761474609375, -0.573516845703125, -0.5508575439453125, -0.5281982421875, -0.5055389404296875, -0.482879638671875, -0.4602203369140625, -0.43756103515625, -0.4149017333984375, -0.392242431640625, -0.3695831298828125, -0.346923828125, -0.3242645263671875, -0.301605224609375, -0.2789459228515625, -0.25628662109375, -0.2336273193359375, -0.210968017578125, -0.1883087158203125, -0.1656494140625, -0.1429901123046875, -0.120330810546875, -0.0976715087890625, -0.07501220703125, -0.0523529052734375, -0.029693603515625, -0.0070343017578125, 0.015625, 0.0382843017578125, 0.060943603515625, 0.0836029052734375, 0.10626220703125, 0.1289215087890625, 0.151580810546875, 0.1742401123046875, 0.1968994140625, 0.2195587158203125, 0.242218017578125, 0.2648773193359375, 0.28753662109375, 0.3101959228515625, 0.332855224609375, 0.3555145263671875, 0.378173828125, 0.4008331298828125, 0.423492431640625, 0.4461517333984375, 0.46881103515625, 0.4914703369140625, 0.514129638671875, 0.5367889404296875, 0.5594482421875, 0.5821075439453125, 0.604766845703125, 0.6274261474609375, 0.65008544921875, 0.6727447509765625, 0.695404052734375, 0.7180633544921875, 0.74072265625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 3.0, 9.0, 16.0, 15.0, 20.0, 15.0, 30.0, 37.0, 36.0, 25.0, 42.0, 49.0, 65.0, 92.0, 175.0, 1469.0, 344.0, 153.0, 72.0, 64.0, 45.0, 38.0, 47.0, 33.0, 36.0, 17.0, 14.0, 14.0, 17.0, 7.0, 9.0, 9.0, 5.0, 8.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.457244873046875, -1.40667724609375, -1.356109619140625, -1.3055419921875, -1.254974365234375, -1.20440673828125, -1.153839111328125, -1.103271484375, -1.052703857421875, -1.00213623046875, -0.951568603515625, -0.9010009765625, -0.850433349609375, -0.79986572265625, -0.749298095703125, -0.69873046875, -0.648162841796875, -0.59759521484375, -0.547027587890625, -0.4964599609375, -0.445892333984375, -0.39532470703125, -0.344757080078125, -0.294189453125, -0.243621826171875, -0.19305419921875, -0.142486572265625, -0.0919189453125, -0.041351318359375, 0.00921630859375, 0.059783935546875, 0.1103515625, 0.160919189453125, 0.21148681640625, 0.262054443359375, 0.3126220703125, 0.363189697265625, 0.41375732421875, 0.464324951171875, 0.514892578125, 0.565460205078125, 0.61602783203125, 0.666595458984375, 0.7171630859375, 0.767730712890625, 0.81829833984375, 0.868865966796875, 0.91943359375, 0.970001220703125, 1.02056884765625, 1.071136474609375, 1.1217041015625, 1.172271728515625, 1.22283935546875, 1.273406982421875, 1.323974609375, 1.374542236328125, 1.42510986328125, 1.475677490234375, 1.5262451171875, 1.576812744140625, 1.62738037109375, 1.677947998046875, 1.728515625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 6.0, 11.0, 7.0, 11.0, 18.0, 16.0, 16.0, 27.0, 37.0, 59.0, 86.0, 131.0, 209.0, 374.0, 644.0, 1543.0, 6345.0, 68721.0, 2680537.0, 365023.0, 17163.0, 2608.0, 878.0, 449.0, 238.0, 145.0, 120.0, 77.0, 54.0, 40.0, 27.0, 27.0, 11.0, 9.0, 14.0, 4.0, 2.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.7578125, -2.6827392578125, -2.607666015625, -2.5325927734375, -2.45751953125, -2.3824462890625, -2.307373046875, -2.2322998046875, -2.1572265625, -2.0821533203125, -2.007080078125, -1.9320068359375, -1.85693359375, -1.7818603515625, -1.706787109375, -1.6317138671875, -1.556640625, -1.4815673828125, -1.406494140625, -1.3314208984375, -1.25634765625, -1.1812744140625, -1.106201171875, -1.0311279296875, -0.9560546875, -0.8809814453125, -0.805908203125, -0.7308349609375, -0.65576171875, -0.5806884765625, -0.505615234375, -0.4305419921875, -0.35546875, -0.2803955078125, -0.205322265625, -0.1302490234375, -0.05517578125, 0.0198974609375, 0.094970703125, 0.1700439453125, 0.2451171875, 0.3201904296875, 0.395263671875, 0.4703369140625, 0.54541015625, 0.6204833984375, 0.695556640625, 0.7706298828125, 0.845703125, 0.9207763671875, 0.995849609375, 1.0709228515625, 1.14599609375, 1.2210693359375, 1.296142578125, 1.3712158203125, 1.4462890625, 1.5213623046875, 1.596435546875, 1.6715087890625, 1.74658203125, 1.8216552734375, 1.896728515625, 1.9718017578125, 2.046875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 15.0, 40.0, 80.0, 157.0, 219.0, 219.0, 150.0, 77.0, 26.0, 20.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.498206615447998, -4.310431480407715, -4.12265682220459, -3.9348816871643066, -3.7471070289611816, -3.5593318939208984, -3.3715569972991943, -3.1837821006774902, -2.996007204055786, -2.808232307434082, -2.620457410812378, -2.432682514190674, -2.2449073791503906, -2.0571327209472656, -1.8693575859069824, -1.6815826892852783, -1.4938077926635742, -1.3060328960418701, -1.118257999420166, -0.9304829835891724, -0.7427080869674683, -0.5549331903457642, -0.3671581745147705, -0.1793832778930664, 0.008391618728637695, 0.19616654515266418, 0.3839414715766907, 0.5717164278030396, 0.7594913244247437, 0.9472662210464478, 1.1350412368774414, 1.3228161334991455, 1.5105905532836914, 1.6983654499053955, 1.8861403465270996, 2.073915481567383, 2.261690139770508, 2.449465274810791, 2.637240171432495, 2.825015068054199, 3.0127899646759033, 3.2005648612976074, 3.3883397579193115, 3.5761146545410156, 3.763889789581299, 3.951664447784424, 4.139439582824707, 4.327214241027832, 4.514989376068115, 4.702764511108398, 4.890539169311523, 5.078314304351807, 5.266088962554932, 5.453864097595215, 5.64163875579834, 5.829413890838623, 6.017189025878906, 6.2049641609191895, 6.3927388191223145, 6.580513954162598, 6.768288612365723, 6.956063747406006, 7.143838882446289, 7.331613540649414, 7.519388198852539]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 11.0, 12.0, 11.0, 17.0, 19.0, 32.0, 23.0, 14.0, 25.0, 28.0, 29.0, 35.0, 28.0, 33.0, 40.0, 34.0, 40.0, 31.0, 34.0, 43.0, 47.0, 24.0, 31.0, 32.0, 31.0, 29.0, 32.0, 29.0, 23.0, 32.0, 15.0, 13.0, 24.0, 12.0, 12.0, 11.0, 13.0, 7.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.1307461261749268, -3.0235543251037598, -2.9163625240325928, -2.809170722961426, -2.7019786834716797, -2.594787120819092, -2.4875950813293457, -2.3804032802581787, -2.2732114791870117, -2.1660196781158447, -2.0588278770446777, -1.9516359567642212, -1.8444441556930542, -1.7372523546218872, -1.6300604343414307, -1.5228686332702637, -1.4156768321990967, -1.3084850311279297, -1.2012932300567627, -1.0941013097763062, -0.9869095087051392, -0.8797177076339722, -0.7725258469581604, -0.6653339862823486, -0.5581421852111816, -0.45095035433769226, -0.3437585234642029, -0.2365666925907135, -0.12937486171722412, -0.02218306064605713, 0.08500880002975464, 0.1922006607055664, 0.2993924617767334, 0.4065842926502228, 0.5137761235237122, 0.6209679841995239, 0.7281597852706909, 0.8353515863418579, 0.9425434470176697, 1.0497353076934814, 1.1569271087646484, 1.2641189098358154, 1.3713107109069824, 1.478502631187439, 1.585694432258606, 1.692886233329773, 1.8000781536102295, 1.9072699546813965, 2.0144617557525635, 2.1216535568237305, 2.2288453578948975, 2.3360371589660645, 2.4432291984558105, 2.5504207611083984, 2.6576128005981445, 2.7648046016693115, 2.8719964027404785, 2.9791882038116455, 3.0863800048828125, 3.1935718059539795, 3.3007636070251465, 3.4079556465148926, 3.5151474475860596, 3.6223392486572266, 3.7295310497283936]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 7.0, 12.0, 11.0, 10.0, 14.0, 13.0, 18.0, 18.0, 23.0, 24.0, 29.0, 34.0, 37.0, 27.0, 36.0, 31.0, 34.0, 31.0, 33.0, 38.0, 41.0, 51.0, 37.0, 41.0, 34.0, 33.0, 28.0, 31.0, 24.0, 17.0, 24.0, 23.0, 21.0, 14.0, 13.0, 15.0, 13.0, 9.0, 9.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.329345703125, -0.31789398193359375, -0.3064422607421875, -0.29499053955078125, -0.283538818359375, -0.27208709716796875, -0.2606353759765625, -0.24918365478515625, -0.23773193359375, -0.22628021240234375, -0.2148284912109375, -0.20337677001953125, -0.191925048828125, -0.18047332763671875, -0.1690216064453125, -0.15756988525390625, -0.1461181640625, -0.13466644287109375, -0.1232147216796875, -0.11176300048828125, -0.100311279296875, -0.08885955810546875, -0.0774078369140625, -0.06595611572265625, -0.05450439453125, -0.04305267333984375, -0.0316009521484375, -0.02014923095703125, -0.008697509765625, 0.00275421142578125, 0.0142059326171875, 0.02565765380859375, 0.037109375, 0.04856109619140625, 0.0600128173828125, 0.07146453857421875, 0.082916259765625, 0.09436798095703125, 0.1058197021484375, 0.11727142333984375, 0.12872314453125, 0.14017486572265625, 0.1516265869140625, 0.16307830810546875, 0.174530029296875, 0.18598175048828125, 0.1974334716796875, 0.20888519287109375, 0.2203369140625, 0.23178863525390625, 0.2432403564453125, 0.25469207763671875, 0.266143798828125, 0.27759552001953125, 0.2890472412109375, 0.30049896240234375, 0.31195068359375, 0.32340240478515625, 0.3348541259765625, 0.34630584716796875, 0.357757568359375, 0.36920928955078125, 0.3806610107421875, 0.39211273193359375, 0.403564453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 11.0, 5.0, 15.0, 22.0, 17.0, 32.0, 50.0, 72.0, 92.0, 198.0, 272.0, 476.0, 844.0, 1540.0, 3102.0, 6809.0, 17644.0, 71914.0, 771363.0, 2940952.0, 312231.0, 43495.0, 12660.0, 5210.0, 2359.0, 1179.0, 635.0, 406.0, 228.0, 151.0, 74.0, 58.0, 40.0, 30.0, 27.0, 20.0, 9.0, 9.0, 10.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1420440673828125, -1.104400634765625, -1.0667572021484375, -1.02911376953125, -0.9914703369140625, -0.953826904296875, -0.9161834716796875, -0.8785400390625, -0.8408966064453125, -0.803253173828125, -0.7656097412109375, -0.72796630859375, -0.6903228759765625, -0.652679443359375, -0.6150360107421875, -0.577392578125, -0.5397491455078125, -0.502105712890625, -0.4644622802734375, -0.42681884765625, -0.3891754150390625, -0.351531982421875, -0.3138885498046875, -0.2762451171875, -0.2386016845703125, -0.200958251953125, -0.1633148193359375, -0.12567138671875, -0.0880279541015625, -0.050384521484375, -0.0127410888671875, 0.02490234375, 0.0625457763671875, 0.100189208984375, 0.1378326416015625, 0.17547607421875, 0.2131195068359375, 0.250762939453125, 0.2884063720703125, 0.3260498046875, 0.3636932373046875, 0.401336669921875, 0.4389801025390625, 0.47662353515625, 0.5142669677734375, 0.551910400390625, 0.5895538330078125, 0.627197265625, 0.6648406982421875, 0.702484130859375, 0.7401275634765625, 0.77777099609375, 0.8154144287109375, 0.853057861328125, 0.8907012939453125, 0.9283447265625, 0.9659881591796875, 1.003631591796875, 1.0412750244140625, 1.07891845703125, 1.1165618896484375, 1.154205322265625, 1.1918487548828125, 1.2294921875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 9.0, 7.0, 10.0, 5.0, 12.0, 24.0, 31.0, 35.0, 53.0, 82.0, 105.0, 149.0, 287.0, 495.0, 761.0, 702.0, 484.0, 269.0, 180.0, 121.0, 79.0, 48.0, 34.0, 27.0, 15.0, 11.0, 11.0, 7.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.5673828125, -1.5308914184570312, -1.4944000244140625, -1.4579086303710938, -1.421417236328125, -1.3849258422851562, -1.3484344482421875, -1.3119430541992188, -1.27545166015625, -1.2389602661132812, -1.2024688720703125, -1.1659774780273438, -1.129486083984375, -1.0929946899414062, -1.0565032958984375, -1.0200119018554688, -0.9835205078125, -0.9470291137695312, -0.9105377197265625, -0.8740463256835938, -0.837554931640625, -0.8010635375976562, -0.7645721435546875, -0.7280807495117188, -0.69158935546875, -0.6550979614257812, -0.6186065673828125, -0.5821151733398438, -0.545623779296875, -0.5091323852539062, -0.4726409912109375, -0.43614959716796875, -0.399658203125, -0.36316680908203125, -0.3266754150390625, -0.29018402099609375, -0.253692626953125, -0.21720123291015625, -0.1807098388671875, -0.14421844482421875, -0.10772705078125, -0.07123565673828125, -0.0347442626953125, 0.00174713134765625, 0.038238525390625, 0.07472991943359375, 0.1112213134765625, 0.14771270751953125, 0.1842041015625, 0.22069549560546875, 0.2571868896484375, 0.29367828369140625, 0.330169677734375, 0.36666107177734375, 0.4031524658203125, 0.43964385986328125, 0.47613525390625, 0.5126266479492188, 0.5491180419921875, 0.5856094360351562, 0.622100830078125, 0.6585922241210938, 0.6950836181640625, 0.7315750122070312, 0.76806640625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 8.0, 17.0, 29.0, 34.0, 51.0, 88.0, 165.0, 327.0, 744.0, 1720.0, 4312.0, 12276.0, 49394.0, 505873.0, 3352324.0, 220388.0, 31847.0, 8813.0, 3197.0, 1349.0, 584.0, 296.0, 165.0, 83.0, 60.0, 38.0, 21.0, 23.0, 12.0, 13.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.4809722900390625, -1.408233642578125, -1.3354949951171875, -1.26275634765625, -1.1900177001953125, -1.117279052734375, -1.0445404052734375, -0.9718017578125, -0.8990631103515625, -0.826324462890625, -0.7535858154296875, -0.68084716796875, -0.6081085205078125, -0.535369873046875, -0.4626312255859375, -0.389892578125, -0.3171539306640625, -0.244415283203125, -0.1716766357421875, -0.09893798828125, -0.0261993408203125, 0.046539306640625, 0.1192779541015625, 0.1920166015625, 0.2647552490234375, 0.337493896484375, 0.4102325439453125, 0.48297119140625, 0.5557098388671875, 0.628448486328125, 0.7011871337890625, 0.77392578125, 0.8466644287109375, 0.919403076171875, 0.9921417236328125, 1.06488037109375, 1.1376190185546875, 1.210357666015625, 1.2830963134765625, 1.3558349609375, 1.4285736083984375, 1.501312255859375, 1.5740509033203125, 1.64678955078125, 1.7195281982421875, 1.792266845703125, 1.8650054931640625, 1.937744140625, 2.0104827880859375, 2.083221435546875, 2.1559600830078125, 2.22869873046875, 2.3014373779296875, 2.374176025390625, 2.4469146728515625, 2.5196533203125, 2.5923919677734375, 2.665130615234375, 2.7378692626953125, 2.81060791015625, 2.8833465576171875, 2.956085205078125, 3.0288238525390625, 3.1015625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 9.0, 8.0, 23.0, 27.0, 46.0, 112.0, 131.0, 196.0, 176.0, 135.0, 62.0, 34.0, 31.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.513570308685303, -5.218964576721191, -4.924358367919922, -4.6297526359558105, -4.335146427154541, -4.04054069519043, -3.7459347248077393, -3.451328754425049, -3.1567227840423584, -2.862116813659668, -2.5675108432769775, -2.272904872894287, -1.9782990217208862, -1.6836930513381958, -1.389087200164795, -1.0944812297821045, -0.7998752593994141, -0.5052692890167236, -0.21066337823867798, 0.08394253253936768, 0.3785485029220581, 0.6731544733047485, 0.9677603244781494, 1.2623662948608398, 1.5569722652435303, 1.8515782356262207, 2.146184206008911, 2.4407901763916016, 2.735395908355713, 3.0300021171569824, 3.3246078491210938, 3.619213819503784, 3.9138193130493164, 4.208425045013428, 4.503031253814697, 4.797636985778809, 5.092243194580078, 5.3868489265441895, 5.681454658508301, 5.97606086730957, 6.27066707611084, 6.565272808074951, 6.859879016876221, 7.154484748840332, 7.449090957641602, 7.743696689605713, 8.038302421569824, 8.332908630371094, 8.627513885498047, 8.922120094299316, 9.21672534942627, 9.511331558227539, 9.805937767028809, 10.100543975830078, 10.395149230957031, 10.6897554397583, 10.98436164855957, 11.27896785736084, 11.573573112487793, 11.868179321289062, 12.162785530090332, 12.457391738891602, 12.751996994018555, 13.046603202819824, 13.341209411621094]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 6.0, 3.0, 8.0, 8.0, 13.0, 14.0, 14.0, 16.0, 17.0, 17.0, 20.0, 19.0, 23.0, 26.0, 30.0, 32.0, 31.0, 35.0, 42.0, 44.0, 43.0, 43.0, 37.0, 38.0, 38.0, 33.0, 38.0, 29.0, 37.0, 35.0, 22.0, 28.0, 22.0, 16.0, 19.0, 12.0, 13.0, 12.0, 13.0, 8.0, 9.0, 9.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.8948380947113037, -2.803074359893799, -2.711310386657715, -2.61954665184021, -2.527782678604126, -2.436018943786621, -2.344254970550537, -2.2524912357330322, -2.1607275009155273, -2.0689637660980225, -1.9771997928619385, -1.8854360580444336, -1.7936722040176392, -1.7019083499908447, -1.6101444959640503, -1.5183806419372559, -1.4266167879104614, -1.334852933883667, -1.2430890798568726, -1.1513252258300781, -1.0595614910125732, -0.9677976369857788, -0.8760337829589844, -0.7842699885368347, -0.6925061345100403, -0.6007422804832458, -0.5089784860610962, -0.41721463203430176, -0.3254508078098297, -0.23368698358535767, -0.14192312955856323, -0.050159335136413574, 0.04160451889038086, 0.1333683431148529, 0.22513218224048615, 0.3168960213661194, 0.40865984559059143, 0.5004236698150635, 0.5921875238418579, 0.6839513182640076, 0.775715172290802, 0.8674790263175964, 0.9592428207397461, 1.0510066747665405, 1.142770528793335, 1.2345342636108398, 1.3262982368469238, 1.4180619716644287, 1.5098258256912231, 1.6015896797180176, 1.693353533744812, 1.7851173877716064, 1.8768811225891113, 1.9686449766159058, 2.0604088306427, 2.152172565460205, 2.243936538696289, 2.335700273513794, 2.427464246749878, 2.519227981567383, 2.610991954803467, 2.7027556896209717, 2.7945194244384766, 2.8862833976745605, 2.9780471324920654]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 11.0, 5.0, 6.0, 9.0, 16.0, 10.0, 23.0, 17.0, 26.0, 18.0, 20.0, 23.0, 31.0, 28.0, 26.0, 27.0, 36.0, 27.0, 37.0, 29.0, 40.0, 30.0, 35.0, 39.0, 37.0, 41.0, 42.0, 38.0, 27.0, 27.0, 26.0, 27.0, 21.0, 22.0, 18.0, 13.0, 19.0, 10.0, 12.0, 9.0, 7.0, 4.0, 6.0, 5.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.31689453125, -0.3057365417480469, -0.29457855224609375, -0.2834205627441406, -0.2722625732421875, -0.2611045837402344, -0.24994659423828125, -0.23878860473632812, -0.227630615234375, -0.21647262573242188, -0.20531463623046875, -0.19415664672851562, -0.1829986572265625, -0.17184066772460938, -0.16068267822265625, -0.14952468872070312, -0.13836669921875, -0.12720870971679688, -0.11605072021484375, -0.10489273071289062, -0.0937347412109375, -0.08257675170898438, -0.07141876220703125, -0.060260772705078125, -0.049102783203125, -0.037944793701171875, -0.02678680419921875, -0.015628814697265625, -0.0044708251953125, 0.006687164306640625, 0.01784515380859375, 0.029003143310546875, 0.0401611328125, 0.051319122314453125, 0.06247711181640625, 0.07363510131835938, 0.0847930908203125, 0.09595108032226562, 0.10710906982421875, 0.11826705932617188, 0.129425048828125, 0.14058303833007812, 0.15174102783203125, 0.16289901733398438, 0.1740570068359375, 0.18521499633789062, 0.19637298583984375, 0.20753097534179688, 0.21868896484375, 0.22984695434570312, 0.24100494384765625, 0.2521629333496094, 0.2633209228515625, 0.2744789123535156, 0.28563690185546875, 0.2967948913574219, 0.307952880859375, 0.3191108703613281, 0.33026885986328125, 0.3414268493652344, 0.3525848388671875, 0.3637428283691406, 0.37490081787109375, 0.3860588073730469, 0.397216796875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 11.0, 11.0, 22.0, 25.0, 39.0, 56.0, 86.0, 126.0, 174.0, 289.0, 437.0, 634.0, 1055.0, 1669.0, 2602.0, 4513.0, 7599.0, 13251.0, 23266.0, 41430.0, 72201.0, 132221.0, 358734.0, 183571.0, 86916.0, 50211.0, 28104.0, 16069.0, 9216.0, 5301.0, 3184.0, 2030.0, 1287.0, 757.0, 492.0, 329.0, 198.0, 124.0, 79.0, 72.0, 51.0, 33.0, 21.0, 19.0, 9.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0], "bins": [-0.38818359375, -0.3769874572753906, -0.36579132080078125, -0.3545951843261719, -0.3433990478515625, -0.3322029113769531, -0.32100677490234375, -0.3098106384277344, -0.298614501953125, -0.2874183654785156, -0.27622222900390625, -0.2650260925292969, -0.2538299560546875, -0.24263381958007812, -0.23143768310546875, -0.22024154663085938, -0.20904541015625, -0.19784927368164062, -0.18665313720703125, -0.17545700073242188, -0.1642608642578125, -0.15306472778320312, -0.14186859130859375, -0.13067245483398438, -0.119476318359375, -0.10828018188476562, -0.09708404541015625, -0.08588790893554688, -0.0746917724609375, -0.06349563598632812, -0.05229949951171875, -0.041103363037109375, -0.0299072265625, -0.018711090087890625, -0.00751495361328125, 0.003681182861328125, 0.0148773193359375, 0.026073455810546875, 0.03726959228515625, 0.048465728759765625, 0.059661865234375, 0.07085800170898438, 0.08205413818359375, 0.09325027465820312, 0.1044464111328125, 0.11564254760742188, 0.12683868408203125, 0.13803482055664062, 0.14923095703125, 0.16042709350585938, 0.17162322998046875, 0.18281936645507812, 0.1940155029296875, 0.20521163940429688, 0.21640777587890625, 0.22760391235351562, 0.238800048828125, 0.24999618530273438, 0.26119232177734375, 0.2723884582519531, 0.2835845947265625, 0.2947807312011719, 0.30597686767578125, 0.3171730041503906, 0.328369140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 5.0, 5.0, 7.0, 7.0, 10.0, 10.0, 15.0, 17.0, 17.0, 27.0, 25.0, 30.0, 31.0, 21.0, 50.0, 41.0, 28.0, 41.0, 45.0, 41.0, 1078.0, 50.0, 38.0, 40.0, 32.0, 35.0, 38.0, 38.0, 31.0, 30.0, 22.0, 18.0, 17.0, 14.0, 10.0, 8.0, 10.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3056640625, -0.2951393127441406, -0.28461456298828125, -0.2740898132324219, -0.2635650634765625, -0.2530403137207031, -0.24251556396484375, -0.23199081420898438, -0.221466064453125, -0.21094131469726562, -0.20041656494140625, -0.18989181518554688, -0.1793670654296875, -0.16884231567382812, -0.15831756591796875, -0.14779281616210938, -0.13726806640625, -0.12674331665039062, -0.11621856689453125, -0.10569381713867188, -0.0951690673828125, -0.08464431762695312, -0.07411956787109375, -0.06359481811523438, -0.053070068359375, -0.042545318603515625, -0.03202056884765625, -0.021495819091796875, -0.0109710693359375, -0.000446319580078125, 0.01007843017578125, 0.020603179931640625, 0.0311279296875, 0.041652679443359375, 0.05217742919921875, 0.06270217895507812, 0.0732269287109375, 0.08375167846679688, 0.09427642822265625, 0.10480117797851562, 0.115325927734375, 0.12585067749023438, 0.13637542724609375, 0.14690017700195312, 0.1574249267578125, 0.16794967651367188, 0.17847442626953125, 0.18899917602539062, 0.19952392578125, 0.21004867553710938, 0.22057342529296875, 0.23109817504882812, 0.2416229248046875, 0.2521476745605469, 0.26267242431640625, 0.2731971740722656, 0.283721923828125, 0.2942466735839844, 0.30477142333984375, 0.3152961730957031, 0.3258209228515625, 0.3363456726074219, 0.34687042236328125, 0.3573951721191406, 0.367919921875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 11.0, 11.0, 18.0, 29.0, 30.0, 52.0, 68.0, 123.0, 182.0, 265.0, 419.0, 684.0, 1062.0, 1696.0, 2739.0, 4551.0, 7655.0, 14884.0, 40346.0, 1539477.0, 417542.0, 33608.0, 13531.0, 7109.0, 4120.0, 2525.0, 1569.0, 980.0, 623.0, 422.0, 261.0, 190.0, 101.0, 84.0, 49.0, 39.0, 30.0, 13.0, 9.0, 11.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495849609375, -0.4803199768066406, -0.46479034423828125, -0.4492607116699219, -0.4337310791015625, -0.4182014465332031, -0.40267181396484375, -0.3871421813964844, -0.371612548828125, -0.3560829162597656, -0.34055328369140625, -0.3250236511230469, -0.3094940185546875, -0.2939643859863281, -0.27843475341796875, -0.2629051208496094, -0.24737548828125, -0.23184585571289062, -0.21631622314453125, -0.20078659057617188, -0.1852569580078125, -0.16972732543945312, -0.15419769287109375, -0.13866806030273438, -0.123138427734375, -0.10760879516601562, -0.09207916259765625, -0.07654953002929688, -0.0610198974609375, -0.045490264892578125, -0.02996063232421875, -0.014430999755859375, 0.0010986328125, 0.016628265380859375, 0.03215789794921875, 0.047687530517578125, 0.0632171630859375, 0.07874679565429688, 0.09427642822265625, 0.10980606079101562, 0.125335693359375, 0.14086532592773438, 0.15639495849609375, 0.17192459106445312, 0.1874542236328125, 0.20298385620117188, 0.21851348876953125, 0.23404312133789062, 0.24957275390625, 0.2651023864746094, 0.28063201904296875, 0.2961616516113281, 0.3116912841796875, 0.3272209167480469, 0.34275054931640625, 0.3582801818847656, 0.373809814453125, 0.3893394470214844, 0.40486907958984375, 0.4203987121582031, 0.4359283447265625, 0.4514579772949219, 0.46698760986328125, 0.4825172424316406, 0.498046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 4.0, 7.0, 9.0, 6.0, 12.0, 8.0, 7.0, 20.0, 19.0, 27.0, 31.0, 22.0, 34.0, 63.0, 84.0, 136.0, 124.0, 93.0, 48.0, 35.0, 34.0, 21.0, 24.0, 15.0, 18.0, 13.0, 12.0, 14.0, 11.0, 6.0, 8.0, 4.0, 4.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02947998046875, -0.028584957122802734, -0.02768993377685547, -0.026794910430908203, -0.025899887084960938, -0.025004863739013672, -0.024109840393066406, -0.02321481704711914, -0.022319793701171875, -0.02142477035522461, -0.020529747009277344, -0.019634723663330078, -0.018739700317382812, -0.017844676971435547, -0.01694965362548828, -0.016054630279541016, -0.01515960693359375, -0.014264583587646484, -0.013369560241699219, -0.012474536895751953, -0.011579513549804688, -0.010684490203857422, -0.009789466857910156, -0.00889444351196289, -0.007999420166015625, -0.007104396820068359, -0.006209373474121094, -0.005314350128173828, -0.0044193267822265625, -0.003524303436279297, -0.0026292800903320312, -0.0017342567443847656, -0.0008392333984375, 5.5789947509765625e-05, 0.0009508132934570312, 0.0018458366394042969, 0.0027408599853515625, 0.003635883331298828, 0.004530906677246094, 0.005425930023193359, 0.006320953369140625, 0.007215976715087891, 0.008111000061035156, 0.009006023406982422, 0.009901046752929688, 0.010796070098876953, 0.011691093444824219, 0.012586116790771484, 0.01348114013671875, 0.014376163482666016, 0.015271186828613281, 0.016166210174560547, 0.017061233520507812, 0.017956256866455078, 0.018851280212402344, 0.01974630355834961, 0.020641326904296875, 0.02153635025024414, 0.022431373596191406, 0.023326396942138672, 0.024221420288085938, 0.025116443634033203, 0.02601146697998047, 0.026906490325927734, 0.027801513671875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 7.0, 6.0, 7.0, 3.0, 15.0, 13.0, 22.0, 25.0, 23.0, 42.0, 49.0, 73.0, 105.0, 126.0, 293.0, 535.0, 2933.0, 32804.0, 843648.0, 156622.0, 9022.0, 1176.0, 364.0, 167.0, 126.0, 113.0, 52.0, 31.0, 35.0, 18.0, 31.0, 14.0, 11.0, 9.0, 8.0, 9.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.36658477783203125, -0.3542633056640625, -0.34194183349609375, -0.329620361328125, -0.31729888916015625, -0.3049774169921875, -0.29265594482421875, -0.28033447265625, -0.26801300048828125, -0.2556915283203125, -0.24337005615234375, -0.231048583984375, -0.21872711181640625, -0.2064056396484375, -0.19408416748046875, -0.1817626953125, -0.16944122314453125, -0.1571197509765625, -0.14479827880859375, -0.132476806640625, -0.12015533447265625, -0.1078338623046875, -0.09551239013671875, -0.08319091796875, -0.07086944580078125, -0.0585479736328125, -0.04622650146484375, -0.033905029296875, -0.02158355712890625, -0.0092620849609375, 0.00305938720703125, 0.015380859375, 0.02770233154296875, 0.0400238037109375, 0.05234527587890625, 0.064666748046875, 0.07698822021484375, 0.0893096923828125, 0.10163116455078125, 0.11395263671875, 0.12627410888671875, 0.1385955810546875, 0.15091705322265625, 0.163238525390625, 0.17555999755859375, 0.1878814697265625, 0.20020294189453125, 0.2125244140625, 0.22484588623046875, 0.2371673583984375, 0.24948883056640625, 0.261810302734375, 0.27413177490234375, 0.2864532470703125, 0.29877471923828125, 0.31109619140625, 0.32341766357421875, 0.3357391357421875, 0.34806060791015625, 0.360382080078125, 0.37270355224609375, 0.3850250244140625, 0.39734649658203125, 0.40966796875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 25.0, 106.0, 390.0, 353.0, 95.0, 27.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42734280228614807, -0.41263318061828613, -0.3979235589504242, -0.38321393728256226, -0.36850428581237793, -0.353794664144516, -0.33908504247665405, -0.3243754208087921, -0.3096657991409302, -0.29495617747306824, -0.2802465558052063, -0.265536904335022, -0.25082728266716003, -0.2361176609992981, -0.22140803933143616, -0.20669841766357422, -0.1919887661933899, -0.17727914452552795, -0.16256950795650482, -0.14785988628864288, -0.13315024971961975, -0.11844062805175781, -0.10373100638389587, -0.08902137726545334, -0.0743117481470108, -0.05960211902856827, -0.04489249363541603, -0.030182868242263794, -0.015473239123821259, -0.0007636100053787231, 0.013946011662483215, 0.02865564078092575, 0.0433652400970459, 0.058074869215488434, 0.07278449833393097, 0.08749412000179291, 0.10220374912023544, 0.11691337823867798, 0.13162299990653992, 0.14633262157440186, 0.161042258143425, 0.17575187981128693, 0.19046151638031006, 0.205171138048172, 0.21988075971603394, 0.23459039628505707, 0.249300017952919, 0.26400965452194214, 0.2787192761898041, 0.293428897857666, 0.30813851952552795, 0.3228481411933899, 0.3375577926635742, 0.35226741433143616, 0.3669770359992981, 0.38168665766716003, 0.396396279335022, 0.4111059010028839, 0.42581552267074585, 0.4405251741409302, 0.4552347958087921, 0.46994441747665405, 0.484654039144516, 0.49936366081237793, 0.5140733122825623]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 9.0, 11.0, 21.0, 13.0, 32.0, 39.0, 43.0, 56.0, 53.0, 78.0, 65.0, 55.0, 65.0, 65.0, 53.0, 55.0, 65.0, 49.0, 34.0, 31.0, 35.0, 25.0, 13.0, 9.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15926963090896606, -0.15427462756633759, -0.1492796242237091, -0.14428460597991943, -0.13928960263729095, -0.13429459929466248, -0.129299595952034, -0.12430459260940552, -0.11930958181619644, -0.11431457847356796, -0.10931956768035889, -0.10432456433773041, -0.09932956099510193, -0.09433455020189285, -0.08933954685926437, -0.0843445360660553, -0.07934953272342682, -0.07435452938079834, -0.06935951858758926, -0.06436451524496078, -0.05936950817704201, -0.05437450110912323, -0.04937949776649475, -0.044384490698575974, -0.039389483630657196, -0.03439447656273842, -0.02939947135746479, -0.024404466152191162, -0.019409459084272385, -0.014414452016353607, -0.009419446811079979, -0.004424441605806351, 0.0005705654621124268, 0.00556557159870863, 0.010560577735304832, 0.015555583871901035, 0.020550590008497238, 0.025545597076416016, 0.030540602281689644, 0.03553560748696327, 0.04053061455488205, 0.04552562162280083, 0.050520628690719604, 0.055515632033348083, 0.06051063910126686, 0.06550564616918564, 0.07050064951181412, 0.0754956603050232, 0.08049066364765167, 0.08548566699028015, 0.09048067778348923, 0.0954756811261177, 0.10047069191932678, 0.10546569526195526, 0.11046069860458374, 0.11545570194721222, 0.1204507127404213, 0.12544572353363037, 0.13044072687625885, 0.13543573021888733, 0.1404307335615158, 0.1454257369041443, 0.15042075514793396, 0.15541575849056244, 0.16041076183319092]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 4.0, 3.0, 4.0, 3.0, 8.0, 8.0, 6.0, 7.0, 15.0, 10.0, 21.0, 17.0, 20.0, 24.0, 25.0, 13.0, 37.0, 26.0, 29.0, 21.0, 33.0, 37.0, 30.0, 33.0, 39.0, 27.0, 33.0, 40.0, 43.0, 38.0, 39.0, 39.0, 27.0, 32.0, 26.0, 27.0, 20.0, 26.0, 15.0, 14.0, 18.0, 11.0, 13.0, 6.0, 11.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.321044921875, -0.3098182678222656, -0.29859161376953125, -0.2873649597167969, -0.2761383056640625, -0.2649116516113281, -0.25368499755859375, -0.24245834350585938, -0.231231689453125, -0.22000503540039062, -0.20877838134765625, -0.19755172729492188, -0.1863250732421875, -0.17509841918945312, -0.16387176513671875, -0.15264511108398438, -0.14141845703125, -0.13019180297851562, -0.11896514892578125, -0.10773849487304688, -0.0965118408203125, -0.08528518676757812, -0.07405853271484375, -0.06283187866210938, -0.051605224609375, -0.040378570556640625, -0.02915191650390625, -0.017925262451171875, -0.0066986083984375, 0.004528045654296875, 0.01575469970703125, 0.026981353759765625, 0.0382080078125, 0.049434661865234375, 0.06066131591796875, 0.07188796997070312, 0.0831146240234375, 0.09434127807617188, 0.10556793212890625, 0.11679458618164062, 0.128021240234375, 0.13924789428710938, 0.15047454833984375, 0.16170120239257812, 0.1729278564453125, 0.18415451049804688, 0.19538116455078125, 0.20660781860351562, 0.21783447265625, 0.22906112670898438, 0.24028778076171875, 0.2515144348144531, 0.2627410888671875, 0.2739677429199219, 0.28519439697265625, 0.2964210510253906, 0.307647705078125, 0.3188743591308594, 0.33010101318359375, 0.3413276672363281, 0.3525543212890625, 0.3637809753417969, 0.37500762939453125, 0.3862342834472656, 0.3974609375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 12.0, 13.0, 25.0, 20.0, 36.0, 63.0, 94.0, 144.0, 165.0, 220.0, 394.0, 562.0, 858.0, 1331.0, 2172.0, 3299.0, 5295.0, 8897.0, 14895.0, 26358.0, 48740.0, 96675.0, 207526.0, 300714.0, 160083.0, 76312.0, 39304.0, 21688.0, 12571.0, 7584.0, 4472.0, 2789.0, 1867.0, 1082.0, 747.0, 518.0, 316.0, 226.0, 161.0, 92.0, 60.0, 45.0, 38.0, 23.0, 23.0, 14.0, 12.0, 7.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.4521484375, -0.4385833740234375, -0.425018310546875, -0.4114532470703125, -0.39788818359375, -0.3843231201171875, -0.370758056640625, -0.3571929931640625, -0.3436279296875, -0.3300628662109375, -0.316497802734375, -0.3029327392578125, -0.28936767578125, -0.2758026123046875, -0.262237548828125, -0.2486724853515625, -0.235107421875, -0.2215423583984375, -0.207977294921875, -0.1944122314453125, -0.18084716796875, -0.1672821044921875, -0.153717041015625, -0.1401519775390625, -0.1265869140625, -0.1130218505859375, -0.099456787109375, -0.0858917236328125, -0.07232666015625, -0.0587615966796875, -0.045196533203125, -0.0316314697265625, -0.01806640625, -0.0045013427734375, 0.009063720703125, 0.0226287841796875, 0.03619384765625, 0.0497589111328125, 0.063323974609375, 0.0768890380859375, 0.0904541015625, 0.1040191650390625, 0.117584228515625, 0.1311492919921875, 0.14471435546875, 0.1582794189453125, 0.171844482421875, 0.1854095458984375, 0.198974609375, 0.2125396728515625, 0.226104736328125, 0.2396697998046875, 0.25323486328125, 0.2667999267578125, 0.280364990234375, 0.2939300537109375, 0.3074951171875, 0.3210601806640625, 0.334625244140625, 0.3481903076171875, 0.36175537109375, 0.3753204345703125, 0.388885498046875, 0.4024505615234375, 0.416015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 11.0, 13.0, 14.0, 14.0, 23.0, 17.0, 28.0, 21.0, 28.0, 32.0, 38.0, 46.0, 59.0, 71.0, 107.0, 176.0, 1348.0, 273.0, 179.0, 115.0, 68.0, 47.0, 42.0, 31.0, 35.0, 31.0, 24.0, 17.0, 26.0, 21.0, 11.0, 15.0, 9.0, 10.0, 8.0, 8.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2734375, -1.2307891845703125, -1.188140869140625, -1.1454925537109375, -1.10284423828125, -1.0601959228515625, -1.017547607421875, -0.9748992919921875, -0.9322509765625, -0.8896026611328125, -0.846954345703125, -0.8043060302734375, -0.76165771484375, -0.7190093994140625, -0.676361083984375, -0.6337127685546875, -0.591064453125, -0.5484161376953125, -0.505767822265625, -0.4631195068359375, -0.42047119140625, -0.3778228759765625, -0.335174560546875, -0.2925262451171875, -0.2498779296875, -0.2072296142578125, -0.164581298828125, -0.1219329833984375, -0.07928466796875, -0.0366363525390625, 0.006011962890625, 0.0486602783203125, 0.09130859375, 0.1339569091796875, 0.176605224609375, 0.2192535400390625, 0.26190185546875, 0.3045501708984375, 0.347198486328125, 0.3898468017578125, 0.4324951171875, 0.4751434326171875, 0.517791748046875, 0.5604400634765625, 0.60308837890625, 0.6457366943359375, 0.688385009765625, 0.7310333251953125, 0.773681640625, 0.8163299560546875, 0.858978271484375, 0.9016265869140625, 0.94427490234375, 0.9869232177734375, 1.029571533203125, 1.0722198486328125, 1.1148681640625, 1.1575164794921875, 1.200164794921875, 1.2428131103515625, 1.28546142578125, 1.3281097412109375, 1.370758056640625, 1.4134063720703125, 1.4560546875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 11.0, 4.0, 17.0, 21.0, 15.0, 21.0, 38.0, 48.0, 66.0, 79.0, 125.0, 183.0, 324.0, 553.0, 1044.0, 2986.0, 15692.0, 292514.0, 2706301.0, 112101.0, 9172.0, 2177.0, 897.0, 462.0, 296.0, 172.0, 102.0, 92.0, 42.0, 44.0, 33.0, 20.0, 14.0, 15.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.05487060546875, -1.9769287109375, -1.89898681640625, -1.821044921875, -1.74310302734375, -1.6651611328125, -1.58721923828125, -1.50927734375, -1.43133544921875, -1.3533935546875, -1.27545166015625, -1.197509765625, -1.11956787109375, -1.0416259765625, -0.96368408203125, -0.8857421875, -0.80780029296875, -0.7298583984375, -0.65191650390625, -0.573974609375, -0.49603271484375, -0.4180908203125, -0.34014892578125, -0.26220703125, -0.18426513671875, -0.1063232421875, -0.02838134765625, 0.049560546875, 0.12750244140625, 0.2054443359375, 0.28338623046875, 0.361328125, 0.43927001953125, 0.5172119140625, 0.59515380859375, 0.673095703125, 0.75103759765625, 0.8289794921875, 0.90692138671875, 0.98486328125, 1.06280517578125, 1.1407470703125, 1.21868896484375, 1.296630859375, 1.37457275390625, 1.4525146484375, 1.53045654296875, 1.6083984375, 1.68634033203125, 1.7642822265625, 1.84222412109375, 1.920166015625, 1.99810791015625, 2.0760498046875, 2.15399169921875, 2.23193359375, 2.30987548828125, 2.3878173828125, 2.46575927734375, 2.543701171875, 2.62164306640625, 2.6995849609375, 2.77752685546875, 2.85546875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [354.0, 662.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.026209592819214, -0.17567121982574463, 1.6748671531677246, 3.5254056453704834, 5.375944137573242, 7.226482391357422, 9.077020645141602, 10.927558898925781, 12.778097152709961, 14.62863540649414, 16.47917366027832, 18.3297119140625, 20.18025016784668, 22.03078842163086, 23.881328582763672, 25.73186492919922, 27.58240509033203, 29.43294334411621, 31.28348159790039, 33.1340217590332, 34.98455810546875, 36.83509826660156, 38.68563461303711, 40.53617477416992, 42.38671112060547, 44.23725128173828, 46.08778762817383, 47.93832778930664, 49.78886413574219, 51.639404296875, 53.48994064331055, 55.34048080444336, 57.19102096557617, 59.041561126708984, 60.89209747314453, 62.742637634277344, 64.59317779541016, 66.44371032714844, 68.29425048828125, 70.14479064941406, 71.99533081054688, 73.84587097167969, 75.6964111328125, 77.54694366455078, 79.3974838256836, 81.2480239868164, 83.09856414794922, 84.9490966796875, 86.79963684082031, 88.65017700195312, 90.50071716308594, 92.35124969482422, 94.20178985595703, 96.05233001708984, 97.90287017822266, 99.75340270996094, 101.60394287109375, 103.45448303222656, 105.30502319335938, 107.15555572509766, 109.00609588623047, 110.85663604736328, 112.7071762084961, 114.55770874023438, 116.40824890136719]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 10.0, 14.0, 16.0, 18.0, 17.0, 30.0, 29.0, 36.0, 28.0, 42.0, 34.0, 44.0, 38.0, 45.0, 50.0, 49.0, 50.0, 44.0, 31.0, 39.0, 35.0, 36.0, 33.0, 37.0, 22.0, 35.0, 22.0, 21.0, 21.0, 20.0, 13.0, 8.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.105642318725586, -4.958823204040527, -4.812004089355469, -4.665184497833252, -4.518365383148193, -4.371546268463135, -4.224727153778076, -4.077908039093018, -3.93108868598938, -3.7842695713043213, -3.6374502182006836, -3.490631103515625, -3.3438119888305664, -3.1969926357269287, -3.05017352104187, -2.9033541679382324, -2.756535053253174, -2.6097159385681152, -2.4628965854644775, -2.316077470779419, -2.1692581176757812, -2.0224390029907227, -1.875619888305664, -1.728800654411316, -1.5819814205169678, -1.4351621866226196, -1.2883429527282715, -1.141523838043213, -0.9947046041488647, -0.8478853702545166, -0.7010661959648132, -0.5542470216751099, -0.4074277877807617, -0.26060858368873596, -0.1137893795967102, 0.03302982449531555, 0.1798490285873413, 0.32666826248168945, 0.4734874367713928, 0.6203066110610962, 0.7671258449554443, 0.9139450788497925, 1.0607643127441406, 1.2075834274291992, 1.3544026613235474, 1.5012218952178955, 1.648041009902954, 1.7948602437973022, 1.9416794776916504, 2.088498592376709, 2.2353179454803467, 2.3821370601654053, 2.528956413269043, 2.6757755279541016, 2.82259464263916, 2.9694137573242188, 3.1162331104278564, 3.263052225112915, 3.4098715782165527, 3.5566906929016113, 3.70350980758667, 3.8503291606903076, 3.997148275375366, 4.143967628479004, 4.2907867431640625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 13.0, 9.0, 7.0, 5.0, 11.0, 11.0, 21.0, 17.0, 15.0, 23.0, 21.0, 37.0, 26.0, 33.0, 30.0, 38.0, 32.0, 35.0, 42.0, 42.0, 37.0, 46.0, 33.0, 50.0, 35.0, 33.0, 32.0, 23.0, 37.0, 36.0, 29.0, 25.0, 16.0, 15.0, 20.0, 14.0, 10.0, 8.0, 5.0, 5.0, 1.0, 8.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371337890625, -0.35843658447265625, -0.3455352783203125, -0.33263397216796875, -0.319732666015625, -0.30683135986328125, -0.2939300537109375, -0.28102874755859375, -0.26812744140625, -0.25522613525390625, -0.2423248291015625, -0.22942352294921875, -0.216522216796875, -0.20362091064453125, -0.1907196044921875, -0.17781829833984375, -0.1649169921875, -0.15201568603515625, -0.1391143798828125, -0.12621307373046875, -0.113311767578125, -0.10041046142578125, -0.0875091552734375, -0.07460784912109375, -0.06170654296875, -0.04880523681640625, -0.0359039306640625, -0.02300262451171875, -0.010101318359375, 0.00279998779296875, 0.0157012939453125, 0.02860260009765625, 0.04150390625, 0.05440521240234375, 0.0673065185546875, 0.08020782470703125, 0.093109130859375, 0.10601043701171875, 0.1189117431640625, 0.13181304931640625, 0.14471435546875, 0.15761566162109375, 0.1705169677734375, 0.18341827392578125, 0.196319580078125, 0.20922088623046875, 0.2221221923828125, 0.23502349853515625, 0.2479248046875, 0.26082611083984375, 0.2737274169921875, 0.28662872314453125, 0.299530029296875, 0.31243133544921875, 0.3253326416015625, 0.33823394775390625, 0.35113525390625, 0.36403656005859375, 0.3769378662109375, 0.38983917236328125, 0.402740478515625, 0.41564178466796875, 0.4285430908203125, 0.44144439697265625, 0.454345703125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 6.0, 12.0, 11.0, 20.0, 29.0, 47.0, 51.0, 79.0, 98.0, 129.0, 212.0, 283.0, 442.0, 637.0, 951.0, 1594.0, 2606.0, 4891.0, 9502.0, 21110.0, 61591.0, 291980.0, 1845406.0, 1612560.0, 243888.0, 55232.0, 20021.0, 9102.0, 4784.0, 2597.0, 1512.0, 924.0, 618.0, 440.0, 269.0, 192.0, 139.0, 91.0, 62.0, 49.0, 33.0, 27.0, 16.0, 12.0, 13.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.91259765625, -0.8857192993164062, -0.8588409423828125, -0.8319625854492188, -0.805084228515625, -0.7782058715820312, -0.7513275146484375, -0.7244491577148438, -0.69757080078125, -0.6706924438476562, -0.6438140869140625, -0.6169357299804688, -0.590057373046875, -0.5631790161132812, -0.5363006591796875, -0.5094223022460938, -0.4825439453125, -0.45566558837890625, -0.4287872314453125, -0.40190887451171875, -0.375030517578125, -0.34815216064453125, -0.3212738037109375, -0.29439544677734375, -0.26751708984375, -0.24063873291015625, -0.2137603759765625, -0.18688201904296875, -0.160003662109375, -0.13312530517578125, -0.1062469482421875, -0.07936859130859375, -0.052490234375, -0.02561187744140625, 0.0012664794921875, 0.02814483642578125, 0.055023193359375, 0.08190155029296875, 0.1087799072265625, 0.13565826416015625, 0.16253662109375, 0.18941497802734375, 0.2162933349609375, 0.24317169189453125, 0.270050048828125, 0.29692840576171875, 0.3238067626953125, 0.35068511962890625, 0.3775634765625, 0.40444183349609375, 0.4313201904296875, 0.45819854736328125, 0.485076904296875, 0.5119552612304688, 0.5388336181640625, 0.5657119750976562, 0.59259033203125, 0.6194686889648438, 0.6463470458984375, 0.6732254028320312, 0.700103759765625, 0.7269821166992188, 0.7538604736328125, 0.7807388305664062, 0.8076171875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 5.0, 3.0, 19.0, 15.0, 19.0, 28.0, 48.0, 50.0, 79.0, 116.0, 180.0, 346.0, 547.0, 745.0, 640.0, 397.0, 267.0, 165.0, 112.0, 69.0, 58.0, 36.0, 28.0, 24.0, 18.0, 16.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.0934295654296875, -1.057952880859375, -1.0224761962890625, -0.98699951171875, -0.9515228271484375, -0.916046142578125, -0.8805694580078125, -0.8450927734375, -0.8096160888671875, -0.774139404296875, -0.7386627197265625, -0.70318603515625, -0.6677093505859375, -0.632232666015625, -0.5967559814453125, -0.561279296875, -0.5258026123046875, -0.490325927734375, -0.4548492431640625, -0.41937255859375, -0.3838958740234375, -0.348419189453125, -0.3129425048828125, -0.2774658203125, -0.2419891357421875, -0.206512451171875, -0.1710357666015625, -0.13555908203125, -0.1000823974609375, -0.064605712890625, -0.0291290283203125, 0.00634765625, 0.0418243408203125, 0.077301025390625, 0.1127777099609375, 0.14825439453125, 0.1837310791015625, 0.219207763671875, 0.2546844482421875, 0.2901611328125, 0.3256378173828125, 0.361114501953125, 0.3965911865234375, 0.43206787109375, 0.4675445556640625, 0.503021240234375, 0.5384979248046875, 0.573974609375, 0.6094512939453125, 0.644927978515625, 0.6804046630859375, 0.71588134765625, 0.7513580322265625, 0.786834716796875, 0.8223114013671875, 0.8577880859375, 0.8932647705078125, 0.928741455078125, 0.9642181396484375, 0.99969482421875, 1.0351715087890625, 1.070648193359375, 1.1061248779296875, 1.1416015625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 4.0, 6.0, 10.0, 15.0, 22.0, 36.0, 39.0, 75.0, 123.0, 172.0, 263.0, 404.0, 657.0, 1048.0, 1916.0, 3209.0, 6636.0, 15286.0, 42345.0, 168976.0, 1453019.0, 2173363.0, 238129.0, 53628.0, 18197.0, 7868.0, 3686.0, 2009.0, 1193.0, 697.0, 454.0, 273.0, 193.0, 108.0, 74.0, 48.0, 34.0, 22.0, 13.0, 12.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4097442626953125, -1.364410400390625, -1.3190765380859375, -1.27374267578125, -1.2284088134765625, -1.183074951171875, -1.1377410888671875, -1.0924072265625, -1.0470733642578125, -1.001739501953125, -0.9564056396484375, -0.91107177734375, -0.8657379150390625, -0.820404052734375, -0.7750701904296875, -0.729736328125, -0.6844024658203125, -0.639068603515625, -0.5937347412109375, -0.54840087890625, -0.5030670166015625, -0.457733154296875, -0.4123992919921875, -0.3670654296875, -0.3217315673828125, -0.276397705078125, -0.2310638427734375, -0.18572998046875, -0.1403961181640625, -0.095062255859375, -0.0497283935546875, -0.00439453125, 0.0409393310546875, 0.086273193359375, 0.1316070556640625, 0.17694091796875, 0.2222747802734375, 0.267608642578125, 0.3129425048828125, 0.3582763671875, 0.4036102294921875, 0.448944091796875, 0.4942779541015625, 0.53961181640625, 0.5849456787109375, 0.630279541015625, 0.6756134033203125, 0.720947265625, 0.7662811279296875, 0.811614990234375, 0.8569488525390625, 0.90228271484375, 0.9476165771484375, 0.992950439453125, 1.0382843017578125, 1.0836181640625, 1.1289520263671875, 1.174285888671875, 1.2196197509765625, 1.26495361328125, 1.3102874755859375, 1.355621337890625, 1.4009552001953125, 1.4462890625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 16.0, 39.0, 72.0, 189.0, 247.0, 245.0, 111.0, 42.0, 22.0, 14.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.698354721069336, -8.31443977355957, -7.930525302886963, -7.546610355377197, -7.16269588470459, -6.778780937194824, -6.394865989685059, -6.010951042175293, -5.6270365715026855, -5.24312162399292, -4.8592071533203125, -4.475292205810547, -4.091377258300781, -3.707462787628174, -3.323547840118408, -2.9396331310272217, -2.555718421936035, -2.1718037128448486, -1.7878888845443726, -1.4039740562438965, -1.02005934715271, -0.6361446380615234, -0.2522296905517578, 0.1316850185394287, 0.5155997276306152, 0.8995144963264465, 1.2834292650222778, 1.667344093322754, 2.0512588024139404, 2.435173511505127, 2.8190884590148926, 3.203003168106079, 3.586916923522949, 3.9708316326141357, 4.354746341705322, 4.738661289215088, 5.122575759887695, 5.506490707397461, 5.890405654907227, 6.274320602416992, 6.6582350730896, 7.042150020599365, 7.426064491271973, 7.809979438781738, 8.193894386291504, 8.577808380126953, 8.961723327636719, 9.345638275146484, 9.72955322265625, 10.113468170166016, 10.497383117675781, 10.881298065185547, 11.265212059020996, 11.649127006530762, 12.033041954040527, 12.416956901550293, 12.800870895385742, 13.184785842895508, 13.568700790405273, 13.952615737915039, 14.336529731750488, 14.720444679260254, 15.10435962677002, 15.488274574279785, 15.87218952178955]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 6.0, 6.0, 8.0, 12.0, 15.0, 10.0, 28.0, 20.0, 24.0, 26.0, 41.0, 27.0, 37.0, 39.0, 47.0, 40.0, 36.0, 39.0, 55.0, 45.0, 38.0, 47.0, 42.0, 41.0, 39.0, 38.0, 29.0, 32.0, 24.0, 23.0, 14.0, 18.0, 8.0, 4.0, 6.0, 9.0, 4.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.924111843109131, -2.822512626647949, -2.7209131717681885, -2.619313955307007, -2.517714738845825, -2.4161152839660645, -2.314516067504883, -2.212916851043701, -2.1113176345825195, -2.009718418121338, -1.9081190824508667, -1.8065197467803955, -1.7049205303192139, -1.6033211946487427, -1.5017218589782715, -1.4001226425170898, -1.2985233068466187, -1.1969239711761475, -1.0953247547149658, -0.9937254190444946, -0.892126202583313, -0.7905268669128418, -0.6889275908470154, -0.587328314781189, -0.48572903871536255, -0.38412976264953613, -0.2825304865837097, -0.1809311807155609, -0.0793319046497345, 0.022267401218414307, 0.12386667728424072, 0.22546595335006714, 0.32706522941589355, 0.42866450548171997, 0.5302637815475464, 0.6318631172180176, 0.7334623336791992, 0.8350616693496704, 0.9366609454154968, 1.0382602214813232, 1.1398594379425049, 1.241458773612976, 1.3430579900741577, 1.444657325744629, 1.5462565422058105, 1.6478558778762817, 1.749455213546753, 1.8510544300079346, 1.9526537656784058, 2.054253101348877, 2.1558523178100586, 2.2574515342712402, 2.359050989151001, 2.4606502056121826, 2.5622494220733643, 2.663848876953125, 2.7654480934143066, 2.8670473098754883, 2.968646764755249, 3.0702459812164307, 3.1718451976776123, 3.273444652557373, 3.3750438690185547, 3.4766430854797363, 3.578242301940918]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 10.0, 12.0, 8.0, 11.0, 14.0, 15.0, 16.0, 19.0, 32.0, 28.0, 21.0, 25.0, 35.0, 36.0, 43.0, 47.0, 47.0, 34.0, 33.0, 54.0, 26.0, 43.0, 31.0, 34.0, 30.0, 39.0, 31.0, 38.0, 28.0, 18.0, 21.0, 29.0, 20.0, 11.0, 2.0, 6.0, 9.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.39306640625, -0.38005828857421875, -0.3670501708984375, -0.35404205322265625, -0.341033935546875, -0.32802581787109375, -0.3150177001953125, -0.30200958251953125, -0.28900146484375, -0.27599334716796875, -0.2629852294921875, -0.24997711181640625, -0.236968994140625, -0.22396087646484375, -0.2109527587890625, -0.19794464111328125, -0.1849365234375, -0.17192840576171875, -0.1589202880859375, -0.14591217041015625, -0.132904052734375, -0.11989593505859375, -0.1068878173828125, -0.09387969970703125, -0.08087158203125, -0.06786346435546875, -0.0548553466796875, -0.04184722900390625, -0.028839111328125, -0.01583099365234375, -0.0028228759765625, 0.01018524169921875, 0.023193359375, 0.03620147705078125, 0.0492095947265625, 0.06221771240234375, 0.075225830078125, 0.08823394775390625, 0.1012420654296875, 0.11425018310546875, 0.12725830078125, 0.14026641845703125, 0.1532745361328125, 0.16628265380859375, 0.179290771484375, 0.19229888916015625, 0.2053070068359375, 0.21831512451171875, 0.2313232421875, 0.24433135986328125, 0.2573394775390625, 0.27034759521484375, 0.283355712890625, 0.29636383056640625, 0.3093719482421875, 0.32238006591796875, 0.33538818359375, 0.34839630126953125, 0.3614044189453125, 0.37441253662109375, 0.387420654296875, 0.40042877197265625, 0.4134368896484375, 0.42644500732421875, 0.439453125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 10.0, 15.0, 15.0, 30.0, 39.0, 61.0, 94.0, 133.0, 193.0, 305.0, 498.0, 716.0, 1070.0, 1801.0, 2922.0, 4643.0, 8012.0, 13654.0, 24691.0, 44853.0, 79579.0, 131875.0, 185705.0, 193148.0, 144905.0, 90533.0, 51846.0, 28560.0, 15843.0, 8941.0, 5319.0, 3038.0, 1961.0, 1212.0, 802.0, 491.0, 335.0, 228.0, 148.0, 102.0, 66.0, 53.0, 39.0, 21.0, 14.0, 5.0, 11.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.33642578125, -0.32595062255859375, -0.3154754638671875, -0.30500030517578125, -0.294525146484375, -0.28404998779296875, -0.2735748291015625, -0.26309967041015625, -0.25262451171875, -0.24214935302734375, -0.2316741943359375, -0.22119903564453125, -0.210723876953125, -0.20024871826171875, -0.1897735595703125, -0.17929840087890625, -0.1688232421875, -0.15834808349609375, -0.1478729248046875, -0.13739776611328125, -0.126922607421875, -0.11644744873046875, -0.1059722900390625, -0.09549713134765625, -0.08502197265625, -0.07454681396484375, -0.0640716552734375, -0.05359649658203125, -0.043121337890625, -0.03264617919921875, -0.0221710205078125, -0.01169586181640625, -0.001220703125, 0.00925445556640625, 0.0197296142578125, 0.03020477294921875, 0.040679931640625, 0.05115509033203125, 0.0616302490234375, 0.07210540771484375, 0.08258056640625, 0.09305572509765625, 0.1035308837890625, 0.11400604248046875, 0.124481201171875, 0.13495635986328125, 0.1454315185546875, 0.15590667724609375, 0.1663818359375, 0.17685699462890625, 0.1873321533203125, 0.19780731201171875, 0.208282470703125, 0.21875762939453125, 0.2292327880859375, 0.23970794677734375, 0.25018310546875, 0.26065826416015625, 0.2711334228515625, 0.28160858154296875, 0.292083740234375, 0.30255889892578125, 0.3130340576171875, 0.32350921630859375, 0.333984375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 7.0, 11.0, 11.0, 22.0, 13.0, 15.0, 19.0, 21.0, 21.0, 24.0, 29.0, 36.0, 34.0, 26.0, 34.0, 42.0, 30.0, 37.0, 51.0, 1062.0, 50.0, 41.0, 35.0, 41.0, 37.0, 34.0, 37.0, 29.0, 24.0, 21.0, 20.0, 23.0, 16.0, 9.0, 8.0, 11.0, 6.0, 6.0, 8.0, 4.0, 1.0, 1.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.3671875, -0.3567237854003906, -0.34626007080078125, -0.3357963562011719, -0.3253326416015625, -0.3148689270019531, -0.30440521240234375, -0.2939414978027344, -0.283477783203125, -0.2730140686035156, -0.26255035400390625, -0.2520866394042969, -0.2416229248046875, -0.23115921020507812, -0.22069549560546875, -0.21023178100585938, -0.19976806640625, -0.18930435180664062, -0.17884063720703125, -0.16837692260742188, -0.1579132080078125, -0.14744949340820312, -0.13698577880859375, -0.12652206420898438, -0.116058349609375, -0.10559463500976562, -0.09513092041015625, -0.08466720581054688, -0.0742034912109375, -0.06373977661132812, -0.05327606201171875, -0.042812347412109375, -0.0323486328125, -0.021884918212890625, -0.01142120361328125, -0.000957489013671875, 0.0095062255859375, 0.019969940185546875, 0.03043365478515625, 0.040897369384765625, 0.051361083984375, 0.061824798583984375, 0.07228851318359375, 0.08275222778320312, 0.0932159423828125, 0.10367965698242188, 0.11414337158203125, 0.12460708618164062, 0.13507080078125, 0.14553451538085938, 0.15599822998046875, 0.16646194458007812, 0.1769256591796875, 0.18738937377929688, 0.19785308837890625, 0.20831680297851562, 0.218780517578125, 0.22924423217773438, 0.23970794677734375, 0.2501716613769531, 0.2606353759765625, 0.2710990905761719, 0.28156280517578125, 0.2920265197753906, 0.302490234375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 19.0, 12.0, 25.0, 35.0, 52.0, 60.0, 91.0, 133.0, 207.0, 358.0, 528.0, 750.0, 1207.0, 1707.0, 2631.0, 4058.0, 6324.0, 10290.0, 18273.0, 40532.0, 373305.0, 1529491.0, 54196.0, 21063.0, 11595.0, 7117.0, 4461.0, 2837.0, 1904.0, 1280.0, 811.0, 560.0, 392.0, 283.0, 165.0, 118.0, 74.0, 56.0, 46.0, 20.0, 22.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.472412109375, -0.45856475830078125, -0.4447174072265625, -0.43087005615234375, -0.417022705078125, -0.40317535400390625, -0.3893280029296875, -0.37548065185546875, -0.36163330078125, -0.34778594970703125, -0.3339385986328125, -0.32009124755859375, -0.306243896484375, -0.29239654541015625, -0.2785491943359375, -0.26470184326171875, -0.2508544921875, -0.23700714111328125, -0.2231597900390625, -0.20931243896484375, -0.195465087890625, -0.18161773681640625, -0.1677703857421875, -0.15392303466796875, -0.14007568359375, -0.12622833251953125, -0.1123809814453125, -0.09853363037109375, -0.084686279296875, -0.07083892822265625, -0.0569915771484375, -0.04314422607421875, -0.029296875, -0.01544952392578125, -0.0016021728515625, 0.01224517822265625, 0.026092529296875, 0.03993988037109375, 0.0537872314453125, 0.06763458251953125, 0.08148193359375, 0.09532928466796875, 0.1091766357421875, 0.12302398681640625, 0.136871337890625, 0.15071868896484375, 0.1645660400390625, 0.17841339111328125, 0.1922607421875, 0.20610809326171875, 0.2199554443359375, 0.23380279541015625, 0.247650146484375, 0.26149749755859375, 0.2753448486328125, 0.28919219970703125, 0.30303955078125, 0.31688690185546875, 0.3307342529296875, 0.34458160400390625, 0.358428955078125, 0.37227630615234375, 0.3861236572265625, 0.39997100830078125, 0.413818359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 1.0, 2.0, 2.0, 3.0, 13.0, 12.0, 22.0, 20.0, 22.0, 30.0, 31.0, 43.0, 58.0, 61.0, 86.0, 82.0, 80.0, 67.0, 79.0, 55.0, 44.0, 39.0, 31.0, 27.0, 18.0, 15.0, 18.0, 12.0, 6.0, 4.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032440185546875, -0.031522274017333984, -0.03060436248779297, -0.029686450958251953, -0.028768539428710938, -0.027850627899169922, -0.026932716369628906, -0.02601480484008789, -0.025096893310546875, -0.02417898178100586, -0.023261070251464844, -0.022343158721923828, -0.021425247192382812, -0.020507335662841797, -0.01958942413330078, -0.018671512603759766, -0.01775360107421875, -0.016835689544677734, -0.01591777801513672, -0.014999866485595703, -0.014081954956054688, -0.013164043426513672, -0.012246131896972656, -0.01132822036743164, -0.010410308837890625, -0.00949239730834961, -0.008574485778808594, -0.007656574249267578, -0.0067386627197265625, -0.005820751190185547, -0.004902839660644531, -0.003984928131103516, -0.0030670166015625, -0.0021491050720214844, -0.0012311935424804688, -0.0003132820129394531, 0.0006046295166015625, 0.0015225410461425781, 0.0024404525756835938, 0.0033583641052246094, 0.004276275634765625, 0.005194187164306641, 0.006112098693847656, 0.007030010223388672, 0.007947921752929688, 0.008865833282470703, 0.009783744812011719, 0.010701656341552734, 0.01161956787109375, 0.012537479400634766, 0.013455390930175781, 0.014373302459716797, 0.015291213989257812, 0.016209125518798828, 0.017127037048339844, 0.01804494857788086, 0.018962860107421875, 0.01988077163696289, 0.020798683166503906, 0.021716594696044922, 0.022634506225585938, 0.023552417755126953, 0.02447032928466797, 0.025388240814208984, 0.02630615234375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 10.0, 7.0, 18.0, 24.0, 35.0, 42.0, 65.0, 121.0, 170.0, 434.0, 1649.0, 19906.0, 782393.0, 234846.0, 7199.0, 871.0, 307.0, 138.0, 90.0, 67.0, 47.0, 28.0, 25.0, 19.0, 12.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404052734375, -0.3900337219238281, -0.37601470947265625, -0.3619956970214844, -0.3479766845703125, -0.3339576721191406, -0.31993865966796875, -0.3059196472167969, -0.291900634765625, -0.2778816223144531, -0.26386260986328125, -0.24984359741210938, -0.2358245849609375, -0.22180557250976562, -0.20778656005859375, -0.19376754760742188, -0.17974853515625, -0.16572952270507812, -0.15171051025390625, -0.13769149780273438, -0.1236724853515625, -0.10965347290039062, -0.09563446044921875, -0.08161544799804688, -0.067596435546875, -0.053577423095703125, -0.03955841064453125, -0.025539398193359375, -0.0115203857421875, 0.002498626708984375, 0.01651763916015625, 0.030536651611328125, 0.0445556640625, 0.058574676513671875, 0.07259368896484375, 0.08661270141601562, 0.1006317138671875, 0.11465072631835938, 0.12866973876953125, 0.14268875122070312, 0.156707763671875, 0.17072677612304688, 0.18474578857421875, 0.19876480102539062, 0.2127838134765625, 0.22680282592773438, 0.24082183837890625, 0.2548408508300781, 0.26885986328125, 0.2828788757324219, 0.29689788818359375, 0.3109169006347656, 0.3249359130859375, 0.3389549255371094, 0.35297393798828125, 0.3669929504394531, 0.381011962890625, 0.3950309753417969, 0.40904998779296875, 0.4230690002441406, 0.4370880126953125, 0.4511070251464844, 0.46512603759765625, 0.4791450500488281, 0.4931640625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 10.0, 4.0, 6.0, 2.0, 17.0, 12.0, 20.0, 28.0, 40.0, 70.0, 79.0, 133.0, 138.0, 143.0, 87.0, 66.0, 47.0, 32.0, 19.0, 15.0, 11.0, 6.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1612149029970169, -0.15643617510795593, -0.15165744721889496, -0.14687871932983398, -0.14209997653961182, -0.13732124865055084, -0.13254252076148987, -0.1277637928724289, -0.12298506498336792, -0.11820633709430695, -0.11342760920524597, -0.1086488738656044, -0.10387014597654343, -0.09909141808748245, -0.09431268274784088, -0.08953395485877991, -0.08475522696971893, -0.07997649908065796, -0.07519777119159698, -0.07041903585195541, -0.06564030796289444, -0.060861580073833466, -0.05608284845948219, -0.05130411684513092, -0.046525388956069946, -0.04174666106700897, -0.0369679294526577, -0.03218919783830643, -0.027410469949245453, -0.02263174019753933, -0.017853010445833206, -0.013074278831481934, -0.00829555094242096, -0.003516821190714836, 0.0012619085609912872, 0.006040638312697411, 0.010819368064403534, 0.015598097816109657, 0.02037682756781578, 0.025155559182167053, 0.029934287071228027, 0.034713014960289, 0.039491746574640274, 0.04427047818899155, 0.04904920607805252, 0.053827933967113495, 0.05860666558146477, 0.06338539719581604, 0.06816412508487701, 0.07294285297393799, 0.07772158086299896, 0.08250031620264053, 0.08727904409170151, 0.09205777198076248, 0.09683650732040405, 0.10161523520946503, 0.106393963098526, 0.11117269098758698, 0.11595141887664795, 0.12073015421628952, 0.1255088746547699, 0.13028761744499207, 0.13506634533405304, 0.139845073223114, 0.144623801112175]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 9.0, 6.0, 6.0, 12.0, 18.0, 9.0, 14.0, 24.0, 24.0, 19.0, 35.0, 30.0, 42.0, 33.0, 39.0, 44.0, 45.0, 35.0, 57.0, 42.0, 45.0, 31.0, 41.0, 42.0, 41.0, 33.0, 37.0, 28.0, 27.0, 24.0, 21.0, 16.0, 9.0, 15.0, 9.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0973542332649231, -0.09453877061605453, -0.09172330796718597, -0.08890784531831741, -0.08609238266944885, -0.0832769125699997, -0.08046144992113113, -0.07764598727226257, -0.07483052462339401, -0.07201506197452545, -0.06919959932565689, -0.06638413667678833, -0.06356866657733917, -0.06075320765376091, -0.05793774127960205, -0.05512227863073349, -0.05230681598186493, -0.04949135333299637, -0.04667589068412781, -0.04386042430996895, -0.04104496166110039, -0.03822949901223183, -0.03541403263807297, -0.03259856998920441, -0.029783107340335846, -0.026967644691467285, -0.024152180179953575, -0.021336715668439865, -0.018521253019571304, -0.015705790370702744, -0.012890325859189034, -0.010074861347675323, -0.007259398698806763, -0.004443935118615627, -0.0016284715384244919, 0.0011869920417666435, 0.004002455621957779, 0.006817919202148914, 0.00963338278234005, 0.01244884729385376, 0.01526430994272232, 0.01807977259159088, 0.02089523710310459, 0.0237107016146183, 0.026526164263486862, 0.029341626912355423, 0.03215709328651428, 0.03497255593538284, 0.037788018584251404, 0.040603481233119965, 0.043418943881988525, 0.046234410256147385, 0.049049872905015945, 0.051865335553884506, 0.054680801928043365, 0.057496264576911926, 0.06031172722578049, 0.06312718987464905, 0.06594265252351761, 0.06875811517238617, 0.07157358527183533, 0.07438904792070389, 0.07720451056957245, 0.08001997321844101, 0.08283543586730957]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 10.0, 7.0, 13.0, 9.0, 8.0, 14.0, 16.0, 17.0, 16.0, 31.0, 30.0, 24.0, 25.0, 27.0, 35.0, 49.0, 40.0, 53.0, 33.0, 37.0, 44.0, 36.0, 38.0, 33.0, 37.0, 25.0, 38.0, 36.0, 37.0, 27.0, 22.0, 18.0, 28.0, 21.0, 12.0, 7.0, 3.0, 10.0, 4.0, 8.0, 8.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.395751953125, -0.3827247619628906, -0.36969757080078125, -0.3566703796386719, -0.3436431884765625, -0.3306159973144531, -0.31758880615234375, -0.3045616149902344, -0.291534423828125, -0.2785072326660156, -0.26548004150390625, -0.2524528503417969, -0.2394256591796875, -0.22639846801757812, -0.21337127685546875, -0.20034408569335938, -0.18731689453125, -0.17428970336914062, -0.16126251220703125, -0.14823532104492188, -0.1352081298828125, -0.12218093872070312, -0.10915374755859375, -0.09612655639648438, -0.083099365234375, -0.07007217407226562, -0.05704498291015625, -0.044017791748046875, -0.0309906005859375, -0.017963409423828125, -0.00493621826171875, 0.008090972900390625, 0.0211181640625, 0.034145355224609375, 0.04717254638671875, 0.060199737548828125, 0.0732269287109375, 0.08625411987304688, 0.09928131103515625, 0.11230850219726562, 0.125335693359375, 0.13836288452148438, 0.15139007568359375, 0.16441726684570312, 0.1774444580078125, 0.19047164916992188, 0.20349884033203125, 0.21652603149414062, 0.22955322265625, 0.24258041381835938, 0.25560760498046875, 0.2686347961425781, 0.2816619873046875, 0.2946891784667969, 0.30771636962890625, 0.3207435607910156, 0.333770751953125, 0.3467979431152344, 0.35982513427734375, 0.3728523254394531, 0.3858795166015625, 0.3989067077636719, 0.41193389892578125, 0.4249610900878906, 0.43798828125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 16.0, 22.0, 30.0, 39.0, 55.0, 93.0, 134.0, 272.0, 450.0, 823.0, 1500.0, 3186.0, 7136.0, 18343.0, 70352.0, 435148.0, 412666.0, 67294.0, 17598.0, 6943.0, 3094.0, 1494.0, 776.0, 408.0, 236.0, 147.0, 89.0, 81.0, 40.0, 21.0, 17.0, 6.0, 17.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3642578125, -1.3273696899414062, -1.2904815673828125, -1.2535934448242188, -1.216705322265625, -1.1798171997070312, -1.1429290771484375, -1.1060409545898438, -1.06915283203125, -1.0322647094726562, -0.9953765869140625, -0.9584884643554688, -0.921600341796875, -0.8847122192382812, -0.8478240966796875, -0.8109359741210938, -0.7740478515625, -0.7371597290039062, -0.7002716064453125, -0.6633834838867188, -0.626495361328125, -0.5896072387695312, -0.5527191162109375, -0.5158309936523438, -0.47894287109375, -0.44205474853515625, -0.4051666259765625, -0.36827850341796875, -0.331390380859375, -0.29450225830078125, -0.2576141357421875, -0.22072601318359375, -0.183837890625, -0.14694976806640625, -0.1100616455078125, -0.07317352294921875, -0.036285400390625, 0.00060272216796875, 0.0374908447265625, 0.07437896728515625, 0.11126708984375, 0.14815521240234375, 0.1850433349609375, 0.22193145751953125, 0.258819580078125, 0.29570770263671875, 0.3325958251953125, 0.36948394775390625, 0.4063720703125, 0.44326019287109375, 0.4801483154296875, 0.5170364379882812, 0.553924560546875, 0.5908126831054688, 0.6277008056640625, 0.6645889282226562, 0.70147705078125, 0.7383651733398438, 0.7752532958984375, 0.8121414184570312, 0.849029541015625, 0.8859176635742188, 0.9228057861328125, 0.9596939086914062, 0.99658203125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 12.0, 11.0, 12.0, 23.0, 15.0, 17.0, 24.0, 24.0, 29.0, 43.0, 29.0, 32.0, 53.0, 60.0, 73.0, 87.0, 219.0, 1371.0, 292.0, 150.0, 87.0, 67.0, 46.0, 44.0, 33.0, 31.0, 27.0, 24.0, 19.0, 19.0, 16.0, 8.0, 13.0, 10.0, 11.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5251617431640625, -1.477081298828125, -1.4290008544921875, -1.38092041015625, -1.3328399658203125, -1.284759521484375, -1.2366790771484375, -1.1885986328125, -1.1405181884765625, -1.092437744140625, -1.0443572998046875, -0.99627685546875, -0.9481964111328125, -0.900115966796875, -0.8520355224609375, -0.803955078125, -0.7558746337890625, -0.707794189453125, -0.6597137451171875, -0.61163330078125, -0.5635528564453125, -0.515472412109375, -0.4673919677734375, -0.4193115234375, -0.3712310791015625, -0.323150634765625, -0.2750701904296875, -0.22698974609375, -0.1789093017578125, -0.130828857421875, -0.0827484130859375, -0.03466796875, 0.0134124755859375, 0.061492919921875, 0.1095733642578125, 0.15765380859375, 0.2057342529296875, 0.253814697265625, 0.3018951416015625, 0.3499755859375, 0.3980560302734375, 0.446136474609375, 0.4942169189453125, 0.54229736328125, 0.5903778076171875, 0.638458251953125, 0.6865386962890625, 0.734619140625, 0.7826995849609375, 0.830780029296875, 0.8788604736328125, 0.92694091796875, 0.9750213623046875, 1.023101806640625, 1.0711822509765625, 1.1192626953125, 1.1673431396484375, 1.215423583984375, 1.2635040283203125, 1.31158447265625, 1.3596649169921875, 1.407745361328125, 1.4558258056640625, 1.50390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 16.0, 8.0, 8.0, 15.0, 21.0, 30.0, 34.0, 53.0, 58.0, 90.0, 142.0, 190.0, 310.0, 565.0, 1062.0, 2743.0, 13536.0, 210609.0, 2762600.0, 137835.0, 10743.0, 2495.0, 985.0, 558.0, 270.0, 199.0, 138.0, 95.0, 64.0, 53.0, 54.0, 24.0, 24.0, 16.0, 15.0, 7.0, 10.0, 5.0, 4.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0], "bins": [-2.775390625, -2.69708251953125, -2.6187744140625, -2.54046630859375, -2.462158203125, -2.38385009765625, -2.3055419921875, -2.22723388671875, -2.14892578125, -2.07061767578125, -1.9923095703125, -1.91400146484375, -1.835693359375, -1.75738525390625, -1.6790771484375, -1.60076904296875, -1.5224609375, -1.44415283203125, -1.3658447265625, -1.28753662109375, -1.209228515625, -1.13092041015625, -1.0526123046875, -0.97430419921875, -0.89599609375, -0.81768798828125, -0.7393798828125, -0.66107177734375, -0.582763671875, -0.50445556640625, -0.4261474609375, -0.34783935546875, -0.26953125, -0.19122314453125, -0.1129150390625, -0.03460693359375, 0.043701171875, 0.12200927734375, 0.2003173828125, 0.27862548828125, 0.35693359375, 0.43524169921875, 0.5135498046875, 0.59185791015625, 0.670166015625, 0.74847412109375, 0.8267822265625, 0.90509033203125, 0.9833984375, 1.06170654296875, 1.1400146484375, 1.21832275390625, 1.296630859375, 1.37493896484375, 1.4532470703125, 1.53155517578125, 1.60986328125, 1.68817138671875, 1.7664794921875, 1.84478759765625, 1.923095703125, 2.00140380859375, 2.0797119140625, 2.15802001953125, 2.236328125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 181.0, 828.0, 8.0, 2.0], "bins": [-82.7947006225586, -81.44242858886719, -80.09014892578125, -78.73787689208984, -77.38560485839844, -76.03333282470703, -74.6810531616211, -73.32878112792969, -71.97650909423828, -70.62423706054688, -69.27195739746094, -67.91968536376953, -66.56741333007812, -65.21514129638672, -63.86286544799805, -62.510589599609375, -61.15831756591797, -59.8060417175293, -58.45376968383789, -57.10149383544922, -55.74922180175781, -54.39694595336914, -53.044673919677734, -51.69239807128906, -50.34012222290039, -48.98784637451172, -47.63557434082031, -46.28329849243164, -44.931026458740234, -43.57875061035156, -42.226478576660156, -40.874202728271484, -39.52193069458008, -38.169654846191406, -36.8173828125, -35.46510696411133, -34.11283493041992, -32.76055908203125, -31.408287048339844, -30.056011199951172, -28.703737258911133, -27.351463317871094, -25.999189376831055, -24.646915435791016, -23.294641494750977, -21.942367553710938, -20.590091705322266, -19.23781967163086, -17.885543823242188, -16.53326988220215, -15.18099594116211, -13.82872200012207, -12.476448059082031, -11.124174118041992, -9.771899223327637, -8.419625282287598, -7.067352294921875, -5.715078353881836, -4.362804412841797, -3.0105299949645996, -1.6582560539245605, -0.3059821128845215, 1.0462923049926758, 2.398566246032715, 3.750840425491333]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 6.0, 5.0, 9.0, 13.0, 7.0, 14.0, 17.0, 19.0, 20.0, 14.0, 16.0, 33.0, 28.0, 33.0, 43.0, 35.0, 37.0, 45.0, 28.0, 42.0, 49.0, 48.0, 41.0, 38.0, 51.0, 35.0, 44.0, 36.0, 37.0, 21.0, 25.0, 19.0, 13.0, 15.0, 15.0, 6.0, 13.0, 12.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7381715774536133, -3.615029811859131, -3.4918880462646484, -3.368746280670166, -3.2456047534942627, -3.1224629878997803, -2.999321222305298, -2.8761794567108154, -2.753037929534912, -2.6298961639404297, -2.5067543983459473, -2.383612632751465, -2.2604711055755615, -2.137329339981079, -2.0141875743865967, -1.8910458087921143, -1.7679040431976318, -1.6447622776031494, -1.5216206312179565, -1.3984788656234741, -1.2753372192382812, -1.1521954536437988, -1.0290536880493164, -0.9059119820594788, -0.7827702760696411, -0.6596285700798035, -0.5364868640899658, -0.4133450984954834, -0.29020339250564575, -0.1670616865158081, -0.043919920921325684, 0.07922178506851196, 0.2023634910583496, 0.32550519704818726, 0.4486469328403473, 0.5717886686325073, 0.694930374622345, 0.8180720806121826, 0.941213846206665, 1.0643556118011475, 1.1874972581863403, 1.3106390237808228, 1.4337806701660156, 1.556922435760498, 1.6800642013549805, 1.8032058477401733, 1.9263476133346558, 2.0494892597198486, 2.172631025314331, 2.2957727909088135, 2.418914556503296, 2.542056083679199, 2.6651978492736816, 2.788339614868164, 2.9114813804626465, 3.034623146057129, 3.1577649116516113, 3.2809066772460938, 3.404048442840576, 3.5271902084350586, 3.650331735610962, 3.7734735012054443, 3.8966152667999268, 4.01975679397583, 4.1428985595703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 8.0, 9.0, 9.0, 20.0, 19.0, 16.0, 20.0, 29.0, 17.0, 34.0, 42.0, 41.0, 35.0, 43.0, 41.0, 25.0, 45.0, 43.0, 42.0, 49.0, 44.0, 28.0, 43.0, 36.0, 37.0, 38.0, 29.0, 28.0, 26.0, 23.0, 18.0, 6.0, 15.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4912109375, -0.4763031005859375, -0.461395263671875, -0.4464874267578125, -0.43157958984375, -0.4166717529296875, -0.401763916015625, -0.3868560791015625, -0.3719482421875, -0.3570404052734375, -0.342132568359375, -0.3272247314453125, -0.31231689453125, -0.2974090576171875, -0.282501220703125, -0.2675933837890625, -0.252685546875, -0.2377777099609375, -0.222869873046875, -0.2079620361328125, -0.19305419921875, -0.1781463623046875, -0.163238525390625, -0.1483306884765625, -0.1334228515625, -0.1185150146484375, -0.103607177734375, -0.0886993408203125, -0.07379150390625, -0.0588836669921875, -0.043975830078125, -0.0290679931640625, -0.01416015625, 0.0007476806640625, 0.015655517578125, 0.0305633544921875, 0.04547119140625, 0.0603790283203125, 0.075286865234375, 0.0901947021484375, 0.1051025390625, 0.1200103759765625, 0.134918212890625, 0.1498260498046875, 0.16473388671875, 0.1796417236328125, 0.194549560546875, 0.2094573974609375, 0.224365234375, 0.2392730712890625, 0.254180908203125, 0.2690887451171875, 0.28399658203125, 0.2989044189453125, 0.313812255859375, 0.3287200927734375, 0.3436279296875, 0.3585357666015625, 0.373443603515625, 0.3883514404296875, 0.40325927734375, 0.4181671142578125, 0.433074951171875, 0.4479827880859375, 0.462890625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 5.0, 11.0, 15.0, 20.0, 19.0, 30.0, 47.0, 62.0, 88.0, 100.0, 185.0, 262.0, 432.0, 650.0, 1100.0, 1973.0, 3738.0, 8681.0, 24537.0, 114668.0, 1564168.0, 2258974.0, 163555.0, 31052.0, 10258.0, 4285.0, 2201.0, 1181.0, 673.0, 420.0, 272.0, 173.0, 126.0, 100.0, 65.0, 33.0, 30.0, 16.0, 23.0, 11.0, 14.0, 8.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0], "bins": [-1.5849609375, -1.5422210693359375, -1.499481201171875, -1.4567413330078125, -1.41400146484375, -1.3712615966796875, -1.328521728515625, -1.2857818603515625, -1.2430419921875, -1.2003021240234375, -1.157562255859375, -1.1148223876953125, -1.07208251953125, -1.0293426513671875, -0.986602783203125, -0.9438629150390625, -0.901123046875, -0.8583831787109375, -0.815643310546875, -0.7729034423828125, -0.73016357421875, -0.6874237060546875, -0.644683837890625, -0.6019439697265625, -0.5592041015625, -0.5164642333984375, -0.473724365234375, -0.4309844970703125, -0.38824462890625, -0.3455047607421875, -0.302764892578125, -0.2600250244140625, -0.21728515625, -0.1745452880859375, -0.131805419921875, -0.0890655517578125, -0.04632568359375, -0.0035858154296875, 0.039154052734375, 0.0818939208984375, 0.1246337890625, 0.1673736572265625, 0.210113525390625, 0.2528533935546875, 0.29559326171875, 0.3383331298828125, 0.381072998046875, 0.4238128662109375, 0.466552734375, 0.5092926025390625, 0.552032470703125, 0.5947723388671875, 0.63751220703125, 0.6802520751953125, 0.722991943359375, 0.7657318115234375, 0.8084716796875, 0.8512115478515625, 0.893951416015625, 0.9366912841796875, 0.97943115234375, 1.0221710205078125, 1.064910888671875, 1.1076507568359375, 1.150390625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 6.0, 14.0, 16.0, 19.0, 20.0, 44.0, 64.0, 76.0, 108.0, 164.0, 264.0, 382.0, 536.0, 659.0, 511.0, 393.0, 232.0, 179.0, 97.0, 63.0, 48.0, 22.0, 33.0, 25.0, 19.0, 10.0, 10.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.13671875, -1.10467529296875, -1.0726318359375, -1.04058837890625, -1.008544921875, -0.97650146484375, -0.9444580078125, -0.91241455078125, -0.88037109375, -0.84832763671875, -0.8162841796875, -0.78424072265625, -0.752197265625, -0.72015380859375, -0.6881103515625, -0.65606689453125, -0.6240234375, -0.59197998046875, -0.5599365234375, -0.52789306640625, -0.495849609375, -0.46380615234375, -0.4317626953125, -0.39971923828125, -0.36767578125, -0.33563232421875, -0.3035888671875, -0.27154541015625, -0.239501953125, -0.20745849609375, -0.1754150390625, -0.14337158203125, -0.111328125, -0.07928466796875, -0.0472412109375, -0.01519775390625, 0.016845703125, 0.04888916015625, 0.0809326171875, 0.11297607421875, 0.14501953125, 0.17706298828125, 0.2091064453125, 0.24114990234375, 0.273193359375, 0.30523681640625, 0.3372802734375, 0.36932373046875, 0.4013671875, 0.43341064453125, 0.4654541015625, 0.49749755859375, 0.529541015625, 0.56158447265625, 0.5936279296875, 0.62567138671875, 0.65771484375, 0.68975830078125, 0.7218017578125, 0.75384521484375, 0.785888671875, 0.81793212890625, 0.8499755859375, 0.88201904296875, 0.9140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 7.0, 18.0, 17.0, 36.0, 39.0, 87.0, 113.0, 176.0, 264.0, 416.0, 716.0, 1184.0, 2135.0, 3860.0, 7555.0, 16320.0, 44193.0, 179314.0, 1597830.0, 2033554.0, 219498.0, 50708.0, 18277.0, 8318.0, 4176.0, 2206.0, 1257.0, 761.0, 444.0, 246.0, 179.0, 115.0, 81.0, 49.0, 32.0, 25.0, 14.0, 14.0, 9.0, 8.0, 10.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.275390625, -1.2299346923828125, -1.184478759765625, -1.1390228271484375, -1.09356689453125, -1.0481109619140625, -1.002655029296875, -0.9571990966796875, -0.9117431640625, -0.8662872314453125, -0.820831298828125, -0.7753753662109375, -0.72991943359375, -0.6844635009765625, -0.639007568359375, -0.5935516357421875, -0.548095703125, -0.5026397705078125, -0.457183837890625, -0.4117279052734375, -0.36627197265625, -0.3208160400390625, -0.275360107421875, -0.2299041748046875, -0.1844482421875, -0.1389923095703125, -0.093536376953125, -0.0480804443359375, -0.00262451171875, 0.0428314208984375, 0.088287353515625, 0.1337432861328125, 0.17919921875, 0.2246551513671875, 0.270111083984375, 0.3155670166015625, 0.36102294921875, 0.4064788818359375, 0.451934814453125, 0.4973907470703125, 0.5428466796875, 0.5883026123046875, 0.633758544921875, 0.6792144775390625, 0.72467041015625, 0.7701263427734375, 0.815582275390625, 0.8610382080078125, 0.906494140625, 0.9519500732421875, 0.997406005859375, 1.0428619384765625, 1.08831787109375, 1.1337738037109375, 1.179229736328125, 1.2246856689453125, 1.2701416015625, 1.3155975341796875, 1.361053466796875, 1.4065093994140625, 1.45196533203125, 1.4974212646484375, 1.542877197265625, 1.5883331298828125, 1.6337890625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 16.0, 15.0, 19.0, 32.0, 31.0, 62.0, 59.0, 66.0, 104.0, 110.0, 95.0, 94.0, 63.0, 61.0, 49.0, 33.0, 22.0, 20.0, 5.0, 11.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.770090103149414, -5.6255059242248535, -5.480922222137451, -5.336338043212891, -5.19175386428833, -5.0471696853637695, -4.902585983276367, -4.758001804351807, -4.613417625427246, -4.4688334465026855, -4.324249744415283, -4.179665565490723, -4.035081386566162, -3.8904974460601807, -3.745913505554199, -3.6013293266296387, -3.4567456245422363, -3.312161684036255, -3.1675775051116943, -3.022993564605713, -2.8784093856811523, -2.733825445175171, -2.5892415046691895, -2.444657325744629, -2.3000733852386475, -2.155489444732666, -2.0109052658081055, -1.866321325302124, -1.721737265586853, -1.577153205871582, -1.4325692653656006, -1.2879852056503296, -1.1434006690979004, -0.9988166093826294, -0.8542326092720032, -0.709648609161377, -0.565064549446106, -0.42048048973083496, -0.27589648962020874, -0.13131248950958252, 0.013271570205688477, 0.15785560011863708, 0.3024396300315857, 0.4470236599445343, 0.5916076898574829, 0.7361917495727539, 0.8807757496833801, 1.0253597497940063, 1.1699438095092773, 1.3145278692245483, 1.4591119289398193, 1.6036958694458008, 1.7482799291610718, 1.8928639888763428, 2.037447929382324, 2.1820321083068848, 2.326616048812866, 2.4711999893188477, 2.615784168243408, 2.7603681087493896, 2.904952049255371, 3.0495362281799316, 3.194120168685913, 3.3387041091918945, 3.483288288116455]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 2.0, 7.0, 5.0, 8.0, 12.0, 17.0, 14.0, 19.0, 20.0, 13.0, 21.0, 34.0, 29.0, 25.0, 38.0, 33.0, 50.0, 40.0, 37.0, 38.0, 52.0, 37.0, 38.0, 33.0, 31.0, 33.0, 38.0, 36.0, 34.0, 24.0, 22.0, 20.0, 21.0, 21.0, 12.0, 14.0, 13.0, 8.0, 8.0, 10.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.679152727127075, -2.5888547897338867, -2.4985570907592773, -2.408259153366089, -2.3179612159729004, -2.227663516998291, -2.1373655796051025, -2.047067642211914, -1.9567698240280151, -1.8664720058441162, -1.7761740684509277, -1.6858762502670288, -1.5955784320831299, -1.5052804946899414, -1.4149826765060425, -1.3246848583221436, -1.234386920928955, -1.1440891027450562, -1.0537911653518677, -0.9634933471679688, -0.873195469379425, -0.7828975915908813, -0.6925997734069824, -0.6023018956184387, -0.512004017829895, -0.4217061400413513, -0.33140829205513, -0.2411104440689087, -0.150812566280365, -0.06051468849182129, 0.029783129692077637, 0.12008100748062134, 0.21037864685058594, 0.30067652463912964, 0.39097437262535095, 0.48127222061157227, 0.571570098400116, 0.6618679761886597, 0.7521657943725586, 0.8424636721611023, 0.932761549949646, 1.023059368133545, 1.1133573055267334, 1.2036551237106323, 1.2939529418945312, 1.3842508792877197, 1.4745486974716187, 1.5648465156555176, 1.655144453048706, 1.745442271232605, 1.8357402086257935, 1.9260380268096924, 2.016335964202881, 2.1066336631774902, 2.1969316005706787, 2.287229537963867, 2.3775272369384766, 2.467825174331665, 2.5581228733062744, 2.648420810699463, 2.7387187480926514, 2.82901668548584, 2.919314384460449, 3.0096123218536377, 3.099910259246826]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 6.0, 11.0, 5.0, 22.0, 13.0, 20.0, 22.0, 25.0, 41.0, 22.0, 30.0, 29.0, 30.0, 34.0, 28.0, 31.0, 46.0, 43.0, 33.0, 41.0, 41.0, 42.0, 40.0, 39.0, 39.0, 34.0, 37.0, 28.0, 24.0, 24.0, 20.0, 17.0, 11.0, 9.0, 14.0, 7.0, 6.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4248046875, -0.4113883972167969, -0.39797210693359375, -0.3845558166503906, -0.3711395263671875, -0.3577232360839844, -0.34430694580078125, -0.3308906555175781, -0.317474365234375, -0.3040580749511719, -0.29064178466796875, -0.2772254943847656, -0.2638092041015625, -0.2503929138183594, -0.23697662353515625, -0.22356033325195312, -0.21014404296875, -0.19672775268554688, -0.18331146240234375, -0.16989517211914062, -0.1564788818359375, -0.14306259155273438, -0.12964630126953125, -0.11623001098632812, -0.102813720703125, -0.08939743041992188, -0.07598114013671875, -0.06256484985351562, -0.0491485595703125, -0.035732269287109375, -0.02231597900390625, -0.008899688720703125, 0.0045166015625, 0.017932891845703125, 0.03134918212890625, 0.044765472412109375, 0.0581817626953125, 0.07159805297851562, 0.08501434326171875, 0.09843063354492188, 0.111846923828125, 0.12526321411132812, 0.13867950439453125, 0.15209579467773438, 0.1655120849609375, 0.17892837524414062, 0.19234466552734375, 0.20576095581054688, 0.21917724609375, 0.23259353637695312, 0.24600982666015625, 0.2594261169433594, 0.2728424072265625, 0.2862586975097656, 0.29967498779296875, 0.3130912780761719, 0.326507568359375, 0.3399238586425781, 0.35334014892578125, 0.3667564392089844, 0.3801727294921875, 0.3935890197753906, 0.40700531005859375, 0.4204216003417969, 0.433837890625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 13.0, 19.0, 33.0, 39.0, 55.0, 105.0, 159.0, 250.0, 429.0, 728.0, 1201.0, 2194.0, 4038.0, 7645.0, 15342.0, 31259.0, 66438.0, 152883.0, 366560.0, 225679.0, 90092.0, 41834.0, 20048.0, 9879.0, 5134.0, 2741.0, 1453.0, 850.0, 550.0, 318.0, 212.0, 116.0, 100.0, 37.0, 37.0, 18.0, 19.0, 13.0, 9.0, 6.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27734375, -0.26859283447265625, -0.2598419189453125, -0.25109100341796875, -0.242340087890625, -0.23358917236328125, -0.2248382568359375, -0.21608734130859375, -0.20733642578125, -0.19858551025390625, -0.1898345947265625, -0.18108367919921875, -0.172332763671875, -0.16358184814453125, -0.1548309326171875, -0.14608001708984375, -0.1373291015625, -0.12857818603515625, -0.1198272705078125, -0.11107635498046875, -0.102325439453125, -0.09357452392578125, -0.0848236083984375, -0.07607269287109375, -0.06732177734375, -0.05857086181640625, -0.0498199462890625, -0.04106903076171875, -0.032318115234375, -0.02356719970703125, -0.0148162841796875, -0.00606536865234375, 0.002685546875, 0.01143646240234375, 0.0201873779296875, 0.02893829345703125, 0.037689208984375, 0.04644012451171875, 0.0551910400390625, 0.06394195556640625, 0.07269287109375, 0.08144378662109375, 0.0901947021484375, 0.09894561767578125, 0.107696533203125, 0.11644744873046875, 0.1251983642578125, 0.13394927978515625, 0.1427001953125, 0.15145111083984375, 0.1602020263671875, 0.16895294189453125, 0.177703857421875, 0.18645477294921875, 0.1952056884765625, 0.20395660400390625, 0.21270751953125, 0.22145843505859375, 0.2302093505859375, 0.23896026611328125, 0.247711181640625, 0.25646209716796875, 0.2652130126953125, 0.27396392822265625, 0.28271484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 6.0, 6.0, 10.0, 10.0, 11.0, 15.0, 12.0, 12.0, 22.0, 18.0, 26.0, 14.0, 28.0, 34.0, 32.0, 33.0, 40.0, 44.0, 34.0, 30.0, 1058.0, 45.0, 51.0, 45.0, 40.0, 38.0, 46.0, 27.0, 36.0, 28.0, 27.0, 21.0, 20.0, 25.0, 14.0, 16.0, 15.0, 14.0, 10.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.2999916076660156, -0.28992462158203125, -0.2798576354980469, -0.2697906494140625, -0.2597236633300781, -0.24965667724609375, -0.23958969116210938, -0.229522705078125, -0.21945571899414062, -0.20938873291015625, -0.19932174682617188, -0.1892547607421875, -0.17918777465820312, -0.16912078857421875, -0.15905380249023438, -0.14898681640625, -0.13891983032226562, -0.12885284423828125, -0.11878585815429688, -0.1087188720703125, -0.09865188598632812, -0.08858489990234375, -0.07851791381835938, -0.068450927734375, -0.058383941650390625, -0.04831695556640625, -0.038249969482421875, -0.0281829833984375, -0.018115997314453125, -0.00804901123046875, 0.002017974853515625, 0.0120849609375, 0.022151947021484375, 0.03221893310546875, 0.042285919189453125, 0.0523529052734375, 0.062419891357421875, 0.07248687744140625, 0.08255386352539062, 0.092620849609375, 0.10268783569335938, 0.11275482177734375, 0.12282180786132812, 0.1328887939453125, 0.14295578002929688, 0.15302276611328125, 0.16308975219726562, 0.17315673828125, 0.18322372436523438, 0.19329071044921875, 0.20335769653320312, 0.2134246826171875, 0.22349166870117188, 0.23355865478515625, 0.24362564086914062, 0.253692626953125, 0.2637596130371094, 0.27382659912109375, 0.2838935852050781, 0.2939605712890625, 0.3040275573730469, 0.31409454345703125, 0.3241615295410156, 0.334228515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 1.0, 4.0, 7.0, 6.0, 14.0, 18.0, 29.0, 46.0, 62.0, 91.0, 126.0, 208.0, 244.0, 408.0, 701.0, 1035.0, 1841.0, 2844.0, 4802.0, 8587.0, 18246.0, 63681.0, 1843082.0, 105263.0, 22019.0, 9939.0, 5322.0, 3098.0, 1942.0, 1241.0, 804.0, 484.0, 310.0, 219.0, 111.0, 109.0, 55.0, 32.0, 34.0, 10.0, 20.0, 14.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3445625305175781, -0.33292388916015625, -0.3212852478027344, -0.3096466064453125, -0.2980079650878906, -0.28636932373046875, -0.2747306823730469, -0.263092041015625, -0.2514533996582031, -0.23981475830078125, -0.22817611694335938, -0.2165374755859375, -0.20489883422851562, -0.19326019287109375, -0.18162155151367188, -0.16998291015625, -0.15834426879882812, -0.14670562744140625, -0.13506698608398438, -0.1234283447265625, -0.11178970336914062, -0.10015106201171875, -0.08851242065429688, -0.076873779296875, -0.06523513793945312, -0.05359649658203125, -0.041957855224609375, -0.0303192138671875, -0.018680572509765625, -0.00704193115234375, 0.004596710205078125, 0.0162353515625, 0.027873992919921875, 0.03951263427734375, 0.051151275634765625, 0.0627899169921875, 0.07442855834960938, 0.08606719970703125, 0.09770584106445312, 0.109344482421875, 0.12098312377929688, 0.13262176513671875, 0.14426040649414062, 0.1558990478515625, 0.16753768920898438, 0.17917633056640625, 0.19081497192382812, 0.20245361328125, 0.21409225463867188, 0.22573089599609375, 0.23736953735351562, 0.2490081787109375, 0.2606468200683594, 0.27228546142578125, 0.2839241027832031, 0.295562744140625, 0.3072013854980469, 0.31884002685546875, 0.3304786682128906, 0.3421173095703125, 0.3537559509277344, 0.36539459228515625, 0.3770332336425781, 0.388671875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 6.0, 7.0, 15.0, 14.0, 13.0, 12.0, 14.0, 22.0, 23.0, 41.0, 30.0, 46.0, 58.0, 54.0, 54.0, 61.0, 51.0, 55.0, 57.0, 51.0, 45.0, 37.0, 37.0, 35.0, 22.0, 20.0, 21.0, 9.0, 12.0, 15.0, 9.0, 9.0, 8.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00989532470703125, -0.009566307067871094, -0.009237289428710938, -0.008908271789550781, -0.008579254150390625, -0.008250236511230469, -0.007921218872070312, -0.007592201232910156, -0.00726318359375, -0.006934165954589844, -0.0066051483154296875, -0.006276130676269531, -0.005947113037109375, -0.005618095397949219, -0.0052890777587890625, -0.004960060119628906, -0.00463104248046875, -0.004302024841308594, -0.0039730072021484375, -0.0036439895629882812, -0.003314971923828125, -0.0029859542846679688, -0.0026569366455078125, -0.0023279190063476562, -0.0019989013671875, -0.0016698837280273438, -0.0013408660888671875, -0.0010118484497070312, -0.000682830810546875, -0.00035381317138671875, -2.47955322265625e-05, 0.00030422210693359375, 0.00063323974609375, 0.0009622573852539062, 0.0012912750244140625, 0.0016202926635742188, 0.001949310302734375, 0.0022783279418945312, 0.0026073455810546875, 0.0029363632202148438, 0.003265380859375, 0.0035943984985351562, 0.0039234161376953125, 0.004252433776855469, 0.004581451416015625, 0.004910469055175781, 0.0052394866943359375, 0.005568504333496094, 0.00589752197265625, 0.006226539611816406, 0.0065555572509765625, 0.006884574890136719, 0.007213592529296875, 0.007542610168457031, 0.007871627807617188, 0.008200645446777344, 0.0085296630859375, 0.008858680725097656, 0.009187698364257812, 0.009516716003417969, 0.009845733642578125, 0.010174751281738281, 0.010503768920898438, 0.010832786560058594, 0.01116180419921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 4.0, 3.0, 7.0, 6.0, 7.0, 12.0, 16.0, 19.0, 26.0, 43.0, 49.0, 60.0, 91.0, 149.0, 220.0, 446.0, 1567.0, 19510.0, 736325.0, 280628.0, 7414.0, 941.0, 366.0, 194.0, 132.0, 87.0, 57.0, 45.0, 22.0, 22.0, 19.0, 10.0, 10.0, 4.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.197265625, -0.1919116973876953, -0.18655776977539062, -0.18120384216308594, -0.17584991455078125, -0.17049598693847656, -0.16514205932617188, -0.1597881317138672, -0.1544342041015625, -0.1490802764892578, -0.14372634887695312, -0.13837242126464844, -0.13301849365234375, -0.12766456604003906, -0.12231063842773438, -0.11695671081542969, -0.111602783203125, -0.10624885559082031, -0.10089492797851562, -0.09554100036621094, -0.09018707275390625, -0.08483314514160156, -0.07947921752929688, -0.07412528991699219, -0.0687713623046875, -0.06341743469238281, -0.058063507080078125, -0.05270957946777344, -0.04735565185546875, -0.04200172424316406, -0.036647796630859375, -0.03129386901855469, -0.02593994140625, -0.020586013793945312, -0.015232086181640625, -0.009878158569335938, -0.00452423095703125, 0.0008296966552734375, 0.006183624267578125, 0.011537551879882812, 0.0168914794921875, 0.022245407104492188, 0.027599334716796875, 0.03295326232910156, 0.03830718994140625, 0.04366111755371094, 0.049015045166015625, 0.05436897277832031, 0.059722900390625, 0.06507682800292969, 0.07043075561523438, 0.07578468322753906, 0.08113861083984375, 0.08649253845214844, 0.09184646606445312, 0.09720039367675781, 0.1025543212890625, 0.10790824890136719, 0.11326217651367188, 0.11861610412597656, 0.12397003173828125, 0.12932395935058594, 0.13467788696289062, 0.1400318145751953, 0.1453857421875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 30.0, 147.0, 446.0, 301.0, 71.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05420726537704468, -0.049967505037784576, -0.045727748423814774, -0.04148798808455467, -0.03724823147058487, -0.03300847113132477, -0.028768710792064667, -0.024528952315449715, -0.020289193838834763, -0.01604943536221981, -0.011809675954282284, -0.007569916546344757, -0.003330158069729805, 0.0009096004068851471, 0.005149360746145248, 0.0093891192227602, 0.013628877699375153, 0.017868636175990105, 0.022108394652605057, 0.026348154991865158, 0.03058791346848011, 0.03482767194509506, 0.039067432284355164, 0.043307192623615265, 0.04754694923758507, 0.05178670957684517, 0.05602646619081497, 0.06026622653007507, 0.06450598686933517, 0.06874574720859528, 0.07298550009727478, 0.07722526043653488, 0.08146502077579498, 0.08570478111505508, 0.08994454145431519, 0.09418429434299469, 0.09842405468225479, 0.10266381502151489, 0.106903575360775, 0.1111433357000351, 0.1153830885887146, 0.1196228489279747, 0.1238626092672348, 0.1281023621559143, 0.132342129945755, 0.1365818828344345, 0.140821635723114, 0.1450614035129547, 0.1493011713027954, 0.15354092419147491, 0.1577806919813156, 0.16202044486999512, 0.16626021265983582, 0.17049996554851532, 0.17473971843719482, 0.17897948622703552, 0.18321923911571503, 0.18745899200439453, 0.19169875979423523, 0.19593851268291473, 0.20017828047275543, 0.20441803336143494, 0.20865780115127563, 0.21289755403995514, 0.21713730692863464]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 9.0, 9.0, 27.0, 28.0, 20.0, 40.0, 56.0, 47.0, 70.0, 64.0, 60.0, 75.0, 66.0, 73.0, 79.0, 61.0, 51.0, 38.0, 40.0, 32.0, 15.0, 8.0, 8.0, 10.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050609290599823, -0.04921359568834305, -0.0478179007768631, -0.04642220586538315, -0.0450265109539032, -0.04363081604242325, -0.0422351211309433, -0.04083942621946335, -0.0394437313079834, -0.03804803639650345, -0.0366523414850235, -0.03525664657354355, -0.0338609516620636, -0.03246525675058365, -0.0310695618391037, -0.02967386692762375, -0.0282781720161438, -0.02688247710466385, -0.0254867821931839, -0.02409108728170395, -0.022695392370224, -0.02129969745874405, -0.0199040025472641, -0.01850830763578415, -0.0171126127243042, -0.01571691781282425, -0.0143212229013443, -0.01292552798986435, -0.0115298330783844, -0.01013413816690445, -0.0087384432554245, -0.0073427483439445496, -0.0059470534324646, -0.00455135852098465, -0.0031556636095046997, -0.0017599686980247498, -0.0003642737865447998, 0.0010314211249351501, 0.0024271160364151, 0.00382281094789505, 0.005218505859375, 0.00661420077085495, 0.0080098956823349, 0.00940559059381485, 0.0108012855052948, 0.01219698041677475, 0.0135926753282547, 0.01498837023973465, 0.0163840651512146, 0.01777976006269455, 0.0191754549741745, 0.02057114988565445, 0.0219668447971344, 0.02336253970861435, 0.0247582346200943, 0.02615392953157425, 0.0275496244430542, 0.02894531935453415, 0.0303410142660141, 0.03173670917749405, 0.033132404088974, 0.03452809900045395, 0.0359237939119339, 0.03731948882341385, 0.0387151837348938]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 5.0, 7.0, 12.0, 5.0, 21.0, 13.0, 22.0, 23.0, 27.0, 36.0, 23.0, 29.0, 31.0, 29.0, 36.0, 27.0, 33.0, 44.0, 40.0, 37.0, 43.0, 40.0, 41.0, 41.0, 37.0, 38.0, 36.0, 35.0, 28.0, 24.0, 25.0, 23.0, 12.0, 12.0, 10.0, 12.0, 7.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.424072265625, -0.41065216064453125, -0.3972320556640625, -0.38381195068359375, -0.370391845703125, -0.35697174072265625, -0.3435516357421875, -0.33013153076171875, -0.31671142578125, -0.30329132080078125, -0.2898712158203125, -0.27645111083984375, -0.263031005859375, -0.24961090087890625, -0.2361907958984375, -0.22277069091796875, -0.2093505859375, -0.19593048095703125, -0.1825103759765625, -0.16909027099609375, -0.155670166015625, -0.14225006103515625, -0.1288299560546875, -0.11540985107421875, -0.10198974609375, -0.08856964111328125, -0.0751495361328125, -0.06172943115234375, -0.048309326171875, -0.03488922119140625, -0.0214691162109375, -0.00804901123046875, 0.00537109375, 0.01879119873046875, 0.0322113037109375, 0.04563140869140625, 0.059051513671875, 0.07247161865234375, 0.0858917236328125, 0.09931182861328125, 0.11273193359375, 0.12615203857421875, 0.1395721435546875, 0.15299224853515625, 0.166412353515625, 0.17983245849609375, 0.1932525634765625, 0.20667266845703125, 0.2200927734375, 0.23351287841796875, 0.2469329833984375, 0.26035308837890625, 0.273773193359375, 0.28719329833984375, 0.3006134033203125, 0.31403350830078125, 0.32745361328125, 0.34087371826171875, 0.3542938232421875, 0.36771392822265625, 0.381134033203125, 0.39455413818359375, 0.4079742431640625, 0.42139434814453125, 0.434814453125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 11.0, 8.0, 28.0, 18.0, 28.0, 49.0, 54.0, 103.0, 153.0, 174.0, 292.0, 426.0, 665.0, 1052.0, 1557.0, 2716.0, 4310.0, 7393.0, 13151.0, 25996.0, 56669.0, 136158.0, 368581.0, 250920.0, 92817.0, 39982.0, 19404.0, 10358.0, 5906.0, 3516.0, 2131.0, 1346.0, 866.0, 546.0, 349.0, 255.0, 194.0, 114.0, 84.0, 43.0, 41.0, 31.0, 20.0, 15.0, 7.0, 4.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77734375, -0.751251220703125, -0.72515869140625, -0.699066162109375, -0.6729736328125, -0.646881103515625, -0.62078857421875, -0.594696044921875, -0.568603515625, -0.542510986328125, -0.51641845703125, -0.490325927734375, -0.4642333984375, -0.438140869140625, -0.41204833984375, -0.385955810546875, -0.35986328125, -0.333770751953125, -0.30767822265625, -0.281585693359375, -0.2554931640625, -0.229400634765625, -0.20330810546875, -0.177215576171875, -0.151123046875, -0.125030517578125, -0.09893798828125, -0.072845458984375, -0.0467529296875, -0.020660400390625, 0.00543212890625, 0.031524658203125, 0.0576171875, 0.083709716796875, 0.10980224609375, 0.135894775390625, 0.1619873046875, 0.188079833984375, 0.21417236328125, 0.240264892578125, 0.266357421875, 0.292449951171875, 0.31854248046875, 0.344635009765625, 0.3707275390625, 0.396820068359375, 0.42291259765625, 0.449005126953125, 0.47509765625, 0.501190185546875, 0.52728271484375, 0.553375244140625, 0.5794677734375, 0.605560302734375, 0.63165283203125, 0.657745361328125, 0.683837890625, 0.709930419921875, 0.73602294921875, 0.762115478515625, 0.7882080078125, 0.814300537109375, 0.84039306640625, 0.866485595703125, 0.892578125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 12.0, 12.0, 14.0, 22.0, 10.0, 20.0, 22.0, 26.0, 37.0, 35.0, 56.0, 54.0, 65.0, 99.0, 150.0, 239.0, 1289.0, 204.0, 126.0, 72.0, 74.0, 50.0, 41.0, 33.0, 50.0, 38.0, 22.0, 20.0, 14.0, 24.0, 23.0, 14.0, 15.0, 8.0, 9.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.33203125, -1.2919158935546875, -1.251800537109375, -1.2116851806640625, -1.17156982421875, -1.1314544677734375, -1.091339111328125, -1.0512237548828125, -1.0111083984375, -0.9709930419921875, -0.930877685546875, -0.8907623291015625, -0.85064697265625, -0.8105316162109375, -0.770416259765625, -0.7303009033203125, -0.690185546875, -0.6500701904296875, -0.609954833984375, -0.5698394775390625, -0.52972412109375, -0.4896087646484375, -0.449493408203125, -0.4093780517578125, -0.3692626953125, -0.3291473388671875, -0.289031982421875, -0.2489166259765625, -0.20880126953125, -0.1686859130859375, -0.128570556640625, -0.0884552001953125, -0.04833984375, -0.0082244873046875, 0.031890869140625, 0.0720062255859375, 0.11212158203125, 0.1522369384765625, 0.192352294921875, 0.2324676513671875, 0.2725830078125, 0.3126983642578125, 0.352813720703125, 0.3929290771484375, 0.43304443359375, 0.4731597900390625, 0.513275146484375, 0.5533905029296875, 0.593505859375, 0.6336212158203125, 0.673736572265625, 0.7138519287109375, 0.75396728515625, 0.7940826416015625, 0.834197998046875, 0.8743133544921875, 0.9144287109375, 0.9545440673828125, 0.994659423828125, 1.0347747802734375, 1.07489013671875, 1.1150054931640625, 1.155120849609375, 1.1952362060546875, 1.2353515625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 12.0, 15.0, 13.0, 20.0, 17.0, 28.0, 39.0, 40.0, 64.0, 91.0, 108.0, 180.0, 269.0, 497.0, 1236.0, 4183.0, 22677.0, 292369.0, 2675323.0, 129503.0, 13975.0, 2894.0, 951.0, 426.0, 250.0, 139.0, 91.0, 65.0, 44.0, 44.0, 42.0, 33.0, 16.0, 14.0, 10.0, 7.0, 10.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.95086669921875, -2.8568115234375, -2.76275634765625, -2.668701171875, -2.57464599609375, -2.4805908203125, -2.38653564453125, -2.29248046875, -2.19842529296875, -2.1043701171875, -2.01031494140625, -1.916259765625, -1.82220458984375, -1.7281494140625, -1.63409423828125, -1.5400390625, -1.44598388671875, -1.3519287109375, -1.25787353515625, -1.163818359375, -1.06976318359375, -0.9757080078125, -0.88165283203125, -0.78759765625, -0.69354248046875, -0.5994873046875, -0.50543212890625, -0.411376953125, -0.31732177734375, -0.2232666015625, -0.12921142578125, -0.03515625, 0.05889892578125, 0.1529541015625, 0.24700927734375, 0.341064453125, 0.43511962890625, 0.5291748046875, 0.62322998046875, 0.71728515625, 0.81134033203125, 0.9053955078125, 0.99945068359375, 1.093505859375, 1.18756103515625, 1.2816162109375, 1.37567138671875, 1.4697265625, 1.56378173828125, 1.6578369140625, 1.75189208984375, 1.845947265625, 1.94000244140625, 2.0340576171875, 2.12811279296875, 2.22216796875, 2.31622314453125, 2.4102783203125, 2.50433349609375, 2.598388671875, 2.69244384765625, 2.7864990234375, 2.88055419921875, 2.974609375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [8.0, 24.0, 129.0, 278.0, 324.0, 176.0, 60.0, 16.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7160799503326416, -1.3029026985168457, -0.889725387096405, -0.47654807567596436, -0.06337082386016846, 0.349806547164917, 0.7629837989807129, 1.1761610507965088, 1.5893383026123047, 2.0025155544281006, 2.4156928062438965, 2.8288702964782715, 3.2420473098754883, 3.6552248001098633, 4.068402290344238, 4.481579303741455, 4.894756317138672, 5.307933807373047, 5.721110820770264, 6.134288311004639, 6.5474653244018555, 6.9606428146362305, 7.3738203048706055, 7.786997318267822, 8.200174331665039, 8.613351821899414, 9.026529312133789, 9.439705848693848, 9.852883338928223, 10.266060829162598, 10.679238319396973, 11.092414855957031, 11.505593299865723, 11.918770790100098, 12.331948280334473, 12.745124816894531, 13.158302307128906, 13.571479797363281, 13.984657287597656, 14.397834777832031, 14.81101131439209, 15.224188804626465, 15.63736629486084, 16.0505428314209, 16.463720321655273, 16.87689781188965, 17.290075302124023, 17.7032527923584, 18.116430282592773, 18.52960777282715, 18.942785263061523, 19.3559627532959, 19.769140243530273, 20.182315826416016, 20.59549331665039, 21.008670806884766, 21.42184829711914, 21.835025787353516, 22.24820327758789, 22.661380767822266, 23.07455825805664, 23.487735748291016, 23.900911331176758, 24.314088821411133, 24.727266311645508]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 10.0, 5.0, 12.0, 11.0, 16.0, 19.0, 15.0, 14.0, 21.0, 17.0, 16.0, 36.0, 39.0, 40.0, 36.0, 40.0, 45.0, 42.0, 49.0, 54.0, 39.0, 40.0, 32.0, 46.0, 34.0, 25.0, 31.0, 28.0, 26.0, 22.0, 18.0, 17.0, 15.0, 13.0, 10.0, 13.0, 8.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.2601494789123535, -4.133118152618408, -4.006086826324463, -3.8790555000305176, -3.7520241737365723, -3.624992847442627, -3.4979615211486816, -3.3709301948547363, -3.243898868560791, -3.1168675422668457, -2.9898362159729004, -2.862804889678955, -2.7357735633850098, -2.6087422370910645, -2.481710910797119, -2.354679584503174, -2.2276484966278076, -2.1006171703338623, -1.973585844039917, -1.8465545177459717, -1.7195231914520264, -1.592491865158081, -1.4654606580734253, -1.33842933177948, -1.2113980054855347, -1.0843666791915894, -0.957335352897644, -0.8303040862083435, -0.7032727599143982, -0.5762414336204529, -0.44921016693115234, -0.32217884063720703, -0.19514751434326172, -0.0681162029504776, 0.05891510844230652, 0.18594640493392944, 0.31297773122787476, 0.44000905752182007, 0.5670403242111206, 0.6940716505050659, 0.8211029767990112, 0.9481343030929565, 1.0751656293869019, 1.2021968364715576, 1.329228162765503, 1.4562594890594482, 1.5832908153533936, 1.7103221416473389, 1.8373534679412842, 1.9643847942352295, 2.091416120529175, 2.21844744682312, 2.3454787731170654, 2.4725100994110107, 2.599541187286377, 2.7265725135803223, 2.8536038398742676, 2.980635166168213, 3.107666492462158, 3.2346978187561035, 3.361729145050049, 3.488760471343994, 3.6157917976379395, 3.7428231239318848, 3.86985445022583]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 13.0, 8.0, 15.0, 18.0, 32.0, 40.0, 37.0, 26.0, 24.0, 32.0, 42.0, 40.0, 36.0, 36.0, 39.0, 45.0, 55.0, 41.0, 38.0, 44.0, 40.0, 47.0, 25.0, 37.0, 36.0, 23.0, 17.0, 17.0, 9.0, 14.0, 11.0, 7.0, 4.0, 7.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.56396484375, -0.5480079650878906, -0.5320510864257812, -0.5160942077636719, -0.5001373291015625, -0.4841804504394531, -0.46822357177734375, -0.4522666931152344, -0.436309814453125, -0.4203529357910156, -0.40439605712890625, -0.3884391784667969, -0.3724822998046875, -0.3565254211425781, -0.34056854248046875, -0.3246116638183594, -0.30865478515625, -0.2926979064941406, -0.27674102783203125, -0.2607841491699219, -0.2448272705078125, -0.22887039184570312, -0.21291351318359375, -0.19695663452148438, -0.180999755859375, -0.16504287719726562, -0.14908599853515625, -0.13312911987304688, -0.1171722412109375, -0.10121536254882812, -0.08525848388671875, -0.06930160522460938, -0.0533447265625, -0.037387847900390625, -0.02143096923828125, -0.005474090576171875, 0.0104827880859375, 0.026439666748046875, 0.04239654541015625, 0.058353424072265625, 0.074310302734375, 0.09026718139648438, 0.10622406005859375, 0.12218093872070312, 0.1381378173828125, 0.15409469604492188, 0.17005157470703125, 0.18600845336914062, 0.20196533203125, 0.21792221069335938, 0.23387908935546875, 0.24983596801757812, 0.2657928466796875, 0.2817497253417969, 0.29770660400390625, 0.3136634826660156, 0.329620361328125, 0.3455772399902344, 0.36153411865234375, 0.3774909973144531, 0.3934478759765625, 0.4094047546386719, 0.42536163330078125, 0.4413185119628906, 0.457275390625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 6.0, 6.0, 6.0, 9.0, 6.0, 16.0, 16.0, 36.0, 25.0, 40.0, 54.0, 88.0, 123.0, 171.0, 225.0, 391.0, 585.0, 910.0, 1629.0, 3143.0, 7338.0, 22505.0, 110825.0, 1405318.0, 2384347.0, 204754.0, 33475.0, 9825.0, 3821.0, 1763.0, 1011.0, 630.0, 408.0, 237.0, 159.0, 86.0, 92.0, 63.0, 46.0, 23.0, 16.0, 11.0, 23.0, 6.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6201171875, -1.574005126953125, -1.52789306640625, -1.481781005859375, -1.4356689453125, -1.389556884765625, -1.34344482421875, -1.297332763671875, -1.251220703125, -1.205108642578125, -1.15899658203125, -1.112884521484375, -1.0667724609375, -1.020660400390625, -0.97454833984375, -0.928436279296875, -0.88232421875, -0.836212158203125, -0.79010009765625, -0.743988037109375, -0.6978759765625, -0.651763916015625, -0.60565185546875, -0.559539794921875, -0.513427734375, -0.467315673828125, -0.42120361328125, -0.375091552734375, -0.3289794921875, -0.282867431640625, -0.23675537109375, -0.190643310546875, -0.14453125, -0.098419189453125, -0.05230712890625, -0.006195068359375, 0.0399169921875, 0.086029052734375, 0.13214111328125, 0.178253173828125, 0.224365234375, 0.270477294921875, 0.31658935546875, 0.362701416015625, 0.4088134765625, 0.454925537109375, 0.50103759765625, 0.547149658203125, 0.59326171875, 0.639373779296875, 0.68548583984375, 0.731597900390625, 0.7777099609375, 0.823822021484375, 0.86993408203125, 0.916046142578125, 0.962158203125, 1.008270263671875, 1.05438232421875, 1.100494384765625, 1.1466064453125, 1.192718505859375, 1.23883056640625, 1.284942626953125, 1.3310546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 1.0, 8.0, 7.0, 17.0, 26.0, 34.0, 55.0, 103.0, 164.0, 289.0, 529.0, 902.0, 865.0, 464.0, 248.0, 138.0, 89.0, 50.0, 25.0, 19.0, 13.0, 12.0, 2.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.412109375, -2.354522705078125, -2.29693603515625, -2.239349365234375, -2.1817626953125, -2.124176025390625, -2.06658935546875, -2.009002685546875, -1.951416015625, -1.893829345703125, -1.83624267578125, -1.778656005859375, -1.7210693359375, -1.663482666015625, -1.60589599609375, -1.548309326171875, -1.49072265625, -1.433135986328125, -1.37554931640625, -1.317962646484375, -1.2603759765625, -1.202789306640625, -1.14520263671875, -1.087615966796875, -1.030029296875, -0.972442626953125, -0.91485595703125, -0.857269287109375, -0.7996826171875, -0.742095947265625, -0.68450927734375, -0.626922607421875, -0.5693359375, -0.511749267578125, -0.45416259765625, -0.396575927734375, -0.3389892578125, -0.281402587890625, -0.22381591796875, -0.166229248046875, -0.108642578125, -0.051055908203125, 0.00653076171875, 0.064117431640625, 0.1217041015625, 0.179290771484375, 0.23687744140625, 0.294464111328125, 0.35205078125, 0.409637451171875, 0.46722412109375, 0.524810791015625, 0.5823974609375, 0.639984130859375, 0.69757080078125, 0.755157470703125, 0.812744140625, 0.870330810546875, 0.92791748046875, 0.985504150390625, 1.0430908203125, 1.100677490234375, 1.15826416015625, 1.215850830078125, 1.2734375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 9.0, 13.0, 30.0, 58.0, 94.0, 210.0, 449.0, 1243.0, 4132.0, 19233.0, 353002.0, 3714241.0, 87075.0, 10266.0, 2612.0, 892.0, 360.0, 161.0, 76.0, 43.0, 34.0, 16.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.185546875, -3.048919677734375, -2.91229248046875, -2.775665283203125, -2.6390380859375, -2.502410888671875, -2.36578369140625, -2.229156494140625, -2.092529296875, -1.955902099609375, -1.81927490234375, -1.682647705078125, -1.5460205078125, -1.409393310546875, -1.27276611328125, -1.136138916015625, -0.99951171875, -0.862884521484375, -0.72625732421875, -0.589630126953125, -0.4530029296875, -0.316375732421875, -0.17974853515625, -0.043121337890625, 0.093505859375, 0.230133056640625, 0.36676025390625, 0.503387451171875, 0.6400146484375, 0.776641845703125, 0.91326904296875, 1.049896240234375, 1.1865234375, 1.323150634765625, 1.45977783203125, 1.596405029296875, 1.7330322265625, 1.869659423828125, 2.00628662109375, 2.142913818359375, 2.279541015625, 2.416168212890625, 2.55279541015625, 2.689422607421875, 2.8260498046875, 2.962677001953125, 3.09930419921875, 3.235931396484375, 3.37255859375, 3.509185791015625, 3.64581298828125, 3.782440185546875, 3.9190673828125, 4.055694580078125, 4.19232177734375, 4.328948974609375, 4.465576171875, 4.602203369140625, 4.73883056640625, 4.875457763671875, 5.0120849609375, 5.148712158203125, 5.28533935546875, 5.421966552734375, 5.55859375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 20.0, 56.0, 145.0, 256.0, 296.0, 140.0, 52.0, 29.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.151822566986084, -5.599461555480957, -5.04710054397583, -4.494739532470703, -3.9423787593841553, -3.3900177478790283, -2.8376569747924805, -2.2852959632873535, -1.7329349517822266, -1.1805739402770996, -0.6282130479812622, -0.0758521556854248, 0.47650885581970215, 1.028869867324829, 1.581230640411377, 2.133591651916504, 2.685952663421631, 3.238313674926758, 3.7906746864318848, 4.343035697937012, 4.8953962326049805, 5.447757720947266, 6.000118255615234, 6.552479267120361, 7.104840278625488, 7.657201290130615, 8.209562301635742, 8.761922836303711, 9.314284324645996, 9.866644859313965, 10.41900634765625, 10.971366882324219, 11.523727416992188, 12.076087951660156, 12.628449440002441, 13.18080997467041, 13.733171463012695, 14.285531997680664, 14.837892532348633, 15.390254020690918, 15.942615509033203, 16.494976043701172, 17.04733657836914, 17.599699020385742, 18.15205955505371, 18.70442008972168, 19.25678062438965, 19.80914306640625, 20.36150360107422, 20.913864135742188, 21.466224670410156, 22.018587112426758, 22.570947647094727, 23.123308181762695, 23.675668716430664, 24.228031158447266, 24.7803897857666, 25.33275032043457, 25.88511085510254, 26.43747329711914, 26.98983383178711, 27.542194366455078, 28.094554901123047, 28.646915435791016, 29.199277877807617]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 2.0, 9.0, 7.0, 14.0, 10.0, 20.0, 17.0, 19.0, 19.0, 28.0, 26.0, 37.0, 40.0, 40.0, 27.0, 35.0, 43.0, 48.0, 48.0, 42.0, 51.0, 50.0, 45.0, 42.0, 42.0, 46.0, 41.0, 19.0, 31.0, 22.0, 14.0, 14.0, 9.0, 9.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8337321281433105, -4.694365978240967, -4.555000305175781, -4.4156341552734375, -4.276268482208252, -4.136902332305908, -3.9975364208221436, -3.858170509338379, -3.7188045978546143, -3.5794386863708496, -3.440072774887085, -3.3007068634033203, -3.1613407135009766, -3.021975040435791, -2.8826088905334473, -2.7432429790496826, -2.603877067565918, -2.4645111560821533, -2.3251452445983887, -2.185779333114624, -2.0464134216308594, -1.9070473909378052, -1.767681360244751, -1.6283154487609863, -1.4889495372772217, -1.349583625793457, -1.2102177143096924, -1.0708516836166382, -0.9314857721328735, -0.7921198606491089, -0.6527538895606995, -0.51338791847229, -0.3740224838256836, -0.23465654253959656, -0.09529060125350952, 0.044075340032577515, 0.18344128131866455, 0.3228071928024292, 0.4621731638908386, 0.601539134979248, 0.7409050464630127, 0.8802709579467773, 1.019636869430542, 1.1590029001235962, 1.2983688116073608, 1.4377347230911255, 1.5771007537841797, 1.7164666652679443, 1.855832576751709, 1.9951984882354736, 2.1345643997192383, 2.273930311203003, 2.4132962226867676, 2.5526623725891113, 2.692028284072876, 2.8313941955566406, 2.9707601070404053, 3.11012601852417, 3.2494919300079346, 3.388857841491699, 3.528223991394043, 3.6675896644592285, 3.8069558143615723, 3.946321725845337, 4.085687637329102]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 5.0, 5.0, 7.0, 15.0, 16.0, 14.0, 17.0, 25.0, 23.0, 21.0, 34.0, 24.0, 31.0, 30.0, 29.0, 41.0, 42.0, 39.0, 46.0, 37.0, 30.0, 37.0, 35.0, 45.0, 43.0, 37.0, 39.0, 27.0, 30.0, 28.0, 22.0, 23.0, 16.0, 15.0, 15.0, 6.0, 10.0, 12.0, 5.0, 7.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.5244140625, -0.509796142578125, -0.49517822265625, -0.480560302734375, -0.4659423828125, -0.451324462890625, -0.43670654296875, -0.422088623046875, -0.407470703125, -0.392852783203125, -0.37823486328125, -0.363616943359375, -0.3489990234375, -0.334381103515625, -0.31976318359375, -0.305145263671875, -0.29052734375, -0.275909423828125, -0.26129150390625, -0.246673583984375, -0.2320556640625, -0.217437744140625, -0.20281982421875, -0.188201904296875, -0.173583984375, -0.158966064453125, -0.14434814453125, -0.129730224609375, -0.1151123046875, -0.100494384765625, -0.08587646484375, -0.071258544921875, -0.056640625, -0.042022705078125, -0.02740478515625, -0.012786865234375, 0.0018310546875, 0.016448974609375, 0.03106689453125, 0.045684814453125, 0.060302734375, 0.074920654296875, 0.08953857421875, 0.104156494140625, 0.1187744140625, 0.133392333984375, 0.14801025390625, 0.162628173828125, 0.17724609375, 0.191864013671875, 0.20648193359375, 0.221099853515625, 0.2357177734375, 0.250335693359375, 0.26495361328125, 0.279571533203125, 0.294189453125, 0.308807373046875, 0.32342529296875, 0.338043212890625, 0.3526611328125, 0.367279052734375, 0.38189697265625, 0.396514892578125, 0.4111328125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 16.0, 31.0, 46.0, 61.0, 81.0, 122.0, 168.0, 314.0, 574.0, 981.0, 1997.0, 3942.0, 9110.0, 23969.0, 70065.0, 214041.0, 427199.0, 194275.0, 63191.0, 22014.0, 8464.0, 3655.0, 1837.0, 962.0, 536.0, 322.0, 189.0, 108.0, 103.0, 51.0, 29.0, 20.0, 13.0, 13.0, 9.0, 10.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.327392578125, -0.31664276123046875, -0.3058929443359375, -0.29514312744140625, -0.284393310546875, -0.27364349365234375, -0.2628936767578125, -0.25214385986328125, -0.24139404296875, -0.23064422607421875, -0.2198944091796875, -0.20914459228515625, -0.198394775390625, -0.18764495849609375, -0.1768951416015625, -0.16614532470703125, -0.1553955078125, -0.14464569091796875, -0.1338958740234375, -0.12314605712890625, -0.112396240234375, -0.10164642333984375, -0.0908966064453125, -0.08014678955078125, -0.06939697265625, -0.05864715576171875, -0.0478973388671875, -0.03714752197265625, -0.026397705078125, -0.01564788818359375, -0.0048980712890625, 0.00585174560546875, 0.0166015625, 0.02735137939453125, 0.0381011962890625, 0.04885101318359375, 0.059600830078125, 0.07035064697265625, 0.0811004638671875, 0.09185028076171875, 0.10260009765625, 0.11334991455078125, 0.1240997314453125, 0.13484954833984375, 0.145599365234375, 0.15634918212890625, 0.1670989990234375, 0.17784881591796875, 0.1885986328125, 0.19934844970703125, 0.2100982666015625, 0.22084808349609375, 0.231597900390625, 0.24234771728515625, 0.2530975341796875, 0.26384735107421875, 0.27459716796875, 0.28534698486328125, 0.2960968017578125, 0.30684661865234375, 0.317596435546875, 0.32834625244140625, 0.3390960693359375, 0.34984588623046875, 0.360595703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 7.0, 8.0, 18.0, 10.0, 17.0, 16.0, 18.0, 21.0, 28.0, 20.0, 21.0, 29.0, 34.0, 39.0, 36.0, 36.0, 42.0, 34.0, 46.0, 1073.0, 46.0, 36.0, 34.0, 32.0, 34.0, 26.0, 34.0, 30.0, 26.0, 26.0, 16.0, 14.0, 15.0, 18.0, 18.0, 12.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.350830078125, -0.33953094482421875, -0.3282318115234375, -0.31693267822265625, -0.305633544921875, -0.29433441162109375, -0.2830352783203125, -0.27173614501953125, -0.26043701171875, -0.24913787841796875, -0.2378387451171875, -0.22653961181640625, -0.215240478515625, -0.20394134521484375, -0.1926422119140625, -0.18134307861328125, -0.1700439453125, -0.15874481201171875, -0.1474456787109375, -0.13614654541015625, -0.124847412109375, -0.11354827880859375, -0.1022491455078125, -0.09095001220703125, -0.07965087890625, -0.06835174560546875, -0.0570526123046875, -0.04575347900390625, -0.034454345703125, -0.02315521240234375, -0.0118560791015625, -0.00055694580078125, 0.0107421875, 0.02204132080078125, 0.0333404541015625, 0.04463958740234375, 0.055938720703125, 0.06723785400390625, 0.0785369873046875, 0.08983612060546875, 0.10113525390625, 0.11243438720703125, 0.1237335205078125, 0.13503265380859375, 0.146331787109375, 0.15763092041015625, 0.1689300537109375, 0.18022918701171875, 0.1915283203125, 0.20282745361328125, 0.2141265869140625, 0.22542572021484375, 0.236724853515625, 0.24802398681640625, 0.2593231201171875, 0.27062225341796875, 0.28192138671875, 0.29322052001953125, 0.3045196533203125, 0.31581878662109375, 0.327117919921875, 0.33841705322265625, 0.3497161865234375, 0.36101531982421875, 0.372314453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 7.0, 10.0, 13.0, 24.0, 34.0, 60.0, 61.0, 139.0, 210.0, 337.0, 649.0, 1194.0, 2352.0, 5213.0, 12411.0, 41902.0, 1843244.0, 151967.0, 22059.0, 7958.0, 3538.0, 1702.0, 835.0, 487.0, 259.0, 148.0, 105.0, 55.0, 44.0, 26.0, 17.0, 17.0, 7.0, 7.0, 3.0, 9.0, 4.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.481689453125, -0.4660301208496094, -0.45037078857421875, -0.4347114562988281, -0.4190521240234375, -0.4033927917480469, -0.38773345947265625, -0.3720741271972656, -0.356414794921875, -0.3407554626464844, -0.32509613037109375, -0.3094367980957031, -0.2937774658203125, -0.2781181335449219, -0.26245880126953125, -0.24679946899414062, -0.23114013671875, -0.21548080444335938, -0.19982147216796875, -0.18416213989257812, -0.1685028076171875, -0.15284347534179688, -0.13718414306640625, -0.12152481079101562, -0.105865478515625, -0.09020614624023438, -0.07454681396484375, -0.058887481689453125, -0.0432281494140625, -0.027568817138671875, -0.01190948486328125, 0.003749847412109375, 0.0194091796875, 0.035068511962890625, 0.05072784423828125, 0.06638717651367188, 0.0820465087890625, 0.09770584106445312, 0.11336517333984375, 0.12902450561523438, 0.144683837890625, 0.16034317016601562, 0.17600250244140625, 0.19166183471679688, 0.2073211669921875, 0.22298049926757812, 0.23863983154296875, 0.2542991638183594, 0.26995849609375, 0.2856178283691406, 0.30127716064453125, 0.3169364929199219, 0.3325958251953125, 0.3482551574707031, 0.36391448974609375, 0.3795738220214844, 0.395233154296875, 0.4108924865722656, 0.42655181884765625, 0.4422111511230469, 0.4578704833984375, 0.4735298156738281, 0.48918914794921875, 0.5048484802246094, 0.5205078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 14.0, 21.0, 22.0, 28.0, 38.0, 72.0, 115.0, 127.0, 142.0, 110.0, 102.0, 67.0, 30.0, 27.0, 20.0, 12.0, 8.0, 10.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024261474609375, -0.02349066734313965, -0.022719860076904297, -0.021949052810668945, -0.021178245544433594, -0.020407438278198242, -0.01963663101196289, -0.01886582374572754, -0.018095016479492188, -0.017324209213256836, -0.016553401947021484, -0.015782594680786133, -0.015011787414550781, -0.01424098014831543, -0.013470172882080078, -0.012699365615844727, -0.011928558349609375, -0.011157751083374023, -0.010386943817138672, -0.00961613655090332, -0.008845329284667969, -0.008074522018432617, -0.007303714752197266, -0.006532907485961914, -0.0057621002197265625, -0.004991292953491211, -0.004220485687255859, -0.003449678421020508, -0.0026788711547851562, -0.0019080638885498047, -0.0011372566223144531, -0.00036644935607910156, 0.00040435791015625, 0.0011751651763916016, 0.0019459724426269531, 0.0027167797088623047, 0.0034875869750976562, 0.004258394241333008, 0.005029201507568359, 0.005800008773803711, 0.0065708160400390625, 0.007341623306274414, 0.008112430572509766, 0.008883237838745117, 0.009654045104980469, 0.01042485237121582, 0.011195659637451172, 0.011966466903686523, 0.012737274169921875, 0.013508081436157227, 0.014278888702392578, 0.01504969596862793, 0.01582050323486328, 0.016591310501098633, 0.017362117767333984, 0.018132925033569336, 0.018903732299804688, 0.01967453956604004, 0.02044534683227539, 0.021216154098510742, 0.021986961364746094, 0.022757768630981445, 0.023528575897216797, 0.02429938316345215, 0.0250701904296875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 1.0, 5.0, 4.0, 6.0, 7.0, 12.0, 17.0, 21.0, 36.0, 58.0, 91.0, 184.0, 718.0, 11071.0, 965361.0, 68499.0, 1809.0, 321.0, 120.0, 68.0, 42.0, 39.0, 21.0, 13.0, 6.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.38232421875, -0.370635986328125, -0.35894775390625, -0.347259521484375, -0.3355712890625, -0.323883056640625, -0.31219482421875, -0.300506591796875, -0.288818359375, -0.277130126953125, -0.26544189453125, -0.253753662109375, -0.2420654296875, -0.230377197265625, -0.21868896484375, -0.207000732421875, -0.1953125, -0.183624267578125, -0.17193603515625, -0.160247802734375, -0.1485595703125, -0.136871337890625, -0.12518310546875, -0.113494873046875, -0.101806640625, -0.090118408203125, -0.07843017578125, -0.066741943359375, -0.0550537109375, -0.043365478515625, -0.03167724609375, -0.019989013671875, -0.00830078125, 0.003387451171875, 0.01507568359375, 0.026763916015625, 0.0384521484375, 0.050140380859375, 0.06182861328125, 0.073516845703125, 0.085205078125, 0.096893310546875, 0.10858154296875, 0.120269775390625, 0.1319580078125, 0.143646240234375, 0.15533447265625, 0.167022705078125, 0.1787109375, 0.190399169921875, 0.20208740234375, 0.213775634765625, 0.2254638671875, 0.237152099609375, 0.24884033203125, 0.260528564453125, 0.272216796875, 0.283905029296875, 0.29559326171875, 0.307281494140625, 0.3189697265625, 0.330657958984375, 0.34234619140625, 0.354034423828125, 0.36572265625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 6.0, 12.0, 39.0, 123.0, 322.0, 319.0, 118.0, 37.0, 15.0, 9.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14149564504623413, -0.13642992079257965, -0.13136419653892517, -0.1262984573841095, -0.12123273313045502, -0.11616700887680054, -0.11110127717256546, -0.10603554546833038, -0.1009698212146759, -0.09590409696102142, -0.09083836525678635, -0.08577263355255127, -0.08070690929889679, -0.07564118504524231, -0.07057545334100723, -0.06550972163677216, -0.060443997383117676, -0.0553782694041729, -0.05031254142522812, -0.04524681344628334, -0.04018108546733856, -0.035115357488393784, -0.030049629509449005, -0.024983901530504227, -0.019918173551559448, -0.01485244557261467, -0.009786717593669891, -0.004720989614725113, 0.00034473836421966553, 0.005410466343164444, 0.010476194322109222, 0.015541922301054, 0.02060765027999878, 0.025673378258943558, 0.030739106237888336, 0.035804834216833115, 0.04087056219577789, 0.04593629017472267, 0.05100201815366745, 0.05606774613261223, 0.06113347411155701, 0.06619919836521149, 0.07126493006944656, 0.07633066177368164, 0.08139638602733612, 0.0864621102809906, 0.09152784198522568, 0.09659357368946075, 0.10165929794311523, 0.10672502219676971, 0.11179075390100479, 0.11685648560523987, 0.12192220985889435, 0.12698793411254883, 0.1320536732673645, 0.13711939752101898, 0.14218512177467346, 0.14725084602832794, 0.15231657028198242, 0.1573823094367981, 0.16244803369045258, 0.16751375794410706, 0.17257949709892273, 0.1776452213525772, 0.1827109456062317]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 10.0, 4.0, 8.0, 9.0, 5.0, 13.0, 16.0, 16.0, 22.0, 23.0, 26.0, 39.0, 38.0, 32.0, 43.0, 37.0, 43.0, 36.0, 45.0, 48.0, 31.0, 46.0, 43.0, 40.0, 46.0, 29.0, 31.0, 41.0, 28.0, 22.0, 21.0, 14.0, 22.0, 10.0, 11.0, 7.0, 14.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.023356854915618896, -0.022606655955314636, -0.021856456995010376, -0.021106258034706116, -0.020356059074401855, -0.019605860114097595, -0.018855661153793335, -0.018105462193489075, -0.017355263233184814, -0.016605064272880554, -0.015854865312576294, -0.015104666352272034, -0.014354467391967773, -0.013604268431663513, -0.012854069471359253, -0.012103870511054993, -0.011353671550750732, -0.010603472590446472, -0.009853273630142212, -0.009103074669837952, -0.008352875709533691, -0.007602676749229431, -0.006852477788925171, -0.006102278828620911, -0.00535207986831665, -0.00460188090801239, -0.00385168194770813, -0.0031014829874038696, -0.0023512840270996094, -0.0016010850667953491, -0.0008508861064910889, -0.00010068714618682861, 0.0006495118141174316, 0.001399710774421692, 0.002149909734725952, 0.0029001086950302124, 0.0036503076553344727, 0.004400506615638733, 0.005150705575942993, 0.005900904536247253, 0.006651103496551514, 0.007401302456855774, 0.008151501417160034, 0.008901700377464294, 0.009651899337768555, 0.010402098298072815, 0.011152297258377075, 0.011902496218681335, 0.012652695178985596, 0.013402894139289856, 0.014153093099594116, 0.014903292059898376, 0.015653491020202637, 0.016403689980506897, 0.017153888940811157, 0.017904087901115417, 0.018654286861419678, 0.019404485821723938, 0.020154684782028198, 0.02090488374233246, 0.02165508270263672, 0.02240528166294098, 0.02315548062324524, 0.0239056795835495, 0.02465587854385376]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 3.0, 6.0, 5.0, 7.0, 14.0, 16.0, 16.0, 17.0, 26.0, 19.0, 22.0, 34.0, 25.0, 31.0, 30.0, 30.0, 39.0, 45.0, 35.0, 49.0, 35.0, 31.0, 38.0, 35.0, 44.0, 44.0, 36.0, 37.0, 30.0, 29.0, 28.0, 21.0, 23.0, 19.0, 13.0, 15.0, 7.0, 10.0, 11.0, 5.0, 7.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.5244140625, -0.509796142578125, -0.49517822265625, -0.480560302734375, -0.4659423828125, -0.451324462890625, -0.43670654296875, -0.422088623046875, -0.407470703125, -0.392852783203125, -0.37823486328125, -0.363616943359375, -0.3489990234375, -0.334381103515625, -0.31976318359375, -0.305145263671875, -0.29052734375, -0.275909423828125, -0.26129150390625, -0.246673583984375, -0.2320556640625, -0.217437744140625, -0.20281982421875, -0.188201904296875, -0.173583984375, -0.158966064453125, -0.14434814453125, -0.129730224609375, -0.1151123046875, -0.100494384765625, -0.08587646484375, -0.071258544921875, -0.056640625, -0.042022705078125, -0.02740478515625, -0.012786865234375, 0.0018310546875, 0.016448974609375, 0.03106689453125, 0.045684814453125, 0.060302734375, 0.074920654296875, 0.08953857421875, 0.104156494140625, 0.1187744140625, 0.133392333984375, 0.14801025390625, 0.162628173828125, 0.17724609375, 0.191864013671875, 0.20648193359375, 0.221099853515625, 0.2357177734375, 0.250335693359375, 0.26495361328125, 0.279571533203125, 0.294189453125, 0.308807373046875, 0.32342529296875, 0.338043212890625, 0.3526611328125, 0.367279052734375, 0.38189697265625, 0.396514892578125, 0.4111328125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 7.0, 13.0, 15.0, 25.0, 44.0, 65.0, 87.0, 159.0, 230.0, 460.0, 984.0, 2216.0, 6320.0, 28433.0, 320977.0, 630135.0, 44902.0, 8237.0, 2777.0, 1160.0, 548.0, 272.0, 177.0, 100.0, 66.0, 45.0, 35.0, 20.0, 10.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.79296875, -2.70599365234375, -2.6190185546875, -2.53204345703125, -2.445068359375, -2.35809326171875, -2.2711181640625, -2.18414306640625, -2.09716796875, -2.01019287109375, -1.9232177734375, -1.83624267578125, -1.749267578125, -1.66229248046875, -1.5753173828125, -1.48834228515625, -1.4013671875, -1.31439208984375, -1.2274169921875, -1.14044189453125, -1.053466796875, -0.96649169921875, -0.8795166015625, -0.79254150390625, -0.70556640625, -0.61859130859375, -0.5316162109375, -0.44464111328125, -0.357666015625, -0.27069091796875, -0.1837158203125, -0.09674072265625, -0.009765625, 0.07720947265625, 0.1641845703125, 0.25115966796875, 0.338134765625, 0.42510986328125, 0.5120849609375, 0.59906005859375, 0.68603515625, 0.77301025390625, 0.8599853515625, 0.94696044921875, 1.033935546875, 1.12091064453125, 1.2078857421875, 1.29486083984375, 1.3818359375, 1.46881103515625, 1.5557861328125, 1.64276123046875, 1.729736328125, 1.81671142578125, 1.9036865234375, 1.99066162109375, 2.07763671875, 2.16461181640625, 2.2515869140625, 2.33856201171875, 2.425537109375, 2.51251220703125, 2.5994873046875, 2.68646240234375, 2.7734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 8.0, 10.0, 6.0, 11.0, 9.0, 20.0, 16.0, 31.0, 23.0, 31.0, 31.0, 43.0, 64.0, 61.0, 97.0, 141.0, 212.0, 1362.0, 231.0, 134.0, 90.0, 69.0, 64.0, 34.0, 36.0, 33.0, 22.0, 31.0, 17.0, 21.0, 10.0, 12.0, 7.0, 12.0, 6.0, 5.0, 7.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.4694976806640625, -1.421417236328125, -1.3733367919921875, -1.32525634765625, -1.2771759033203125, -1.229095458984375, -1.1810150146484375, -1.1329345703125, -1.0848541259765625, -1.036773681640625, -0.9886932373046875, -0.94061279296875, -0.8925323486328125, -0.844451904296875, -0.7963714599609375, -0.748291015625, -0.7002105712890625, -0.652130126953125, -0.6040496826171875, -0.55596923828125, -0.5078887939453125, -0.459808349609375, -0.4117279052734375, -0.3636474609375, -0.3155670166015625, -0.267486572265625, -0.2194061279296875, -0.17132568359375, -0.1232452392578125, -0.075164794921875, -0.0270843505859375, 0.02099609375, 0.0690765380859375, 0.117156982421875, 0.1652374267578125, 0.21331787109375, 0.2613983154296875, 0.309478759765625, 0.3575592041015625, 0.4056396484375, 0.4537200927734375, 0.501800537109375, 0.5498809814453125, 0.59796142578125, 0.6460418701171875, 0.694122314453125, 0.7422027587890625, 0.790283203125, 0.8383636474609375, 0.886444091796875, 0.9345245361328125, 0.98260498046875, 1.0306854248046875, 1.078765869140625, 1.1268463134765625, 1.1749267578125, 1.2230072021484375, 1.271087646484375, 1.3191680908203125, 1.36724853515625, 1.4153289794921875, 1.463409423828125, 1.5114898681640625, 1.5595703125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 14.0, 13.0, 18.0, 22.0, 28.0, 48.0, 62.0, 88.0, 154.0, 356.0, 808.0, 2397.0, 10924.0, 410220.0, 2686207.0, 28080.0, 3958.0, 1234.0, 438.0, 230.0, 112.0, 75.0, 58.0, 34.0, 31.0, 16.0, 8.0, 13.0, 10.0, 8.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.31793212890625, -4.1749267578125, -4.03192138671875, -3.888916015625, -3.74591064453125, -3.6029052734375, -3.45989990234375, -3.31689453125, -3.17388916015625, -3.0308837890625, -2.88787841796875, -2.744873046875, -2.60186767578125, -2.4588623046875, -2.31585693359375, -2.1728515625, -2.02984619140625, -1.8868408203125, -1.74383544921875, -1.600830078125, -1.45782470703125, -1.3148193359375, -1.17181396484375, -1.02880859375, -0.88580322265625, -0.7427978515625, -0.59979248046875, -0.456787109375, -0.31378173828125, -0.1707763671875, -0.02777099609375, 0.115234375, 0.25823974609375, 0.4012451171875, 0.54425048828125, 0.687255859375, 0.83026123046875, 0.9732666015625, 1.11627197265625, 1.25927734375, 1.40228271484375, 1.5452880859375, 1.68829345703125, 1.831298828125, 1.97430419921875, 2.1173095703125, 2.26031494140625, 2.4033203125, 2.54632568359375, 2.6893310546875, 2.83233642578125, 2.975341796875, 3.11834716796875, 3.2613525390625, 3.40435791015625, 3.54736328125, 3.69036865234375, 3.8333740234375, 3.97637939453125, 4.119384765625, 4.26239013671875, 4.4053955078125, 4.54840087890625, 4.69140625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 87.0, 925.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.180527210235596, -2.9515085220336914, -0.7224898338317871, 1.5065288543701172, 3.7355475425720215, 5.964566707611084, 8.193584442138672, 10.422603607177734, 12.651622772216797, 14.88064193725586, 17.109661102294922, 19.33867835998535, 21.567697525024414, 23.796716690063477, 26.025733947753906, 28.25475311279297, 30.48377227783203, 32.712791442871094, 34.941810607910156, 37.17082977294922, 39.39984893798828, 41.628868103027344, 43.85788345336914, 46.0869026184082, 48.315921783447266, 50.54494094848633, 52.77396011352539, 55.00297927856445, 57.23199462890625, 59.46101379394531, 61.690032958984375, 63.91905212402344, 66.1480712890625, 68.37709045410156, 70.60610961914062, 72.83512878417969, 75.06414794921875, 77.29316711425781, 79.52218627929688, 81.75120544433594, 83.980224609375, 86.20924377441406, 88.43826293945312, 90.66728210449219, 92.89630126953125, 95.12532043457031, 97.35433959960938, 99.58335876464844, 101.81237030029297, 104.04138946533203, 106.2704086303711, 108.49942779541016, 110.72844696044922, 112.95746612548828, 115.18648529052734, 117.41549682617188, 119.64451599121094, 121.87353515625, 124.10255432128906, 126.33157348632812, 128.5605926513672, 130.78961181640625, 133.0186309814453, 135.24765014648438, 137.47666931152344]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 8.0, 2.0, 2.0, 4.0, 3.0, 7.0, 3.0, 6.0, 11.0, 12.0, 19.0, 18.0, 19.0, 16.0, 25.0, 26.0, 28.0, 41.0, 38.0, 35.0, 38.0, 37.0, 55.0, 41.0, 44.0, 39.0, 38.0, 26.0, 39.0, 36.0, 37.0, 30.0, 34.0, 34.0, 30.0, 25.0, 22.0, 19.0, 15.0, 15.0, 3.0, 7.0, 8.0, 6.0, 3.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.278147220611572, -4.1318464279174805, -3.9855451583862305, -3.8392441272735596, -3.6929430961608887, -3.5466420650482178, -3.400341033935547, -3.254040002822876, -3.107738971710205, -2.961437940597534, -2.8151369094848633, -2.6688358783721924, -2.5225348472595215, -2.3762338161468506, -2.2299327850341797, -2.083631753921509, -1.937330722808838, -1.791029691696167, -1.644728660583496, -1.4984276294708252, -1.3521265983581543, -1.2058255672454834, -1.0595245361328125, -0.9132235050201416, -0.7669224739074707, -0.6206214427947998, -0.4743204116821289, -0.328019380569458, -0.1817183494567871, -0.03541731834411621, 0.11088371276855469, 0.2571847438812256, 0.4034852981567383, 0.5497863292694092, 0.6960873603820801, 0.842388391494751, 0.9886894226074219, 1.1349904537200928, 1.2812914848327637, 1.4275925159454346, 1.5738935470581055, 1.7201945781707764, 1.8664956092834473, 2.012796640396118, 2.159097671508789, 2.30539870262146, 2.451699733734131, 2.5980007648468018, 2.7443017959594727, 2.8906028270721436, 3.0369038581848145, 3.1832048892974854, 3.3295059204101562, 3.475806951522827, 3.622107982635498, 3.768409013748169, 3.91471004486084, 4.06101131439209, 4.207312107086182, 4.353612899780273, 4.499914169311523, 4.646215438842773, 4.792516231536865, 4.938817024230957, 5.085118293762207]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 8.0, 7.0, 16.0, 8.0, 10.0, 15.0, 14.0, 22.0, 19.0, 17.0, 28.0, 25.0, 28.0, 28.0, 33.0, 38.0, 41.0, 40.0, 37.0, 27.0, 37.0, 36.0, 45.0, 39.0, 37.0, 32.0, 46.0, 42.0, 28.0, 24.0, 29.0, 20.0, 20.0, 24.0, 10.0, 13.0, 9.0, 13.0, 13.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.48995208740234375, -0.4740447998046875, -0.45813751220703125, -0.442230224609375, -0.42632293701171875, -0.4104156494140625, -0.39450836181640625, -0.37860107421875, -0.36269378662109375, -0.3467864990234375, -0.33087921142578125, -0.314971923828125, -0.29906463623046875, -0.2831573486328125, -0.26725006103515625, -0.2513427734375, -0.23543548583984375, -0.2195281982421875, -0.20362091064453125, -0.187713623046875, -0.17180633544921875, -0.1558990478515625, -0.13999176025390625, -0.12408447265625, -0.10817718505859375, -0.0922698974609375, -0.07636260986328125, -0.060455322265625, -0.04454803466796875, -0.0286407470703125, -0.01273345947265625, 0.003173828125, 0.01908111572265625, 0.0349884033203125, 0.05089569091796875, 0.066802978515625, 0.08271026611328125, 0.0986175537109375, 0.11452484130859375, 0.13043212890625, 0.14633941650390625, 0.1622467041015625, 0.17815399169921875, 0.194061279296875, 0.20996856689453125, 0.2258758544921875, 0.24178314208984375, 0.2576904296875, 0.27359771728515625, 0.2895050048828125, 0.30541229248046875, 0.321319580078125, 0.33722686767578125, 0.3531341552734375, 0.36904144287109375, 0.38494873046875, 0.40085601806640625, 0.4167633056640625, 0.43267059326171875, 0.448577880859375, 0.46448516845703125, 0.4803924560546875, 0.49629974365234375, 0.51220703125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 7.0, 17.0, 21.0, 27.0, 42.0, 58.0, 107.0, 160.0, 272.0, 501.0, 943.0, 2162.0, 6311.0, 28359.0, 328732.0, 3318998.0, 461081.0, 34858.0, 7151.0, 2306.0, 1010.0, 482.0, 265.0, 171.0, 88.0, 52.0, 37.0, 22.0, 10.0, 13.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.1050872802734375, -2.044158935546875, -1.9832305908203125, -1.92230224609375, -1.8613739013671875, -1.800445556640625, -1.7395172119140625, -1.6785888671875, -1.6176605224609375, -1.556732177734375, -1.4958038330078125, -1.43487548828125, -1.3739471435546875, -1.313018798828125, -1.2520904541015625, -1.191162109375, -1.1302337646484375, -1.069305419921875, -1.0083770751953125, -0.94744873046875, -0.8865203857421875, -0.825592041015625, -0.7646636962890625, -0.7037353515625, -0.6428070068359375, -0.581878662109375, -0.5209503173828125, -0.46002197265625, -0.3990936279296875, -0.338165283203125, -0.2772369384765625, -0.21630859375, -0.1553802490234375, -0.094451904296875, -0.0335235595703125, 0.02740478515625, 0.0883331298828125, 0.149261474609375, 0.2101898193359375, 0.2711181640625, 0.3320465087890625, 0.392974853515625, 0.4539031982421875, 0.51483154296875, 0.5757598876953125, 0.636688232421875, 0.6976165771484375, 0.758544921875, 0.8194732666015625, 0.880401611328125, 0.9413299560546875, 1.00225830078125, 1.0631866455078125, 1.124114990234375, 1.1850433349609375, 1.2459716796875, 1.3069000244140625, 1.367828369140625, 1.4287567138671875, 1.48968505859375, 1.5506134033203125, 1.611541748046875, 1.6724700927734375, 1.7333984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 7.0, 7.0, 14.0, 25.0, 34.0, 53.0, 77.0, 124.0, 170.0, 310.0, 455.0, 695.0, 691.0, 474.0, 288.0, 194.0, 141.0, 92.0, 55.0, 42.0, 45.0, 25.0, 19.0, 5.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.322265625, -1.2796478271484375, -1.237030029296875, -1.1944122314453125, -1.15179443359375, -1.1091766357421875, -1.066558837890625, -1.0239410400390625, -0.9813232421875, -0.9387054443359375, -0.896087646484375, -0.8534698486328125, -0.81085205078125, -0.7682342529296875, -0.725616455078125, -0.6829986572265625, -0.640380859375, -0.5977630615234375, -0.555145263671875, -0.5125274658203125, -0.46990966796875, -0.4272918701171875, -0.384674072265625, -0.3420562744140625, -0.2994384765625, -0.2568206787109375, -0.214202880859375, -0.1715850830078125, -0.12896728515625, -0.0863494873046875, -0.043731689453125, -0.0011138916015625, 0.04150390625, 0.0841217041015625, 0.126739501953125, 0.1693572998046875, 0.21197509765625, 0.2545928955078125, 0.297210693359375, 0.3398284912109375, 0.3824462890625, 0.4250640869140625, 0.467681884765625, 0.5102996826171875, 0.55291748046875, 0.5955352783203125, 0.638153076171875, 0.6807708740234375, 0.723388671875, 0.7660064697265625, 0.808624267578125, 0.8512420654296875, 0.89385986328125, 0.9364776611328125, 0.979095458984375, 1.0217132568359375, 1.0643310546875, 1.1069488525390625, 1.149566650390625, 1.1921844482421875, 1.23480224609375, 1.2774200439453125, 1.320037841796875, 1.3626556396484375, 1.4052734375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 2.0, 9.0, 11.0, 23.0, 40.0, 69.0, 110.0, 185.0, 409.0, 824.0, 2114.0, 7696.0, 60359.0, 2528151.0, 1540188.0, 44571.0, 6403.0, 1727.0, 737.0, 314.0, 154.0, 88.0, 35.0, 23.0, 12.0, 11.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.56640625, -3.451141357421875, -3.33587646484375, -3.220611572265625, -3.1053466796875, -2.990081787109375, -2.87481689453125, -2.759552001953125, -2.644287109375, -2.529022216796875, -2.41375732421875, -2.298492431640625, -2.1832275390625, -2.067962646484375, -1.95269775390625, -1.837432861328125, -1.72216796875, -1.606903076171875, -1.49163818359375, -1.376373291015625, -1.2611083984375, -1.145843505859375, -1.03057861328125, -0.915313720703125, -0.800048828125, -0.684783935546875, -0.56951904296875, -0.454254150390625, -0.3389892578125, -0.223724365234375, -0.10845947265625, 0.006805419921875, 0.1220703125, 0.237335205078125, 0.35260009765625, 0.467864990234375, 0.5831298828125, 0.698394775390625, 0.81365966796875, 0.928924560546875, 1.044189453125, 1.159454345703125, 1.27471923828125, 1.389984130859375, 1.5052490234375, 1.620513916015625, 1.73577880859375, 1.851043701171875, 1.96630859375, 2.081573486328125, 2.19683837890625, 2.312103271484375, 2.4273681640625, 2.542633056640625, 2.65789794921875, 2.773162841796875, 2.888427734375, 3.003692626953125, 3.11895751953125, 3.234222412109375, 3.3494873046875, 3.464752197265625, 3.58001708984375, 3.695281982421875, 3.810546875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 12.0, 21.0, 22.0, 42.0, 90.0, 133.0, 168.0, 146.0, 132.0, 95.0, 59.0, 38.0, 14.0, 12.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.334183692932129, -12.053131103515625, -11.772079467773438, -11.491026878356934, -11.20997428894043, -10.928922653198242, -10.647870063781738, -10.36681842803955, -10.085765838623047, -9.804713249206543, -9.523661613464355, -9.242609024047852, -8.961557388305664, -8.68050479888916, -8.399452209472656, -8.118400573730469, -7.837347984313965, -7.556295871734619, -7.275243759155273, -6.9941911697387695, -6.713139057159424, -6.432086944580078, -6.151034355163574, -5.8699822425842285, -5.588930130004883, -5.307878017425537, -5.026825904846191, -4.7457733154296875, -4.464721202850342, -4.183669090270996, -3.9026167392730713, -3.6215643882751465, -3.340513229370117, -3.0594611167907715, -2.7784087657928467, -2.497356414794922, -2.216304302215576, -1.935252070426941, -1.6541998386383057, -1.3731476068496704, -1.0920953750610352, -0.8110431432723999, -0.5299909114837646, -0.2489386796951294, 0.03211355209350586, 0.3131657838821411, 0.5942180156707764, 0.8752702474594116, 1.1563224792480469, 1.4373747110366821, 1.7184269428253174, 1.9994791746139526, 2.280531406402588, 2.5615835189819336, 2.8426358699798584, 3.123688220977783, 3.404740333557129, 3.6857924461364746, 3.9668447971343994, 4.247897148132324, 4.52894926071167, 4.810001373291016, 5.0910539627075195, 5.372106075286865, 5.653158187866211]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 4.0, 7.0, 7.0, 6.0, 5.0, 8.0, 8.0, 15.0, 15.0, 16.0, 14.0, 17.0, 30.0, 19.0, 31.0, 31.0, 37.0, 30.0, 27.0, 42.0, 47.0, 38.0, 47.0, 38.0, 40.0, 28.0, 27.0, 36.0, 34.0, 36.0, 29.0, 28.0, 18.0, 19.0, 21.0, 28.0, 21.0, 20.0, 14.0, 10.0, 9.0, 9.0, 7.0, 7.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.615499973297119, -3.510424852371216, -3.4053499698638916, -3.3002748489379883, -3.195199728012085, -3.0901246070861816, -2.9850497245788574, -2.879974603652954, -2.774899482727051, -2.6698243618011475, -2.5647494792938232, -2.45967435836792, -2.3545992374420166, -2.2495241165161133, -2.144449234008789, -2.0393741130828857, -1.934299111366272, -1.8292241096496582, -1.7241489887237549, -1.6190739870071411, -1.5139988660812378, -1.408923864364624, -1.3038487434387207, -1.198773741722107, -1.0936987400054932, -0.9886236786842346, -0.8835486173629761, -0.7784736156463623, -0.673398494720459, -0.5683234930038452, -0.46324843168258667, -0.3581733703613281, -0.2530982494354248, -0.14802318811416626, -0.04294814169406891, 0.06212690472602844, 0.167201966047287, 0.27227699756622314, 0.3773520588874817, 0.48242712020874023, 0.5875021815299988, 0.6925772428512573, 0.7976523041725159, 0.9027273654937744, 1.0078023672103882, 1.112877368927002, 1.2179524898529053, 1.3230276107788086, 1.4281026124954224, 1.5331776142120361, 1.6382527351379395, 1.7433277368545532, 1.8484028577804565, 1.9534778594970703, 2.0585529804229736, 2.163628101348877, 2.268702983856201, 2.3737781047821045, 2.4788529872894287, 2.583928108215332, 2.6890032291412354, 2.7940783500671387, 2.899153232574463, 3.004228353500366, 3.1093034744262695]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 4.0, 15.0, 23.0, 10.0, 15.0, 20.0, 22.0, 25.0, 21.0, 35.0, 36.0, 34.0, 36.0, 30.0, 46.0, 36.0, 39.0, 42.0, 51.0, 37.0, 39.0, 42.0, 48.0, 38.0, 29.0, 28.0, 24.0, 26.0, 19.0, 24.0, 23.0, 13.0, 17.0, 11.0, 6.0, 13.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.6025390625, -0.5857391357421875, -0.568939208984375, -0.5521392822265625, -0.53533935546875, -0.5185394287109375, -0.501739501953125, -0.4849395751953125, -0.4681396484375, -0.4513397216796875, -0.434539794921875, -0.4177398681640625, -0.40093994140625, -0.3841400146484375, -0.367340087890625, -0.3505401611328125, -0.333740234375, -0.3169403076171875, -0.300140380859375, -0.2833404541015625, -0.26654052734375, -0.2497406005859375, -0.232940673828125, -0.2161407470703125, -0.1993408203125, -0.1825408935546875, -0.165740966796875, -0.1489410400390625, -0.13214111328125, -0.1153411865234375, -0.098541259765625, -0.0817413330078125, -0.06494140625, -0.0481414794921875, -0.031341552734375, -0.0145416259765625, 0.00225830078125, 0.0190582275390625, 0.035858154296875, 0.0526580810546875, 0.0694580078125, 0.0862579345703125, 0.103057861328125, 0.1198577880859375, 0.13665771484375, 0.1534576416015625, 0.170257568359375, 0.1870574951171875, 0.203857421875, 0.2206573486328125, 0.237457275390625, 0.2542572021484375, 0.27105712890625, 0.2878570556640625, 0.304656982421875, 0.3214569091796875, 0.3382568359375, 0.3550567626953125, 0.371856689453125, 0.3886566162109375, 0.40545654296875, 0.4222564697265625, 0.439056396484375, 0.4558563232421875, 0.47265625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 17.0, 15.0, 22.0, 37.0, 40.0, 36.0, 94.0, 117.0, 146.0, 208.0, 272.0, 400.0, 563.0, 793.0, 1173.0, 2014.0, 3415.0, 6393.0, 12891.0, 29413.0, 68909.0, 165875.0, 325103.0, 242774.0, 105103.0, 43224.0, 18648.0, 8960.0, 4572.0, 2552.0, 1525.0, 964.0, 657.0, 456.0, 311.0, 229.0, 162.0, 124.0, 92.0, 66.0, 59.0, 31.0, 25.0, 16.0, 15.0, 5.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1900634765625, -0.18407440185546875, -0.1780853271484375, -0.17209625244140625, -0.166107177734375, -0.16011810302734375, -0.1541290283203125, -0.14813995361328125, -0.14215087890625, -0.13616180419921875, -0.1301727294921875, -0.12418365478515625, -0.118194580078125, -0.11220550537109375, -0.1062164306640625, -0.10022735595703125, -0.09423828125, -0.08824920654296875, -0.0822601318359375, -0.07627105712890625, -0.070281982421875, -0.06429290771484375, -0.0583038330078125, -0.05231475830078125, -0.04632568359375, -0.04033660888671875, -0.0343475341796875, -0.02835845947265625, -0.022369384765625, -0.01638031005859375, -0.0103912353515625, -0.00440216064453125, 0.0015869140625, 0.00757598876953125, 0.0135650634765625, 0.01955413818359375, 0.025543212890625, 0.03153228759765625, 0.0375213623046875, 0.04351043701171875, 0.04949951171875, 0.05548858642578125, 0.0614776611328125, 0.06746673583984375, 0.073455810546875, 0.07944488525390625, 0.0854339599609375, 0.09142303466796875, 0.097412109375, 0.10340118408203125, 0.1093902587890625, 0.11537933349609375, 0.121368408203125, 0.12735748291015625, 0.1333465576171875, 0.13933563232421875, 0.14532470703125, 0.15131378173828125, 0.1573028564453125, 0.16329193115234375, 0.169281005859375, 0.17527008056640625, 0.1812591552734375, 0.18724822998046875, 0.1932373046875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 11.0, 8.0, 10.0, 18.0, 18.0, 16.0, 23.0, 15.0, 28.0, 27.0, 32.0, 37.0, 30.0, 45.0, 48.0, 39.0, 34.0, 39.0, 1064.0, 47.0, 36.0, 43.0, 36.0, 42.0, 43.0, 23.0, 21.0, 21.0, 26.0, 21.0, 19.0, 16.0, 16.0, 8.0, 6.0, 6.0, 15.0, 8.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376708984375, -0.3638725280761719, -0.35103607177734375, -0.3381996154785156, -0.3253631591796875, -0.3125267028808594, -0.29969024658203125, -0.2868537902832031, -0.274017333984375, -0.2611808776855469, -0.24834442138671875, -0.23550796508789062, -0.2226715087890625, -0.20983505249023438, -0.19699859619140625, -0.18416213989257812, -0.17132568359375, -0.15848922729492188, -0.14565277099609375, -0.13281631469726562, -0.1199798583984375, -0.10714340209960938, -0.09430694580078125, -0.08147048950195312, -0.068634033203125, -0.055797576904296875, -0.04296112060546875, -0.030124664306640625, -0.0172882080078125, -0.004451751708984375, 0.00838470458984375, 0.021221160888671875, 0.0340576171875, 0.046894073486328125, 0.05973052978515625, 0.07256698608398438, 0.0854034423828125, 0.09823989868164062, 0.11107635498046875, 0.12391281127929688, 0.136749267578125, 0.14958572387695312, 0.16242218017578125, 0.17525863647460938, 0.1880950927734375, 0.20093154907226562, 0.21376800537109375, 0.22660446166992188, 0.23944091796875, 0.2522773742675781, 0.26511383056640625, 0.2779502868652344, 0.2907867431640625, 0.3036231994628906, 0.31645965576171875, 0.3292961120605469, 0.342132568359375, 0.3549690246582031, 0.36780548095703125, 0.3806419372558594, 0.3934783935546875, 0.4063148498535156, 0.41915130615234375, 0.4319877624511719, 0.44482421875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 7.0, 10.0, 10.0, 8.0, 12.0, 22.0, 28.0, 42.0, 64.0, 117.0, 187.0, 310.0, 588.0, 1098.0, 2688.0, 6494.0, 19737.0, 168855.0, 1847260.0, 33014.0, 9602.0, 3641.0, 1603.0, 770.0, 369.0, 220.0, 126.0, 83.0, 45.0, 37.0, 31.0, 14.0, 12.0, 8.0, 7.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4267578125, -0.41262054443359375, -0.3984832763671875, -0.38434600830078125, -0.370208740234375, -0.35607147216796875, -0.3419342041015625, -0.32779693603515625, -0.31365966796875, -0.29952239990234375, -0.2853851318359375, -0.27124786376953125, -0.257110595703125, -0.24297332763671875, -0.2288360595703125, -0.21469879150390625, -0.2005615234375, -0.18642425537109375, -0.1722869873046875, -0.15814971923828125, -0.144012451171875, -0.12987518310546875, -0.1157379150390625, -0.10160064697265625, -0.08746337890625, -0.07332611083984375, -0.0591888427734375, -0.04505157470703125, -0.030914306640625, -0.01677703857421875, -0.0026397705078125, 0.01149749755859375, 0.025634765625, 0.03977203369140625, 0.0539093017578125, 0.06804656982421875, 0.082183837890625, 0.09632110595703125, 0.1104583740234375, 0.12459564208984375, 0.13873291015625, 0.15287017822265625, 0.1670074462890625, 0.18114471435546875, 0.195281982421875, 0.20941925048828125, 0.2235565185546875, 0.23769378662109375, 0.2518310546875, 0.26596832275390625, 0.2801055908203125, 0.29424285888671875, 0.308380126953125, 0.32251739501953125, 0.3366546630859375, 0.35079193115234375, 0.36492919921875, 0.37906646728515625, 0.3932037353515625, 0.40734100341796875, 0.421478271484375, 0.43561553955078125, 0.4497528076171875, 0.46389007568359375, 0.47802734375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 7.0, 24.0, 42.0, 64.0, 115.0, 149.0, 168.0, 159.0, 94.0, 65.0, 40.0, 18.0, 14.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.031524658203125, -0.030612468719482422, -0.029700279235839844, -0.028788089752197266, -0.027875900268554688, -0.02696371078491211, -0.02605152130126953, -0.025139331817626953, -0.024227142333984375, -0.023314952850341797, -0.02240276336669922, -0.02149057388305664, -0.020578384399414062, -0.019666194915771484, -0.018754005432128906, -0.017841815948486328, -0.01692962646484375, -0.016017436981201172, -0.015105247497558594, -0.014193058013916016, -0.013280868530273438, -0.01236867904663086, -0.011456489562988281, -0.010544300079345703, -0.009632110595703125, -0.008719921112060547, -0.007807731628417969, -0.006895542144775391, -0.0059833526611328125, -0.005071163177490234, -0.004158973693847656, -0.003246784210205078, -0.0023345947265625, -0.0014224052429199219, -0.0005102157592773438, 0.0004019737243652344, 0.0013141632080078125, 0.0022263526916503906, 0.0031385421752929688, 0.004050731658935547, 0.004962921142578125, 0.005875110626220703, 0.006787300109863281, 0.007699489593505859, 0.008611679077148438, 0.009523868560791016, 0.010436058044433594, 0.011348247528076172, 0.01226043701171875, 0.013172626495361328, 0.014084815979003906, 0.014997005462646484, 0.015909194946289062, 0.01682138442993164, 0.01773357391357422, 0.018645763397216797, 0.019557952880859375, 0.020470142364501953, 0.02138233184814453, 0.02229452133178711, 0.023206710815429688, 0.024118900299072266, 0.025031089782714844, 0.025943279266357422, 0.02685546875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 7.0, 10.0, 13.0, 16.0, 38.0, 105.0, 416.0, 2040.0, 13259.0, 1010695.0, 18642.0, 2556.0, 474.0, 128.0, 54.0, 24.0, 15.0, 7.0, 8.0, 3.0, 4.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44384765625, -0.4288330078125, -0.413818359375, -0.3988037109375, -0.3837890625, -0.3687744140625, -0.353759765625, -0.3387451171875, -0.32373046875, -0.3087158203125, -0.293701171875, -0.2786865234375, -0.263671875, -0.2486572265625, -0.233642578125, -0.2186279296875, -0.20361328125, -0.1885986328125, -0.173583984375, -0.1585693359375, -0.1435546875, -0.1285400390625, -0.113525390625, -0.0985107421875, -0.08349609375, -0.0684814453125, -0.053466796875, -0.0384521484375, -0.0234375, -0.0084228515625, 0.006591796875, 0.0216064453125, 0.03662109375, 0.0516357421875, 0.066650390625, 0.0816650390625, 0.0966796875, 0.1116943359375, 0.126708984375, 0.1417236328125, 0.15673828125, 0.1717529296875, 0.186767578125, 0.2017822265625, 0.216796875, 0.2318115234375, 0.246826171875, 0.2618408203125, 0.27685546875, 0.2918701171875, 0.306884765625, 0.3218994140625, 0.3369140625, 0.3519287109375, 0.366943359375, 0.3819580078125, 0.39697265625, 0.4119873046875, 0.427001953125, 0.4420166015625, 0.45703125, 0.4720458984375, 0.487060546875, 0.5020751953125, 0.51708984375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 16.0, 56.0, 333.0, 480.0, 106.0, 13.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28422310948371887, -0.27478501200675964, -0.2653469145298004, -0.2559088170528412, -0.24647073447704315, -0.23703263700008392, -0.2275945544242859, -0.21815645694732666, -0.20871835947036743, -0.1992802619934082, -0.18984216451644897, -0.18040408194065094, -0.1709659844636917, -0.16152788698673248, -0.15208980441093445, -0.14265170693397522, -0.133213609457016, -0.12377551198005676, -0.11433742195367813, -0.1048993319272995, -0.09546123445034027, -0.08602313697338104, -0.07658504694700241, -0.06714695692062378, -0.05770885944366455, -0.04827076569199562, -0.03883267194032669, -0.02939457818865776, -0.01995648443698883, -0.0105183906853199, -0.0010802969336509705, 0.008357793092727661, 0.017795860767364502, 0.027233954519033432, 0.03667204827070236, 0.04611014202237129, 0.05554823577404022, 0.06498633325099945, 0.07442442327737808, 0.08386251330375671, 0.09330061078071594, 0.10273870825767517, 0.1121767982840538, 0.12161488831043243, 0.13105298578739166, 0.1404910832643509, 0.14992916584014893, 0.15936726331710815, 0.16880536079406738, 0.1782434582710266, 0.18768155574798584, 0.19711963832378387, 0.2065577358007431, 0.21599583327770233, 0.22543391585350037, 0.2348720133304596, 0.24431011080741882, 0.25374820828437805, 0.2631863057613373, 0.2726244032382965, 0.28206247091293335, 0.2915005683898926, 0.3009386658668518, 0.31037676334381104, 0.31981486082077026]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 13.0, 15.0, 12.0, 14.0, 26.0, 30.0, 41.0, 32.0, 36.0, 40.0, 49.0, 52.0, 64.0, 63.0, 56.0, 68.0, 54.0, 56.0, 50.0, 33.0, 36.0, 26.0, 31.0, 25.0, 15.0, 20.0, 10.0, 7.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04205822944641113, -0.040676165372133255, -0.03929410129785538, -0.0379120409488678, -0.03652997687458992, -0.03514791280031204, -0.03376585245132446, -0.032383788377046585, -0.031001724302768707, -0.02961966022849083, -0.0282375980168581, -0.026855535805225372, -0.025473471730947495, -0.024091407656669617, -0.022709345445036888, -0.02132728323340416, -0.019945219159126282, -0.018563155084848404, -0.017181092873215675, -0.015799030661582947, -0.014416966587305069, -0.013034903444349766, -0.011652840301394463, -0.01027077715843916, -0.008888714015483856, -0.007506650872528553, -0.00612458772957325, -0.004742524586617947, -0.0033604614436626434, -0.0019783983007073402, -0.000596335157752037, 0.0007857279852032661, 0.0021677911281585693, 0.0035498542711138725, 0.004931917414069176, 0.006313980557024479, 0.007696043699979782, 0.009078106842935085, 0.010460169985890388, 0.011842233128845692, 0.013224296271800995, 0.014606359414756298, 0.0159884225577116, 0.01737048476934433, 0.018752548843622208, 0.020134612917900085, 0.021516675129532814, 0.022898737341165543, 0.02428080141544342, 0.025662865489721298, 0.027044927701354027, 0.028426989912986755, 0.029809053987264633, 0.03119111806154251, 0.03257317841053009, 0.03395524248480797, 0.035337306559085846, 0.036719370633363724, 0.0381014347076416, 0.03948349505662918, 0.04086555913090706, 0.042247623205184937, 0.043629683554172516, 0.045011747628450394, 0.04639381170272827]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 5.0, 15.0, 22.0, 11.0, 15.0, 20.0, 21.0, 25.0, 23.0, 35.0, 33.0, 31.0, 44.0, 29.0, 45.0, 33.0, 42.0, 39.0, 54.0, 37.0, 38.0, 38.0, 50.0, 38.0, 31.0, 27.0, 23.0, 30.0, 17.0, 20.0, 26.0, 15.0, 15.0, 10.0, 7.0, 13.0, 7.0, 7.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.6015625, -0.5847816467285156, -0.5680007934570312, -0.5512199401855469, -0.5344390869140625, -0.5176582336425781, -0.5008773803710938, -0.4840965270996094, -0.467315673828125, -0.4505348205566406, -0.43375396728515625, -0.4169731140136719, -0.4001922607421875, -0.3834114074707031, -0.36663055419921875, -0.3498497009277344, -0.33306884765625, -0.3162879943847656, -0.29950714111328125, -0.2827262878417969, -0.2659454345703125, -0.24916458129882812, -0.23238372802734375, -0.21560287475585938, -0.198822021484375, -0.18204116821289062, -0.16526031494140625, -0.14847946166992188, -0.1316986083984375, -0.11491775512695312, -0.09813690185546875, -0.08135604858398438, -0.0645751953125, -0.047794342041015625, -0.03101348876953125, -0.014232635498046875, 0.0025482177734375, 0.019329071044921875, 0.03610992431640625, 0.052890777587890625, 0.069671630859375, 0.08645248413085938, 0.10323333740234375, 0.12001419067382812, 0.1367950439453125, 0.15357589721679688, 0.17035675048828125, 0.18713760375976562, 0.20391845703125, 0.22069931030273438, 0.23748016357421875, 0.2542610168457031, 0.2710418701171875, 0.2878227233886719, 0.30460357666015625, 0.3213844299316406, 0.338165283203125, 0.3549461364746094, 0.37172698974609375, 0.3885078430175781, 0.4052886962890625, 0.4220695495605469, 0.43885040283203125, 0.4556312561035156, 0.472412109375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 16.0, 22.0, 34.0, 42.0, 72.0, 122.0, 185.0, 315.0, 498.0, 831.0, 1486.0, 2682.0, 5177.0, 10125.0, 21113.0, 48187.0, 124325.0, 389485.0, 272914.0, 96209.0, 38940.0, 17199.0, 8587.0, 4394.0, 2373.0, 1314.0, 718.0, 448.0, 284.0, 170.0, 91.0, 55.0, 41.0, 28.0, 19.0, 16.0, 10.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8920059204101562, -0.8631134033203125, -0.8342208862304688, -0.805328369140625, -0.7764358520507812, -0.7475433349609375, -0.7186508178710938, -0.68975830078125, -0.6608657836914062, -0.6319732666015625, -0.6030807495117188, -0.574188232421875, -0.5452957153320312, -0.5164031982421875, -0.48751068115234375, -0.4586181640625, -0.42972564697265625, -0.4008331298828125, -0.37194061279296875, -0.343048095703125, -0.31415557861328125, -0.2852630615234375, -0.25637054443359375, -0.22747802734375, -0.19858551025390625, -0.1696929931640625, -0.14080047607421875, -0.111907958984375, -0.08301544189453125, -0.0541229248046875, -0.02523040771484375, 0.003662109375, 0.03255462646484375, 0.0614471435546875, 0.09033966064453125, 0.119232177734375, 0.14812469482421875, 0.1770172119140625, 0.20590972900390625, 0.23480224609375, 0.26369476318359375, 0.2925872802734375, 0.32147979736328125, 0.350372314453125, 0.37926483154296875, 0.4081573486328125, 0.43704986572265625, 0.4659423828125, 0.49483489990234375, 0.5237274169921875, 0.5526199340820312, 0.581512451171875, 0.6104049682617188, 0.6392974853515625, 0.6681900024414062, 0.69708251953125, 0.7259750366210938, 0.7548675537109375, 0.7837600708007812, 0.812652587890625, 0.8415451049804688, 0.8704376220703125, 0.8993301391601562, 0.92822265625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 7.0, 12.0, 11.0, 17.0, 13.0, 20.0, 32.0, 23.0, 31.0, 32.0, 34.0, 43.0, 45.0, 65.0, 103.0, 181.0, 1367.0, 314.0, 183.0, 92.0, 58.0, 47.0, 34.0, 41.0, 33.0, 25.0, 23.0, 26.0, 20.0, 15.0, 14.0, 13.0, 14.0, 9.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0], "bins": [-1.830078125, -1.7777099609375, -1.725341796875, -1.6729736328125, -1.62060546875, -1.5682373046875, -1.515869140625, -1.4635009765625, -1.4111328125, -1.3587646484375, -1.306396484375, -1.2540283203125, -1.20166015625, -1.1492919921875, -1.096923828125, -1.0445556640625, -0.9921875, -0.9398193359375, -0.887451171875, -0.8350830078125, -0.78271484375, -0.7303466796875, -0.677978515625, -0.6256103515625, -0.5732421875, -0.5208740234375, -0.468505859375, -0.4161376953125, -0.36376953125, -0.3114013671875, -0.259033203125, -0.2066650390625, -0.154296875, -0.1019287109375, -0.049560546875, 0.0028076171875, 0.05517578125, 0.1075439453125, 0.159912109375, 0.2122802734375, 0.2646484375, 0.3170166015625, 0.369384765625, 0.4217529296875, 0.47412109375, 0.5264892578125, 0.578857421875, 0.6312255859375, 0.68359375, 0.7359619140625, 0.788330078125, 0.8406982421875, 0.89306640625, 0.9454345703125, 0.997802734375, 1.0501708984375, 1.1025390625, 1.1549072265625, 1.207275390625, 1.2596435546875, 1.31201171875, 1.3643798828125, 1.416748046875, 1.4691162109375, 1.521484375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 17.0, 25.0, 30.0, 89.0, 175.0, 338.0, 859.0, 4778.0, 1735730.0, 1397497.0, 4629.0, 841.0, 340.0, 160.0, 67.0, 42.0, 33.0, 10.0, 10.0, 7.0, 8.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.3203125, -7.09149169921875, -6.8626708984375, -6.63385009765625, -6.405029296875, -6.17620849609375, -5.9473876953125, -5.71856689453125, -5.48974609375, -5.26092529296875, -5.0321044921875, -4.80328369140625, -4.574462890625, -4.34564208984375, -4.1168212890625, -3.88800048828125, -3.6591796875, -3.43035888671875, -3.2015380859375, -2.97271728515625, -2.743896484375, -2.51507568359375, -2.2862548828125, -2.05743408203125, -1.82861328125, -1.59979248046875, -1.3709716796875, -1.14215087890625, -0.913330078125, -0.68450927734375, -0.4556884765625, -0.22686767578125, 0.001953125, 0.23077392578125, 0.4595947265625, 0.68841552734375, 0.917236328125, 1.14605712890625, 1.3748779296875, 1.60369873046875, 1.83251953125, 2.06134033203125, 2.2901611328125, 2.51898193359375, 2.747802734375, 2.97662353515625, 3.2054443359375, 3.43426513671875, 3.6630859375, 3.89190673828125, 4.1207275390625, 4.34954833984375, 4.578369140625, 4.80718994140625, 5.0360107421875, 5.26483154296875, 5.49365234375, 5.72247314453125, 5.9512939453125, 6.18011474609375, 6.408935546875, 6.63775634765625, 6.8665771484375, 7.09539794921875, 7.32421875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 5.0, 66.0, 408.0, 442.0, 84.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3541646003723145, -1.7754302024841309, -1.1966956853866577, -0.6179611682891846, -0.03922677040100098, 0.5395076274871826, 1.1182422637939453, 1.696976661682129, 2.2757110595703125, 2.854445457458496, 3.4331798553466797, 4.011914253234863, 4.590648651123047, 5.1693830490112305, 5.748117923736572, 6.326852321624756, 6.9055867195129395, 7.484321117401123, 8.063055992126465, 8.641790390014648, 9.220524787902832, 9.799259185791016, 10.3779935836792, 10.956727981567383, 11.535462379455566, 12.11419677734375, 12.692931175231934, 13.271665573120117, 13.8503999710083, 14.429134368896484, 15.007869720458984, 15.586603164672852, 16.16533851623535, 16.74407386779785, 17.32280731201172, 17.90154266357422, 18.480276107788086, 19.059011459350586, 19.637744903564453, 20.216480255126953, 20.79521369934082, 21.37394905090332, 21.952682495117188, 22.531417846679688, 23.110151290893555, 23.688886642456055, 24.267620086669922, 24.846355438232422, 25.425090789794922, 26.003826141357422, 26.58255958557129, 27.16129493713379, 27.740028381347656, 28.318763732910156, 28.897497177124023, 29.476232528686523, 30.05496597290039, 30.63370132446289, 31.212434768676758, 31.791170120239258, 32.369903564453125, 32.948638916015625, 33.527374267578125, 34.10610580444336, 34.68484115600586]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 8.0, 7.0, 10.0, 12.0, 18.0, 18.0, 11.0, 23.0, 30.0, 29.0, 33.0, 28.0, 43.0, 38.0, 33.0, 45.0, 33.0, 41.0, 40.0, 41.0, 37.0, 50.0, 38.0, 41.0, 27.0, 41.0, 29.0, 27.0, 32.0, 14.0, 17.0, 18.0, 15.0, 10.0, 8.0, 4.0, 13.0, 7.0, 5.0, 2.0, 6.0, 0.0, 4.0, 3.0, 1.0, 1.0], "bins": [-5.041223526000977, -4.903148174285889, -4.765072822570801, -4.626996994018555, -4.488921642303467, -4.350846290588379, -4.212770938873291, -4.074695587158203, -3.936619758605957, -3.798544406890869, -3.660468816757202, -3.5223934650421143, -3.3843178749084473, -3.2462425231933594, -3.1081671714782715, -2.9700915813446045, -2.8320162296295166, -2.6939408779144287, -2.5558652877807617, -2.417789936065674, -2.279714345932007, -2.141638994216919, -2.003563404083252, -1.865488052368164, -1.7274125814437866, -1.5893371105194092, -1.4512616395950317, -1.3131861686706543, -1.1751108169555664, -1.0370352268218994, -0.8989598751068115, -0.7608844041824341, -0.6228091716766357, -0.4847337007522583, -0.34665825963020325, -0.2085828185081482, -0.07050734758377075, 0.06756812334060669, 0.20564353466033936, 0.3437190055847168, 0.48179447650909424, 0.6198699474334717, 0.7579454183578491, 0.8960208296775818, 1.0340962409973145, 1.1721718311309814, 1.3102471828460693, 1.4483226537704468, 1.5863981246948242, 1.7244735956192017, 1.862549066543579, 2.000624418258667, 2.138700008392334, 2.276775360107422, 2.4148507118225098, 2.5529263019561768, 2.6910018920898438, 2.8290772438049316, 2.9671528339385986, 3.1052281856536865, 3.2433037757873535, 3.3813791275024414, 3.5194544792175293, 3.6575300693511963, 3.795605421066284]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 9.0, 10.0, 9.0, 13.0, 11.0, 24.0, 22.0, 19.0, 23.0, 32.0, 28.0, 29.0, 32.0, 34.0, 41.0, 32.0, 36.0, 33.0, 32.0, 49.0, 39.0, 53.0, 26.0, 33.0, 28.0, 33.0, 42.0, 32.0, 30.0, 20.0, 25.0, 9.0, 15.0, 20.0, 11.0, 6.0, 15.0, 7.0, 9.0, 5.0, 7.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.56689453125, -0.5507621765136719, -0.5346298217773438, -0.5184974670410156, -0.5023651123046875, -0.4862327575683594, -0.47010040283203125, -0.4539680480957031, -0.437835693359375, -0.4217033386230469, -0.40557098388671875, -0.3894386291503906, -0.3733062744140625, -0.3571739196777344, -0.34104156494140625, -0.3249092102050781, -0.30877685546875, -0.2926445007324219, -0.27651214599609375, -0.2603797912597656, -0.2442474365234375, -0.22811508178710938, -0.21198272705078125, -0.19585037231445312, -0.179718017578125, -0.16358566284179688, -0.14745330810546875, -0.13132095336914062, -0.1151885986328125, -0.09905624389648438, -0.08292388916015625, -0.06679153442382812, -0.0506591796875, -0.034526824951171875, -0.01839447021484375, -0.002262115478515625, 0.0138702392578125, 0.030002593994140625, 0.04613494873046875, 0.062267303466796875, 0.078399658203125, 0.09453201293945312, 0.11066436767578125, 0.12679672241210938, 0.1429290771484375, 0.15906143188476562, 0.17519378662109375, 0.19132614135742188, 0.20745849609375, 0.22359085083007812, 0.23972320556640625, 0.2558555603027344, 0.2719879150390625, 0.2881202697753906, 0.30425262451171875, 0.3203849792480469, 0.336517333984375, 0.3526496887207031, 0.36878204345703125, 0.3849143981933594, 0.4010467529296875, 0.4171791076660156, 0.43331146240234375, 0.4494438171386719, 0.465576171875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 8.0, 12.0, 12.0, 23.0, 40.0, 46.0, 69.0, 96.0, 133.0, 187.0, 283.0, 408.0, 690.0, 1049.0, 1808.0, 3279.0, 6645.0, 14585.0, 42957.0, 178419.0, 1047236.0, 2189829.0, 552400.0, 102930.0, 28622.0, 10951.0, 5006.0, 2612.0, 1519.0, 859.0, 533.0, 341.0, 210.0, 130.0, 101.0, 67.0, 52.0, 38.0, 20.0, 25.0, 18.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.037109375, -1.0050201416015625, -0.972930908203125, -0.9408416748046875, -0.90875244140625, -0.8766632080078125, -0.844573974609375, -0.8124847412109375, -0.7803955078125, -0.7483062744140625, -0.716217041015625, -0.6841278076171875, -0.65203857421875, -0.6199493408203125, -0.587860107421875, -0.5557708740234375, -0.523681640625, -0.4915924072265625, -0.459503173828125, -0.4274139404296875, -0.39532470703125, -0.3632354736328125, -0.331146240234375, -0.2990570068359375, -0.2669677734375, -0.2348785400390625, -0.202789306640625, -0.1707000732421875, -0.13861083984375, -0.1065216064453125, -0.074432373046875, -0.0423431396484375, -0.01025390625, 0.0218353271484375, 0.053924560546875, 0.0860137939453125, 0.11810302734375, 0.1501922607421875, 0.182281494140625, 0.2143707275390625, 0.2464599609375, 0.2785491943359375, 0.310638427734375, 0.3427276611328125, 0.37481689453125, 0.4069061279296875, 0.438995361328125, 0.4710845947265625, 0.503173828125, 0.5352630615234375, 0.567352294921875, 0.5994415283203125, 0.63153076171875, 0.6636199951171875, 0.695709228515625, 0.7277984619140625, 0.7598876953125, 0.7919769287109375, 0.824066162109375, 0.8561553955078125, 0.88824462890625, 0.9203338623046875, 0.952423095703125, 0.9845123291015625, 1.0166015625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 6.0, 12.0, 24.0, 23.0, 48.0, 57.0, 82.0, 121.0, 229.0, 404.0, 686.0, 831.0, 568.0, 343.0, 220.0, 134.0, 90.0, 61.0, 37.0, 22.0, 18.0, 11.0, 11.0, 4.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8818359375, -1.83404541015625, -1.7862548828125, -1.73846435546875, -1.690673828125, -1.64288330078125, -1.5950927734375, -1.54730224609375, -1.49951171875, -1.45172119140625, -1.4039306640625, -1.35614013671875, -1.308349609375, -1.26055908203125, -1.2127685546875, -1.16497802734375, -1.1171875, -1.06939697265625, -1.0216064453125, -0.97381591796875, -0.926025390625, -0.87823486328125, -0.8304443359375, -0.78265380859375, -0.73486328125, -0.68707275390625, -0.6392822265625, -0.59149169921875, -0.543701171875, -0.49591064453125, -0.4481201171875, -0.40032958984375, -0.3525390625, -0.30474853515625, -0.2569580078125, -0.20916748046875, -0.161376953125, -0.11358642578125, -0.0657958984375, -0.01800537109375, 0.02978515625, 0.07757568359375, 0.1253662109375, 0.17315673828125, 0.220947265625, 0.26873779296875, 0.3165283203125, 0.36431884765625, 0.412109375, 0.45989990234375, 0.5076904296875, 0.55548095703125, 0.603271484375, 0.65106201171875, 0.6988525390625, 0.74664306640625, 0.79443359375, 0.84222412109375, 0.8900146484375, 0.93780517578125, 0.985595703125, 1.03338623046875, 1.0811767578125, 1.12896728515625, 1.1767578125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 9.0, 10.0, 16.0, 35.0, 46.0, 83.0, 132.0, 263.0, 754.0, 3144.0, 22355.0, 1910064.0, 2228938.0, 23599.0, 3319.0, 867.0, 277.0, 144.0, 66.0, 44.0, 34.0, 24.0, 16.0, 12.0, 10.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4613037109375, -4.289794921875, -4.1182861328125, -3.94677734375, -3.7752685546875, -3.603759765625, -3.4322509765625, -3.2607421875, -3.0892333984375, -2.917724609375, -2.7462158203125, -2.57470703125, -2.4031982421875, -2.231689453125, -2.0601806640625, -1.888671875, -1.7171630859375, -1.545654296875, -1.3741455078125, -1.20263671875, -1.0311279296875, -0.859619140625, -0.6881103515625, -0.5166015625, -0.3450927734375, -0.173583984375, -0.0020751953125, 0.16943359375, 0.3409423828125, 0.512451171875, 0.6839599609375, 0.85546875, 1.0269775390625, 1.198486328125, 1.3699951171875, 1.54150390625, 1.7130126953125, 1.884521484375, 2.0560302734375, 2.2275390625, 2.3990478515625, 2.570556640625, 2.7420654296875, 2.91357421875, 3.0850830078125, 3.256591796875, 3.4281005859375, 3.599609375, 3.7711181640625, 3.942626953125, 4.1141357421875, 4.28564453125, 4.4571533203125, 4.628662109375, 4.8001708984375, 4.9716796875, 5.1431884765625, 5.314697265625, 5.4862060546875, 5.65771484375, 5.8292236328125, 6.000732421875, 6.1722412109375, 6.34375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 15.0, 27.0, 99.0, 213.0, 313.0, 198.0, 94.0, 30.0, 16.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.104403495788574, -7.610931396484375, -7.117458820343018, -6.62398624420166, -6.130514144897461, -5.637042045593262, -5.143569469451904, -4.650096893310547, -4.156624794006348, -3.6631524562835693, -3.169680118560791, -2.6762077808380127, -2.1827354431152344, -1.689263105392456, -1.1957907676696777, -0.7023184299468994, -0.2088460922241211, 0.2846262454986572, 0.7780985832214355, 1.2715709209442139, 1.7650432586669922, 2.2585155963897705, 2.751987934112549, 3.245460271835327, 3.7389326095581055, 4.232404708862305, 4.725877285003662, 5.2193498611450195, 5.712821960449219, 6.206294059753418, 6.699766635894775, 7.193239212036133, 7.686710357666016, 8.180182456970215, 8.673654556274414, 9.16712760925293, 9.660599708557129, 10.154071807861328, 10.647544860839844, 11.141016960144043, 11.634489059448242, 12.127961158752441, 12.62143325805664, 13.114906311035156, 13.608378410339355, 14.101850509643555, 14.59532356262207, 15.08879566192627, 15.582267761230469, 16.075740814208984, 16.569211959838867, 17.062685012817383, 17.556156158447266, 18.04962921142578, 18.543102264404297, 19.03657341003418, 19.530046463012695, 20.02351951599121, 20.516990661621094, 21.01046371459961, 21.503936767578125, 21.997407913208008, 22.490880966186523, 22.984352111816406, 23.477825164794922]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 9.0, 5.0, 14.0, 18.0, 16.0, 15.0, 13.0, 21.0, 24.0, 31.0, 32.0, 41.0, 37.0, 42.0, 35.0, 31.0, 48.0, 51.0, 45.0, 42.0, 31.0, 33.0, 34.0, 40.0, 29.0, 39.0, 33.0, 34.0, 18.0, 29.0, 16.0, 21.0, 15.0, 8.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.131260395050049, -4.013218402862549, -3.8951761722564697, -3.7771339416503906, -3.6590919494628906, -3.5410499572753906, -3.4230077266693115, -3.3049654960632324, -3.1869235038757324, -3.0688815116882324, -2.9508392810821533, -2.832797050476074, -2.714755058288574, -2.596713066101074, -2.478670835494995, -2.360628604888916, -2.242586612701416, -2.124544620513916, -2.006502389907837, -1.8884602785110474, -1.7704181671142578, -1.6523760557174683, -1.5343339443206787, -1.4162918329238892, -1.2982497215270996, -1.18020761013031, -1.0621654987335205, -0.944123387336731, -0.8260812759399414, -0.7080391645431519, -0.5899970531463623, -0.47195494174957275, -0.3539125919342041, -0.23587048053741455, -0.117828369140625, 0.00021374225616455078, 0.1182558536529541, 0.23629796504974365, 0.3543400764465332, 0.47238218784332275, 0.5904242992401123, 0.7084664106369019, 0.8265085220336914, 0.944550633430481, 1.0625927448272705, 1.18063485622406, 1.2986769676208496, 1.4167190790176392, 1.5347611904144287, 1.6528033018112183, 1.7708454132080078, 1.8888875246047974, 2.006929636001587, 2.124971866607666, 2.243013858795166, 2.361055850982666, 2.479098081588745, 2.597140312194824, 2.715182304382324, 2.833224296569824, 2.9512665271759033, 3.0693087577819824, 3.1873507499694824, 3.3053927421569824, 3.4234349727630615]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 6.0, 12.0, 7.0, 17.0, 12.0, 16.0, 18.0, 26.0, 19.0, 20.0, 28.0, 32.0, 39.0, 42.0, 24.0, 40.0, 54.0, 34.0, 43.0, 47.0, 47.0, 36.0, 44.0, 36.0, 33.0, 35.0, 27.0, 27.0, 14.0, 39.0, 22.0, 16.0, 15.0, 12.0, 8.0, 10.0, 13.0, 9.0, 1.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5751953125, -0.5582504272460938, -0.5413055419921875, -0.5243606567382812, -0.507415771484375, -0.49047088623046875, -0.4735260009765625, -0.45658111572265625, -0.43963623046875, -0.42269134521484375, -0.4057464599609375, -0.38880157470703125, -0.371856689453125, -0.35491180419921875, -0.3379669189453125, -0.32102203369140625, -0.3040771484375, -0.28713226318359375, -0.2701873779296875, -0.25324249267578125, -0.236297607421875, -0.21935272216796875, -0.2024078369140625, -0.18546295166015625, -0.16851806640625, -0.15157318115234375, -0.1346282958984375, -0.11768341064453125, -0.100738525390625, -0.08379364013671875, -0.0668487548828125, -0.04990386962890625, -0.032958984375, -0.01601409912109375, 0.0009307861328125, 0.01787567138671875, 0.034820556640625, 0.05176544189453125, 0.0687103271484375, 0.08565521240234375, 0.10260009765625, 0.11954498291015625, 0.1364898681640625, 0.15343475341796875, 0.170379638671875, 0.18732452392578125, 0.2042694091796875, 0.22121429443359375, 0.2381591796875, 0.25510406494140625, 0.2720489501953125, 0.28899383544921875, 0.305938720703125, 0.32288360595703125, 0.3398284912109375, 0.35677337646484375, 0.37371826171875, 0.39066314697265625, 0.4076080322265625, 0.42455291748046875, 0.441497802734375, 0.45844268798828125, 0.4753875732421875, 0.49233245849609375, 0.50927734375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 10.0, 25.0, 26.0, 44.0, 47.0, 99.0, 140.0, 197.0, 288.0, 468.0, 708.0, 1120.0, 1809.0, 2891.0, 4617.0, 7686.0, 12836.0, 21523.0, 36788.0, 63343.0, 108728.0, 174655.0, 210473.0, 161219.0, 98596.0, 57266.0, 33509.0, 19549.0, 11557.0, 6801.0, 4320.0, 2587.0, 1611.0, 1030.0, 674.0, 423.0, 311.0, 174.0, 124.0, 90.0, 58.0, 50.0, 22.0, 14.0, 10.0, 8.0, 7.0, 10.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09735107421875, -0.09434700012207031, -0.09134292602539062, -0.08833885192871094, -0.08533477783203125, -0.08233070373535156, -0.07932662963867188, -0.07632255554199219, -0.0733184814453125, -0.07031440734863281, -0.06731033325195312, -0.06430625915527344, -0.06130218505859375, -0.05829811096191406, -0.055294036865234375, -0.05228996276855469, -0.049285888671875, -0.04628181457519531, -0.043277740478515625, -0.04027366638183594, -0.03726959228515625, -0.03426551818847656, -0.031261444091796875, -0.028257369995117188, -0.0252532958984375, -0.022249221801757812, -0.019245147705078125, -0.016241073608398438, -0.01323699951171875, -0.010232925415039062, -0.007228851318359375, -0.0042247772216796875, -0.001220703125, 0.0017833709716796875, 0.004787445068359375, 0.0077915191650390625, 0.01079559326171875, 0.013799667358398438, 0.016803741455078125, 0.019807815551757812, 0.0228118896484375, 0.025815963745117188, 0.028820037841796875, 0.03182411193847656, 0.03482818603515625, 0.03783226013183594, 0.040836334228515625, 0.04384040832519531, 0.046844482421875, 0.04984855651855469, 0.052852630615234375, 0.05585670471191406, 0.05886077880859375, 0.06186485290527344, 0.06486892700195312, 0.06787300109863281, 0.0708770751953125, 0.07388114929199219, 0.07688522338867188, 0.07988929748535156, 0.08289337158203125, 0.08589744567871094, 0.08890151977539062, 0.09190559387207031, 0.09490966796875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 2.0, 8.0, 12.0, 5.0, 7.0, 12.0, 14.0, 13.0, 11.0, 24.0, 20.0, 27.0, 25.0, 30.0, 39.0, 25.0, 27.0, 32.0, 49.0, 32.0, 38.0, 1061.0, 42.0, 35.0, 35.0, 48.0, 40.0, 24.0, 38.0, 22.0, 29.0, 30.0, 27.0, 23.0, 20.0, 23.0, 9.0, 5.0, 14.0, 5.0, 10.0, 5.0, 9.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.411865234375, -0.3993415832519531, -0.38681793212890625, -0.3742942810058594, -0.3617706298828125, -0.3492469787597656, -0.33672332763671875, -0.3241996765136719, -0.311676025390625, -0.2991523742675781, -0.28662872314453125, -0.2741050720214844, -0.2615814208984375, -0.24905776977539062, -0.23653411865234375, -0.22401046752929688, -0.21148681640625, -0.19896316528320312, -0.18643951416015625, -0.17391586303710938, -0.1613922119140625, -0.14886856079101562, -0.13634490966796875, -0.12382125854492188, -0.111297607421875, -0.09877395629882812, -0.08625030517578125, -0.07372665405273438, -0.0612030029296875, -0.048679351806640625, -0.03615570068359375, -0.023632049560546875, -0.0111083984375, 0.001415252685546875, 0.01393890380859375, 0.026462554931640625, 0.0389862060546875, 0.051509857177734375, 0.06403350830078125, 0.07655715942382812, 0.089080810546875, 0.10160446166992188, 0.11412811279296875, 0.12665176391601562, 0.1391754150390625, 0.15169906616210938, 0.16422271728515625, 0.17674636840820312, 0.18927001953125, 0.20179367065429688, 0.21431732177734375, 0.22684097290039062, 0.2393646240234375, 0.2518882751464844, 0.26441192626953125, 0.2769355773925781, 0.289459228515625, 0.3019828796386719, 0.31450653076171875, 0.3270301818847656, 0.3395538330078125, 0.3520774841308594, 0.36460113525390625, 0.3771247863769531, 0.3896484375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 11.0, 26.0, 27.0, 61.0, 86.0, 135.0, 289.0, 514.0, 1093.0, 2177.0, 4722.0, 11215.0, 33736.0, 1712231.0, 288723.0, 25228.0, 9061.0, 3933.0, 1830.0, 955.0, 481.0, 250.0, 130.0, 79.0, 34.0, 22.0, 21.0, 11.0, 4.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2728538513183594, -0.26372528076171875, -0.2545967102050781, -0.2454681396484375, -0.23633956909179688, -0.22721099853515625, -0.21808242797851562, -0.208953857421875, -0.19982528686523438, -0.19069671630859375, -0.18156814575195312, -0.1724395751953125, -0.16331100463867188, -0.15418243408203125, -0.14505386352539062, -0.13592529296875, -0.12679672241210938, -0.11766815185546875, -0.10853958129882812, -0.0994110107421875, -0.09028244018554688, -0.08115386962890625, -0.07202529907226562, -0.062896728515625, -0.053768157958984375, -0.04463958740234375, -0.035511016845703125, -0.0263824462890625, -0.017253875732421875, -0.00812530517578125, 0.001003265380859375, 0.0101318359375, 0.019260406494140625, 0.02838897705078125, 0.037517547607421875, 0.0466461181640625, 0.055774688720703125, 0.06490325927734375, 0.07403182983398438, 0.083160400390625, 0.09228897094726562, 0.10141754150390625, 0.11054611206054688, 0.1196746826171875, 0.12880325317382812, 0.13793182373046875, 0.14706039428710938, 0.15618896484375, 0.16531753540039062, 0.17444610595703125, 0.18357467651367188, 0.1927032470703125, 0.20183181762695312, 0.21096038818359375, 0.22008895874023438, 0.229217529296875, 0.23834609985351562, 0.24747467041015625, 0.2566032409667969, 0.2657318115234375, 0.2748603820800781, 0.28398895263671875, 0.2931175231933594, 0.30224609375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 7.0, 3.0, 5.0, 14.0, 13.0, 26.0, 37.0, 43.0, 53.0, 64.0, 70.0, 90.0, 81.0, 69.0, 92.0, 75.0, 51.0, 53.0, 48.0, 30.0, 16.0, 25.0, 12.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01343536376953125, -0.01303720474243164, -0.012639045715332031, -0.012240886688232422, -0.011842727661132812, -0.011444568634033203, -0.011046409606933594, -0.010648250579833984, -0.010250091552734375, -0.009851932525634766, -0.009453773498535156, -0.009055614471435547, -0.008657455444335938, -0.008259296417236328, -0.007861137390136719, -0.007462978363037109, -0.0070648193359375, -0.006666660308837891, -0.006268501281738281, -0.005870342254638672, -0.0054721832275390625, -0.005074024200439453, -0.004675865173339844, -0.004277706146240234, -0.003879547119140625, -0.0034813880920410156, -0.0030832290649414062, -0.002685070037841797, -0.0022869110107421875, -0.0018887519836425781, -0.0014905929565429688, -0.0010924339294433594, -0.00069427490234375, -0.0002961158752441406, 0.00010204315185546875, 0.0005002021789550781, 0.0008983612060546875, 0.0012965202331542969, 0.0016946792602539062, 0.0020928382873535156, 0.002490997314453125, 0.0028891563415527344, 0.0032873153686523438, 0.003685474395751953, 0.0040836334228515625, 0.004481792449951172, 0.004879951477050781, 0.005278110504150391, 0.00567626953125, 0.006074428558349609, 0.006472587585449219, 0.006870746612548828, 0.0072689056396484375, 0.007667064666748047, 0.008065223693847656, 0.008463382720947266, 0.008861541748046875, 0.009259700775146484, 0.009657859802246094, 0.010056018829345703, 0.010454177856445312, 0.010852336883544922, 0.011250495910644531, 0.01164865493774414, 0.01204681396484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 12.0, 17.0, 19.0, 39.0, 41.0, 53.0, 97.0, 168.0, 315.0, 1492.0, 137932.0, 903346.0, 4081.0, 417.0, 190.0, 109.0, 73.0, 53.0, 32.0, 10.0, 19.0, 7.0, 6.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2041015625, -0.19733428955078125, -0.1905670166015625, -0.18379974365234375, -0.177032470703125, -0.17026519775390625, -0.1634979248046875, -0.15673065185546875, -0.14996337890625, -0.14319610595703125, -0.1364288330078125, -0.12966156005859375, -0.122894287109375, -0.11612701416015625, -0.1093597412109375, -0.10259246826171875, -0.0958251953125, -0.08905792236328125, -0.0822906494140625, -0.07552337646484375, -0.068756103515625, -0.06198883056640625, -0.0552215576171875, -0.04845428466796875, -0.04168701171875, -0.03491973876953125, -0.0281524658203125, -0.02138519287109375, -0.014617919921875, -0.00785064697265625, -0.0010833740234375, 0.00568389892578125, 0.012451171875, 0.01921844482421875, 0.0259857177734375, 0.03275299072265625, 0.039520263671875, 0.04628753662109375, 0.0530548095703125, 0.05982208251953125, 0.06658935546875, 0.07335662841796875, 0.0801239013671875, 0.08689117431640625, 0.093658447265625, 0.10042572021484375, 0.1071929931640625, 0.11396026611328125, 0.1207275390625, 0.12749481201171875, 0.1342620849609375, 0.14102935791015625, 0.147796630859375, 0.15456390380859375, 0.1613311767578125, 0.16809844970703125, 0.17486572265625, 0.18163299560546875, 0.1884002685546875, 0.19516754150390625, 0.201934814453125, 0.20870208740234375, 0.2154693603515625, 0.22223663330078125, 0.22900390625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 150.0, 730.0, 122.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26916176080703735, -0.2641236186027527, -0.25908544659614563, -0.25404730439186096, -0.2490091472864151, -0.24397099018096924, -0.23893283307552338, -0.23389467597007751, -0.22885653376579285, -0.22381837666034698, -0.21878021955490112, -0.21374207735061646, -0.2087039202451706, -0.20366576313972473, -0.19862760603427887, -0.193589448928833, -0.18855130672454834, -0.18351314961910248, -0.17847499251365662, -0.17343685030937195, -0.1683986932039261, -0.16336053609848022, -0.15832237899303436, -0.1532842218875885, -0.14824606478214264, -0.14320790767669678, -0.13816975057125092, -0.13313160836696625, -0.12809345126152039, -0.12305529415607452, -0.11801713705062866, -0.1129789873957634, -0.10794083774089813, -0.10290268063545227, -0.097864530980587, -0.09282637387514114, -0.08778822422027588, -0.08275006711483002, -0.07771191000938416, -0.07267376035451889, -0.06763560324907303, -0.06259744614362717, -0.0575592964887619, -0.05252113938331604, -0.047482989728450775, -0.04244483262300491, -0.03740667924284935, -0.03236852586269379, -0.027330372482538223, -0.02229221910238266, -0.017254065722227097, -0.012215910479426384, -0.007177757099270821, -0.0021396037191152573, 0.0028985515236854553, 0.007936704903841019, 0.012974858283996582, 0.018013011664152145, 0.02305116504430771, 0.02808932028710842, 0.033127471804618835, 0.0381656289100647, 0.04320378229022026, 0.048241935670375824, 0.05328008905053139]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 5.0, 9.0, 12.0, 12.0, 11.0, 11.0, 17.0, 18.0, 25.0, 24.0, 26.0, 24.0, 41.0, 28.0, 36.0, 52.0, 37.0, 36.0, 39.0, 44.0, 49.0, 41.0, 43.0, 28.0, 34.0, 34.0, 44.0, 34.0, 28.0, 26.0, 16.0, 16.0, 10.0, 16.0, 11.0, 8.0, 13.0, 10.0, 9.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.017004013061523438, -0.016484690830111504, -0.01596536859869957, -0.015446046367287636, -0.014926724135875702, -0.014407401904463768, -0.013888079673051834, -0.0133687574416399, -0.012849435210227966, -0.012330112978816032, -0.011810790747404099, -0.011291468515992165, -0.01077214628458023, -0.010252824053168297, -0.009733501821756363, -0.009214179590344429, -0.008694857358932495, -0.008175535127520561, -0.007656212896108627, -0.007136890664696693, -0.0066175684332847595, -0.006098246201872826, -0.005578923970460892, -0.005059601739048958, -0.004540279507637024, -0.00402095727622509, -0.003501635044813156, -0.0029823128134012222, -0.0024629905819892883, -0.0019436683505773544, -0.0014243461191654205, -0.0009050238877534866, -0.00038570165634155273, 0.00013362057507038116, 0.0006529428064823151, 0.001172265037894249, 0.0016915872693061829, 0.0022109095007181168, 0.0027302317321300507, 0.0032495539635419846, 0.0037688761949539185, 0.004288198426365852, 0.004807520657777786, 0.00532684288918972, 0.005846165120601654, 0.006365487352013588, 0.006884809583425522, 0.007404131814837456, 0.00792345404624939, 0.008442776277661324, 0.008962098509073257, 0.009481420740485191, 0.010000742971897125, 0.01052006520330906, 0.011039387434720993, 0.011558709666132927, 0.01207803189754486, 0.012597354128956795, 0.013116676360368729, 0.013635998591780663, 0.014155320823192596, 0.01467464305460453, 0.015193965286016464, 0.015713287517428398, 0.016232609748840332]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 11.0, 6.0, 19.0, 12.0, 16.0, 19.0, 25.0, 21.0, 18.0, 29.0, 31.0, 42.0, 39.0, 24.0, 43.0, 50.0, 41.0, 40.0, 45.0, 46.0, 37.0, 44.0, 34.0, 35.0, 34.0, 28.0, 25.0, 20.0, 34.0, 22.0, 17.0, 17.0, 8.0, 8.0, 10.0, 13.0, 9.0, 1.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.57373046875, -0.5568008422851562, -0.5398712158203125, -0.5229415893554688, -0.506011962890625, -0.48908233642578125, -0.4721527099609375, -0.45522308349609375, -0.43829345703125, -0.42136383056640625, -0.4044342041015625, -0.38750457763671875, -0.370574951171875, -0.35364532470703125, -0.3367156982421875, -0.31978607177734375, -0.3028564453125, -0.28592681884765625, -0.2689971923828125, -0.25206756591796875, -0.235137939453125, -0.21820831298828125, -0.2012786865234375, -0.18434906005859375, -0.16741943359375, -0.15048980712890625, -0.1335601806640625, -0.11663055419921875, -0.099700927734375, -0.08277130126953125, -0.0658416748046875, -0.04891204833984375, -0.031982421875, -0.01505279541015625, 0.0018768310546875, 0.01880645751953125, 0.035736083984375, 0.05266571044921875, 0.0695953369140625, 0.08652496337890625, 0.10345458984375, 0.12038421630859375, 0.1373138427734375, 0.15424346923828125, 0.171173095703125, 0.18810272216796875, 0.2050323486328125, 0.22196197509765625, 0.2388916015625, 0.25582122802734375, 0.2727508544921875, 0.28968048095703125, 0.306610107421875, 0.32353973388671875, 0.3404693603515625, 0.35739898681640625, 0.37432861328125, 0.39125823974609375, 0.4081878662109375, 0.42511749267578125, 0.442047119140625, 0.45897674560546875, 0.4759063720703125, 0.49283599853515625, 0.509765625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 12.0, 20.0, 43.0, 35.0, 70.0, 110.0, 174.0, 248.0, 371.0, 589.0, 1048.0, 1735.0, 3078.0, 5343.0, 9799.0, 18210.0, 34910.0, 72425.0, 173004.0, 378536.0, 189798.0, 78449.0, 37215.0, 19372.0, 10307.0, 5681.0, 3222.0, 1838.0, 1071.0, 643.0, 421.0, 246.0, 158.0, 118.0, 61.0, 64.0, 42.0, 24.0, 20.0, 12.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.69189453125, -0.6718673706054688, -0.6518402099609375, -0.6318130493164062, -0.611785888671875, -0.5917587280273438, -0.5717315673828125, -0.5517044067382812, -0.53167724609375, -0.5116500854492188, -0.4916229248046875, -0.47159576416015625, -0.451568603515625, -0.43154144287109375, -0.4115142822265625, -0.39148712158203125, -0.3714599609375, -0.35143280029296875, -0.3314056396484375, -0.31137847900390625, -0.291351318359375, -0.27132415771484375, -0.2512969970703125, -0.23126983642578125, -0.21124267578125, -0.19121551513671875, -0.1711883544921875, -0.15116119384765625, -0.131134033203125, -0.11110687255859375, -0.0910797119140625, -0.07105255126953125, -0.051025390625, -0.03099822998046875, -0.0109710693359375, 0.00905609130859375, 0.029083251953125, 0.04911041259765625, 0.0691375732421875, 0.08916473388671875, 0.10919189453125, 0.12921905517578125, 0.1492462158203125, 0.16927337646484375, 0.189300537109375, 0.20932769775390625, 0.2293548583984375, 0.24938201904296875, 0.2694091796875, 0.28943634033203125, 0.3094635009765625, 0.32949066162109375, 0.349517822265625, 0.36954498291015625, 0.3895721435546875, 0.40959930419921875, 0.42962646484375, 0.44965362548828125, 0.4696807861328125, 0.48970794677734375, 0.509735107421875, 0.5297622680664062, 0.5497894287109375, 0.5698165893554688, 0.58984375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 6.0, 4.0, 8.0, 14.0, 8.0, 12.0, 11.0, 18.0, 19.0, 17.0, 30.0, 26.0, 28.0, 31.0, 35.0, 46.0, 56.0, 72.0, 113.0, 205.0, 1402.0, 302.0, 142.0, 58.0, 63.0, 35.0, 38.0, 32.0, 39.0, 27.0, 14.0, 19.0, 18.0, 17.0, 19.0, 10.0, 15.0, 12.0, 6.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5439453125, -1.490264892578125, -1.43658447265625, -1.382904052734375, -1.3292236328125, -1.275543212890625, -1.22186279296875, -1.168182373046875, -1.114501953125, -1.060821533203125, -1.00714111328125, -0.953460693359375, -0.8997802734375, -0.846099853515625, -0.79241943359375, -0.738739013671875, -0.68505859375, -0.631378173828125, -0.57769775390625, -0.524017333984375, -0.4703369140625, -0.416656494140625, -0.36297607421875, -0.309295654296875, -0.255615234375, -0.201934814453125, -0.14825439453125, -0.094573974609375, -0.0408935546875, 0.012786865234375, 0.06646728515625, 0.120147705078125, 0.173828125, 0.227508544921875, 0.28118896484375, 0.334869384765625, 0.3885498046875, 0.442230224609375, 0.49591064453125, 0.549591064453125, 0.603271484375, 0.656951904296875, 0.71063232421875, 0.764312744140625, 0.8179931640625, 0.871673583984375, 0.92535400390625, 0.979034423828125, 1.03271484375, 1.086395263671875, 1.14007568359375, 1.193756103515625, 1.2474365234375, 1.301116943359375, 1.35479736328125, 1.408477783203125, 1.462158203125, 1.515838623046875, 1.56951904296875, 1.623199462890625, 1.6768798828125, 1.730560302734375, 1.78424072265625, 1.837921142578125, 1.8916015625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 15.0, 13.0, 14.0, 24.0, 29.0, 29.0, 36.0, 52.0, 73.0, 93.0, 151.0, 206.0, 353.0, 693.0, 2411.0, 28235.0, 2524246.0, 574401.0, 11396.0, 1637.0, 600.0, 306.0, 196.0, 117.0, 84.0, 68.0, 36.0, 39.0, 31.0, 21.0, 27.0, 15.0, 16.0, 7.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.873046875, -3.75860595703125, -3.6441650390625, -3.52972412109375, -3.415283203125, -3.30084228515625, -3.1864013671875, -3.07196044921875, -2.95751953125, -2.84307861328125, -2.7286376953125, -2.61419677734375, -2.499755859375, -2.38531494140625, -2.2708740234375, -2.15643310546875, -2.0419921875, -1.92755126953125, -1.8131103515625, -1.69866943359375, -1.584228515625, -1.46978759765625, -1.3553466796875, -1.24090576171875, -1.12646484375, -1.01202392578125, -0.8975830078125, -0.78314208984375, -0.668701171875, -0.55426025390625, -0.4398193359375, -0.32537841796875, -0.2109375, -0.09649658203125, 0.0179443359375, 0.13238525390625, 0.246826171875, 0.36126708984375, 0.4757080078125, 0.59014892578125, 0.70458984375, 0.81903076171875, 0.9334716796875, 1.04791259765625, 1.162353515625, 1.27679443359375, 1.3912353515625, 1.50567626953125, 1.6201171875, 1.73455810546875, 1.8489990234375, 1.96343994140625, 2.077880859375, 2.19232177734375, 2.3067626953125, 2.42120361328125, 2.53564453125, 2.65008544921875, 2.7645263671875, 2.87896728515625, 2.993408203125, 3.10784912109375, 3.2222900390625, 3.33673095703125, 3.451171875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 23.0, 658.0, 329.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5358285903930664, -2.6199288368225098, -1.7040292024612427, -0.7881295680999756, 0.12777018547058105, 1.0436697006225586, 1.9595694541931152, 2.875469207763672, 3.7913689613342285, 4.707268714904785, 5.623168468475342, 6.539068222045898, 7.454967498779297, 8.370866775512695, 9.28676700592041, 10.202667236328125, 11.118566513061523, 12.034465789794922, 12.950366020202637, 13.866265296936035, 14.78216552734375, 15.698064804077148, 16.613964080810547, 17.529865264892578, 18.445764541625977, 19.361663818359375, 20.277563095092773, 21.193464279174805, 22.109363555908203, 23.0252628326416, 23.941162109375, 24.85706329345703, 25.77296257019043, 26.688861846923828, 27.604761123657227, 28.520662307739258, 29.436561584472656, 30.352460861206055, 31.268360137939453, 32.184261322021484, 33.10015869140625, 34.01605987548828, 34.93195724487305, 35.84785842895508, 36.763755798339844, 37.679656982421875, 38.595558166503906, 39.51145553588867, 40.4273567199707, 41.343257904052734, 42.2591552734375, 43.17505645751953, 44.0909538269043, 45.00685501098633, 45.92275619506836, 46.838653564453125, 47.754554748535156, 48.67045593261719, 49.58635330200195, 50.502254486083984, 51.41815185546875, 52.33405303955078, 53.24995422363281, 54.16585159301758, 55.08175277709961]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 11.0, 13.0, 5.0, 19.0, 17.0, 19.0, 22.0, 18.0, 18.0, 25.0, 24.0, 20.0, 27.0, 31.0, 33.0, 37.0, 34.0, 30.0, 37.0, 28.0, 40.0, 36.0, 35.0, 29.0, 37.0, 37.0, 37.0, 25.0, 24.0, 30.0, 26.0, 21.0, 28.0, 17.0, 14.0, 16.0, 13.0, 12.0, 10.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.216878414154053, -4.09588098526001, -3.974883794784546, -3.853886604309082, -3.732889175415039, -3.611891984939575, -3.4908947944641113, -3.3698973655700684, -3.2489001750946045, -3.1279029846191406, -3.0069055557250977, -2.885908365249634, -2.764910936355591, -2.643913745880127, -2.522916316986084, -2.40191912651062, -2.2809219360351562, -2.1599247455596924, -2.0389273166656494, -1.9179301261901855, -1.7969328165054321, -1.6759355068206787, -1.5549381971359253, -1.4339408874511719, -1.312943458557129, -1.1919461488723755, -1.070948839187622, -0.9499515891075134, -0.8289543390274048, -0.7079570293426514, -0.586959719657898, -0.4659624695777893, -0.34496521949768066, -0.22396793961524963, -0.10297064483165741, 0.018026649951934814, 0.13902392983436584, 0.2600212097167969, 0.3810185194015503, 0.5020157694816589, 0.6230130791664124, 0.7440103888511658, 0.8650076389312744, 0.9860049486160278, 1.1070022583007812, 1.2279994487762451, 1.348996877670288, 1.469994068145752, 1.5909913778305054, 1.7119886875152588, 1.8329859972000122, 1.9539833068847656, 2.0749804973602295, 2.1959776878356934, 2.3169751167297363, 2.4379723072052, 2.558969736099243, 2.679966926574707, 2.80096435546875, 2.921961545944214, 3.042958974838257, 3.1639561653137207, 3.2849535942077637, 3.4059507846832275, 3.5269479751586914]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 5.0, 9.0, 20.0, 11.0, 15.0, 19.0, 22.0, 29.0, 11.0, 39.0, 25.0, 29.0, 28.0, 41.0, 49.0, 41.0, 34.0, 49.0, 40.0, 45.0, 36.0, 34.0, 34.0, 45.0, 31.0, 28.0, 30.0, 29.0, 21.0, 37.0, 18.0, 21.0, 6.0, 12.0, 9.0, 9.0, 7.0, 4.0, 6.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5413589477539062, -0.5236358642578125, -0.5059127807617188, -0.488189697265625, -0.47046661376953125, -0.4527435302734375, -0.43502044677734375, -0.41729736328125, -0.39957427978515625, -0.3818511962890625, -0.36412811279296875, -0.346405029296875, -0.32868194580078125, -0.3109588623046875, -0.29323577880859375, -0.2755126953125, -0.25778961181640625, -0.2400665283203125, -0.22234344482421875, -0.204620361328125, -0.18689727783203125, -0.1691741943359375, -0.15145111083984375, -0.13372802734375, -0.11600494384765625, -0.0982818603515625, -0.08055877685546875, -0.062835693359375, -0.04511260986328125, -0.0273895263671875, -0.00966644287109375, 0.008056640625, 0.02577972412109375, 0.0435028076171875, 0.06122589111328125, 0.078948974609375, 0.09667205810546875, 0.1143951416015625, 0.13211822509765625, 0.14984130859375, 0.16756439208984375, 0.1852874755859375, 0.20301055908203125, 0.220733642578125, 0.23845672607421875, 0.2561798095703125, 0.27390289306640625, 0.2916259765625, 0.30934906005859375, 0.3270721435546875, 0.34479522705078125, 0.362518310546875, 0.38024139404296875, 0.3979644775390625, 0.41568756103515625, 0.43341064453125, 0.45113372802734375, 0.4688568115234375, 0.48657989501953125, 0.504302978515625, 0.5220260620117188, 0.5397491455078125, 0.5574722290039062, 0.5751953125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 10.0, 6.0, 11.0, 16.0, 14.0, 25.0, 37.0, 40.0, 68.0, 90.0, 125.0, 211.0, 335.0, 580.0, 1188.0, 2617.0, 7096.0, 23254.0, 126352.0, 1205427.0, 2458441.0, 305735.0, 44143.0, 11290.0, 3679.0, 1598.0, 767.0, 395.0, 232.0, 141.0, 99.0, 68.0, 48.0, 34.0, 18.0, 24.0, 16.0, 8.0, 12.0, 5.0, 7.0, 4.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34375, -1.300689697265625, -1.25762939453125, -1.214569091796875, -1.1715087890625, -1.128448486328125, -1.08538818359375, -1.042327880859375, -0.999267578125, -0.956207275390625, -0.91314697265625, -0.870086669921875, -0.8270263671875, -0.783966064453125, -0.74090576171875, -0.697845458984375, -0.65478515625, -0.611724853515625, -0.56866455078125, -0.525604248046875, -0.4825439453125, -0.439483642578125, -0.39642333984375, -0.353363037109375, -0.310302734375, -0.267242431640625, -0.22418212890625, -0.181121826171875, -0.1380615234375, -0.095001220703125, -0.05194091796875, -0.008880615234375, 0.0341796875, 0.077239990234375, 0.12030029296875, 0.163360595703125, 0.2064208984375, 0.249481201171875, 0.29254150390625, 0.335601806640625, 0.378662109375, 0.421722412109375, 0.46478271484375, 0.507843017578125, 0.5509033203125, 0.593963623046875, 0.63702392578125, 0.680084228515625, 0.72314453125, 0.766204833984375, 0.80926513671875, 0.852325439453125, 0.8953857421875, 0.938446044921875, 0.98150634765625, 1.024566650390625, 1.067626953125, 1.110687255859375, 1.15374755859375, 1.196807861328125, 1.2398681640625, 1.282928466796875, 1.32598876953125, 1.369049072265625, 1.412109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 4.0, 5.0, 7.0, 19.0, 28.0, 28.0, 42.0, 57.0, 89.0, 152.0, 233.0, 407.0, 632.0, 688.0, 585.0, 369.0, 219.0, 153.0, 90.0, 81.0, 50.0, 35.0, 22.0, 16.0, 18.0, 11.0, 7.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.1538543701171875, -1.113372802734375, -1.0728912353515625, -1.03240966796875, -0.9919281005859375, -0.951446533203125, -0.9109649658203125, -0.8704833984375, -0.8300018310546875, -0.789520263671875, -0.7490386962890625, -0.70855712890625, -0.6680755615234375, -0.627593994140625, -0.5871124267578125, -0.546630859375, -0.5061492919921875, -0.465667724609375, -0.4251861572265625, -0.38470458984375, -0.3442230224609375, -0.303741455078125, -0.2632598876953125, -0.2227783203125, -0.1822967529296875, -0.141815185546875, -0.1013336181640625, -0.06085205078125, -0.0203704833984375, 0.020111083984375, 0.0605926513671875, 0.10107421875, 0.1415557861328125, 0.182037353515625, 0.2225189208984375, 0.26300048828125, 0.3034820556640625, 0.343963623046875, 0.3844451904296875, 0.4249267578125, 0.4654083251953125, 0.505889892578125, 0.5463714599609375, 0.58685302734375, 0.6273345947265625, 0.667816162109375, 0.7082977294921875, 0.748779296875, 0.7892608642578125, 0.829742431640625, 0.8702239990234375, 0.91070556640625, 0.9511871337890625, 0.991668701171875, 1.0321502685546875, 1.0726318359375, 1.1131134033203125, 1.153594970703125, 1.1940765380859375, 1.23455810546875, 1.2750396728515625, 1.315521240234375, 1.3560028076171875, 1.396484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 3.0, 3.0, 4.0, 7.0, 18.0, 13.0, 26.0, 28.0, 39.0, 52.0, 94.0, 160.0, 271.0, 681.0, 2139.0, 11582.0, 218029.0, 3852197.0, 98287.0, 7826.0, 1655.0, 558.0, 232.0, 139.0, 90.0, 44.0, 31.0, 27.0, 16.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.0390625, -4.892578125, -4.74609375, -4.599609375, -4.453125, -4.306640625, -4.16015625, -4.013671875, -3.8671875, -3.720703125, -3.57421875, -3.427734375, -3.28125, -3.134765625, -2.98828125, -2.841796875, -2.6953125, -2.548828125, -2.40234375, -2.255859375, -2.109375, -1.962890625, -1.81640625, -1.669921875, -1.5234375, -1.376953125, -1.23046875, -1.083984375, -0.9375, -0.791015625, -0.64453125, -0.498046875, -0.3515625, -0.205078125, -0.05859375, 0.087890625, 0.234375, 0.380859375, 0.52734375, 0.673828125, 0.8203125, 0.966796875, 1.11328125, 1.259765625, 1.40625, 1.552734375, 1.69921875, 1.845703125, 1.9921875, 2.138671875, 2.28515625, 2.431640625, 2.578125, 2.724609375, 2.87109375, 3.017578125, 3.1640625, 3.310546875, 3.45703125, 3.603515625, 3.75, 3.896484375, 4.04296875, 4.189453125, 4.3359375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 23.0, 43.0, 105.0, 203.0, 244.0, 200.0, 111.0, 56.0, 11.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.992700576782227, -13.608741760253906, -13.224782943725586, -12.840824127197266, -12.456865310668945, -12.072906494140625, -11.688947677612305, -11.304988861083984, -10.921030044555664, -10.537071228027344, -10.153112411499023, -9.769153594970703, -9.385194778442383, -9.001235961914062, -8.617277145385742, -8.233318328857422, -7.849360466003418, -7.465401649475098, -7.081442832946777, -6.697484016418457, -6.313525199890137, -5.929566383361816, -5.545608043670654, -5.161649227142334, -4.777690410614014, -4.393731594085693, -4.009772777557373, -3.625814199447632, -3.2418553829193115, -2.857896566390991, -2.47393798828125, -2.0899791717529297, -1.7060203552246094, -1.322061538696289, -0.9381028413772583, -0.5541441440582275, -0.17018532752990723, 0.21377348899841309, 0.5977320671081543, 0.9816908836364746, 1.365649700164795, 1.7496085166931152, 2.1335673332214355, 2.5175259113311768, 2.901484727859497, 3.2854435443878174, 3.6694021224975586, 4.053360939025879, 4.437319755554199, 4.8212785720825195, 5.20523738861084, 5.58919620513916, 5.9731550216674805, 6.357113838195801, 6.741072177886963, 7.125030994415283, 7.5089898109436035, 7.892948627471924, 8.276906967163086, 8.660865783691406, 9.044824600219727, 9.428783416748047, 9.812742233276367, 10.196701049804688, 10.580659866333008]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 7.0, 17.0, 15.0, 12.0, 21.0, 16.0, 18.0, 21.0, 28.0, 27.0, 28.0, 23.0, 23.0, 37.0, 27.0, 32.0, 37.0, 28.0, 45.0, 36.0, 40.0, 37.0, 39.0, 29.0, 30.0, 32.0, 27.0, 27.0, 35.0, 18.0, 24.0, 20.0, 21.0, 16.0, 14.0, 19.0, 7.0, 10.0, 7.0, 10.0, 8.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.09420108795166, -3.0003137588500977, -2.906426429748535, -2.8125391006469727, -2.71865177154541, -2.6247644424438477, -2.530877113342285, -2.4369897842407227, -2.34310245513916, -2.2492151260375977, -2.155327796936035, -2.0614404678344727, -1.9675531387329102, -1.8736658096313477, -1.7797785997390747, -1.6858912706375122, -1.5920040607452393, -1.4981167316436768, -1.4042294025421143, -1.3103420734405518, -1.2164547443389893, -1.1225674152374268, -1.0286802053451538, -0.9347928762435913, -0.8409055471420288, -0.7470182180404663, -0.6531308889389038, -0.5592436194419861, -0.4653562903404236, -0.3714689612388611, -0.27758169174194336, -0.18369436264038086, -0.08980679512023926, 0.004080519080162048, 0.09796783328056335, 0.19185513257980347, 0.28574246168136597, 0.37962979078292847, 0.4735170602798462, 0.5674043893814087, 0.6612917184829712, 0.7551790475845337, 0.8490663766860962, 0.9429536461830139, 1.0368409156799316, 1.1307282447814941, 1.2246155738830566, 1.3185029029846191, 1.4123902320861816, 1.5062775611877441, 1.6001648902893066, 1.6940522193908691, 1.7879395484924316, 1.8818268775939941, 1.975714087486267, 2.069601535797119, 2.1634888648986816, 2.257376194000244, 2.3512635231018066, 2.445150852203369, 2.5390381813049316, 2.632925510406494, 2.7268128395080566, 2.820700168609619, 2.9145872592926025]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 8.0, 8.0, 8.0, 20.0, 14.0, 18.0, 22.0, 18.0, 18.0, 21.0, 26.0, 30.0, 26.0, 28.0, 32.0, 34.0, 39.0, 42.0, 38.0, 32.0, 37.0, 37.0, 38.0, 33.0, 40.0, 33.0, 33.0, 30.0, 28.0, 34.0, 25.0, 30.0, 16.0, 19.0, 11.0, 13.0, 10.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.50244140625, -0.4862060546875, -0.469970703125, -0.4537353515625, -0.4375, -0.4212646484375, -0.405029296875, -0.3887939453125, -0.37255859375, -0.3563232421875, -0.340087890625, -0.3238525390625, -0.3076171875, -0.2913818359375, -0.275146484375, -0.2589111328125, -0.24267578125, -0.2264404296875, -0.210205078125, -0.1939697265625, -0.177734375, -0.1614990234375, -0.145263671875, -0.1290283203125, -0.11279296875, -0.0965576171875, -0.080322265625, -0.0640869140625, -0.0478515625, -0.0316162109375, -0.015380859375, 0.0008544921875, 0.01708984375, 0.0333251953125, 0.049560546875, 0.0657958984375, 0.08203125, 0.0982666015625, 0.114501953125, 0.1307373046875, 0.14697265625, 0.1632080078125, 0.179443359375, 0.1956787109375, 0.2119140625, 0.2281494140625, 0.244384765625, 0.2606201171875, 0.27685546875, 0.2930908203125, 0.309326171875, 0.3255615234375, 0.341796875, 0.3580322265625, 0.374267578125, 0.3905029296875, 0.40673828125, 0.4229736328125, 0.439208984375, 0.4554443359375, 0.4716796875, 0.4879150390625, 0.504150390625, 0.5203857421875, 0.53662109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 9.0, 10.0, 19.0, 32.0, 37.0, 43.0, 67.0, 112.0, 136.0, 187.0, 273.0, 384.0, 559.0, 812.0, 1123.0, 1611.0, 2206.0, 3131.0, 4419.0, 6390.0, 9049.0, 12891.0, 18777.0, 27296.0, 38853.0, 57449.0, 83213.0, 117781.0, 150004.0, 145144.0, 112100.0, 79091.0, 53648.0, 37127.0, 25337.0, 17652.0, 12369.0, 8595.0, 5940.0, 4163.0, 2917.0, 2252.0, 1594.0, 1123.0, 712.0, 540.0, 448.0, 282.0, 204.0, 140.0, 108.0, 69.0, 58.0, 40.0, 14.0, 13.0, 4.0, 2.0, 4.0], "bins": [-0.0570068359375, -0.05532646179199219, -0.053646087646484375, -0.05196571350097656, -0.05028533935546875, -0.04860496520996094, -0.046924591064453125, -0.04524421691894531, -0.0435638427734375, -0.04188346862792969, -0.040203094482421875, -0.03852272033691406, -0.03684234619140625, -0.03516197204589844, -0.033481597900390625, -0.03180122375488281, -0.030120849609375, -0.028440475463867188, -0.026760101318359375, -0.025079727172851562, -0.02339935302734375, -0.021718978881835938, -0.020038604736328125, -0.018358230590820312, -0.0166778564453125, -0.014997482299804688, -0.013317108154296875, -0.011636734008789062, -0.00995635986328125, -0.008275985717773438, -0.006595611572265625, -0.0049152374267578125, -0.00323486328125, -0.0015544891357421875, 0.000125885009765625, 0.0018062591552734375, 0.00348663330078125, 0.0051670074462890625, 0.006847381591796875, 0.008527755737304688, 0.0102081298828125, 0.011888504028320312, 0.013568878173828125, 0.015249252319335938, 0.01692962646484375, 0.018610000610351562, 0.020290374755859375, 0.021970748901367188, 0.023651123046875, 0.025331497192382812, 0.027011871337890625, 0.028692245483398438, 0.03037261962890625, 0.03205299377441406, 0.033733367919921875, 0.03541374206542969, 0.0370941162109375, 0.03877449035644531, 0.040454864501953125, 0.04213523864746094, 0.04381561279296875, 0.04549598693847656, 0.047176361083984375, 0.04885673522949219, 0.050537109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 13.0, 7.0, 9.0, 11.0, 12.0, 19.0, 22.0, 22.0, 22.0, 21.0, 26.0, 37.0, 30.0, 49.0, 32.0, 35.0, 34.0, 48.0, 1056.0, 45.0, 46.0, 40.0, 42.0, 32.0, 36.0, 47.0, 31.0, 26.0, 30.0, 18.0, 24.0, 26.0, 18.0, 12.0, 12.0, 6.0, 3.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4638671875, -0.44913482666015625, -0.4344024658203125, -0.41967010498046875, -0.404937744140625, -0.39020538330078125, -0.3754730224609375, -0.36074066162109375, -0.34600830078125, -0.33127593994140625, -0.3165435791015625, -0.30181121826171875, -0.287078857421875, -0.27234649658203125, -0.2576141357421875, -0.24288177490234375, -0.2281494140625, -0.21341705322265625, -0.1986846923828125, -0.18395233154296875, -0.169219970703125, -0.15448760986328125, -0.1397552490234375, -0.12502288818359375, -0.11029052734375, -0.09555816650390625, -0.0808258056640625, -0.06609344482421875, -0.051361083984375, -0.03662872314453125, -0.0218963623046875, -0.00716400146484375, 0.007568359375, 0.02230072021484375, 0.0370330810546875, 0.05176544189453125, 0.066497802734375, 0.08123016357421875, 0.0959625244140625, 0.11069488525390625, 0.12542724609375, 0.14015960693359375, 0.1548919677734375, 0.16962432861328125, 0.184356689453125, 0.19908905029296875, 0.2138214111328125, 0.22855377197265625, 0.2432861328125, 0.25801849365234375, 0.2727508544921875, 0.28748321533203125, 0.302215576171875, 0.31694793701171875, 0.3316802978515625, 0.34641265869140625, 0.36114501953125, 0.37587738037109375, 0.3906097412109375, 0.40534210205078125, 0.420074462890625, 0.43480682373046875, 0.4495391845703125, 0.46427154541015625, 0.47900390625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 6.0, 9.0, 11.0, 18.0, 28.0, 40.0, 45.0, 77.0, 109.0, 140.0, 254.0, 338.0, 485.0, 732.0, 1088.0, 1599.0, 2564.0, 4011.0, 6923.0, 12628.0, 26400.0, 112291.0, 1769712.0, 102063.0, 25476.0, 11902.0, 6886.0, 3922.0, 2514.0, 1628.0, 1027.0, 712.0, 482.0, 325.0, 209.0, 134.0, 98.0, 88.0, 51.0, 28.0, 32.0, 12.0, 8.0, 12.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1248779296875, -0.12049293518066406, -0.11610794067382812, -0.11172294616699219, -0.10733795166015625, -0.10295295715332031, -0.09856796264648438, -0.09418296813964844, -0.0897979736328125, -0.08541297912597656, -0.08102798461914062, -0.07664299011230469, -0.07225799560546875, -0.06787300109863281, -0.06348800659179688, -0.05910301208496094, -0.054718017578125, -0.05033302307128906, -0.045948028564453125, -0.04156303405761719, -0.03717803955078125, -0.03279304504394531, -0.028408050537109375, -0.024023056030273438, -0.0196380615234375, -0.015253067016601562, -0.010868072509765625, -0.0064830780029296875, -0.00209808349609375, 0.0022869110107421875, 0.006671905517578125, 0.011056900024414062, 0.01544189453125, 0.019826889038085938, 0.024211883544921875, 0.028596878051757812, 0.03298187255859375, 0.03736686706542969, 0.041751861572265625, 0.04613685607910156, 0.0505218505859375, 0.05490684509277344, 0.059291839599609375, 0.06367683410644531, 0.06806182861328125, 0.07244682312011719, 0.07683181762695312, 0.08121681213378906, 0.085601806640625, 0.08998680114746094, 0.09437179565429688, 0.09875679016113281, 0.10314178466796875, 0.10752677917480469, 0.11191177368164062, 0.11629676818847656, 0.1206817626953125, 0.12506675720214844, 0.12945175170898438, 0.1338367462158203, 0.13822174072265625, 0.1426067352294922, 0.14699172973632812, 0.15137672424316406, 0.15576171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 8.0, 5.0, 14.0, 11.0, 19.0, 17.0, 23.0, 19.0, 25.0, 28.0, 28.0, 27.0, 34.0, 30.0, 35.0, 29.0, 31.0, 40.0, 33.0, 44.0, 33.0, 33.0, 37.0, 37.0, 29.0, 40.0, 34.0, 29.0, 36.0, 28.0, 24.0, 19.0, 10.0, 11.0, 16.0, 15.0, 14.0, 8.0, 5.0, 11.0, 6.0, 8.0, 3.0, 2.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005550384521484375, -0.005357980728149414, -0.005165576934814453, -0.004973173141479492, -0.004780769348144531, -0.00458836555480957, -0.004395961761474609, -0.0042035579681396484, -0.0040111541748046875, -0.0038187503814697266, -0.0036263465881347656, -0.0034339427947998047, -0.0032415390014648438, -0.003049135208129883, -0.002856731414794922, -0.002664327621459961, -0.002471923828125, -0.002279520034790039, -0.002087116241455078, -0.0018947124481201172, -0.0017023086547851562, -0.0015099048614501953, -0.0013175010681152344, -0.0011250972747802734, -0.0009326934814453125, -0.0007402896881103516, -0.0005478858947753906, -0.0003554821014404297, -0.00016307830810546875, 2.9325485229492188e-05, 0.00022172927856445312, 0.00041413307189941406, 0.000606536865234375, 0.0007989406585693359, 0.0009913444519042969, 0.0011837482452392578, 0.0013761520385742188, 0.0015685558319091797, 0.0017609596252441406, 0.0019533634185791016, 0.0021457672119140625, 0.0023381710052490234, 0.0025305747985839844, 0.0027229785919189453, 0.0029153823852539062, 0.003107786178588867, 0.003300189971923828, 0.003492593765258789, 0.00368499755859375, 0.003877401351928711, 0.004069805145263672, 0.004262208938598633, 0.004454612731933594, 0.004647016525268555, 0.004839420318603516, 0.0050318241119384766, 0.0052242279052734375, 0.0054166316986083984, 0.005609035491943359, 0.00580143928527832, 0.005993843078613281, 0.006186246871948242, 0.006378650665283203, 0.006571054458618164, 0.006763458251953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 11.0, 10.0, 2.0, 12.0, 12.0, 18.0, 12.0, 14.0, 21.0, 36.0, 40.0, 44.0, 76.0, 90.0, 125.0, 128.0, 209.0, 359.0, 1228.0, 68747.0, 962875.0, 12611.0, 750.0, 313.0, 157.0, 145.0, 94.0, 72.0, 69.0, 48.0, 43.0, 34.0, 26.0, 21.0, 22.0, 14.0, 12.0, 11.0, 9.0, 6.0, 8.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1265869140625, -0.12300491333007812, -0.11942291259765625, -0.11584091186523438, -0.1122589111328125, -0.10867691040039062, -0.10509490966796875, -0.10151290893554688, -0.097930908203125, -0.09434890747070312, -0.09076690673828125, -0.08718490600585938, -0.0836029052734375, -0.08002090454101562, -0.07643890380859375, -0.07285690307617188, -0.06927490234375, -0.06569290161132812, -0.06211090087890625, -0.058528900146484375, -0.0549468994140625, -0.051364898681640625, -0.04778289794921875, -0.044200897216796875, -0.040618896484375, -0.037036895751953125, -0.03345489501953125, -0.029872894287109375, -0.0262908935546875, -0.022708892822265625, -0.01912689208984375, -0.015544891357421875, -0.011962890625, -0.008380889892578125, -0.00479888916015625, -0.001216888427734375, 0.0023651123046875, 0.005947113037109375, 0.00952911376953125, 0.013111114501953125, 0.016693115234375, 0.020275115966796875, 0.02385711669921875, 0.027439117431640625, 0.0310211181640625, 0.034603118896484375, 0.03818511962890625, 0.041767120361328125, 0.04534912109375, 0.048931121826171875, 0.05251312255859375, 0.056095123291015625, 0.0596771240234375, 0.06325912475585938, 0.06684112548828125, 0.07042312622070312, 0.074005126953125, 0.07758712768554688, 0.08116912841796875, 0.08475112915039062, 0.0883331298828125, 0.09191513061523438, 0.09549713134765625, 0.09907913208007812, 0.1026611328125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 19.0, 255.0, 703.0, 38.0, 2.0], "bins": [-0.2405931055545807, -0.23666276037693024, -0.2327324002981186, -0.22880205512046814, -0.2248716950416565, -0.22094134986400604, -0.2170110046863556, -0.21308064460754395, -0.2091502994298935, -0.20521995425224304, -0.2012895941734314, -0.19735924899578094, -0.1934289038181305, -0.18949854373931885, -0.1855681985616684, -0.18163783848285675, -0.1777074933052063, -0.17377714812755585, -0.1698467880487442, -0.16591644287109375, -0.1619860827922821, -0.15805573761463165, -0.1541253924369812, -0.15019503235816956, -0.1462646871805191, -0.14233434200286865, -0.138403981924057, -0.13447363674640656, -0.1305432915687561, -0.12661293148994446, -0.122682586312294, -0.11875223368406296, -0.11482187360525131, -0.11089152097702026, -0.10696117579936981, -0.10303082317113876, -0.09910047054290771, -0.09517011791467667, -0.09123976528644562, -0.08730942010879517, -0.08337906748056412, -0.07944871485233307, -0.07551836967468262, -0.07158801704645157, -0.06765766441822052, -0.06372731178998947, -0.05979696288704872, -0.05586661398410797, -0.05193626135587692, -0.048005908727645874, -0.044075559824705124, -0.040145210921764374, -0.036214858293533325, -0.03228450566530228, -0.028354156762361526, -0.024423805996775627, -0.020493457093834877, -0.016563106328248978, -0.012632755562663078, -0.008702404797077179, -0.00477205403149128, -0.0008417032659053802, 0.003088647499680519, 0.0070189982652664185, 0.010949349030852318]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 15.0, 8.0, 31.0, 31.0, 38.0, 43.0, 34.0, 37.0, 41.0, 60.0, 52.0, 42.0, 47.0, 48.0, 55.0, 56.0, 58.0, 43.0, 38.0, 27.0, 27.0, 27.0, 22.0, 25.0, 17.0, 13.0, 9.0, 8.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02219676971435547, -0.021458376199007034, -0.0207199826836586, -0.019981589168310165, -0.01924319565296173, -0.018504802137613297, -0.017766408622264862, -0.017028015106916428, -0.016289621591567993, -0.015551228076219559, -0.014812834560871124, -0.01407444104552269, -0.013336047530174255, -0.012597654014825821, -0.011859260499477386, -0.011120866984128952, -0.010382473468780518, -0.009644079953432083, -0.008905686438083649, -0.008167292922735214, -0.00742889940738678, -0.006690505892038345, -0.005952112376689911, -0.0052137188613414764, -0.004475325345993042, -0.0037369318306446075, -0.002998538315296173, -0.0022601447999477386, -0.0015217512845993042, -0.0007833577692508698, -4.49642539024353e-05, 0.0006934292614459991, 0.0014318227767944336, 0.002170216292142868, 0.0029086098074913025, 0.003647003322839737, 0.004385396838188171, 0.005123790353536606, 0.00586218386888504, 0.006600577384233475, 0.007338970899581909, 0.008077364414930344, 0.008815757930278778, 0.009554151445627213, 0.010292544960975647, 0.011030938476324081, 0.011769331991672516, 0.01250772550702095, 0.013246119022369385, 0.01398451253771782, 0.014722906053066254, 0.015461299568414688, 0.016199693083763123, 0.016938086599111557, 0.01767648011445999, 0.018414873629808426, 0.01915326714515686, 0.019891660660505295, 0.02063005417585373, 0.021368447691202164, 0.022106841206550598, 0.022845234721899033, 0.023583628237247467, 0.0243220217525959, 0.025060415267944336]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 8.0, 9.0, 7.0, 20.0, 15.0, 18.0, 23.0, 17.0, 19.0, 20.0, 25.0, 31.0, 27.0, 27.0, 33.0, 33.0, 42.0, 41.0, 36.0, 35.0, 34.0, 37.0, 39.0, 33.0, 39.0, 34.0, 32.0, 30.0, 32.0, 30.0, 25.0, 29.0, 22.0, 14.0, 12.0, 11.0, 10.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.50146484375, -0.4852294921875, -0.468994140625, -0.4527587890625, -0.4365234375, -0.4202880859375, -0.404052734375, -0.3878173828125, -0.37158203125, -0.3553466796875, -0.339111328125, -0.3228759765625, -0.306640625, -0.2904052734375, -0.274169921875, -0.2579345703125, -0.24169921875, -0.2254638671875, -0.209228515625, -0.1929931640625, -0.1767578125, -0.1605224609375, -0.144287109375, -0.1280517578125, -0.11181640625, -0.0955810546875, -0.079345703125, -0.0631103515625, -0.046875, -0.0306396484375, -0.014404296875, 0.0018310546875, 0.01806640625, 0.0343017578125, 0.050537109375, 0.0667724609375, 0.0830078125, 0.0992431640625, 0.115478515625, 0.1317138671875, 0.14794921875, 0.1641845703125, 0.180419921875, 0.1966552734375, 0.212890625, 0.2291259765625, 0.245361328125, 0.2615966796875, 0.27783203125, 0.2940673828125, 0.310302734375, 0.3265380859375, 0.3427734375, 0.3590087890625, 0.375244140625, 0.3914794921875, 0.40771484375, 0.4239501953125, 0.440185546875, 0.4564208984375, 0.47265625, 0.4888916015625, 0.505126953125, 0.5213623046875, 0.53759765625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 8.0, 11.0, 18.0, 19.0, 24.0, 44.0, 57.0, 62.0, 102.0, 152.0, 179.0, 256.0, 368.0, 565.0, 982.0, 1342.0, 2058.0, 3393.0, 5465.0, 9381.0, 16785.0, 31002.0, 58587.0, 114600.0, 233659.0, 280422.0, 136479.0, 68928.0, 36293.0, 19345.0, 10843.0, 6394.0, 3893.0, 2339.0, 1435.0, 981.0, 583.0, 414.0, 286.0, 246.0, 166.0, 111.0, 73.0, 55.0, 37.0, 34.0, 20.0, 17.0, 12.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.62890625, -0.6093292236328125, -0.589752197265625, -0.5701751708984375, -0.55059814453125, -0.5310211181640625, -0.511444091796875, -0.4918670654296875, -0.4722900390625, -0.4527130126953125, -0.433135986328125, -0.4135589599609375, -0.39398193359375, -0.3744049072265625, -0.354827880859375, -0.3352508544921875, -0.315673828125, -0.2960968017578125, -0.276519775390625, -0.2569427490234375, -0.23736572265625, -0.2177886962890625, -0.198211669921875, -0.1786346435546875, -0.1590576171875, -0.1394805908203125, -0.119903564453125, -0.1003265380859375, -0.08074951171875, -0.0611724853515625, -0.041595458984375, -0.0220184326171875, -0.00244140625, 0.0171356201171875, 0.036712646484375, 0.0562896728515625, 0.07586669921875, 0.0954437255859375, 0.115020751953125, 0.1345977783203125, 0.1541748046875, 0.1737518310546875, 0.193328857421875, 0.2129058837890625, 0.23248291015625, 0.2520599365234375, 0.271636962890625, 0.2912139892578125, 0.310791015625, 0.3303680419921875, 0.349945068359375, 0.3695220947265625, 0.38909912109375, 0.4086761474609375, 0.428253173828125, 0.4478302001953125, 0.4674072265625, 0.4869842529296875, 0.506561279296875, 0.5261383056640625, 0.54571533203125, 0.5652923583984375, 0.584869384765625, 0.6044464111328125, 0.6240234375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 13.0, 11.0, 14.0, 18.0, 21.0, 26.0, 30.0, 22.0, 29.0, 37.0, 34.0, 57.0, 59.0, 81.0, 110.0, 200.0, 1391.0, 232.0, 122.0, 100.0, 64.0, 48.0, 46.0, 38.0, 23.0, 32.0, 26.0, 20.0, 25.0, 14.0, 11.0, 13.0, 11.0, 8.0, 11.0, 6.0, 2.0, 1.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59765625, -1.54705810546875, -1.4964599609375, -1.44586181640625, -1.395263671875, -1.34466552734375, -1.2940673828125, -1.24346923828125, -1.19287109375, -1.14227294921875, -1.0916748046875, -1.04107666015625, -0.990478515625, -0.93988037109375, -0.8892822265625, -0.83868408203125, -0.7880859375, -0.73748779296875, -0.6868896484375, -0.63629150390625, -0.585693359375, -0.53509521484375, -0.4844970703125, -0.43389892578125, -0.38330078125, -0.33270263671875, -0.2821044921875, -0.23150634765625, -0.180908203125, -0.13031005859375, -0.0797119140625, -0.02911376953125, 0.021484375, 0.07208251953125, 0.1226806640625, 0.17327880859375, 0.223876953125, 0.27447509765625, 0.3250732421875, 0.37567138671875, 0.42626953125, 0.47686767578125, 0.5274658203125, 0.57806396484375, 0.628662109375, 0.67926025390625, 0.7298583984375, 0.78045654296875, 0.8310546875, 0.88165283203125, 0.9322509765625, 0.98284912109375, 1.033447265625, 1.08404541015625, 1.1346435546875, 1.18524169921875, 1.23583984375, 1.28643798828125, 1.3370361328125, 1.38763427734375, 1.438232421875, 1.48883056640625, 1.5394287109375, 1.59002685546875, 1.640625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 12.0, 13.0, 16.0, 27.0, 32.0, 45.0, 56.0, 100.0, 141.0, 253.0, 473.0, 1561.0, 8392.0, 385658.0, 2722618.0, 21903.0, 2769.0, 780.0, 314.0, 186.0, 103.0, 68.0, 56.0, 37.0, 19.0, 15.0, 10.0, 13.0, 11.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.33984375, -5.18365478515625, -5.0274658203125, -4.87127685546875, -4.715087890625, -4.55889892578125, -4.4027099609375, -4.24652099609375, -4.09033203125, -3.93414306640625, -3.7779541015625, -3.62176513671875, -3.465576171875, -3.30938720703125, -3.1531982421875, -2.99700927734375, -2.8408203125, -2.68463134765625, -2.5284423828125, -2.37225341796875, -2.216064453125, -2.05987548828125, -1.9036865234375, -1.74749755859375, -1.59130859375, -1.43511962890625, -1.2789306640625, -1.12274169921875, -0.966552734375, -0.81036376953125, -0.6541748046875, -0.49798583984375, -0.341796875, -0.18560791015625, -0.0294189453125, 0.12677001953125, 0.282958984375, 0.43914794921875, 0.5953369140625, 0.75152587890625, 0.90771484375, 1.06390380859375, 1.2200927734375, 1.37628173828125, 1.532470703125, 1.68865966796875, 1.8448486328125, 2.00103759765625, 2.1572265625, 2.31341552734375, 2.4696044921875, 2.62579345703125, 2.781982421875, 2.93817138671875, 3.0943603515625, 3.25054931640625, 3.40673828125, 3.56292724609375, 3.7191162109375, 3.87530517578125, 4.031494140625, 4.18768310546875, 4.3438720703125, 4.50006103515625, 4.65625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 23.0, 246.0, 580.0, 152.0, 11.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.166410446166992, -3.5154452323913574, -2.8644797801971436, -2.2135143280029297, -1.562549114227295, -0.9115839004516602, -0.2606184482574463, 0.3903470039367676, 1.0413122177124023, 1.6922775506973267, 2.343242883682251, 2.994208335876465, 3.6451735496520996, 4.296138763427734, 4.947104454040527, 5.598069667816162, 6.249034881591797, 6.900000095367432, 7.550965309143066, 8.20193099975586, 8.852895736694336, 9.503861427307129, 10.154827117919922, 10.805791854858398, 11.456757545471191, 12.107723236083984, 12.758687973022461, 13.409653663635254, 14.060619354248047, 14.711584091186523, 15.362549781799316, 16.01351547241211, 16.66448211669922, 17.315446853637695, 17.966413497924805, 18.61737823486328, 19.268342971801758, 19.919307708740234, 20.570274353027344, 21.22123908996582, 21.872203826904297, 22.523168563842773, 23.174135208129883, 23.82509994506836, 24.476064682006836, 25.127029418945312, 25.777996063232422, 26.4289608001709, 27.079927444458008, 27.730892181396484, 28.381858825683594, 29.03282356262207, 29.683788299560547, 30.334754943847656, 30.985719680786133, 31.63668441772461, 32.28765106201172, 32.93861770629883, 33.58958053588867, 34.24054718017578, 34.89151382446289, 35.542476654052734, 36.193443298339844, 36.84440994262695, 37.4953727722168]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 8.0, 3.0, 15.0, 6.0, 13.0, 15.0, 16.0, 28.0, 27.0, 26.0, 42.0, 26.0, 25.0, 24.0, 43.0, 31.0, 39.0, 35.0, 37.0, 35.0, 36.0, 37.0, 43.0, 31.0, 30.0, 38.0, 32.0, 28.0, 28.0, 25.0, 18.0, 18.0, 25.0, 14.0, 14.0, 11.0, 24.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.6120781898498535, -4.476400852203369, -4.340723514556885, -4.2050461769104, -4.069368839263916, -3.9336915016174316, -3.798013925552368, -3.662336587905884, -3.5266592502593994, -3.390981912612915, -3.2553045749664307, -3.1196272373199463, -2.983949661254883, -2.8482723236083984, -2.712594985961914, -2.5769176483154297, -2.4412403106689453, -2.305562973022461, -2.1698856353759766, -2.034208297729492, -1.8985308408737183, -1.7628535032272339, -1.62717604637146, -1.4914987087249756, -1.3558213710784912, -1.2201440334320068, -1.0844666957855225, -0.9487892389297485, -0.8131119012832642, -0.6774345636367798, -0.5417571663856506, -0.4060797691345215, -0.2704029083251953, -0.13472554087638855, 0.0009518265724182129, 0.13662919402122498, 0.27230656147003174, 0.4079838991165161, 0.5436612963676453, 0.6793386936187744, 0.8150160312652588, 0.9506933689117432, 1.0863707065582275, 1.2220481634140015, 1.3577255010604858, 1.4934028387069702, 1.6290802955627441, 1.7647576332092285, 1.900434970855713, 2.0361123085021973, 2.1717896461486816, 2.307466983795166, 2.4431443214416504, 2.5788216590881348, 2.7144992351531982, 2.8501765727996826, 2.985853910446167, 3.1215312480926514, 3.2572085857391357, 3.39288592338562, 3.5285634994506836, 3.664240837097168, 3.7999181747436523, 3.9355955123901367, 4.071272850036621]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 6.0, 8.0, 8.0, 11.0, 7.0, 16.0, 14.0, 19.0, 19.0, 23.0, 22.0, 19.0, 28.0, 32.0, 31.0, 28.0, 29.0, 34.0, 29.0, 29.0, 49.0, 37.0, 35.0, 29.0, 38.0, 20.0, 33.0, 37.0, 31.0, 25.0, 31.0, 25.0, 37.0, 24.0, 19.0, 14.0, 16.0, 11.0, 19.0, 9.0, 7.0, 4.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.51416015625, -0.49794769287109375, -0.4817352294921875, -0.46552276611328125, -0.449310302734375, -0.43309783935546875, -0.4168853759765625, -0.40067291259765625, -0.38446044921875, -0.36824798583984375, -0.3520355224609375, -0.33582305908203125, -0.319610595703125, -0.30339813232421875, -0.2871856689453125, -0.27097320556640625, -0.2547607421875, -0.23854827880859375, -0.2223358154296875, -0.20612335205078125, -0.189910888671875, -0.17369842529296875, -0.1574859619140625, -0.14127349853515625, -0.12506103515625, -0.10884857177734375, -0.0926361083984375, -0.07642364501953125, -0.060211181640625, -0.04399871826171875, -0.0277862548828125, -0.01157379150390625, 0.004638671875, 0.02085113525390625, 0.0370635986328125, 0.05327606201171875, 0.069488525390625, 0.08570098876953125, 0.1019134521484375, 0.11812591552734375, 0.13433837890625, 0.15055084228515625, 0.1667633056640625, 0.18297576904296875, 0.199188232421875, 0.21540069580078125, 0.2316131591796875, 0.24782562255859375, 0.2640380859375, 0.28025054931640625, 0.2964630126953125, 0.31267547607421875, 0.328887939453125, 0.34510040283203125, 0.3613128662109375, 0.37752532958984375, 0.39373779296875, 0.40995025634765625, 0.4261627197265625, 0.44237518310546875, 0.458587646484375, 0.47480010986328125, 0.4910125732421875, 0.5072250366210938, 0.5234375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 11.0, 6.0, 12.0, 12.0, 16.0, 11.0, 19.0, 22.0, 30.0, 36.0, 52.0, 69.0, 110.0, 156.0, 245.0, 500.0, 919.0, 2050.0, 5371.0, 16530.0, 69237.0, 533180.0, 2789465.0, 665025.0, 82650.0, 18570.0, 5680.0, 2126.0, 937.0, 456.0, 220.0, 151.0, 108.0, 63.0, 49.0, 35.0, 31.0, 21.0, 20.0, 20.0, 13.0, 11.0, 6.0, 13.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3896484375, -1.3455963134765625, -1.301544189453125, -1.2574920654296875, -1.21343994140625, -1.1693878173828125, -1.125335693359375, -1.0812835693359375, -1.0372314453125, -0.9931793212890625, -0.949127197265625, -0.9050750732421875, -0.86102294921875, -0.8169708251953125, -0.772918701171875, -0.7288665771484375, -0.684814453125, -0.6407623291015625, -0.596710205078125, -0.5526580810546875, -0.50860595703125, -0.4645538330078125, -0.420501708984375, -0.3764495849609375, -0.3323974609375, -0.2883453369140625, -0.244293212890625, -0.2002410888671875, -0.15618896484375, -0.1121368408203125, -0.068084716796875, -0.0240325927734375, 0.02001953125, 0.0640716552734375, 0.108123779296875, 0.1521759033203125, 0.19622802734375, 0.2402801513671875, 0.284332275390625, 0.3283843994140625, 0.3724365234375, 0.4164886474609375, 0.460540771484375, 0.5045928955078125, 0.54864501953125, 0.5926971435546875, 0.636749267578125, 0.6808013916015625, 0.724853515625, 0.7689056396484375, 0.812957763671875, 0.8570098876953125, 0.90106201171875, 0.9451141357421875, 0.989166259765625, 1.0332183837890625, 1.0772705078125, 1.1213226318359375, 1.165374755859375, 1.2094268798828125, 1.25347900390625, 1.2975311279296875, 1.341583251953125, 1.3856353759765625, 1.4296875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 10.0, 7.0, 5.0, 12.0, 12.0, 12.0, 23.0, 38.0, 42.0, 41.0, 69.0, 115.0, 140.0, 200.0, 323.0, 486.0, 611.0, 560.0, 455.0, 264.0, 176.0, 124.0, 87.0, 55.0, 52.0, 32.0, 22.0, 27.0, 15.0, 10.0, 13.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0850982666015625, -1.052032470703125, -1.0189666748046875, -0.98590087890625, -0.9528350830078125, -0.919769287109375, -0.8867034912109375, -0.8536376953125, -0.8205718994140625, -0.787506103515625, -0.7544403076171875, -0.72137451171875, -0.6883087158203125, -0.655242919921875, -0.6221771240234375, -0.589111328125, -0.5560455322265625, -0.522979736328125, -0.4899139404296875, -0.45684814453125, -0.4237823486328125, -0.390716552734375, -0.3576507568359375, -0.3245849609375, -0.2915191650390625, -0.258453369140625, -0.2253875732421875, -0.19232177734375, -0.1592559814453125, -0.126190185546875, -0.0931243896484375, -0.06005859375, -0.0269927978515625, 0.006072998046875, 0.0391387939453125, 0.07220458984375, 0.1052703857421875, 0.138336181640625, 0.1714019775390625, 0.2044677734375, 0.2375335693359375, 0.270599365234375, 0.3036651611328125, 0.33673095703125, 0.3697967529296875, 0.402862548828125, 0.4359283447265625, 0.468994140625, 0.5020599365234375, 0.535125732421875, 0.5681915283203125, 0.60125732421875, 0.6343231201171875, 0.667388916015625, 0.7004547119140625, 0.7335205078125, 0.7665863037109375, 0.799652099609375, 0.8327178955078125, 0.86578369140625, 0.8988494873046875, 0.931915283203125, 0.9649810791015625, 0.998046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 14.0, 10.0, 16.0, 14.0, 22.0, 22.0, 33.0, 44.0, 65.0, 89.0, 161.0, 292.0, 897.0, 3909.0, 45663.0, 3676780.0, 451360.0, 11865.0, 1758.0, 563.0, 240.0, 140.0, 88.0, 38.0, 46.0, 41.0, 20.0, 15.0, 13.0, 14.0, 5.0, 10.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.68359375, -4.5262451171875, -4.368896484375, -4.2115478515625, -4.05419921875, -3.8968505859375, -3.739501953125, -3.5821533203125, -3.4248046875, -3.2674560546875, -3.110107421875, -2.9527587890625, -2.79541015625, -2.6380615234375, -2.480712890625, -2.3233642578125, -2.166015625, -2.0086669921875, -1.851318359375, -1.6939697265625, -1.53662109375, -1.3792724609375, -1.221923828125, -1.0645751953125, -0.9072265625, -0.7498779296875, -0.592529296875, -0.4351806640625, -0.27783203125, -0.1204833984375, 0.036865234375, 0.1942138671875, 0.3515625, 0.5089111328125, 0.666259765625, 0.8236083984375, 0.98095703125, 1.1383056640625, 1.295654296875, 1.4530029296875, 1.6103515625, 1.7677001953125, 1.925048828125, 2.0823974609375, 2.23974609375, 2.3970947265625, 2.554443359375, 2.7117919921875, 2.869140625, 3.0264892578125, 3.183837890625, 3.3411865234375, 3.49853515625, 3.6558837890625, 3.813232421875, 3.9705810546875, 4.1279296875, 4.2852783203125, 4.442626953125, 4.5999755859375, 4.75732421875, 4.9146728515625, 5.072021484375, 5.2293701171875, 5.38671875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 10.0, 18.0, 22.0, 14.0, 42.0, 63.0, 70.0, 95.0, 91.0, 102.0, 94.0, 90.0, 76.0, 76.0, 46.0, 31.0, 25.0, 12.0, 9.0, 7.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.252429485321045, -5.108919143676758, -4.965409278869629, -4.821898937225342, -4.678388595581055, -4.534878253936768, -4.3913679122924805, -4.247858047485352, -4.1043477058410645, -3.9608373641967773, -3.8173272609710693, -3.6738171577453613, -3.530306816101074, -3.386796474456787, -3.243286371231079, -3.099776268005371, -2.956265926361084, -2.812755584716797, -2.669245481491089, -2.525735378265381, -2.3822250366210938, -2.2387146949768066, -2.0952045917510986, -1.951694369316101, -1.8081841468811035, -1.664673924446106, -1.5211637020111084, -1.3776534795761108, -1.2341432571411133, -1.0906330347061157, -0.9471228122711182, -0.8036125898361206, -0.6601028442382812, -0.5165926218032837, -0.37308239936828613, -0.22957217693328857, -0.08606195449829102, 0.05744826793670654, 0.2009584903717041, 0.34446871280670166, 0.4879789352416992, 0.6314891576766968, 0.7749993801116943, 0.9185096025466919, 1.0620198249816895, 1.205530047416687, 1.3490402698516846, 1.4925504922866821, 1.6360607147216797, 1.7795709371566772, 1.9230811595916748, 2.066591262817383, 2.21010160446167, 2.353611946105957, 2.497122049331665, 2.640632152557373, 2.78414249420166, 2.9276528358459473, 3.0711629390716553, 3.2146730422973633, 3.3581833839416504, 3.5016937255859375, 3.6452038288116455, 3.7887139320373535, 3.9322242736816406]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 4.0, 10.0, 9.0, 5.0, 15.0, 14.0, 15.0, 15.0, 18.0, 22.0, 23.0, 33.0, 37.0, 37.0, 41.0, 40.0, 47.0, 43.0, 33.0, 43.0, 37.0, 43.0, 39.0, 40.0, 40.0, 34.0, 32.0, 24.0, 29.0, 24.0, 32.0, 20.0, 26.0, 8.0, 10.0, 9.0, 6.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.3280394077301025, -3.22735595703125, -3.1266725063323975, -3.025989055633545, -2.9253053665161133, -2.82462215423584, -2.723938465118408, -2.6232550144195557, -2.522571563720703, -2.4218881130218506, -2.321204662322998, -2.2205212116241455, -2.119837760925293, -2.0191540718078613, -1.9184706211090088, -1.8177871704101562, -1.7171037197113037, -1.6164202690124512, -1.5157368183135986, -1.4150532484054565, -1.314369797706604, -1.2136863470077515, -1.1130027770996094, -1.0123193264007568, -0.9116358757019043, -0.8109524250030518, -0.7102689146995544, -0.6095854043960571, -0.5089019536972046, -0.40821850299835205, -0.30753499269485474, -0.20685148239135742, -0.10616803169250488, -0.005484551191329956, 0.09519892930984497, 0.1958824098110199, 0.2965658903121948, 0.39724934101104736, 0.4979328513145447, 0.598616361618042, 0.6992998123168945, 0.7999832630157471, 0.9006667733192444, 1.0013502836227417, 1.1020337343215942, 1.2027171850204468, 1.3034007549285889, 1.4040842056274414, 1.504767656326294, 1.6054511070251465, 1.706134557723999, 1.8068181276321411, 1.9075015783309937, 2.0081849098205566, 2.1088685989379883, 2.209552049636841, 2.3102355003356934, 2.410918951034546, 2.5116024017333984, 2.612285852432251, 2.7129693031311035, 2.813652992248535, 2.9143364429473877, 3.0150198936462402, 3.1157033443450928]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 4.0, 5.0, 9.0, 10.0, 7.0, 19.0, 12.0, 19.0, 17.0, 19.0, 27.0, 30.0, 21.0, 33.0, 29.0, 41.0, 32.0, 49.0, 40.0, 29.0, 39.0, 33.0, 30.0, 37.0, 28.0, 31.0, 40.0, 33.0, 38.0, 31.0, 29.0, 28.0, 15.0, 20.0, 26.0, 14.0, 12.0, 11.0, 16.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.56201171875, -0.5449676513671875, -0.527923583984375, -0.5108795166015625, -0.49383544921875, -0.4767913818359375, -0.459747314453125, -0.4427032470703125, -0.4256591796875, -0.4086151123046875, -0.391571044921875, -0.3745269775390625, -0.35748291015625, -0.3404388427734375, -0.323394775390625, -0.3063507080078125, -0.289306640625, -0.2722625732421875, -0.255218505859375, -0.2381744384765625, -0.22113037109375, -0.2040863037109375, -0.187042236328125, -0.1699981689453125, -0.1529541015625, -0.1359100341796875, -0.118865966796875, -0.1018218994140625, -0.08477783203125, -0.0677337646484375, -0.050689697265625, -0.0336456298828125, -0.0166015625, 0.0004425048828125, 0.017486572265625, 0.0345306396484375, 0.05157470703125, 0.0686187744140625, 0.085662841796875, 0.1027069091796875, 0.1197509765625, 0.1367950439453125, 0.153839111328125, 0.1708831787109375, 0.18792724609375, 0.2049713134765625, 0.222015380859375, 0.2390594482421875, 0.256103515625, 0.2731475830078125, 0.290191650390625, 0.3072357177734375, 0.32427978515625, 0.3413238525390625, 0.358367919921875, 0.3754119873046875, 0.3924560546875, 0.4095001220703125, 0.426544189453125, 0.4435882568359375, 0.46063232421875, 0.4776763916015625, 0.494720458984375, 0.5117645263671875, 0.52880859375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 13.0, 21.0, 41.0, 40.0, 81.0, 116.0, 151.0, 231.0, 390.0, 517.0, 719.0, 1014.0, 1444.0, 2132.0, 2944.0, 4466.0, 6585.0, 9829.0, 15051.0, 22775.0, 35114.0, 55542.0, 88014.0, 132216.0, 172731.0, 163476.0, 117366.0, 75850.0, 48475.0, 30863.0, 19781.0, 12904.0, 8677.0, 5968.0, 4063.0, 2840.0, 1875.0, 1290.0, 878.0, 673.0, 399.0, 302.0, 222.0, 152.0, 108.0, 73.0, 43.0, 44.0, 21.0, 14.0, 12.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.0679931640625, -0.06598424911499023, -0.06397533416748047, -0.0619664192199707, -0.05995750427246094, -0.05794858932495117, -0.055939674377441406, -0.05393075942993164, -0.051921844482421875, -0.04991292953491211, -0.047904014587402344, -0.04589509963989258, -0.04388618469238281, -0.04187726974487305, -0.03986835479736328, -0.037859439849853516, -0.03585052490234375, -0.033841609954833984, -0.03183269500732422, -0.029823780059814453, -0.027814865112304688, -0.025805950164794922, -0.023797035217285156, -0.02178812026977539, -0.019779205322265625, -0.01777029037475586, -0.015761375427246094, -0.013752460479736328, -0.011743545532226562, -0.009734630584716797, -0.007725715637207031, -0.005716800689697266, -0.0037078857421875, -0.0016989707946777344, 0.00030994415283203125, 0.002318859100341797, 0.0043277740478515625, 0.006336688995361328, 0.008345603942871094, 0.01035451889038086, 0.012363433837890625, 0.01437234878540039, 0.016381263732910156, 0.018390178680419922, 0.020399093627929688, 0.022408008575439453, 0.02441692352294922, 0.026425838470458984, 0.02843475341796875, 0.030443668365478516, 0.03245258331298828, 0.03446149826049805, 0.03647041320800781, 0.03847932815551758, 0.040488243103027344, 0.04249715805053711, 0.044506072998046875, 0.04651498794555664, 0.048523902893066406, 0.05053281784057617, 0.05254173278808594, 0.0545506477355957, 0.05655956268310547, 0.058568477630615234, 0.060577392578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 3.0, 7.0, 3.0, 9.0, 8.0, 15.0, 17.0, 19.0, 19.0, 13.0, 24.0, 18.0, 27.0, 26.0, 27.0, 29.0, 31.0, 42.0, 41.0, 40.0, 45.0, 1070.0, 41.0, 45.0, 46.0, 43.0, 41.0, 36.0, 30.0, 21.0, 30.0, 25.0, 25.0, 21.0, 15.0, 18.0, 11.0, 8.0, 4.0, 7.0, 8.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.492034912109375, -0.47479248046875, -0.457550048828125, -0.4403076171875, -0.423065185546875, -0.40582275390625, -0.388580322265625, -0.371337890625, -0.354095458984375, -0.33685302734375, -0.319610595703125, -0.3023681640625, -0.285125732421875, -0.26788330078125, -0.250640869140625, -0.2333984375, -0.216156005859375, -0.19891357421875, -0.181671142578125, -0.1644287109375, -0.147186279296875, -0.12994384765625, -0.112701416015625, -0.095458984375, -0.078216552734375, -0.06097412109375, -0.043731689453125, -0.0264892578125, -0.009246826171875, 0.00799560546875, 0.025238037109375, 0.04248046875, 0.059722900390625, 0.07696533203125, 0.094207763671875, 0.1114501953125, 0.128692626953125, 0.14593505859375, 0.163177490234375, 0.180419921875, 0.197662353515625, 0.21490478515625, 0.232147216796875, 0.2493896484375, 0.266632080078125, 0.28387451171875, 0.301116943359375, 0.318359375, 0.335601806640625, 0.35284423828125, 0.370086669921875, 0.3873291015625, 0.404571533203125, 0.42181396484375, 0.439056396484375, 0.456298828125, 0.473541259765625, 0.49078369140625, 0.508026123046875, 0.5252685546875, 0.542510986328125, 0.55975341796875, 0.576995849609375, 0.59423828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 10.0, 13.0, 33.0, 33.0, 66.0, 87.0, 124.0, 166.0, 245.0, 338.0, 495.0, 702.0, 954.0, 1400.0, 1974.0, 3081.0, 4721.0, 7461.0, 12708.0, 26963.0, 105866.0, 1730294.0, 133277.0, 29540.0, 13629.0, 7879.0, 4763.0, 3282.0, 2083.0, 1499.0, 986.0, 730.0, 494.0, 359.0, 258.0, 178.0, 133.0, 79.0, 59.0, 38.0, 41.0, 24.0, 15.0, 10.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11749267578125, -0.11351680755615234, -0.10954093933105469, -0.10556507110595703, -0.10158920288085938, -0.09761333465576172, -0.09363746643066406, -0.0896615982055664, -0.08568572998046875, -0.0817098617553711, -0.07773399353027344, -0.07375812530517578, -0.06978225708007812, -0.06580638885498047, -0.06183052062988281, -0.057854652404785156, -0.0538787841796875, -0.049902915954589844, -0.04592704772949219, -0.04195117950439453, -0.037975311279296875, -0.03399944305419922, -0.030023574829101562, -0.026047706604003906, -0.02207183837890625, -0.018095970153808594, -0.014120101928710938, -0.010144233703613281, -0.006168365478515625, -0.0021924972534179688, 0.0017833709716796875, 0.005759239196777344, 0.009735107421875, 0.013710975646972656, 0.017686843872070312, 0.02166271209716797, 0.025638580322265625, 0.02961444854736328, 0.03359031677246094, 0.037566184997558594, 0.04154205322265625, 0.045517921447753906, 0.04949378967285156, 0.05346965789794922, 0.057445526123046875, 0.06142139434814453, 0.06539726257324219, 0.06937313079833984, 0.0733489990234375, 0.07732486724853516, 0.08130073547363281, 0.08527660369873047, 0.08925247192382812, 0.09322834014892578, 0.09720420837402344, 0.1011800765991211, 0.10515594482421875, 0.1091318130493164, 0.11310768127441406, 0.11708354949951172, 0.12105941772460938, 0.12503528594970703, 0.1290111541748047, 0.13298702239990234, 0.136962890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 6.0, 4.0, 5.0, 11.0, 10.0, 9.0, 12.0, 14.0, 16.0, 19.0, 23.0, 38.0, 34.0, 32.0, 35.0, 46.0, 36.0, 49.0, 37.0, 28.0, 35.0, 32.0, 31.0, 41.0, 45.0, 33.0, 33.0, 38.0, 38.0, 26.0, 35.0, 18.0, 22.0, 11.0, 23.0, 16.0, 9.0, 10.0, 9.0, 14.0, 5.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.01073455810546875, -0.01043248176574707, -0.01013040542602539, -0.009828329086303711, -0.009526252746582031, -0.009224176406860352, -0.008922100067138672, -0.008620023727416992, -0.008317947387695312, -0.008015871047973633, -0.007713794708251953, -0.0074117183685302734, -0.007109642028808594, -0.006807565689086914, -0.006505489349365234, -0.006203413009643555, -0.005901336669921875, -0.005599260330200195, -0.005297183990478516, -0.004995107650756836, -0.004693031311035156, -0.0043909549713134766, -0.004088878631591797, -0.003786802291870117, -0.0034847259521484375, -0.003182649612426758, -0.002880573272705078, -0.0025784969329833984, -0.0022764205932617188, -0.001974344253540039, -0.0016722679138183594, -0.0013701915740966797, -0.001068115234375, -0.0007660388946533203, -0.0004639625549316406, -0.00016188621520996094, 0.00014019012451171875, 0.00044226646423339844, 0.0007443428039550781, 0.0010464191436767578, 0.0013484954833984375, 0.0016505718231201172, 0.0019526481628417969, 0.0022547245025634766, 0.0025568008422851562, 0.002858877182006836, 0.0031609535217285156, 0.0034630298614501953, 0.003765106201171875, 0.004067182540893555, 0.004369258880615234, 0.004671335220336914, 0.004973411560058594, 0.0052754878997802734, 0.005577564239501953, 0.005879640579223633, 0.0061817169189453125, 0.006483793258666992, 0.006785869598388672, 0.0070879459381103516, 0.007390022277832031, 0.007692098617553711, 0.00799417495727539, 0.00829625129699707, 0.00859832763671875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 9.0, 9.0, 9.0, 11.0, 10.0, 10.0, 16.0, 22.0, 13.0, 24.0, 24.0, 43.0, 53.0, 77.0, 94.0, 114.0, 169.0, 292.0, 637.0, 5728.0, 1014948.0, 24270.0, 828.0, 327.0, 199.0, 127.0, 104.0, 87.0, 58.0, 41.0, 40.0, 39.0, 20.0, 19.0, 16.0, 14.0, 11.0, 8.0, 13.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16796875, -0.16209983825683594, -0.15623092651367188, -0.1503620147705078, -0.14449310302734375, -0.1386241912841797, -0.13275527954101562, -0.12688636779785156, -0.1210174560546875, -0.11514854431152344, -0.10927963256835938, -0.10341072082519531, -0.09754180908203125, -0.09167289733886719, -0.08580398559570312, -0.07993507385253906, -0.074066162109375, -0.06819725036621094, -0.062328338623046875, -0.05645942687988281, -0.05059051513671875, -0.04472160339355469, -0.038852691650390625, -0.03298377990722656, -0.0271148681640625, -0.021245956420898438, -0.015377044677734375, -0.009508132934570312, -0.00363922119140625, 0.0022296905517578125, 0.008098602294921875, 0.013967514038085938, 0.01983642578125, 0.025705337524414062, 0.031574249267578125, 0.03744316101074219, 0.04331207275390625, 0.04918098449707031, 0.055049896240234375, 0.06091880798339844, 0.0667877197265625, 0.07265663146972656, 0.07852554321289062, 0.08439445495605469, 0.09026336669921875, 0.09613227844238281, 0.10200119018554688, 0.10787010192871094, 0.113739013671875, 0.11960792541503906, 0.12547683715820312, 0.1313457489013672, 0.13721466064453125, 0.1430835723876953, 0.14895248413085938, 0.15482139587402344, 0.1606903076171875, 0.16655921936035156, 0.17242813110351562, 0.1782970428466797, 0.18416595458984375, 0.1900348663330078, 0.19590377807617188, 0.20177268981933594, 0.2076416015625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 42.0, 915.0, 55.0], "bins": [-0.5463700890541077, -0.5376310348510742, -0.5288920402526855, -0.5201529860496521, -0.5114139318466187, -0.5026748776435852, -0.49393585324287415, -0.4851968288421631, -0.47645777463912964, -0.4677187502384186, -0.45897969603538513, -0.4502406716346741, -0.4415016174316406, -0.43276259303092957, -0.4240235388278961, -0.41528451442718506, -0.4065454602241516, -0.39780643582344055, -0.3890673816204071, -0.38032835721969604, -0.3715893030166626, -0.36285027861595154, -0.3541112244129181, -0.34537220001220703, -0.33663317561149597, -0.3278941512107849, -0.31915509700775146, -0.3104160726070404, -0.30167701840400696, -0.2929379940032959, -0.28419893980026245, -0.2754599153995514, -0.26672089099884033, -0.2579818665981293, -0.24924281239509583, -0.24050377309322357, -0.23176473379135132, -0.22302569448947906, -0.2142866551876068, -0.20554763078689575, -0.1968085765838623, -0.18806953728199005, -0.1793304979801178, -0.17059145867824554, -0.1618524193763733, -0.15311338007450104, -0.14437434077262878, -0.13563531637191772, -0.12689627707004547, -0.11815723776817322, -0.10941819846630096, -0.10067915916442871, -0.09194011986255646, -0.0832010805606842, -0.07446204870939255, -0.0657230094075203, -0.056983962655067444, -0.04824492335319519, -0.03950588405132294, -0.030766848474740982, -0.02202780917286873, -0.013288769870996475, -0.00454973429441452, 0.004189305007457733, 0.012928342446684837]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 19.0, 13.0, 6.0, 23.0, 20.0, 28.0, 31.0, 23.0, 36.0, 31.0, 40.0, 47.0, 42.0, 45.0, 46.0, 50.0, 49.0, 51.0, 49.0, 48.0, 56.0, 39.0, 29.0, 32.0, 24.0, 24.0, 23.0, 14.0, 14.0, 9.0, 5.0, 12.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04046356678009033, -0.0393192321062088, -0.03817489743232727, -0.03703056648373604, -0.03588623180985451, -0.03474189713597298, -0.033597566187381744, -0.032453231513500214, -0.03130889683961868, -0.030164562165737152, -0.02902022935450077, -0.02787589654326439, -0.02673156186938286, -0.025587227195501328, -0.024442894384264946, -0.023298561573028564, -0.022154226899147034, -0.021009892225265503, -0.01986555941402912, -0.01872122660279274, -0.01757689192891121, -0.01643255725502968, -0.015288224443793297, -0.01414389070123434, -0.012999556958675385, -0.011855223216116428, -0.010710889473557472, -0.009566555730998516, -0.00842222198843956, -0.007277888245880604, -0.006133554503321648, -0.0049892207607626915, -0.0038448870182037354, -0.002700553275644779, -0.001556219533085823, -0.0004118857905268669, 0.0007324479520320892, 0.0018767816945910454, 0.0030211154371500015, 0.004165449179708958, 0.005309782922267914, 0.00645411666482687, 0.007598450407385826, 0.008742784149944782, 0.009887117892503738, 0.011031451635062695, 0.01217578537762165, 0.013320119120180607, 0.014464452862739563, 0.01560878660529852, 0.016753120347857475, 0.017897453159093857, 0.019041787832975388, 0.02018612250685692, 0.0213304553180933, 0.02247478812932968, 0.023619122803211212, 0.024763457477092743, 0.025907790288329124, 0.027052123099565506, 0.028196457773447037, 0.029340792447328568, 0.03048512525856495, 0.03162945806980133, 0.03277379274368286]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 4.0, 6.0, 9.0, 9.0, 8.0, 20.0, 10.0, 20.0, 17.0, 17.0, 27.0, 32.0, 22.0, 30.0, 32.0, 38.0, 33.0, 48.0, 40.0, 31.0, 39.0, 33.0, 28.0, 38.0, 28.0, 31.0, 40.0, 33.0, 40.0, 29.0, 30.0, 28.0, 15.0, 20.0, 25.0, 14.0, 14.0, 10.0, 16.0, 5.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.56298828125, -0.545928955078125, -0.52886962890625, -0.511810302734375, -0.4947509765625, -0.477691650390625, -0.46063232421875, -0.443572998046875, -0.426513671875, -0.409454345703125, -0.39239501953125, -0.375335693359375, -0.3582763671875, -0.341217041015625, -0.32415771484375, -0.307098388671875, -0.2900390625, -0.272979736328125, -0.25592041015625, -0.238861083984375, -0.2218017578125, -0.204742431640625, -0.18768310546875, -0.170623779296875, -0.153564453125, -0.136505126953125, -0.11944580078125, -0.102386474609375, -0.0853271484375, -0.068267822265625, -0.05120849609375, -0.034149169921875, -0.01708984375, -3.0517578125e-05, 0.01702880859375, 0.034088134765625, 0.0511474609375, 0.068206787109375, 0.08526611328125, 0.102325439453125, 0.119384765625, 0.136444091796875, 0.15350341796875, 0.170562744140625, 0.1876220703125, 0.204681396484375, 0.22174072265625, 0.238800048828125, 0.255859375, 0.272918701171875, 0.28997802734375, 0.307037353515625, 0.3240966796875, 0.341156005859375, 0.35821533203125, 0.375274658203125, 0.392333984375, 0.409393310546875, 0.42645263671875, 0.443511962890625, 0.4605712890625, 0.477630615234375, 0.49468994140625, 0.511749267578125, 0.52880859375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 9.0, 15.0, 16.0, 30.0, 43.0, 54.0, 69.0, 98.0, 135.0, 200.0, 310.0, 481.0, 751.0, 1246.0, 2062.0, 3589.0, 6787.0, 13576.0, 29911.0, 70758.0, 184529.0, 367321.0, 216487.0, 83123.0, 33852.0, 15432.0, 7524.0, 4106.0, 2178.0, 1328.0, 847.0, 533.0, 334.0, 253.0, 155.0, 119.0, 84.0, 50.0, 40.0, 28.0, 23.0, 10.0, 12.0, 9.0, 7.0, 6.0, 3.0, 0.0, 1.0, 5.0], "bins": [-0.8046875, -0.782073974609375, -0.75946044921875, -0.736846923828125, -0.7142333984375, -0.691619873046875, -0.66900634765625, -0.646392822265625, -0.623779296875, -0.601165771484375, -0.57855224609375, -0.555938720703125, -0.5333251953125, -0.510711669921875, -0.48809814453125, -0.465484619140625, -0.44287109375, -0.420257568359375, -0.39764404296875, -0.375030517578125, -0.3524169921875, -0.329803466796875, -0.30718994140625, -0.284576416015625, -0.261962890625, -0.239349365234375, -0.21673583984375, -0.194122314453125, -0.1715087890625, -0.148895263671875, -0.12628173828125, -0.103668212890625, -0.0810546875, -0.058441162109375, -0.03582763671875, -0.013214111328125, 0.0093994140625, 0.032012939453125, 0.05462646484375, 0.077239990234375, 0.099853515625, 0.122467041015625, 0.14508056640625, 0.167694091796875, 0.1903076171875, 0.212921142578125, 0.23553466796875, 0.258148193359375, 0.28076171875, 0.303375244140625, 0.32598876953125, 0.348602294921875, 0.3712158203125, 0.393829345703125, 0.41644287109375, 0.439056396484375, 0.461669921875, 0.484283447265625, 0.50689697265625, 0.529510498046875, 0.5521240234375, 0.574737548828125, 0.59735107421875, 0.619964599609375, 0.642578125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 5.0, 6.0, 7.0, 14.0, 8.0, 19.0, 17.0, 20.0, 33.0, 25.0, 30.0, 39.0, 37.0, 54.0, 65.0, 93.0, 133.0, 253.0, 1444.0, 250.0, 108.0, 76.0, 55.0, 37.0, 33.0, 31.0, 27.0, 15.0, 29.0, 16.0, 19.0, 12.0, 8.0, 7.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.986328125, -1.921051025390625, -1.85577392578125, -1.790496826171875, -1.7252197265625, -1.659942626953125, -1.59466552734375, -1.529388427734375, -1.464111328125, -1.398834228515625, -1.33355712890625, -1.268280029296875, -1.2030029296875, -1.137725830078125, -1.07244873046875, -1.007171630859375, -0.94189453125, -0.876617431640625, -0.81134033203125, -0.746063232421875, -0.6807861328125, -0.615509033203125, -0.55023193359375, -0.484954833984375, -0.419677734375, -0.354400634765625, -0.28912353515625, -0.223846435546875, -0.1585693359375, -0.093292236328125, -0.02801513671875, 0.037261962890625, 0.1025390625, 0.167816162109375, 0.23309326171875, 0.298370361328125, 0.3636474609375, 0.428924560546875, 0.49420166015625, 0.559478759765625, 0.624755859375, 0.690032958984375, 0.75531005859375, 0.820587158203125, 0.8858642578125, 0.951141357421875, 1.01641845703125, 1.081695556640625, 1.14697265625, 1.212249755859375, 1.27752685546875, 1.342803955078125, 1.4080810546875, 1.473358154296875, 1.53863525390625, 1.603912353515625, 1.669189453125, 1.734466552734375, 1.79974365234375, 1.865020751953125, 1.9302978515625, 1.995574951171875, 2.06085205078125, 2.126129150390625, 2.19140625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 11.0, 6.0, 15.0, 19.0, 23.0, 30.0, 34.0, 53.0, 67.0, 108.0, 171.0, 323.0, 905.0, 4334.0, 82329.0, 2933081.0, 116842.0, 5315.0, 997.0, 413.0, 165.0, 106.0, 70.0, 59.0, 50.0, 39.0, 26.0, 22.0, 18.0, 10.0, 14.0, 9.0, 7.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.49468994140625, -4.3565673828125, -4.21844482421875, -4.080322265625, -3.94219970703125, -3.8040771484375, -3.66595458984375, -3.52783203125, -3.38970947265625, -3.2515869140625, -3.11346435546875, -2.975341796875, -2.83721923828125, -2.6990966796875, -2.56097412109375, -2.4228515625, -2.28472900390625, -2.1466064453125, -2.00848388671875, -1.870361328125, -1.73223876953125, -1.5941162109375, -1.45599365234375, -1.31787109375, -1.17974853515625, -1.0416259765625, -0.90350341796875, -0.765380859375, -0.62725830078125, -0.4891357421875, -0.35101318359375, -0.212890625, -0.07476806640625, 0.0633544921875, 0.20147705078125, 0.339599609375, 0.47772216796875, 0.6158447265625, 0.75396728515625, 0.89208984375, 1.03021240234375, 1.1683349609375, 1.30645751953125, 1.444580078125, 1.58270263671875, 1.7208251953125, 1.85894775390625, 1.9970703125, 2.13519287109375, 2.2733154296875, 2.41143798828125, 2.549560546875, 2.68768310546875, 2.8258056640625, 2.96392822265625, 3.10205078125, 3.24017333984375, 3.3782958984375, 3.51641845703125, 3.654541015625, 3.79266357421875, 3.9307861328125, 4.06890869140625, 4.20703125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 16.0, 33.0, 69.0, 143.0, 189.0, 203.0, 163.0, 88.0, 58.0, 27.0, 13.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.853670120239258, -8.662105560302734, -8.470541000366211, -8.278977394104004, -8.08741283416748, -7.895848274230957, -7.704283714294434, -7.512719631195068, -7.321155071258545, -7.1295905113220215, -6.938026428222656, -6.746461868286133, -6.554897785186768, -6.363333225250244, -6.171769142150879, -5.9802045822143555, -5.788640022277832, -5.597075462341309, -5.405511379241943, -5.21394681930542, -5.022382736206055, -4.830818176269531, -4.639253616333008, -4.447689533233643, -4.256125450134277, -4.064560890197754, -3.8729968070983887, -3.6814322471618652, -3.489867925643921, -3.2983036041259766, -3.1067392826080322, -2.915174961090088, -2.7236104011535645, -2.53204607963562, -2.340481758117676, -2.1489171981811523, -1.957352876663208, -1.7657885551452637, -1.5742242336273193, -1.3826597929000854, -1.1910954713821411, -0.999531090259552, -0.8079667091369629, -0.6164023876190186, -0.42483800649642944, -0.23327362537384033, -0.041709303855895996, 0.1498551368713379, 0.3414194583892822, 0.5329838395118713, 0.7245482206344604, 0.9161125421524048, 1.1076769828796387, 1.299241304397583, 1.4908056259155273, 1.6823700666427612, 1.8739343881607056, 2.0654988288879395, 2.257063150405884, 2.448627471923828, 2.6401917934417725, 2.831756114959717, 3.0233206748962402, 3.2148849964141846, 3.406449317932129]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 2.0, 3.0, 9.0, 11.0, 14.0, 12.0, 16.0, 28.0, 20.0, 15.0, 22.0, 27.0, 35.0, 27.0, 23.0, 26.0, 39.0, 32.0, 31.0, 44.0, 48.0, 41.0, 43.0, 28.0, 44.0, 38.0, 33.0, 31.0, 21.0, 25.0, 25.0, 22.0, 21.0, 26.0, 25.0, 15.0, 15.0, 11.0, 9.0, 5.0, 5.0, 7.0, 9.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.718386173248291, -4.570075988769531, -4.42176628112793, -4.27345609664917, -4.12514591217041, -3.9768362045288086, -3.828526020050049, -3.680216073989868, -3.5319061279296875, -3.383596181869507, -3.235286235809326, -3.0869760513305664, -2.9386661052703857, -2.790356159210205, -2.6420459747314453, -2.4937360286712646, -2.345426082611084, -2.1971161365509033, -2.0488061904907227, -1.900496006011963, -1.7521860599517822, -1.6038761138916016, -1.4555660486221313, -1.3072559833526611, -1.1589460372924805, -1.0106360912322998, -0.8623260259628296, -0.7140160202980042, -0.5657060146331787, -0.41739600896835327, -0.26908600330352783, -0.12077593803405762, 0.02753448486328125, 0.1758444905281067, 0.32415449619293213, 0.47246450185775757, 0.620774507522583, 0.7690845131874084, 0.9173945188522339, 1.065704584121704, 1.2140145301818848, 1.3623244762420654, 1.5106345415115356, 1.6589446067810059, 1.8072545528411865, 1.9555644989013672, 2.103874683380127, 2.2521846294403076, 2.4004945755004883, 2.548804521560669, 2.6971144676208496, 2.8454246520996094, 2.99373459815979, 3.1420445442199707, 3.2903547286987305, 3.438664674758911, 3.586974620819092, 3.7352845668792725, 3.883594512939453, 4.031904697418213, 4.180214881896973, 4.328524589538574, 4.476834774017334, 4.625144958496094, 4.773454666137695]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 5.0, 13.0, 4.0, 20.0, 18.0, 13.0, 17.0, 26.0, 28.0, 19.0, 32.0, 29.0, 27.0, 30.0, 38.0, 31.0, 46.0, 36.0, 38.0, 30.0, 33.0, 28.0, 37.0, 37.0, 29.0, 31.0, 36.0, 29.0, 35.0, 20.0, 24.0, 19.0, 21.0, 19.0, 7.0, 19.0, 10.0, 6.0, 13.0, 5.0, 5.0, 3.0, 7.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54833984375, -0.5307235717773438, -0.5131072998046875, -0.49549102783203125, -0.477874755859375, -0.46025848388671875, -0.4426422119140625, -0.42502593994140625, -0.40740966796875, -0.38979339599609375, -0.3721771240234375, -0.35456085205078125, -0.336944580078125, -0.31932830810546875, -0.3017120361328125, -0.28409576416015625, -0.2664794921875, -0.24886322021484375, -0.2312469482421875, -0.21363067626953125, -0.196014404296875, -0.17839813232421875, -0.1607818603515625, -0.14316558837890625, -0.12554931640625, -0.10793304443359375, -0.0903167724609375, -0.07270050048828125, -0.055084228515625, -0.03746795654296875, -0.0198516845703125, -0.00223541259765625, 0.015380859375, 0.03299713134765625, 0.0506134033203125, 0.06822967529296875, 0.085845947265625, 0.10346221923828125, 0.1210784912109375, 0.13869476318359375, 0.15631103515625, 0.17392730712890625, 0.1915435791015625, 0.20915985107421875, 0.226776123046875, 0.24439239501953125, 0.2620086669921875, 0.27962493896484375, 0.2972412109375, 0.31485748291015625, 0.3324737548828125, 0.35009002685546875, 0.367706298828125, 0.38532257080078125, 0.4029388427734375, 0.42055511474609375, 0.43817138671875, 0.45578765869140625, 0.4734039306640625, 0.49102020263671875, 0.508636474609375, 0.5262527465820312, 0.5438690185546875, 0.5614852905273438, 0.5791015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 10.0, 10.0, 13.0, 20.0, 33.0, 37.0, 72.0, 76.0, 120.0, 188.0, 286.0, 455.0, 730.0, 1146.0, 2063.0, 3657.0, 6773.0, 13840.0, 32154.0, 95222.0, 370229.0, 1479061.0, 1589538.0, 424121.0, 108641.0, 35811.0, 14563.0, 6993.0, 3621.0, 2026.0, 1105.0, 600.0, 375.0, 241.0, 151.0, 87.0, 70.0, 53.0, 29.0, 21.0, 13.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0625, -1.0312881469726562, -1.0000762939453125, -0.9688644409179688, -0.937652587890625, -0.9064407348632812, -0.8752288818359375, -0.8440170288085938, -0.81280517578125, -0.7815933227539062, -0.7503814697265625, -0.7191696166992188, -0.687957763671875, -0.6567459106445312, -0.6255340576171875, -0.5943222045898438, -0.5631103515625, -0.5318984985351562, -0.5006866455078125, -0.46947479248046875, -0.438262939453125, -0.40705108642578125, -0.3758392333984375, -0.34462738037109375, -0.31341552734375, -0.28220367431640625, -0.2509918212890625, -0.21977996826171875, -0.188568115234375, -0.15735626220703125, -0.1261444091796875, -0.09493255615234375, -0.063720703125, -0.03250885009765625, -0.0012969970703125, 0.02991485595703125, 0.061126708984375, 0.09233856201171875, 0.1235504150390625, 0.15476226806640625, 0.18597412109375, 0.21718597412109375, 0.2483978271484375, 0.27960968017578125, 0.310821533203125, 0.34203338623046875, 0.3732452392578125, 0.40445709228515625, 0.4356689453125, 0.46688079833984375, 0.4980926513671875, 0.5293045043945312, 0.560516357421875, 0.5917282104492188, 0.6229400634765625, 0.6541519165039062, 0.68536376953125, 0.7165756225585938, 0.7477874755859375, 0.7789993286132812, 0.810211181640625, 0.8414230346679688, 0.8726348876953125, 0.9038467407226562, 0.93505859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 6.0, 4.0, 12.0, 14.0, 12.0, 14.0, 13.0, 34.0, 33.0, 56.0, 83.0, 115.0, 143.0, 199.0, 251.0, 408.0, 486.0, 534.0, 457.0, 334.0, 215.0, 156.0, 108.0, 88.0, 54.0, 49.0, 44.0, 37.0, 26.0, 22.0, 14.0, 13.0, 14.0, 5.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.10546875, -1.071044921875, -1.03662109375, -1.002197265625, -0.9677734375, -0.933349609375, -0.89892578125, -0.864501953125, -0.830078125, -0.795654296875, -0.76123046875, -0.726806640625, -0.6923828125, -0.657958984375, -0.62353515625, -0.589111328125, -0.5546875, -0.520263671875, -0.48583984375, -0.451416015625, -0.4169921875, -0.382568359375, -0.34814453125, -0.313720703125, -0.279296875, -0.244873046875, -0.21044921875, -0.176025390625, -0.1416015625, -0.107177734375, -0.07275390625, -0.038330078125, -0.00390625, 0.030517578125, 0.06494140625, 0.099365234375, 0.1337890625, 0.168212890625, 0.20263671875, 0.237060546875, 0.271484375, 0.305908203125, 0.34033203125, 0.374755859375, 0.4091796875, 0.443603515625, 0.47802734375, 0.512451171875, 0.546875, 0.581298828125, 0.61572265625, 0.650146484375, 0.6845703125, 0.718994140625, 0.75341796875, 0.787841796875, 0.822265625, 0.856689453125, 0.89111328125, 0.925537109375, 0.9599609375, 0.994384765625, 1.02880859375, 1.063232421875, 1.09765625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 12.0, 14.0, 19.0, 22.0, 31.0, 40.0, 57.0, 68.0, 77.0, 142.0, 243.0, 536.0, 1628.0, 7516.0, 72381.0, 3090059.0, 981940.0, 32691.0, 4523.0, 1217.0, 404.0, 244.0, 138.0, 76.0, 59.0, 24.0, 28.0, 22.0, 11.0, 9.0, 12.0, 4.0, 5.0, 7.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.849822998046875, -3.72503662109375, -3.600250244140625, -3.4754638671875, -3.350677490234375, -3.22589111328125, -3.101104736328125, -2.976318359375, -2.851531982421875, -2.72674560546875, -2.601959228515625, -2.4771728515625, -2.352386474609375, -2.22760009765625, -2.102813720703125, -1.97802734375, -1.853240966796875, -1.72845458984375, -1.603668212890625, -1.4788818359375, -1.354095458984375, -1.22930908203125, -1.104522705078125, -0.979736328125, -0.854949951171875, -0.73016357421875, -0.605377197265625, -0.4805908203125, -0.355804443359375, -0.23101806640625, -0.106231689453125, 0.0185546875, 0.143341064453125, 0.26812744140625, 0.392913818359375, 0.5177001953125, 0.642486572265625, 0.76727294921875, 0.892059326171875, 1.016845703125, 1.141632080078125, 1.26641845703125, 1.391204833984375, 1.5159912109375, 1.640777587890625, 1.76556396484375, 1.890350341796875, 2.01513671875, 2.139923095703125, 2.26470947265625, 2.389495849609375, 2.5142822265625, 2.639068603515625, 2.76385498046875, 2.888641357421875, 3.013427734375, 3.138214111328125, 3.26300048828125, 3.387786865234375, 3.5125732421875, 3.637359619140625, 3.76214599609375, 3.886932373046875, 4.01171875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 15.0, 80.0, 185.0, 308.0, 240.0, 114.0, 43.0, 15.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.981155395507812, -23.49833106994629, -23.015506744384766, -22.532684326171875, -22.04986000061035, -21.567035675048828, -21.084211349487305, -20.60138702392578, -20.11856460571289, -19.635740280151367, -19.152915954589844, -18.670093536376953, -18.18726921081543, -17.704444885253906, -17.221620559692383, -16.73879623413086, -16.255971908569336, -15.773147583007812, -15.290324211120605, -14.807499885559082, -14.324676513671875, -13.841852188110352, -13.359027862548828, -12.876203536987305, -12.393380165100098, -11.910555839538574, -11.427732467651367, -10.944908142089844, -10.46208381652832, -9.979260444641113, -9.49643611907959, -9.013612747192383, -8.53078842163086, -8.047964096069336, -7.565140724182129, -7.0823163986206055, -6.59949254989624, -6.116668701171875, -5.633844375610352, -5.151020526885986, -4.668197154998779, -4.185373306274414, -3.7025492191314697, -3.2197251319885254, -2.73690128326416, -2.254077434539795, -1.7712533473968506, -1.2884292602539062, -0.805605411529541, -0.32278144359588623, 0.16004252433776855, 0.6428664922714233, 1.1256904602050781, 1.6085143089294434, 2.0913383960723877, 2.574162483215332, 3.0569863319396973, 3.5398101806640625, 4.022634506225586, 4.505458354949951, 4.988282203674316, 5.471106052398682, 5.953929901123047, 6.43675422668457, 6.9195780754089355]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 8.0, 7.0, 4.0, 5.0, 13.0, 6.0, 8.0, 13.0, 15.0, 12.0, 11.0, 20.0, 24.0, 31.0, 28.0, 27.0, 36.0, 39.0, 38.0, 39.0, 32.0, 47.0, 38.0, 47.0, 43.0, 47.0, 34.0, 34.0, 37.0, 34.0, 37.0, 29.0, 29.0, 11.0, 26.0, 21.0, 14.0, 11.0, 7.0, 10.0, 10.0, 4.0, 7.0, 4.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.6101937294006348, -3.492225408554077, -3.3742573261260986, -3.256289005279541, -3.1383209228515625, -3.020352602005005, -2.9023842811584473, -2.7844161987304688, -2.6664481163024902, -2.5484797954559326, -2.430511713027954, -2.3125433921813965, -2.194575309753418, -2.0766069889068604, -1.9586387872695923, -1.8406705856323242, -1.7227022647857666, -1.6047340631484985, -1.4867658615112305, -1.3687975406646729, -1.2508294582366943, -1.1328611373901367, -1.0148929357528687, -0.8969247341156006, -0.7789565324783325, -0.6609883308410645, -0.5430201292037964, -0.42505186796188354, -0.3070836663246155, -0.1891154646873474, -0.07114720344543457, 0.046820998191833496, 0.16478943824768066, 0.28275763988494873, 0.4007258713245392, 0.5186941027641296, 0.6366623044013977, 0.7546305060386658, 0.8725987672805786, 0.9905669689178467, 1.1085351705551147, 1.2265033721923828, 1.3444715738296509, 1.462439775466919, 1.5804080963134766, 1.698376178741455, 1.8163444995880127, 1.9343127012252808, 2.052280902862549, 2.1702492237091064, 2.288217306137085, 2.4061856269836426, 2.524153709411621, 2.6421220302581787, 2.7600903511047363, 2.878058433532715, 2.9960265159606934, 3.113994836807251, 3.2319629192352295, 3.349931240081787, 3.4678993225097656, 3.5858676433563232, 3.703835964202881, 3.8218040466308594, 3.939772367477417]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 3.0, 8.0, 7.0, 6.0, 12.0, 14.0, 11.0, 15.0, 13.0, 21.0, 19.0, 20.0, 29.0, 24.0, 20.0, 33.0, 42.0, 46.0, 30.0, 35.0, 38.0, 43.0, 33.0, 32.0, 27.0, 21.0, 30.0, 37.0, 36.0, 43.0, 38.0, 28.0, 22.0, 24.0, 19.0, 25.0, 15.0, 13.0, 9.0, 15.0, 7.0, 11.0, 3.0, 5.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.529296875, -0.5128250122070312, -0.4963531494140625, -0.47988128662109375, -0.463409423828125, -0.44693756103515625, -0.4304656982421875, -0.41399383544921875, -0.39752197265625, -0.38105010986328125, -0.3645782470703125, -0.34810638427734375, -0.331634521484375, -0.31516265869140625, -0.2986907958984375, -0.28221893310546875, -0.2657470703125, -0.24927520751953125, -0.2328033447265625, -0.21633148193359375, -0.199859619140625, -0.18338775634765625, -0.1669158935546875, -0.15044403076171875, -0.13397216796875, -0.11750030517578125, -0.1010284423828125, -0.08455657958984375, -0.068084716796875, -0.05161285400390625, -0.0351409912109375, -0.01866912841796875, -0.002197265625, 0.01427459716796875, 0.0307464599609375, 0.04721832275390625, 0.063690185546875, 0.08016204833984375, 0.0966339111328125, 0.11310577392578125, 0.12957763671875, 0.14604949951171875, 0.1625213623046875, 0.17899322509765625, 0.195465087890625, 0.21193695068359375, 0.2284088134765625, 0.24488067626953125, 0.2613525390625, 0.27782440185546875, 0.2942962646484375, 0.31076812744140625, 0.327239990234375, 0.34371185302734375, 0.3601837158203125, 0.37665557861328125, 0.39312744140625, 0.40959930419921875, 0.4260711669921875, 0.44254302978515625, 0.459014892578125, 0.47548675537109375, 0.4919586181640625, 0.5084304809570312, 0.52490234375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 14.0, 17.0, 34.0, 44.0, 55.0, 95.0, 131.0, 182.0, 306.0, 466.0, 698.0, 976.0, 1424.0, 2154.0, 3297.0, 4780.0, 7213.0, 11112.0, 16913.0, 26185.0, 40560.0, 63195.0, 96534.0, 143826.0, 178842.0, 151734.0, 104175.0, 67498.0, 44014.0, 28110.0, 18404.0, 12002.0, 8014.0, 5231.0, 3497.0, 2294.0, 1456.0, 992.0, 676.0, 464.0, 319.0, 208.0, 147.0, 88.0, 68.0, 51.0, 22.0, 11.0, 9.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.06494140625, -0.06300783157348633, -0.061074256896972656, -0.059140682220458984, -0.05720710754394531, -0.05527353286743164, -0.05333995819091797, -0.0514063835144043, -0.049472808837890625, -0.04753923416137695, -0.04560565948486328, -0.04367208480834961, -0.04173851013183594, -0.039804935455322266, -0.037871360778808594, -0.03593778610229492, -0.03400421142578125, -0.03207063674926758, -0.030137062072753906, -0.028203487396240234, -0.026269912719726562, -0.02433633804321289, -0.02240276336669922, -0.020469188690185547, -0.018535614013671875, -0.016602039337158203, -0.014668464660644531, -0.01273488998413086, -0.010801315307617188, -0.008867740631103516, -0.006934165954589844, -0.005000591278076172, -0.0030670166015625, -0.0011334419250488281, 0.0008001327514648438, 0.0027337074279785156, 0.0046672821044921875, 0.006600856781005859, 0.008534431457519531, 0.010468006134033203, 0.012401580810546875, 0.014335155487060547, 0.01626873016357422, 0.01820230484008789, 0.020135879516601562, 0.022069454193115234, 0.024003028869628906, 0.025936603546142578, 0.02787017822265625, 0.029803752899169922, 0.031737327575683594, 0.033670902252197266, 0.03560447692871094, 0.03753805160522461, 0.03947162628173828, 0.04140520095825195, 0.043338775634765625, 0.0452723503112793, 0.04720592498779297, 0.04913949966430664, 0.05107307434082031, 0.053006649017333984, 0.054940223693847656, 0.05687379837036133, 0.058807373046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 5.0, 4.0, 6.0, 14.0, 11.0, 7.0, 14.0, 20.0, 24.0, 22.0, 34.0, 22.0, 23.0, 26.0, 42.0, 31.0, 34.0, 45.0, 41.0, 43.0, 1059.0, 46.0, 38.0, 36.0, 32.0, 37.0, 41.0, 31.0, 29.0, 26.0, 24.0, 20.0, 16.0, 21.0, 16.0, 18.0, 17.0, 9.0, 9.0, 6.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50146484375, -0.486236572265625, -0.47100830078125, -0.455780029296875, -0.4405517578125, -0.425323486328125, -0.41009521484375, -0.394866943359375, -0.379638671875, -0.364410400390625, -0.34918212890625, -0.333953857421875, -0.3187255859375, -0.303497314453125, -0.28826904296875, -0.273040771484375, -0.2578125, -0.242584228515625, -0.22735595703125, -0.212127685546875, -0.1968994140625, -0.181671142578125, -0.16644287109375, -0.151214599609375, -0.135986328125, -0.120758056640625, -0.10552978515625, -0.090301513671875, -0.0750732421875, -0.059844970703125, -0.04461669921875, -0.029388427734375, -0.01416015625, 0.001068115234375, 0.01629638671875, 0.031524658203125, 0.0467529296875, 0.061981201171875, 0.07720947265625, 0.092437744140625, 0.107666015625, 0.122894287109375, 0.13812255859375, 0.153350830078125, 0.1685791015625, 0.183807373046875, 0.19903564453125, 0.214263916015625, 0.2294921875, 0.244720458984375, 0.25994873046875, 0.275177001953125, 0.2904052734375, 0.305633544921875, 0.32086181640625, 0.336090087890625, 0.351318359375, 0.366546630859375, 0.38177490234375, 0.397003173828125, 0.4122314453125, 0.427459716796875, 0.44268798828125, 0.457916259765625, 0.47314453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 7.0, 9.0, 8.0, 15.0, 27.0, 33.0, 59.0, 62.0, 101.0, 162.0, 237.0, 320.0, 523.0, 699.0, 1138.0, 1669.0, 2628.0, 4105.0, 6890.0, 12279.0, 25992.0, 109124.0, 1762356.0, 111396.0, 26070.0, 12509.0, 7015.0, 4097.0, 2546.0, 1620.0, 1109.0, 737.0, 510.0, 358.0, 238.0, 156.0, 100.0, 68.0, 57.0, 34.0, 23.0, 23.0, 9.0, 4.0, 6.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1446533203125, -0.14046096801757812, -0.13626861572265625, -0.13207626342773438, -0.1278839111328125, -0.12369155883789062, -0.11949920654296875, -0.11530685424804688, -0.111114501953125, -0.10692214965820312, -0.10272979736328125, -0.09853744506835938, -0.0943450927734375, -0.09015274047851562, -0.08596038818359375, -0.08176803588867188, -0.07757568359375, -0.07338333129882812, -0.06919097900390625, -0.06499862670898438, -0.0608062744140625, -0.056613922119140625, -0.05242156982421875, -0.048229217529296875, -0.044036865234375, -0.039844512939453125, -0.03565216064453125, -0.031459808349609375, -0.0272674560546875, -0.023075103759765625, -0.01888275146484375, -0.014690399169921875, -0.010498046875, -0.006305694580078125, -0.00211334228515625, 0.002079010009765625, 0.0062713623046875, 0.010463714599609375, 0.01465606689453125, 0.018848419189453125, 0.023040771484375, 0.027233123779296875, 0.03142547607421875, 0.035617828369140625, 0.0398101806640625, 0.044002532958984375, 0.04819488525390625, 0.052387237548828125, 0.05657958984375, 0.060771942138671875, 0.06496429443359375, 0.06915664672851562, 0.0733489990234375, 0.07754135131835938, 0.08173370361328125, 0.08592605590820312, 0.090118408203125, 0.09431076049804688, 0.09850311279296875, 0.10269546508789062, 0.1068878173828125, 0.11108016967773438, 0.11527252197265625, 0.11946487426757812, 0.1236572265625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 0.0, 7.0, 9.0, 7.0, 11.0, 7.0, 10.0, 9.0, 10.0, 19.0, 17.0, 25.0, 23.0, 31.0, 25.0, 35.0, 31.0, 27.0, 41.0, 33.0, 37.0, 35.0, 37.0, 29.0, 42.0, 34.0, 38.0, 30.0, 39.0, 36.0, 29.0, 30.0, 28.0, 20.0, 21.0, 13.0, 20.0, 17.0, 15.0, 17.0, 8.0, 11.0, 7.0, 12.0, 2.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.00689697265625, -0.006680786609649658, -0.006464600563049316, -0.006248414516448975, -0.006032228469848633, -0.005816042423248291, -0.005599856376647949, -0.005383670330047607, -0.005167484283447266, -0.004951298236846924, -0.004735112190246582, -0.00451892614364624, -0.0043027400970458984, -0.004086554050445557, -0.003870368003845215, -0.003654181957244873, -0.0034379959106445312, -0.0032218098640441895, -0.0030056238174438477, -0.002789437770843506, -0.002573251724243164, -0.0023570656776428223, -0.0021408796310424805, -0.0019246935844421387, -0.0017085075378417969, -0.001492321491241455, -0.0012761354446411133, -0.0010599493980407715, -0.0008437633514404297, -0.0006275773048400879, -0.0004113912582397461, -0.0001952052116394043, 2.09808349609375e-05, 0.0002371668815612793, 0.0004533529281616211, 0.0006695389747619629, 0.0008857250213623047, 0.0011019110679626465, 0.0013180971145629883, 0.00153428316116333, 0.0017504692077636719, 0.0019666552543640137, 0.0021828413009643555, 0.0023990273475646973, 0.002615213394165039, 0.002831399440765381, 0.0030475854873657227, 0.0032637715339660645, 0.0034799575805664062, 0.003696143627166748, 0.00391232967376709, 0.004128515720367432, 0.0043447017669677734, 0.004560887813568115, 0.004777073860168457, 0.004993259906768799, 0.005209445953369141, 0.005425631999969482, 0.005641818046569824, 0.005858004093170166, 0.006074190139770508, 0.00629037618637085, 0.006506562232971191, 0.006722748279571533, 0.006938934326171875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 14.0, 5.0, 14.0, 13.0, 13.0, 21.0, 13.0, 22.0, 13.0, 30.0, 32.0, 38.0, 69.0, 72.0, 109.0, 119.0, 197.0, 328.0, 813.0, 15694.0, 1019939.0, 9238.0, 676.0, 299.0, 180.0, 127.0, 89.0, 76.0, 58.0, 43.0, 30.0, 27.0, 22.0, 19.0, 15.0, 11.0, 12.0, 5.0, 11.0, 10.0, 8.0, 4.0, 5.0, 0.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140380859375, -0.13591766357421875, -0.1314544677734375, -0.12699127197265625, -0.122528076171875, -0.11806488037109375, -0.1136016845703125, -0.10913848876953125, -0.10467529296875, -0.10021209716796875, -0.0957489013671875, -0.09128570556640625, -0.086822509765625, -0.08235931396484375, -0.0778961181640625, -0.07343292236328125, -0.0689697265625, -0.06450653076171875, -0.0600433349609375, -0.05558013916015625, -0.051116943359375, -0.04665374755859375, -0.0421905517578125, -0.03772735595703125, -0.03326416015625, -0.02880096435546875, -0.0243377685546875, -0.01987457275390625, -0.015411376953125, -0.01094818115234375, -0.0064849853515625, -0.00202178955078125, 0.00244140625, 0.00690460205078125, 0.0113677978515625, 0.01583099365234375, 0.020294189453125, 0.02475738525390625, 0.0292205810546875, 0.03368377685546875, 0.03814697265625, 0.04261016845703125, 0.0470733642578125, 0.05153656005859375, 0.055999755859375, 0.06046295166015625, 0.0649261474609375, 0.06938934326171875, 0.0738525390625, 0.07831573486328125, 0.0827789306640625, 0.08724212646484375, 0.091705322265625, 0.09616851806640625, 0.1006317138671875, 0.10509490966796875, 0.10955810546875, 0.11402130126953125, 0.1184844970703125, 0.12294769287109375, 0.127410888671875, 0.13187408447265625, 0.1363372802734375, 0.14080047607421875, 0.145263671875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 28.0, 815.0, 170.0], "bins": [-0.2968924641609192, -0.29216238856315613, -0.2874322831630707, -0.2827022075653076, -0.27797213196754456, -0.2732420563697815, -0.26851195096969604, -0.263781875371933, -0.2590517997741699, -0.25432172417640686, -0.2495916336774826, -0.24486154317855835, -0.2401314675807953, -0.23540137708187103, -0.23067128658294678, -0.22594121098518372, -0.22121110558509827, -0.216481015086174, -0.21175093948841095, -0.2070208489894867, -0.20229077339172363, -0.19756068289279938, -0.19283059239387512, -0.18810051679611206, -0.183370441198349, -0.17864035069942474, -0.17391027510166168, -0.16918018460273743, -0.16445010900497437, -0.1597200185060501, -0.15498992800712585, -0.1502598524093628, -0.14552976191043854, -0.14079967141151428, -0.13606959581375122, -0.13133950531482697, -0.1266094297170639, -0.12187933921813965, -0.11714925616979599, -0.11241917312145233, -0.10768908262252808, -0.10295899957418442, -0.09822891652584076, -0.0934988260269165, -0.08876874297857285, -0.08403865993022919, -0.07930857688188553, -0.07457849383354187, -0.06984841078519821, -0.06511832773685455, -0.060388240963220596, -0.05565815791487694, -0.05092807114124298, -0.04619798809289932, -0.041467905044555664, -0.03673781827092171, -0.03200773522257805, -0.02727765031158924, -0.022547565400600433, -0.017817482352256775, -0.013087397441267967, -0.00835731253027916, -0.003627229481935501, 0.0011028572916984558, 0.0058329408057034016]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 9.0, 10.0, 15.0, 26.0, 25.0, 31.0, 31.0, 36.0, 42.0, 35.0, 51.0, 54.0, 46.0, 49.0, 51.0, 63.0, 54.0, 54.0, 44.0, 46.0, 48.0, 33.0, 19.0, 21.0, 21.0, 23.0, 10.0, 20.0, 7.0, 10.0, 7.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0325319766998291, -0.0316428542137146, -0.030753733590245247, -0.029864612966775894, -0.028975490480661392, -0.02808636799454689, -0.027197247371077538, -0.026308126747608185, -0.025419004261493683, -0.02452988177537918, -0.023640761151909828, -0.022751640528440475, -0.021862518042325974, -0.02097339555621147, -0.02008427493274212, -0.019195154309272766, -0.018306031823158264, -0.017416909337043762, -0.01652778871357441, -0.015638668090105057, -0.014749545603990555, -0.013860424049198627, -0.0129713024944067, -0.012082180939614773, -0.011193059384822845, -0.010303937830030918, -0.00941481627523899, -0.008525694720447063, -0.007636573165655136, -0.006747451610863209, -0.005858330056071281, -0.004969208501279354, -0.004080086946487427, -0.0031909653916954994, -0.002301843836903572, -0.0014127222821116447, -0.0005236007273197174, 0.00036552082747220993, 0.0012546423822641373, 0.0021437639370560646, 0.003032885491847992, 0.003922007046639919, 0.004811128601431847, 0.005700250156223774, 0.006589371711015701, 0.007478493265807629, 0.008367614820599556, 0.009256736375391483, 0.01014585793018341, 0.011034979484975338, 0.011924101039767265, 0.012813222594559193, 0.01370234414935112, 0.014591465704143047, 0.015480587258934975, 0.016369707882404327, 0.01725883036851883, 0.01814795285463333, 0.019037073478102684, 0.019926194101572037, 0.02081531658768654, 0.02170443907380104, 0.022593559697270393, 0.023482680320739746, 0.024371802806854248]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 3.0, 7.0, 8.0, 5.0, 11.0, 16.0, 10.0, 14.0, 13.0, 22.0, 14.0, 26.0, 23.0, 25.0, 23.0, 33.0, 41.0, 46.0, 31.0, 33.0, 40.0, 44.0, 29.0, 34.0, 28.0, 19.0, 32.0, 37.0, 35.0, 45.0, 37.0, 26.0, 25.0, 25.0, 17.0, 24.0, 18.0, 13.0, 9.0, 14.0, 6.0, 13.0, 2.0, 6.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.53125, -0.5147552490234375, -0.498260498046875, -0.4817657470703125, -0.46527099609375, -0.4487762451171875, -0.432281494140625, -0.4157867431640625, -0.3992919921875, -0.3827972412109375, -0.366302490234375, -0.3498077392578125, -0.33331298828125, -0.3168182373046875, -0.300323486328125, -0.2838287353515625, -0.267333984375, -0.2508392333984375, -0.234344482421875, -0.2178497314453125, -0.20135498046875, -0.1848602294921875, -0.168365478515625, -0.1518707275390625, -0.1353759765625, -0.1188812255859375, -0.102386474609375, -0.0858917236328125, -0.06939697265625, -0.0529022216796875, -0.036407470703125, -0.0199127197265625, -0.00341796875, 0.0130767822265625, 0.029571533203125, 0.0460662841796875, 0.06256103515625, 0.0790557861328125, 0.095550537109375, 0.1120452880859375, 0.1285400390625, 0.1450347900390625, 0.161529541015625, 0.1780242919921875, 0.19451904296875, 0.2110137939453125, 0.227508544921875, 0.2440032958984375, 0.260498046875, 0.2769927978515625, 0.293487548828125, 0.3099822998046875, 0.32647705078125, 0.3429718017578125, 0.359466552734375, 0.3759613037109375, 0.3924560546875, 0.4089508056640625, 0.425445556640625, 0.4419403076171875, 0.45843505859375, 0.4749298095703125, 0.491424560546875, 0.5079193115234375, 0.5244140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 18.0, 17.0, 36.0, 44.0, 67.0, 101.0, 121.0, 202.0, 230.0, 365.0, 498.0, 781.0, 1126.0, 1719.0, 2574.0, 3986.0, 6444.0, 10211.0, 17359.0, 31209.0, 59240.0, 118316.0, 220851.0, 252543.0, 150509.0, 75723.0, 39153.0, 21471.0, 12314.0, 7449.0, 4605.0, 3055.0, 2064.0, 1313.0, 850.0, 617.0, 413.0, 282.0, 192.0, 136.0, 105.0, 55.0, 44.0, 39.0, 28.0, 15.0, 13.0, 12.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.61572265625, -0.596588134765625, -0.57745361328125, -0.558319091796875, -0.5391845703125, -0.520050048828125, -0.50091552734375, -0.481781005859375, -0.462646484375, -0.443511962890625, -0.42437744140625, -0.405242919921875, -0.3861083984375, -0.366973876953125, -0.34783935546875, -0.328704833984375, -0.3095703125, -0.290435791015625, -0.27130126953125, -0.252166748046875, -0.2330322265625, -0.213897705078125, -0.19476318359375, -0.175628662109375, -0.156494140625, -0.137359619140625, -0.11822509765625, -0.099090576171875, -0.0799560546875, -0.060821533203125, -0.04168701171875, -0.022552490234375, -0.00341796875, 0.015716552734375, 0.03485107421875, 0.053985595703125, 0.0731201171875, 0.092254638671875, 0.11138916015625, 0.130523681640625, 0.149658203125, 0.168792724609375, 0.18792724609375, 0.207061767578125, 0.2261962890625, 0.245330810546875, 0.26446533203125, 0.283599853515625, 0.302734375, 0.321868896484375, 0.34100341796875, 0.360137939453125, 0.3792724609375, 0.398406982421875, 0.41754150390625, 0.436676025390625, 0.455810546875, 0.474945068359375, 0.49407958984375, 0.513214111328125, 0.5323486328125, 0.551483154296875, 0.57061767578125, 0.589752197265625, 0.60888671875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 3.0, 22.0, 8.0, 11.0, 13.0, 13.0, 13.0, 32.0, 29.0, 29.0, 39.0, 42.0, 59.0, 81.0, 114.0, 175.0, 285.0, 1299.0, 184.0, 134.0, 83.0, 60.0, 51.0, 35.0, 36.0, 26.0, 31.0, 19.0, 20.0, 22.0, 14.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9267578125, -1.8685302734375, -1.810302734375, -1.7520751953125, -1.69384765625, -1.6356201171875, -1.577392578125, -1.5191650390625, -1.4609375, -1.4027099609375, -1.344482421875, -1.2862548828125, -1.22802734375, -1.1697998046875, -1.111572265625, -1.0533447265625, -0.9951171875, -0.9368896484375, -0.878662109375, -0.8204345703125, -0.76220703125, -0.7039794921875, -0.645751953125, -0.5875244140625, -0.529296875, -0.4710693359375, -0.412841796875, -0.3546142578125, -0.29638671875, -0.2381591796875, -0.179931640625, -0.1217041015625, -0.0634765625, -0.0052490234375, 0.052978515625, 0.1112060546875, 0.16943359375, 0.2276611328125, 0.285888671875, 0.3441162109375, 0.40234375, 0.4605712890625, 0.518798828125, 0.5770263671875, 0.63525390625, 0.6934814453125, 0.751708984375, 0.8099365234375, 0.8681640625, 0.9263916015625, 0.984619140625, 1.0428466796875, 1.10107421875, 1.1593017578125, 1.217529296875, 1.2757568359375, 1.333984375, 1.3922119140625, 1.450439453125, 1.5086669921875, 1.56689453125, 1.6251220703125, 1.683349609375, 1.7415771484375, 1.7998046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 3.0, 4.0, 8.0, 8.0, 11.0, 12.0, 25.0, 25.0, 40.0, 46.0, 48.0, 72.0, 123.0, 141.0, 234.0, 458.0, 1074.0, 3685.0, 17659.0, 159829.0, 2418918.0, 498145.0, 35704.0, 6223.0, 1643.0, 618.0, 283.0, 198.0, 121.0, 94.0, 72.0, 32.0, 28.0, 26.0, 21.0, 20.0, 7.0, 16.0, 7.0, 5.0, 4.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.3203125, -2.24468994140625, -2.1690673828125, -2.09344482421875, -2.017822265625, -1.94219970703125, -1.8665771484375, -1.79095458984375, -1.71533203125, -1.63970947265625, -1.5640869140625, -1.48846435546875, -1.412841796875, -1.33721923828125, -1.2615966796875, -1.18597412109375, -1.1103515625, -1.03472900390625, -0.9591064453125, -0.88348388671875, -0.807861328125, -0.73223876953125, -0.6566162109375, -0.58099365234375, -0.50537109375, -0.42974853515625, -0.3541259765625, -0.27850341796875, -0.202880859375, -0.12725830078125, -0.0516357421875, 0.02398681640625, 0.099609375, 0.17523193359375, 0.2508544921875, 0.32647705078125, 0.402099609375, 0.47772216796875, 0.5533447265625, 0.62896728515625, 0.70458984375, 0.78021240234375, 0.8558349609375, 0.93145751953125, 1.007080078125, 1.08270263671875, 1.1583251953125, 1.23394775390625, 1.3095703125, 1.38519287109375, 1.4608154296875, 1.53643798828125, 1.612060546875, 1.68768310546875, 1.7633056640625, 1.83892822265625, 1.91455078125, 1.99017333984375, 2.0657958984375, 2.14141845703125, 2.217041015625, 2.29266357421875, 2.3682861328125, 2.44390869140625, 2.51953125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 29.0, 120.0, 300.0, 344.0, 160.0, 44.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.600311279296875, -5.230874061584473, -4.8614373207092285, -4.492000102996826, -4.122562885284424, -3.7531259059906006, -3.3836889266967773, -3.014251708984375, -2.6448147296905518, -2.2753777503967285, -1.9059405326843262, -1.536503553390503, -1.1670664548873901, -0.7976293563842773, -0.4281923770904541, -0.05875515937805176, 0.3106818199157715, 0.6801189184188843, 1.049556016921997, 1.4189929962158203, 1.788430094718933, 2.157867193222046, 2.527304172515869, 2.8967413902282715, 3.2661783695220947, 3.635615348815918, 4.00505256652832, 4.374489784240723, 4.743926525115967, 5.113363742828369, 5.482800483703613, 5.852237701416016, 6.221674919128418, 6.59111213684082, 6.9605488777160645, 7.329986095428467, 7.699423313140869, 8.068860054016113, 8.438297271728516, 8.807734489440918, 9.17717170715332, 9.546608924865723, 9.916046142578125, 10.285482406616211, 10.654919624328613, 11.024356842041016, 11.393794059753418, 11.76323127746582, 12.132667541503906, 12.502104759216309, 12.871541976928711, 13.240978240966797, 13.6104154586792, 13.979852676391602, 14.349289894104004, 14.718727111816406, 15.088164329528809, 15.457601547241211, 15.827038764953613, 16.196475982666016, 16.5659122467041, 16.93535041809082, 17.304786682128906, 17.674224853515625, 18.04366111755371]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 13.0, 9.0, 10.0, 10.0, 10.0, 12.0, 25.0, 17.0, 16.0, 37.0, 30.0, 22.0, 30.0, 30.0, 26.0, 40.0, 37.0, 42.0, 40.0, 43.0, 32.0, 35.0, 25.0, 42.0, 37.0, 37.0, 37.0, 22.0, 41.0, 25.0, 22.0, 18.0, 21.0, 17.0, 12.0, 16.0, 10.0, 9.0, 5.0, 12.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.332038879394531, -4.194317817687988, -4.056596755981445, -3.9188759326934814, -3.7811548709869385, -3.6434340476989746, -3.5057129859924316, -3.3679919242858887, -3.2302708625793457, -3.0925498008728027, -2.954828977584839, -2.817107915878296, -2.679386854171753, -2.541666030883789, -2.403944969177246, -2.266223907470703, -2.1285030841827393, -1.9907821416854858, -1.8530610799789429, -1.7153401374816895, -1.5776190757751465, -1.439898133277893, -1.3021771907806396, -1.1644561290740967, -1.0267351865768433, -0.8890141844749451, -0.7512931823730469, -0.6135722398757935, -0.47585123777389526, -0.33813023567199707, -0.20040929317474365, -0.06268829107284546, 0.07503271102905273, 0.21275369822978973, 0.35047468543052673, 0.48819565773010254, 0.6259166598320007, 0.7636376619338989, 0.9013586044311523, 1.0390796661376953, 1.1768006086349487, 1.3145215511322021, 1.4522426128387451, 1.5899635553359985, 1.727684497833252, 1.865405559539795, 2.003126621246338, 2.1408474445343018, 2.2785685062408447, 2.4162895679473877, 2.5540103912353516, 2.6917314529418945, 2.8294525146484375, 2.9671735763549805, 3.1048943996429443, 3.2426154613494873, 3.380336284637451, 3.518057346343994, 3.655778169631958, 3.793499231338501, 3.931220293045044, 4.068941116333008, 4.206662178039551, 4.344383239746094, 4.482104301452637]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 5.0, 9.0, 6.0, 9.0, 17.0, 14.0, 19.0, 17.0, 31.0, 21.0, 32.0, 28.0, 28.0, 32.0, 29.0, 35.0, 33.0, 47.0, 42.0, 28.0, 33.0, 40.0, 40.0, 42.0, 43.0, 32.0, 27.0, 28.0, 35.0, 21.0, 25.0, 20.0, 26.0, 21.0, 23.0, 10.0, 6.0, 4.0, 4.0, 3.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.55859375, -0.540985107421875, -0.52337646484375, -0.505767822265625, -0.4881591796875, -0.470550537109375, -0.45294189453125, -0.435333251953125, -0.417724609375, -0.400115966796875, -0.38250732421875, -0.364898681640625, -0.3472900390625, -0.329681396484375, -0.31207275390625, -0.294464111328125, -0.27685546875, -0.259246826171875, -0.24163818359375, -0.224029541015625, -0.2064208984375, -0.188812255859375, -0.17120361328125, -0.153594970703125, -0.135986328125, -0.118377685546875, -0.10076904296875, -0.083160400390625, -0.0655517578125, -0.047943115234375, -0.03033447265625, -0.012725830078125, 0.0048828125, 0.022491455078125, 0.04010009765625, 0.057708740234375, 0.0753173828125, 0.092926025390625, 0.11053466796875, 0.128143310546875, 0.145751953125, 0.163360595703125, 0.18096923828125, 0.198577880859375, 0.2161865234375, 0.233795166015625, 0.25140380859375, 0.269012451171875, 0.28662109375, 0.304229736328125, 0.32183837890625, 0.339447021484375, 0.3570556640625, 0.374664306640625, 0.39227294921875, 0.409881591796875, 0.427490234375, 0.445098876953125, 0.46270751953125, 0.480316162109375, 0.4979248046875, 0.515533447265625, 0.53314208984375, 0.550750732421875, 0.568359375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 17.0, 11.0, 23.0, 21.0, 47.0, 39.0, 55.0, 87.0, 123.0, 140.0, 211.0, 265.0, 342.0, 498.0, 740.0, 1071.0, 1648.0, 2614.0, 4270.0, 7726.0, 15178.0, 34508.0, 106124.0, 472766.0, 2097479.0, 1118060.0, 221284.0, 60205.0, 22863.0, 10807.0, 5702.0, 3310.0, 1996.0, 1191.0, 877.0, 542.0, 386.0, 318.0, 202.0, 156.0, 84.0, 75.0, 56.0, 40.0, 43.0, 23.0, 23.0, 3.0, 9.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0380859375, -1.0063934326171875, -0.974700927734375, -0.9430084228515625, -0.91131591796875, -0.8796234130859375, -0.847930908203125, -0.8162384033203125, -0.7845458984375, -0.7528533935546875, -0.721160888671875, -0.6894683837890625, -0.65777587890625, -0.6260833740234375, -0.594390869140625, -0.5626983642578125, -0.531005859375, -0.4993133544921875, -0.467620849609375, -0.4359283447265625, -0.40423583984375, -0.3725433349609375, -0.340850830078125, -0.3091583251953125, -0.2774658203125, -0.2457733154296875, -0.214080810546875, -0.1823883056640625, -0.15069580078125, -0.1190032958984375, -0.087310791015625, -0.0556182861328125, -0.02392578125, 0.0077667236328125, 0.039459228515625, 0.0711517333984375, 0.10284423828125, 0.1345367431640625, 0.166229248046875, 0.1979217529296875, 0.2296142578125, 0.2613067626953125, 0.292999267578125, 0.3246917724609375, 0.35638427734375, 0.3880767822265625, 0.419769287109375, 0.4514617919921875, 0.483154296875, 0.5148468017578125, 0.546539306640625, 0.5782318115234375, 0.60992431640625, 0.6416168212890625, 0.673309326171875, 0.7050018310546875, 0.7366943359375, 0.7683868408203125, 0.800079345703125, 0.8317718505859375, 0.86346435546875, 0.8951568603515625, 0.926849365234375, 0.9585418701171875, 0.990234375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 13.0, 8.0, 13.0, 18.0, 32.0, 37.0, 36.0, 83.0, 97.0, 141.0, 213.0, 361.0, 539.0, 717.0, 602.0, 405.0, 233.0, 148.0, 95.0, 81.0, 55.0, 33.0, 23.0, 20.0, 12.0, 8.0, 10.0, 2.0, 7.0, 5.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.2226104736328125, -1.182525634765625, -1.1424407958984375, -1.10235595703125, -1.0622711181640625, -1.022186279296875, -0.9821014404296875, -0.9420166015625, -0.9019317626953125, -0.861846923828125, -0.8217620849609375, -0.78167724609375, -0.7415924072265625, -0.701507568359375, -0.6614227294921875, -0.621337890625, -0.5812530517578125, -0.541168212890625, -0.5010833740234375, -0.46099853515625, -0.4209136962890625, -0.380828857421875, -0.3407440185546875, -0.3006591796875, -0.2605743408203125, -0.220489501953125, -0.1804046630859375, -0.14031982421875, -0.1002349853515625, -0.060150146484375, -0.0200653076171875, 0.02001953125, 0.0601043701171875, 0.100189208984375, 0.1402740478515625, 0.18035888671875, 0.2204437255859375, 0.260528564453125, 0.3006134033203125, 0.3406982421875, 0.3807830810546875, 0.420867919921875, 0.4609527587890625, 0.50103759765625, 0.5411224365234375, 0.581207275390625, 0.6212921142578125, 0.661376953125, 0.7014617919921875, 0.741546630859375, 0.7816314697265625, 0.82171630859375, 0.8618011474609375, 0.901885986328125, 0.9419708251953125, 0.9820556640625, 1.0221405029296875, 1.062225341796875, 1.1023101806640625, 1.14239501953125, 1.1824798583984375, 1.222564697265625, 1.2626495361328125, 1.302734375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 3.0, 7.0, 10.0, 14.0, 13.0, 24.0, 28.0, 52.0, 91.0, 174.0, 321.0, 658.0, 1577.0, 4756.0, 22948.0, 336649.0, 3651541.0, 154327.0, 14895.0, 3673.0, 1337.0, 539.0, 270.0, 125.0, 65.0, 65.0, 34.0, 22.0, 16.0, 8.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.98248291015625, -3.8555908203125, -3.72869873046875, -3.601806640625, -3.47491455078125, -3.3480224609375, -3.22113037109375, -3.09423828125, -2.96734619140625, -2.8404541015625, -2.71356201171875, -2.586669921875, -2.45977783203125, -2.3328857421875, -2.20599365234375, -2.0791015625, -1.95220947265625, -1.8253173828125, -1.69842529296875, -1.571533203125, -1.44464111328125, -1.3177490234375, -1.19085693359375, -1.06396484375, -0.93707275390625, -0.8101806640625, -0.68328857421875, -0.556396484375, -0.42950439453125, -0.3026123046875, -0.17572021484375, -0.048828125, 0.07806396484375, 0.2049560546875, 0.33184814453125, 0.458740234375, 0.58563232421875, 0.7125244140625, 0.83941650390625, 0.96630859375, 1.09320068359375, 1.2200927734375, 1.34698486328125, 1.473876953125, 1.60076904296875, 1.7276611328125, 1.85455322265625, 1.9814453125, 2.10833740234375, 2.2352294921875, 2.36212158203125, 2.489013671875, 2.61590576171875, 2.7427978515625, 2.86968994140625, 2.99658203125, 3.12347412109375, 3.2503662109375, 3.37725830078125, 3.504150390625, 3.63104248046875, 3.7579345703125, 3.88482666015625, 4.01171875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 31.0, 187.0, 501.0, 240.0, 45.0, 5.0, 2.0, 3.0], "bins": [-49.20568084716797, -48.3653450012207, -47.52500534057617, -46.684669494628906, -45.84433364868164, -45.003997802734375, -44.163658142089844, -43.32332229614258, -42.48298645019531, -41.64265060424805, -40.802310943603516, -39.96197509765625, -39.121639251708984, -38.28130340576172, -37.44096374511719, -36.60062789916992, -35.760292053222656, -34.91995620727539, -34.07961654663086, -33.239280700683594, -32.39894485473633, -31.55860710144043, -30.71826934814453, -29.877933502197266, -29.037593841552734, -28.197256088256836, -27.35692024230957, -26.516582489013672, -25.676246643066406, -24.835908889770508, -23.99557113647461, -23.155235290527344, -22.314899444580078, -21.47456169128418, -20.634225845336914, -19.793888092041016, -18.95355224609375, -18.11321449279785, -17.272876739501953, -16.432540893554688, -15.592205047607422, -14.75186824798584, -13.911531448364258, -13.07119369506836, -12.230857849121094, -11.390520095825195, -10.550183296203613, -9.709846496582031, -8.86950969696045, -8.029172897338867, -7.188836097717285, -6.348498821258545, -5.508162021636963, -4.667825222015381, -3.8274879455566406, -2.9871511459350586, -2.1468143463134766, -1.306477427482605, -0.4661405086517334, 0.37419652938842773, 1.2145333290100098, 2.054870128631592, 2.895207405090332, 3.735544204711914, 4.575881004333496]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 3.0, 11.0, 9.0, 15.0, 13.0, 7.0, 17.0, 21.0, 21.0, 34.0, 30.0, 27.0, 38.0, 42.0, 44.0, 50.0, 45.0, 44.0, 41.0, 48.0, 47.0, 33.0, 32.0, 44.0, 39.0, 39.0, 29.0, 34.0, 26.0, 25.0, 13.0, 13.0, 13.0, 9.0, 12.0, 10.0, 8.0, 5.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8542869091033936, -3.723174810409546, -3.5920629501342773, -3.4609508514404297, -3.329838991165161, -3.1987268924713135, -3.067615032196045, -2.9365029335021973, -2.8053908348083496, -2.674278736114502, -2.5431668758392334, -2.4120547771453857, -2.280942916870117, -2.1498308181762695, -2.018718719482422, -1.8876068592071533, -1.7564949989318848, -1.6253830194473267, -1.4942710399627686, -1.363158941268921, -1.2320470809936523, -1.1009349822998047, -0.9698230028152466, -0.8387110233306885, -0.7075990438461304, -0.5764870643615723, -0.4453750550746918, -0.3142630457878113, -0.18315106630325317, -0.05203908681869507, 0.07907295227050781, 0.21018493175506592, 0.3412966728210449, 0.472408652305603, 0.6035206317901611, 0.734632670879364, 0.8657446503639221, 0.9968566298484802, 1.127968668937683, 1.2590806484222412, 1.3901926279067993, 1.5213046073913574, 1.6524165868759155, 1.7835285663604736, 1.9146406650543213, 2.04575252532959, 2.1768646240234375, 2.307976722717285, 2.4390885829925537, 2.5702006816864014, 2.70131254196167, 2.8324246406555176, 2.963536500930786, 3.094648599624634, 3.2257604598999023, 3.35687255859375, 3.4879846572875977, 3.6190967559814453, 3.750208616256714, 3.8813207149505615, 4.01243257522583, 4.143544673919678, 4.274656772613525, 4.405768394470215, 4.5368804931640625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 11.0, 17.0, 12.0, 16.0, 26.0, 18.0, 28.0, 25.0, 29.0, 40.0, 35.0, 47.0, 37.0, 37.0, 32.0, 45.0, 44.0, 40.0, 46.0, 53.0, 30.0, 30.0, 43.0, 31.0, 39.0, 31.0, 20.0, 27.0, 13.0, 17.0, 9.0, 10.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5849609375, -0.5647201538085938, -0.5444793701171875, -0.5242385864257812, -0.503997802734375, -0.48375701904296875, -0.4635162353515625, -0.44327545166015625, -0.42303466796875, -0.40279388427734375, -0.3825531005859375, -0.36231231689453125, -0.342071533203125, -0.32183074951171875, -0.3015899658203125, -0.28134918212890625, -0.2611083984375, -0.24086761474609375, -0.2206268310546875, -0.20038604736328125, -0.180145263671875, -0.15990447998046875, -0.1396636962890625, -0.11942291259765625, -0.09918212890625, -0.07894134521484375, -0.0587005615234375, -0.03845977783203125, -0.018218994140625, 0.00202178955078125, 0.0222625732421875, 0.04250335693359375, 0.062744140625, 0.08298492431640625, 0.1032257080078125, 0.12346649169921875, 0.143707275390625, 0.16394805908203125, 0.1841888427734375, 0.20442962646484375, 0.22467041015625, 0.24491119384765625, 0.2651519775390625, 0.28539276123046875, 0.305633544921875, 0.32587432861328125, 0.3461151123046875, 0.36635589599609375, 0.3865966796875, 0.40683746337890625, 0.4270782470703125, 0.44731903076171875, 0.467559814453125, 0.48780059814453125, 0.5080413818359375, 0.5282821655273438, 0.54852294921875, 0.5687637329101562, 0.5890045166015625, 0.6092453002929688, 0.629486083984375, 0.6497268676757812, 0.6699676513671875, 0.6902084350585938, 0.71044921875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 10.0, 6.0, 10.0, 18.0, 14.0, 31.0, 45.0, 48.0, 81.0, 150.0, 217.0, 303.0, 433.0, 623.0, 998.0, 1494.0, 2360.0, 3686.0, 5875.0, 9301.0, 15324.0, 25142.0, 44294.0, 77796.0, 138604.0, 210869.0, 204417.0, 129627.0, 72998.0, 41383.0, 23699.0, 14501.0, 8835.0, 5422.0, 3496.0, 2206.0, 1444.0, 956.0, 608.0, 393.0, 262.0, 187.0, 112.0, 83.0, 70.0, 45.0, 26.0, 21.0, 11.0, 8.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06964111328125, -0.06731510162353516, -0.06498908996582031, -0.06266307830810547, -0.060337066650390625, -0.05801105499267578, -0.05568504333496094, -0.053359031677246094, -0.05103302001953125, -0.048707008361816406, -0.04638099670410156, -0.04405498504638672, -0.041728973388671875, -0.03940296173095703, -0.03707695007324219, -0.034750938415527344, -0.0324249267578125, -0.030098915100097656, -0.027772903442382812, -0.02544689178466797, -0.023120880126953125, -0.02079486846923828, -0.018468856811523438, -0.016142845153808594, -0.01381683349609375, -0.011490821838378906, -0.009164810180664062, -0.006838798522949219, -0.004512786865234375, -0.0021867752075195312, 0.0001392364501953125, 0.0024652481079101562, 0.004791259765625, 0.007117271423339844, 0.009443283081054688, 0.011769294738769531, 0.014095306396484375, 0.01642131805419922, 0.018747329711914062, 0.021073341369628906, 0.02339935302734375, 0.025725364685058594, 0.028051376342773438, 0.03037738800048828, 0.032703399658203125, 0.03502941131591797, 0.03735542297363281, 0.039681434631347656, 0.0420074462890625, 0.044333457946777344, 0.04665946960449219, 0.04898548126220703, 0.051311492919921875, 0.05363750457763672, 0.05596351623535156, 0.058289527893066406, 0.06061553955078125, 0.0629415512084961, 0.06526756286621094, 0.06759357452392578, 0.06991958618164062, 0.07224559783935547, 0.07457160949707031, 0.07689762115478516, 0.0792236328125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 4.0, 8.0, 12.0, 15.0, 13.0, 11.0, 13.0, 16.0, 26.0, 28.0, 27.0, 34.0, 23.0, 21.0, 29.0, 39.0, 28.0, 36.0, 40.0, 1065.0, 39.0, 45.0, 32.0, 39.0, 39.0, 32.0, 33.0, 31.0, 29.0, 34.0, 22.0, 29.0, 15.0, 20.0, 8.0, 9.0, 16.0, 10.0, 7.0, 5.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.43701171875, -0.42236328125, -0.40771484375, -0.39306640625, -0.37841796875, -0.36376953125, -0.34912109375, -0.33447265625, -0.31982421875, -0.30517578125, -0.29052734375, -0.27587890625, -0.26123046875, -0.24658203125, -0.23193359375, -0.21728515625, -0.20263671875, -0.18798828125, -0.17333984375, -0.15869140625, -0.14404296875, -0.12939453125, -0.11474609375, -0.10009765625, -0.08544921875, -0.07080078125, -0.05615234375, -0.04150390625, -0.02685546875, -0.01220703125, 0.00244140625, 0.01708984375, 0.03173828125, 0.04638671875, 0.06103515625, 0.07568359375, 0.09033203125, 0.10498046875, 0.11962890625, 0.13427734375, 0.14892578125, 0.16357421875, 0.17822265625, 0.19287109375, 0.20751953125, 0.22216796875, 0.23681640625, 0.25146484375, 0.26611328125, 0.28076171875, 0.29541015625, 0.31005859375, 0.32470703125, 0.33935546875, 0.35400390625, 0.36865234375, 0.38330078125, 0.39794921875, 0.41259765625, 0.42724609375, 0.44189453125, 0.45654296875, 0.47119140625, 0.48583984375, 0.50048828125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 15.0, 27.0, 22.0, 46.0, 58.0, 81.0, 105.0, 142.0, 261.0, 307.0, 482.0, 709.0, 972.0, 1482.0, 2219.0, 3429.0, 5378.0, 8826.0, 15889.0, 37677.0, 277440.0, 1631703.0, 60613.0, 20529.0, 10584.0, 6265.0, 3917.0, 2500.0, 1722.0, 1163.0, 804.0, 523.0, 376.0, 233.0, 212.0, 103.0, 86.0, 74.0, 29.0, 34.0, 27.0, 15.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1395263671875, -0.13544368743896484, -0.1313610076904297, -0.12727832794189453, -0.12319564819335938, -0.11911296844482422, -0.11503028869628906, -0.1109476089477539, -0.10686492919921875, -0.1027822494506836, -0.09869956970214844, -0.09461688995361328, -0.09053421020507812, -0.08645153045654297, -0.08236885070800781, -0.07828617095947266, -0.0742034912109375, -0.07012081146240234, -0.06603813171386719, -0.06195545196533203, -0.057872772216796875, -0.05379009246826172, -0.04970741271972656, -0.045624732971191406, -0.04154205322265625, -0.037459373474121094, -0.03337669372558594, -0.02929401397705078, -0.025211334228515625, -0.02112865447998047, -0.017045974731445312, -0.012963294982910156, -0.008880615234375, -0.004797935485839844, -0.0007152557373046875, 0.0033674240112304688, 0.007450103759765625, 0.011532783508300781, 0.015615463256835938, 0.019698143005371094, 0.02378082275390625, 0.027863502502441406, 0.03194618225097656, 0.03602886199951172, 0.040111541748046875, 0.04419422149658203, 0.04827690124511719, 0.052359580993652344, 0.0564422607421875, 0.060524940490722656, 0.06460762023925781, 0.06869029998779297, 0.07277297973632812, 0.07685565948486328, 0.08093833923339844, 0.0850210189819336, 0.08910369873046875, 0.0931863784790039, 0.09726905822753906, 0.10135173797607422, 0.10543441772460938, 0.10951709747314453, 0.11359977722167969, 0.11768245697021484, 0.12176513671875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 11.0, 11.0, 6.0, 12.0, 18.0, 9.0, 21.0, 26.0, 23.0, 34.0, 40.0, 54.0, 57.0, 54.0, 58.0, 56.0, 50.0, 50.0, 59.0, 42.0, 54.0, 47.0, 34.0, 34.0, 28.0, 25.0, 12.0, 15.0, 13.0, 11.0, 11.0, 4.0, 7.0, 2.0, 3.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.008948564529418945, -0.00867319107055664, -0.008397817611694336, -0.008122444152832031, -0.007847070693969727, -0.007571697235107422, -0.007296323776245117, -0.0070209503173828125, -0.006745576858520508, -0.006470203399658203, -0.0061948299407958984, -0.005919456481933594, -0.005644083023071289, -0.005368709564208984, -0.00509333610534668, -0.004817962646484375, -0.00454258918762207, -0.004267215728759766, -0.003991842269897461, -0.0037164688110351562, -0.0034410953521728516, -0.003165721893310547, -0.002890348434448242, -0.0026149749755859375, -0.002339601516723633, -0.002064228057861328, -0.0017888545989990234, -0.0015134811401367188, -0.001238107681274414, -0.0009627342224121094, -0.0006873607635498047, -0.0004119873046875, -0.0001366138458251953, 0.00013875961303710938, 0.00041413307189941406, 0.0006895065307617188, 0.0009648799896240234, 0.0012402534484863281, 0.0015156269073486328, 0.0017910003662109375, 0.002066373825073242, 0.002341747283935547, 0.0026171207427978516, 0.0028924942016601562, 0.003167867660522461, 0.0034432411193847656, 0.0037186145782470703, 0.003993988037109375, 0.00426936149597168, 0.004544734954833984, 0.004820108413696289, 0.005095481872558594, 0.0053708553314208984, 0.005646228790283203, 0.005921602249145508, 0.0061969757080078125, 0.006472349166870117, 0.006747722625732422, 0.0070230960845947266, 0.007298469543457031, 0.007573843002319336, 0.00784921646118164, 0.008124589920043945, 0.00839996337890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 5.0, 7.0, 3.0, 9.0, 13.0, 11.0, 16.0, 16.0, 31.0, 50.0, 46.0, 85.0, 116.0, 137.0, 255.0, 610.0, 11392.0, 1031311.0, 3175.0, 479.0, 240.0, 139.0, 110.0, 81.0, 44.0, 39.0, 31.0, 17.0, 16.0, 16.0, 13.0, 7.0, 12.0, 8.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16432952880859375, -0.1587371826171875, -0.15314483642578125, -0.147552490234375, -0.14196014404296875, -0.1363677978515625, -0.13077545166015625, -0.12518310546875, -0.11959075927734375, -0.1139984130859375, -0.10840606689453125, -0.102813720703125, -0.09722137451171875, -0.0916290283203125, -0.08603668212890625, -0.0804443359375, -0.07485198974609375, -0.0692596435546875, -0.06366729736328125, -0.058074951171875, -0.05248260498046875, -0.0468902587890625, -0.04129791259765625, -0.03570556640625, -0.03011322021484375, -0.0245208740234375, -0.01892852783203125, -0.013336181640625, -0.00774383544921875, -0.0021514892578125, 0.00344085693359375, 0.009033203125, 0.01462554931640625, 0.0202178955078125, 0.02581024169921875, 0.031402587890625, 0.03699493408203125, 0.0425872802734375, 0.04817962646484375, 0.05377197265625, 0.05936431884765625, 0.0649566650390625, 0.07054901123046875, 0.076141357421875, 0.08173370361328125, 0.0873260498046875, 0.09291839599609375, 0.0985107421875, 0.10410308837890625, 0.1096954345703125, 0.11528778076171875, 0.120880126953125, 0.12647247314453125, 0.1320648193359375, 0.13765716552734375, 0.14324951171875, 0.14884185791015625, 0.1544342041015625, 0.16002655029296875, 0.165618896484375, 0.17121124267578125, 0.1768035888671875, 0.18239593505859375, 0.18798828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 24.0, 620.0, 370.0, 3.0], "bins": [-0.23439927399158478, -0.23061445355415344, -0.2268296331167221, -0.22304481267929077, -0.21925999224185944, -0.2154751718044281, -0.21169035136699677, -0.20790553092956543, -0.2041206955909729, -0.20033587515354156, -0.19655105471611023, -0.1927662342786789, -0.18898141384124756, -0.18519659340381622, -0.1814117729663849, -0.17762693762779236, -0.17384213209152222, -0.17005731165409088, -0.16627249121665955, -0.1624876707792282, -0.15870285034179688, -0.15491802990436554, -0.1511332094669342, -0.14734837412834167, -0.14356356859207153, -0.1397787481546402, -0.13599392771720886, -0.13220910727977753, -0.1284242868423462, -0.12463946640491486, -0.12085463851690292, -0.11706981807947159, -0.11328499764204025, -0.10950017720460892, -0.10571535676717758, -0.10193053632974625, -0.09814570844173431, -0.09436088800430298, -0.09057606756687164, -0.08679124712944031, -0.08300642669200897, -0.07922160625457764, -0.0754367858171463, -0.07165196537971497, -0.06786714494228363, -0.0640823245048523, -0.06029749661684036, -0.05651267617940903, -0.05272785201668739, -0.04894303157925606, -0.045158207416534424, -0.04137338697910309, -0.03758856654167175, -0.03380374610424042, -0.030018923804163933, -0.026234101504087448, -0.022449281066656113, -0.018664460629224777, -0.014879638329148293, -0.011094816960394382, -0.007309995591640472, -0.003525175154209137, 0.0002596471458673477, 0.004044469445943832, 0.007829288952052593]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 11.0, 11.0, 16.0, 22.0, 16.0, 18.0, 24.0, 20.0, 20.0, 29.0, 30.0, 30.0, 42.0, 37.0, 32.0, 55.0, 32.0, 54.0, 54.0, 33.0, 45.0, 42.0, 46.0, 42.0, 33.0, 35.0, 28.0, 28.0, 20.0, 17.0, 15.0, 13.0, 7.0, 8.0, 11.0, 4.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-0.02178424596786499, -0.021189220249652863, -0.020594192668795586, -0.01999916508793831, -0.01940413936972618, -0.018809113651514053, -0.018214086070656776, -0.0176190584897995, -0.017024032771587372, -0.016429007053375244, -0.015833979472517967, -0.015238952822983265, -0.014643926173448563, -0.01404889952391386, -0.013453872874379158, -0.012858846224844456, -0.012263819575309753, -0.011668792925775051, -0.011073766276240349, -0.010478739626705647, -0.009883712977170944, -0.009288686327636242, -0.00869365967810154, -0.008098633028566837, -0.007503606379032135, -0.006908579729497433, -0.00631355307996273, -0.005718526430428028, -0.005123499780893326, -0.0045284731313586235, -0.003933446481823921, -0.003338419832289219, -0.0027433931827545166, -0.0021483665332198143, -0.001553339883685112, -0.0009583132341504097, -0.0003632865846157074, 0.0002317400649189949, 0.0008267667144536972, 0.0014217933639883995, 0.002016820013523102, 0.002611846663057804, 0.0032068733125925064, 0.0038018999621272087, 0.004396926611661911, 0.004991953261196613, 0.005586979910731316, 0.006182006560266018, 0.00677703320980072, 0.0073720598593354225, 0.007967086508870125, 0.008562113158404827, 0.00915713980793953, 0.009752166457474232, 0.010347193107008934, 0.010942219756543636, 0.011537246406078339, 0.012132273055613041, 0.012727299705147743, 0.013322326354682446, 0.013917353004217148, 0.01451237965375185, 0.015107406303286552, 0.01570243388414383, 0.016297459602355957]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 8.0, 9.0, 12.0, 17.0, 10.0, 19.0, 24.0, 20.0, 26.0, 27.0, 30.0, 38.0, 33.0, 49.0, 36.0, 38.0, 33.0, 44.0, 44.0, 39.0, 46.0, 54.0, 29.0, 30.0, 43.0, 32.0, 38.0, 32.0, 21.0, 25.0, 12.0, 18.0, 9.0, 11.0, 9.0, 8.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.564239501953125, -0.54400634765625, -0.523773193359375, -0.5035400390625, -0.483306884765625, -0.46307373046875, -0.442840576171875, -0.422607421875, -0.402374267578125, -0.38214111328125, -0.361907958984375, -0.3416748046875, -0.321441650390625, -0.30120849609375, -0.280975341796875, -0.2607421875, -0.240509033203125, -0.22027587890625, -0.200042724609375, -0.1798095703125, -0.159576416015625, -0.13934326171875, -0.119110107421875, -0.098876953125, -0.078643798828125, -0.05841064453125, -0.038177490234375, -0.0179443359375, 0.002288818359375, 0.02252197265625, 0.042755126953125, 0.06298828125, 0.083221435546875, 0.10345458984375, 0.123687744140625, 0.1439208984375, 0.164154052734375, 0.18438720703125, 0.204620361328125, 0.224853515625, 0.245086669921875, 0.26531982421875, 0.285552978515625, 0.3057861328125, 0.326019287109375, 0.34625244140625, 0.366485595703125, 0.38671875, 0.406951904296875, 0.42718505859375, 0.447418212890625, 0.4676513671875, 0.487884521484375, 0.50811767578125, 0.528350830078125, 0.548583984375, 0.568817138671875, 0.58905029296875, 0.609283447265625, 0.6295166015625, 0.649749755859375, 0.66998291015625, 0.690216064453125, 0.71044921875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 13.0, 12.0, 14.0, 27.0, 39.0, 43.0, 58.0, 68.0, 106.0, 170.0, 261.0, 397.0, 545.0, 929.0, 1562.0, 2933.0, 5552.0, 11637.0, 25315.0, 65332.0, 209239.0, 435103.0, 184307.0, 58648.0, 23569.0, 10702.0, 5239.0, 2786.0, 1510.0, 890.0, 538.0, 353.0, 198.0, 131.0, 88.0, 67.0, 57.0, 40.0, 14.0, 22.0, 8.0, 6.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.162109375, -1.1273651123046875, -1.092620849609375, -1.0578765869140625, -1.02313232421875, -0.9883880615234375, -0.953643798828125, -0.9188995361328125, -0.8841552734375, -0.8494110107421875, -0.814666748046875, -0.7799224853515625, -0.74517822265625, -0.7104339599609375, -0.675689697265625, -0.6409454345703125, -0.606201171875, -0.5714569091796875, -0.536712646484375, -0.5019683837890625, -0.46722412109375, -0.4324798583984375, -0.397735595703125, -0.3629913330078125, -0.3282470703125, -0.2935028076171875, -0.258758544921875, -0.2240142822265625, -0.18927001953125, -0.1545257568359375, -0.119781494140625, -0.0850372314453125, -0.05029296875, -0.0155487060546875, 0.019195556640625, 0.0539398193359375, 0.08868408203125, 0.1234283447265625, 0.158172607421875, 0.1929168701171875, 0.2276611328125, 0.2624053955078125, 0.297149658203125, 0.3318939208984375, 0.36663818359375, 0.4013824462890625, 0.436126708984375, 0.4708709716796875, 0.505615234375, 0.5403594970703125, 0.575103759765625, 0.6098480224609375, 0.64459228515625, 0.6793365478515625, 0.714080810546875, 0.7488250732421875, 0.7835693359375, 0.8183135986328125, 0.853057861328125, 0.8878021240234375, 0.92254638671875, 0.9572906494140625, 0.992034912109375, 1.0267791748046875, 1.0615234375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 15.0, 12.0, 6.0, 10.0, 18.0, 25.0, 25.0, 29.0, 25.0, 33.0, 40.0, 51.0, 70.0, 66.0, 125.0, 232.0, 1346.0, 253.0, 154.0, 89.0, 68.0, 46.0, 45.0, 40.0, 37.0, 37.0, 32.0, 13.0, 16.0, 16.0, 8.0, 8.0, 7.0, 10.0, 5.0, 3.0, 1.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.04296875, -1.9823760986328125, -1.921783447265625, -1.8611907958984375, -1.80059814453125, -1.7400054931640625, -1.679412841796875, -1.6188201904296875, -1.5582275390625, -1.4976348876953125, -1.437042236328125, -1.3764495849609375, -1.31585693359375, -1.2552642822265625, -1.194671630859375, -1.1340789794921875, -1.073486328125, -1.0128936767578125, -0.952301025390625, -0.8917083740234375, -0.83111572265625, -0.7705230712890625, -0.709930419921875, -0.6493377685546875, -0.5887451171875, -0.5281524658203125, -0.467559814453125, -0.4069671630859375, -0.34637451171875, -0.2857818603515625, -0.225189208984375, -0.1645965576171875, -0.10400390625, -0.0434112548828125, 0.017181396484375, 0.0777740478515625, 0.13836669921875, 0.1989593505859375, 0.259552001953125, 0.3201446533203125, 0.3807373046875, 0.4413299560546875, 0.501922607421875, 0.5625152587890625, 0.62310791015625, 0.6837005615234375, 0.744293212890625, 0.8048858642578125, 0.865478515625, 0.9260711669921875, 0.986663818359375, 1.0472564697265625, 1.10784912109375, 1.1684417724609375, 1.229034423828125, 1.2896270751953125, 1.3502197265625, 1.4108123779296875, 1.471405029296875, 1.5319976806640625, 1.59259033203125, 1.6531829833984375, 1.713775634765625, 1.7743682861328125, 1.8349609375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 11.0, 6.0, 3.0, 5.0, 9.0, 16.0, 16.0, 15.0, 37.0, 41.0, 45.0, 65.0, 84.0, 96.0, 185.0, 278.0, 651.0, 2047.0, 7909.0, 50405.0, 1110432.0, 1888096.0, 70688.0, 10304.0, 2483.0, 755.0, 354.0, 180.0, 128.0, 83.0, 53.0, 50.0, 38.0, 32.0, 15.0, 17.0, 19.0, 11.0, 8.0, 9.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.6671142578125, -2.568603515625, -2.4700927734375, -2.37158203125, -2.2730712890625, -2.174560546875, -2.0760498046875, -1.9775390625, -1.8790283203125, -1.780517578125, -1.6820068359375, -1.58349609375, -1.4849853515625, -1.386474609375, -1.2879638671875, -1.189453125, -1.0909423828125, -0.992431640625, -0.8939208984375, -0.79541015625, -0.6968994140625, -0.598388671875, -0.4998779296875, -0.4013671875, -0.3028564453125, -0.204345703125, -0.1058349609375, -0.00732421875, 0.0911865234375, 0.189697265625, 0.2882080078125, 0.38671875, 0.4852294921875, 0.583740234375, 0.6822509765625, 0.78076171875, 0.8792724609375, 0.977783203125, 1.0762939453125, 1.1748046875, 1.2733154296875, 1.371826171875, 1.4703369140625, 1.56884765625, 1.6673583984375, 1.765869140625, 1.8643798828125, 1.962890625, 2.0614013671875, 2.159912109375, 2.2584228515625, 2.35693359375, 2.4554443359375, 2.553955078125, 2.6524658203125, 2.7509765625, 2.8494873046875, 2.947998046875, 3.0465087890625, 3.14501953125, 3.2435302734375, 3.342041015625, 3.4405517578125, 3.5390625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 179.0, 724.0, 101.0, 2.0], "bins": [-63.521244049072266, -62.486572265625, -61.451904296875, -60.417232513427734, -59.38256072998047, -58.3478889465332, -57.3132209777832, -56.27854919433594, -55.24387741088867, -54.209205627441406, -53.174537658691406, -52.13986587524414, -51.105194091796875, -50.07052230834961, -49.03585433959961, -48.001182556152344, -46.966514587402344, -45.93184280395508, -44.89717483520508, -43.86250305175781, -42.82783126831055, -41.79315948486328, -40.75849151611328, -39.723819732666016, -38.68914794921875, -37.654476165771484, -36.619808197021484, -35.58513641357422, -34.55046463012695, -33.51579284667969, -32.48112487792969, -31.446453094482422, -30.41178321838379, -29.377113342285156, -28.34244155883789, -27.307771682739258, -26.273099899291992, -25.23843002319336, -24.203758239746094, -23.16908836364746, -22.134418487548828, -21.099748611450195, -20.06507682800293, -19.030406951904297, -17.99573516845703, -16.9610652923584, -15.92639446258545, -14.8917236328125, -13.85705280303955, -12.822381973266602, -11.787711143493652, -10.753040313720703, -9.71837043762207, -8.683698654174805, -7.649028778076172, -6.614357948303223, -5.579687118530273, -4.545016288757324, -3.510345697402954, -2.475675106048584, -1.4410042762756348, -0.40633344650268555, 0.6283369064331055, 1.6630077362060547, 2.697678804397583]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 11.0, 6.0, 7.0, 13.0, 11.0, 14.0, 15.0, 21.0, 21.0, 15.0, 24.0, 22.0, 31.0, 26.0, 27.0, 26.0, 36.0, 34.0, 40.0, 40.0, 38.0, 40.0, 37.0, 28.0, 39.0, 29.0, 24.0, 24.0, 40.0, 29.0, 30.0, 30.0, 15.0, 15.0, 20.0, 15.0, 20.0, 16.0, 13.0, 12.0, 7.0, 9.0, 8.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0], "bins": [-4.0352935791015625, -3.9008164405822754, -3.766339063644409, -3.631861925125122, -3.497384786605835, -3.3629074096679688, -3.2284302711486816, -3.0939531326293945, -2.9594759941101074, -2.8249988555908203, -2.690521478652954, -2.556044340133667, -2.42156720161438, -2.2870898246765137, -2.1526126861572266, -2.0181355476379395, -1.8836581707000732, -1.7491809129714966, -1.6147037744522095, -1.4802265167236328, -1.3457493782043457, -1.211272120475769, -1.0767948627471924, -0.9423176646232605, -0.8078404664993286, -0.6733632683753967, -0.5388860702514648, -0.4044088125228882, -0.2699316143989563, -0.13545441627502441, -0.000977158546447754, 0.13350003957748413, 0.267977237701416, 0.4024544358253479, 0.5369316339492798, 0.6714088916778564, 0.8058860898017883, 0.9403632879257202, 1.0748405456542969, 1.209317684173584, 1.3437949419021606, 1.4782721996307373, 1.6127493381500244, 1.747226595878601, 1.8817038536071777, 2.016180992126465, 2.150658130645752, 2.285135507583618, 2.4196126461029053, 2.5540897846221924, 2.6885671615600586, 2.8230443000793457, 2.957521438598633, 3.09199857711792, 3.226475954055786, 3.3609530925750732, 3.4954304695129395, 3.6299076080322266, 3.7643849849700928, 3.89886212348938, 4.033339500427246, 4.167816638946533, 4.30229377746582, 4.436770915985107, 4.5712480545043945]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 13.0, 14.0, 14.0, 20.0, 18.0, 24.0, 33.0, 24.0, 24.0, 27.0, 29.0, 27.0, 39.0, 44.0, 43.0, 35.0, 42.0, 45.0, 43.0, 50.0, 36.0, 36.0, 32.0, 39.0, 27.0, 25.0, 28.0, 19.0, 26.0, 25.0, 13.0, 8.0, 12.0, 12.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.72412109375, -0.702667236328125, -0.68121337890625, -0.659759521484375, -0.6383056640625, -0.616851806640625, -0.59539794921875, -0.573944091796875, -0.552490234375, -0.531036376953125, -0.50958251953125, -0.488128662109375, -0.4666748046875, -0.445220947265625, -0.42376708984375, -0.402313232421875, -0.380859375, -0.359405517578125, -0.33795166015625, -0.316497802734375, -0.2950439453125, -0.273590087890625, -0.25213623046875, -0.230682373046875, -0.209228515625, -0.187774658203125, -0.16632080078125, -0.144866943359375, -0.1234130859375, -0.101959228515625, -0.08050537109375, -0.059051513671875, -0.03759765625, -0.016143798828125, 0.00531005859375, 0.026763916015625, 0.0482177734375, 0.069671630859375, 0.09112548828125, 0.112579345703125, 0.134033203125, 0.155487060546875, 0.17694091796875, 0.198394775390625, 0.2198486328125, 0.241302490234375, 0.26275634765625, 0.284210205078125, 0.3056640625, 0.327117919921875, 0.34857177734375, 0.370025634765625, 0.3914794921875, 0.412933349609375, 0.43438720703125, 0.455841064453125, 0.477294921875, 0.498748779296875, 0.52020263671875, 0.541656494140625, 0.5631103515625, 0.584564208984375, 0.60601806640625, 0.627471923828125, 0.64892578125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 3.0, 11.0, 14.0, 15.0, 25.0, 32.0, 43.0, 53.0, 77.0, 126.0, 133.0, 234.0, 328.0, 535.0, 844.0, 1307.0, 2239.0, 3840.0, 6695.0, 12660.0, 27755.0, 78907.0, 328424.0, 1612354.0, 1632644.0, 343467.0, 83584.0, 28932.0, 12959.0, 6802.0, 3654.0, 2150.0, 1293.0, 778.0, 470.0, 304.0, 194.0, 130.0, 105.0, 54.0, 33.0, 27.0, 13.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2041015625, -1.169708251953125, -1.13531494140625, -1.100921630859375, -1.0665283203125, -1.032135009765625, -0.99774169921875, -0.963348388671875, -0.928955078125, -0.894561767578125, -0.86016845703125, -0.825775146484375, -0.7913818359375, -0.756988525390625, -0.72259521484375, -0.688201904296875, -0.65380859375, -0.619415283203125, -0.58502197265625, -0.550628662109375, -0.5162353515625, -0.481842041015625, -0.44744873046875, -0.413055419921875, -0.378662109375, -0.344268798828125, -0.30987548828125, -0.275482177734375, -0.2410888671875, -0.206695556640625, -0.17230224609375, -0.137908935546875, -0.103515625, -0.069122314453125, -0.03472900390625, -0.000335693359375, 0.0340576171875, 0.068450927734375, 0.10284423828125, 0.137237548828125, 0.171630859375, 0.206024169921875, 0.24041748046875, 0.274810791015625, 0.3092041015625, 0.343597412109375, 0.37799072265625, 0.412384033203125, 0.44677734375, 0.481170654296875, 0.51556396484375, 0.549957275390625, 0.5843505859375, 0.618743896484375, 0.65313720703125, 0.687530517578125, 0.721923828125, 0.756317138671875, 0.79071044921875, 0.825103759765625, 0.8594970703125, 0.893890380859375, 0.92828369140625, 0.962677001953125, 0.9970703125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 3.0, 11.0, 7.0, 12.0, 15.0, 29.0, 34.0, 54.0, 61.0, 88.0, 104.0, 187.0, 318.0, 446.0, 613.0, 691.0, 454.0, 333.0, 191.0, 115.0, 95.0, 52.0, 36.0, 31.0, 28.0, 11.0, 11.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34765625, -1.3043212890625, -1.260986328125, -1.2176513671875, -1.17431640625, -1.1309814453125, -1.087646484375, -1.0443115234375, -1.0009765625, -0.9576416015625, -0.914306640625, -0.8709716796875, -0.82763671875, -0.7843017578125, -0.740966796875, -0.6976318359375, -0.654296875, -0.6109619140625, -0.567626953125, -0.5242919921875, -0.48095703125, -0.4376220703125, -0.394287109375, -0.3509521484375, -0.3076171875, -0.2642822265625, -0.220947265625, -0.1776123046875, -0.13427734375, -0.0909423828125, -0.047607421875, -0.0042724609375, 0.0390625, 0.0823974609375, 0.125732421875, 0.1690673828125, 0.21240234375, 0.2557373046875, 0.299072265625, 0.3424072265625, 0.3857421875, 0.4290771484375, 0.472412109375, 0.5157470703125, 0.55908203125, 0.6024169921875, 0.645751953125, 0.6890869140625, 0.732421875, 0.7757568359375, 0.819091796875, 0.8624267578125, 0.90576171875, 0.9490966796875, 0.992431640625, 1.0357666015625, 1.0791015625, 1.1224365234375, 1.165771484375, 1.2091064453125, 1.25244140625, 1.2957763671875, 1.339111328125, 1.3824462890625, 1.42578125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 11.0, 3.0, 10.0, 19.0, 12.0, 20.0, 24.0, 46.0, 108.0, 146.0, 330.0, 572.0, 1375.0, 3355.0, 10433.0, 46510.0, 524606.0, 3351374.0, 214891.0, 28270.0, 7280.0, 2589.0, 1053.0, 535.0, 253.0, 183.0, 86.0, 51.0, 35.0, 24.0, 15.0, 9.0, 10.0, 9.0, 5.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.061248779296875, -2.96038818359375, -2.859527587890625, -2.7586669921875, -2.657806396484375, -2.55694580078125, -2.456085205078125, -2.355224609375, -2.254364013671875, -2.15350341796875, -2.052642822265625, -1.9517822265625, -1.850921630859375, -1.75006103515625, -1.649200439453125, -1.54833984375, -1.447479248046875, -1.34661865234375, -1.245758056640625, -1.1448974609375, -1.044036865234375, -0.94317626953125, -0.842315673828125, -0.741455078125, -0.640594482421875, -0.53973388671875, -0.438873291015625, -0.3380126953125, -0.237152099609375, -0.13629150390625, -0.035430908203125, 0.0654296875, 0.166290283203125, 0.26715087890625, 0.368011474609375, 0.4688720703125, 0.569732666015625, 0.67059326171875, 0.771453857421875, 0.872314453125, 0.973175048828125, 1.07403564453125, 1.174896240234375, 1.2757568359375, 1.376617431640625, 1.47747802734375, 1.578338623046875, 1.67919921875, 1.780059814453125, 1.88092041015625, 1.981781005859375, 2.0826416015625, 2.183502197265625, 2.28436279296875, 2.385223388671875, 2.486083984375, 2.586944580078125, 2.68780517578125, 2.788665771484375, 2.8895263671875, 2.990386962890625, 3.09124755859375, 3.192108154296875, 3.29296875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 62.0, 524.0, 391.0, 35.0, 2.0, 0.0, 0.0, 2.0], "bins": [-70.52743530273438, -69.30968475341797, -68.09193420410156, -66.87417602539062, -65.65642547607422, -64.43867492675781, -63.22092056274414, -62.003170013427734, -60.78541564941406, -59.567665100097656, -58.349910736083984, -57.13216018676758, -55.914405822753906, -54.6966552734375, -53.47890090942383, -52.26115036010742, -51.043399810791016, -49.82564926147461, -48.60789489746094, -47.39014434814453, -46.17238998413086, -44.95463943481445, -43.73688507080078, -42.519134521484375, -41.30138397216797, -40.08363342285156, -38.86587905883789, -37.648128509521484, -36.43037414550781, -35.212623596191406, -33.994869232177734, -32.77711868286133, -31.559362411499023, -30.341609954833984, -29.123857498168945, -27.906105041503906, -26.6883544921875, -25.470600128173828, -24.252849578857422, -23.035097122192383, -21.817344665527344, -20.599592208862305, -19.381839752197266, -18.164087295532227, -16.946334838867188, -15.728583335876465, -14.510831832885742, -13.293079376220703, -12.075326919555664, -10.857574462890625, -9.639822006225586, -8.422070503234863, -7.204318046569824, -5.986565589904785, -4.768813610076904, -3.5510616302490234, -2.3333096504211426, -1.1155574321746826, 0.10219478607177734, 1.3199470043182373, 2.5376992225646973, 3.7554516792297363, 4.973203659057617, 6.190955638885498, 7.408708095550537]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 3.0, 6.0, 9.0, 6.0, 16.0, 17.0, 18.0, 30.0, 21.0, 30.0, 36.0, 34.0, 30.0, 33.0, 47.0, 36.0, 47.0, 46.0, 43.0, 43.0, 39.0, 47.0, 43.0, 30.0, 35.0, 25.0, 29.0, 28.0, 25.0, 21.0, 17.0, 20.0, 13.0, 11.0, 18.0, 10.0, 7.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.678386688232422, -4.540285110473633, -4.4021830558776855, -4.2640814781188965, -4.125979900360107, -3.98787784576416, -3.849776268005371, -3.711674451828003, -3.5735726356506348, -3.4354708194732666, -3.2973692417144775, -3.1592674255371094, -3.021165609359741, -2.883063793182373, -2.744962215423584, -2.606860399246216, -2.4687588214874268, -2.3306570053100586, -2.1925554275512695, -2.0544536113739014, -1.9163517951965332, -1.7782500982284546, -1.640148401260376, -1.5020465850830078, -1.3639448881149292, -1.2258431911468506, -1.0877413749694824, -0.9496396780014038, -0.8115379214286804, -0.673436164855957, -0.5353344678878784, -0.39723271131515503, -0.25913095474243164, -0.12102921307086945, 0.01707252860069275, 0.15517425537109375, 0.29327601194381714, 0.4313777685165405, 0.5694794654846191, 0.7075812220573425, 0.8456829786300659, 0.9837847352027893, 1.1218864917755127, 1.2599881887435913, 1.39808988571167, 1.536191701889038, 1.6742933988571167, 1.8123950958251953, 1.9504969120025635, 2.0885987281799316, 2.2267003059387207, 2.364802122116089, 2.502903938293457, 2.641005516052246, 2.7791073322296143, 2.9172091484069824, 3.0553107261657715, 3.1934125423431396, 3.3315141201019287, 3.469615936279297, 3.607717752456665, 3.745819568634033, 3.8839211463928223, 4.022022724151611, 4.160124778747559]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 6.0, 8.0, 4.0, 7.0, 10.0, 15.0, 14.0, 13.0, 10.0, 17.0, 24.0, 19.0, 18.0, 33.0, 34.0, 36.0, 28.0, 32.0, 36.0, 29.0, 49.0, 41.0, 41.0, 33.0, 46.0, 37.0, 34.0, 31.0, 25.0, 32.0, 35.0, 24.0, 25.0, 22.0, 22.0, 16.0, 14.0, 15.0, 12.0, 7.0, 9.0, 7.0, 4.0, 5.0, 6.0, 1.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.63623046875, -0.6169891357421875, -0.597747802734375, -0.5785064697265625, -0.55926513671875, -0.5400238037109375, -0.520782470703125, -0.5015411376953125, -0.4822998046875, -0.4630584716796875, -0.443817138671875, -0.4245758056640625, -0.40533447265625, -0.3860931396484375, -0.366851806640625, -0.3476104736328125, -0.328369140625, -0.3091278076171875, -0.289886474609375, -0.2706451416015625, -0.25140380859375, -0.2321624755859375, -0.212921142578125, -0.1936798095703125, -0.1744384765625, -0.1551971435546875, -0.135955810546875, -0.1167144775390625, -0.09747314453125, -0.0782318115234375, -0.058990478515625, -0.0397491455078125, -0.0205078125, -0.0012664794921875, 0.017974853515625, 0.0372161865234375, 0.05645751953125, 0.0756988525390625, 0.094940185546875, 0.1141815185546875, 0.1334228515625, 0.1526641845703125, 0.171905517578125, 0.1911468505859375, 0.21038818359375, 0.2296295166015625, 0.248870849609375, 0.2681121826171875, 0.287353515625, 0.3065948486328125, 0.325836181640625, 0.3450775146484375, 0.36431884765625, 0.3835601806640625, 0.402801513671875, 0.4220428466796875, 0.4412841796875, 0.4605255126953125, 0.479766845703125, 0.4990081787109375, 0.51824951171875, 0.5374908447265625, 0.556732177734375, 0.5759735107421875, 0.59521484375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 3.0, 7.0, 5.0, 8.0, 22.0, 30.0, 35.0, 56.0, 96.0, 128.0, 198.0, 241.0, 415.0, 542.0, 890.0, 1202.0, 1683.0, 2584.0, 3568.0, 5512.0, 8179.0, 12292.0, 18777.0, 29345.0, 47022.0, 76653.0, 122603.0, 177505.0, 183197.0, 131219.0, 82572.0, 50470.0, 31687.0, 20126.0, 12990.0, 8502.0, 5773.0, 3900.0, 2659.0, 1818.0, 1257.0, 907.0, 590.0, 424.0, 280.0, 199.0, 143.0, 84.0, 53.0, 41.0, 24.0, 21.0, 10.0, 10.0, 8.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06591796875, -0.06386280059814453, -0.06180763244628906, -0.059752464294433594, -0.057697296142578125, -0.055642127990722656, -0.05358695983886719, -0.05153179168701172, -0.04947662353515625, -0.04742145538330078, -0.04536628723144531, -0.043311119079589844, -0.041255950927734375, -0.039200782775878906, -0.03714561462402344, -0.03509044647216797, -0.0330352783203125, -0.03098011016845703, -0.028924942016601562, -0.026869773864746094, -0.024814605712890625, -0.022759437561035156, -0.020704269409179688, -0.01864910125732422, -0.01659393310546875, -0.014538764953613281, -0.012483596801757812, -0.010428428649902344, -0.008373260498046875, -0.006318092346191406, -0.0042629241943359375, -0.0022077560424804688, -0.000152587890625, 0.0019025802612304688, 0.0039577484130859375, 0.006012916564941406, 0.008068084716796875, 0.010123252868652344, 0.012178421020507812, 0.014233589172363281, 0.01628875732421875, 0.01834392547607422, 0.020399093627929688, 0.022454261779785156, 0.024509429931640625, 0.026564598083496094, 0.028619766235351562, 0.03067493438720703, 0.0327301025390625, 0.03478527069091797, 0.03684043884277344, 0.038895606994628906, 0.040950775146484375, 0.043005943298339844, 0.04506111145019531, 0.04711627960205078, 0.04917144775390625, 0.05122661590576172, 0.05328178405761719, 0.055336952209472656, 0.057392120361328125, 0.059447288513183594, 0.06150245666503906, 0.06355762481689453, 0.06561279296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 7.0, 7.0, 17.0, 14.0, 17.0, 23.0, 23.0, 22.0, 22.0, 25.0, 32.0, 31.0, 42.0, 38.0, 29.0, 44.0, 26.0, 49.0, 1060.0, 35.0, 45.0, 42.0, 34.0, 40.0, 27.0, 33.0, 26.0, 29.0, 28.0, 26.0, 14.0, 10.0, 20.0, 9.0, 8.0, 17.0, 5.0, 7.0, 10.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.56103515625, -0.5447120666503906, -0.5283889770507812, -0.5120658874511719, -0.4957427978515625, -0.4794197082519531, -0.46309661865234375, -0.4467735290527344, -0.430450439453125, -0.4141273498535156, -0.39780426025390625, -0.3814811706542969, -0.3651580810546875, -0.3488349914550781, -0.33251190185546875, -0.3161888122558594, -0.29986572265625, -0.2835426330566406, -0.26721954345703125, -0.2508964538574219, -0.2345733642578125, -0.21825027465820312, -0.20192718505859375, -0.18560409545898438, -0.169281005859375, -0.15295791625976562, -0.13663482666015625, -0.12031173706054688, -0.1039886474609375, -0.08766555786132812, -0.07134246826171875, -0.055019378662109375, -0.0386962890625, -0.022373199462890625, -0.00605010986328125, 0.010272979736328125, 0.0265960693359375, 0.042919158935546875, 0.05924224853515625, 0.07556533813476562, 0.091888427734375, 0.10821151733398438, 0.12453460693359375, 0.14085769653320312, 0.1571807861328125, 0.17350387573242188, 0.18982696533203125, 0.20615005493164062, 0.22247314453125, 0.23879623413085938, 0.25511932373046875, 0.2714424133300781, 0.2877655029296875, 0.3040885925292969, 0.32041168212890625, 0.3367347717285156, 0.353057861328125, 0.3693809509277344, 0.38570404052734375, 0.4020271301269531, 0.4183502197265625, 0.4346733093261719, 0.45099639892578125, 0.4673194885253906, 0.483642578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 5.0, 11.0, 13.0, 22.0, 26.0, 47.0, 49.0, 85.0, 126.0, 148.0, 220.0, 310.0, 479.0, 688.0, 1008.0, 1436.0, 2200.0, 3324.0, 5168.0, 8589.0, 15990.0, 38673.0, 330939.0, 1585899.0, 55402.0, 19048.0, 10060.0, 5900.0, 3763.0, 2401.0, 1593.0, 1075.0, 718.0, 490.0, 390.0, 255.0, 164.0, 116.0, 89.0, 56.0, 38.0, 39.0, 31.0, 15.0, 8.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1375732421875, -0.13300704956054688, -0.12844085693359375, -0.12387466430664062, -0.1193084716796875, -0.11474227905273438, -0.11017608642578125, -0.10560989379882812, -0.101043701171875, -0.09647750854492188, -0.09191131591796875, -0.08734512329101562, -0.0827789306640625, -0.07821273803710938, -0.07364654541015625, -0.06908035278320312, -0.06451416015625, -0.059947967529296875, -0.05538177490234375, -0.050815582275390625, -0.0462493896484375, -0.041683197021484375, -0.03711700439453125, -0.032550811767578125, -0.027984619140625, -0.023418426513671875, -0.01885223388671875, -0.014286041259765625, -0.0097198486328125, -0.005153656005859375, -0.00058746337890625, 0.003978729248046875, 0.008544921875, 0.013111114501953125, 0.01767730712890625, 0.022243499755859375, 0.0268096923828125, 0.031375885009765625, 0.03594207763671875, 0.040508270263671875, 0.045074462890625, 0.049640655517578125, 0.05420684814453125, 0.058773040771484375, 0.0633392333984375, 0.06790542602539062, 0.07247161865234375, 0.07703781127929688, 0.08160400390625, 0.08617019653320312, 0.09073638916015625, 0.09530258178710938, 0.0998687744140625, 0.10443496704101562, 0.10900115966796875, 0.11356735229492188, 0.118133544921875, 0.12269973754882812, 0.12726593017578125, 0.13183212280273438, 0.1363983154296875, 0.14096450805664062, 0.14553070068359375, 0.15009689331054688, 0.1546630859375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 11.0, 5.0, 13.0, 13.0, 20.0, 14.0, 24.0, 29.0, 28.0, 28.0, 31.0, 26.0, 33.0, 24.0, 40.0, 33.0, 25.0, 29.0, 35.0, 21.0, 21.0, 35.0, 40.0, 30.0, 43.0, 34.0, 31.0, 38.0, 34.0, 39.0, 26.0, 12.0, 22.0, 18.0, 13.0, 13.0, 11.0, 8.0, 4.0, 8.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.006526947021484375, -0.00631183385848999, -0.0060967206954956055, -0.005881607532501221, -0.005666494369506836, -0.005451381206512451, -0.005236268043518066, -0.005021154880523682, -0.004806041717529297, -0.004590928554534912, -0.004375815391540527, -0.004160702228546143, -0.003945589065551758, -0.003730475902557373, -0.0035153627395629883, -0.0033002495765686035, -0.0030851364135742188, -0.002870023250579834, -0.0026549100875854492, -0.0024397969245910645, -0.0022246837615966797, -0.002009570598602295, -0.0017944574356079102, -0.0015793442726135254, -0.0013642311096191406, -0.0011491179466247559, -0.0009340047836303711, -0.0007188916206359863, -0.0005037784576416016, -0.0002886652946472168, -7.355213165283203e-05, 0.00014156103134155273, 0.0003566741943359375, 0.0005717873573303223, 0.000786900520324707, 0.0010020136833190918, 0.0012171268463134766, 0.0014322400093078613, 0.001647353172302246, 0.0018624663352966309, 0.0020775794982910156, 0.0022926926612854004, 0.002507805824279785, 0.00272291898727417, 0.0029380321502685547, 0.0031531453132629395, 0.0033682584762573242, 0.003583371639251709, 0.0037984848022460938, 0.0040135979652404785, 0.004228711128234863, 0.004443824291229248, 0.004658937454223633, 0.004874050617218018, 0.005089163780212402, 0.005304276943206787, 0.005519390106201172, 0.005734503269195557, 0.005949616432189941, 0.006164729595184326, 0.006379842758178711, 0.006594955921173096, 0.0068100690841674805, 0.007025182247161865, 0.00724029541015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 3.0, 11.0, 7.0, 10.0, 21.0, 21.0, 27.0, 30.0, 36.0, 70.0, 70.0, 91.0, 108.0, 152.0, 208.0, 305.0, 620.0, 3911.0, 899064.0, 140867.0, 1382.0, 465.0, 260.0, 173.0, 135.0, 100.0, 73.0, 61.0, 43.0, 42.0, 33.0, 34.0, 20.0, 19.0, 7.0, 12.0, 11.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.14892578125, -0.14452171325683594, -0.14011764526367188, -0.1357135772705078, -0.13130950927734375, -0.1269054412841797, -0.12250137329101562, -0.11809730529785156, -0.1136932373046875, -0.10928916931152344, -0.10488510131835938, -0.10048103332519531, -0.09607696533203125, -0.09167289733886719, -0.08726882934570312, -0.08286476135253906, -0.078460693359375, -0.07405662536621094, -0.06965255737304688, -0.06524848937988281, -0.06084442138671875, -0.05644035339355469, -0.052036285400390625, -0.04763221740722656, -0.0432281494140625, -0.03882408142089844, -0.034420013427734375, -0.030015945434570312, -0.02561187744140625, -0.021207809448242188, -0.016803741455078125, -0.012399673461914062, -0.00799560546875, -0.0035915374755859375, 0.000812530517578125, 0.0052165985107421875, 0.00962066650390625, 0.014024734497070312, 0.018428802490234375, 0.022832870483398438, 0.0272369384765625, 0.03164100646972656, 0.036045074462890625, 0.04044914245605469, 0.04485321044921875, 0.04925727844238281, 0.053661346435546875, 0.05806541442871094, 0.062469482421875, 0.06687355041503906, 0.07127761840820312, 0.07568168640136719, 0.08008575439453125, 0.08448982238769531, 0.08889389038085938, 0.09329795837402344, 0.0977020263671875, 0.10210609436035156, 0.10651016235351562, 0.11091423034667969, 0.11531829833984375, 0.11972236633300781, 0.12412643432617188, 0.12853050231933594, 0.1329345703125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 41.0, 847.0, 113.0, 7.0], "bins": [-0.3019552230834961, -0.2970576584339142, -0.2921600937843323, -0.287262499332428, -0.28236493468284607, -0.27746737003326416, -0.27256980538368225, -0.26767224073410034, -0.26277464628219604, -0.25787708163261414, -0.2529795169830322, -0.24808193743228912, -0.24318435788154602, -0.2382867932319641, -0.233389213681221, -0.2284916490316391, -0.2235940843820572, -0.21869651973247528, -0.21379894018173218, -0.20890137553215027, -0.20400379598140717, -0.19910623133182526, -0.19420865178108215, -0.18931108713150024, -0.18441352248191833, -0.17951595783233643, -0.17461837828159332, -0.1697208136320114, -0.1648232340812683, -0.1599256694316864, -0.1550280898809433, -0.1501305252313614, -0.14523296058177948, -0.14033539593219757, -0.13543781638145447, -0.13054025173187256, -0.12564267218112946, -0.12074510753154755, -0.11584753543138504, -0.11094996333122253, -0.10605238378047943, -0.10115481168031693, -0.09625723958015442, -0.09135966747999191, -0.0864620953798294, -0.0815645307302475, -0.07666695863008499, -0.07176938652992249, -0.06687181442975998, -0.06197424232959747, -0.05707667022943497, -0.05217910185456276, -0.04728152975440025, -0.04238395765423775, -0.03748638927936554, -0.03258881717920303, -0.027691245079040527, -0.02279367297887802, -0.017896102741360664, -0.012998531572520733, -0.008100960403680801, -0.0032033883035182953, 0.0016941819339990616, 0.0065917521715164185, 0.01148932334035635]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 13.0, 14.0, 22.0, 16.0, 32.0, 26.0, 29.0, 33.0, 36.0, 45.0, 54.0, 51.0, 50.0, 54.0, 55.0, 56.0, 50.0, 51.0, 40.0, 37.0, 39.0, 27.0, 24.0, 33.0, 13.0, 21.0, 15.0, 10.0, 12.0, 9.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.032409489154815674, -0.03155674785375595, -0.030704006552696228, -0.029851265251636505, -0.028998523950576782, -0.02814578264951706, -0.027293041348457336, -0.026440300047397614, -0.02558755874633789, -0.024734817445278168, -0.023882076144218445, -0.023029334843158722, -0.022176593542099, -0.021323852241039276, -0.020471110939979553, -0.01961836963891983, -0.018765628337860107, -0.017912887036800385, -0.01706014573574066, -0.01620740443468094, -0.015354663133621216, -0.014501921832561493, -0.01364918053150177, -0.012796439230442047, -0.011943697929382324, -0.011090956628322601, -0.010238215327262878, -0.009385474026203156, -0.008532732725143433, -0.00767999142408371, -0.006827250123023987, -0.005974508821964264, -0.005121767520904541, -0.004269026219844818, -0.003416284918785095, -0.0025635436177253723, -0.0017108023166656494, -0.0008580610156059265, -5.319714546203613e-06, 0.0008474215865135193, 0.0017001628875732422, 0.002552904188632965, 0.003405645489692688, 0.004258386790752411, 0.005111128091812134, 0.005963869392871857, 0.00681661069393158, 0.0076693519949913025, 0.008522093296051025, 0.009374834597110748, 0.010227575898170471, 0.011080317199230194, 0.011933058500289917, 0.01278579980134964, 0.013638541102409363, 0.014491282403469086, 0.015344023704528809, 0.01619676500558853, 0.017049506306648254, 0.017902247607707977, 0.0187549889087677, 0.019607730209827423, 0.020460471510887146, 0.02131321281194687, 0.022165954113006592]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 9.0, 4.0, 7.0, 10.0, 15.0, 15.0, 12.0, 10.0, 16.0, 27.0, 17.0, 18.0, 32.0, 36.0, 36.0, 28.0, 31.0, 36.0, 30.0, 49.0, 42.0, 41.0, 34.0, 45.0, 35.0, 35.0, 31.0, 25.0, 32.0, 35.0, 24.0, 24.0, 22.0, 21.0, 17.0, 14.0, 15.0, 12.0, 7.0, 8.0, 8.0, 5.0, 4.0, 6.0, 1.0, 6.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.6357421875, -0.6165008544921875, -0.597259521484375, -0.5780181884765625, -0.55877685546875, -0.5395355224609375, -0.520294189453125, -0.5010528564453125, -0.4818115234375, -0.4625701904296875, -0.443328857421875, -0.4240875244140625, -0.40484619140625, -0.3856048583984375, -0.366363525390625, -0.3471221923828125, -0.327880859375, -0.3086395263671875, -0.289398193359375, -0.2701568603515625, -0.25091552734375, -0.2316741943359375, -0.212432861328125, -0.1931915283203125, -0.1739501953125, -0.1547088623046875, -0.135467529296875, -0.1162261962890625, -0.09698486328125, -0.0777435302734375, -0.058502197265625, -0.0392608642578125, -0.02001953125, -0.0007781982421875, 0.018463134765625, 0.0377044677734375, 0.05694580078125, 0.0761871337890625, 0.095428466796875, 0.1146697998046875, 0.1339111328125, 0.1531524658203125, 0.172393798828125, 0.1916351318359375, 0.21087646484375, 0.2301177978515625, 0.249359130859375, 0.2686004638671875, 0.287841796875, 0.3070831298828125, 0.326324462890625, 0.3455657958984375, 0.36480712890625, 0.3840484619140625, 0.403289794921875, 0.4225311279296875, 0.4417724609375, 0.4610137939453125, 0.480255126953125, 0.4994964599609375, 0.51873779296875, 0.5379791259765625, 0.557220458984375, 0.5764617919921875, 0.595703125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 4.0, 5.0, 4.0, 8.0, 20.0, 16.0, 12.0, 34.0, 28.0, 43.0, 44.0, 57.0, 79.0, 118.0, 175.0, 260.0, 475.0, 811.0, 1533.0, 2948.0, 5995.0, 13609.0, 36865.0, 139401.0, 591460.0, 181025.0, 44005.0, 15631.0, 6608.0, 3207.0, 1709.0, 899.0, 505.0, 283.0, 190.0, 114.0, 88.0, 61.0, 44.0, 46.0, 27.0, 22.0, 26.0, 23.0, 11.0, 6.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5244903564453125, -1.477691650390625, -1.4308929443359375, -1.38409423828125, -1.3372955322265625, -1.290496826171875, -1.2436981201171875, -1.1968994140625, -1.1501007080078125, -1.103302001953125, -1.0565032958984375, -1.00970458984375, -0.9629058837890625, -0.916107177734375, -0.8693084716796875, -0.822509765625, -0.7757110595703125, -0.728912353515625, -0.6821136474609375, -0.63531494140625, -0.5885162353515625, -0.541717529296875, -0.4949188232421875, -0.4481201171875, -0.4013214111328125, -0.354522705078125, -0.3077239990234375, -0.26092529296875, -0.2141265869140625, -0.167327880859375, -0.1205291748046875, -0.07373046875, -0.0269317626953125, 0.019866943359375, 0.0666656494140625, 0.11346435546875, 0.1602630615234375, 0.207061767578125, 0.2538604736328125, 0.3006591796875, 0.3474578857421875, 0.394256591796875, 0.4410552978515625, 0.48785400390625, 0.5346527099609375, 0.581451416015625, 0.6282501220703125, 0.675048828125, 0.7218475341796875, 0.768646240234375, 0.8154449462890625, 0.86224365234375, 0.9090423583984375, 0.955841064453125, 1.0026397705078125, 1.0494384765625, 1.0962371826171875, 1.143035888671875, 1.1898345947265625, 1.23663330078125, 1.2834320068359375, 1.330230712890625, 1.3770294189453125, 1.423828125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 8.0, 7.0, 7.0, 13.0, 12.0, 12.0, 22.0, 21.0, 32.0, 29.0, 43.0, 49.0, 57.0, 73.0, 77.0, 167.0, 1444.0, 333.0, 157.0, 82.0, 63.0, 56.0, 52.0, 46.0, 44.0, 30.0, 19.0, 28.0, 16.0, 15.0, 8.0, 13.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.363006591796875, -2.28656005859375, -2.210113525390625, -2.1336669921875, -2.057220458984375, -1.98077392578125, -1.904327392578125, -1.827880859375, -1.751434326171875, -1.67498779296875, -1.598541259765625, -1.5220947265625, -1.445648193359375, -1.36920166015625, -1.292755126953125, -1.21630859375, -1.139862060546875, -1.06341552734375, -0.986968994140625, -0.9105224609375, -0.834075927734375, -0.75762939453125, -0.681182861328125, -0.604736328125, -0.528289794921875, -0.45184326171875, -0.375396728515625, -0.2989501953125, -0.222503662109375, -0.14605712890625, -0.069610595703125, 0.0068359375, 0.083282470703125, 0.15972900390625, 0.236175537109375, 0.3126220703125, 0.389068603515625, 0.46551513671875, 0.541961669921875, 0.618408203125, 0.694854736328125, 0.77130126953125, 0.847747802734375, 0.9241943359375, 1.000640869140625, 1.07708740234375, 1.153533935546875, 1.22998046875, 1.306427001953125, 1.38287353515625, 1.459320068359375, 1.5357666015625, 1.612213134765625, 1.68865966796875, 1.765106201171875, 1.841552734375, 1.917999267578125, 1.99444580078125, 2.070892333984375, 2.1473388671875, 2.223785400390625, 2.30023193359375, 2.376678466796875, 2.453125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 13.0, 6.0, 19.0, 14.0, 20.0, 21.0, 36.0, 52.0, 58.0, 95.0, 159.0, 267.0, 574.0, 1567.0, 5672.0, 47744.0, 2751431.0, 319537.0, 13877.0, 2727.0, 863.0, 366.0, 194.0, 113.0, 70.0, 49.0, 29.0, 31.0, 18.0, 19.0, 18.0, 11.0, 13.0, 5.0, 3.0, 5.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.271240234375, -4.13232421875, -3.993408203125, -3.8544921875, -3.715576171875, -3.57666015625, -3.437744140625, -3.298828125, -3.159912109375, -3.02099609375, -2.882080078125, -2.7431640625, -2.604248046875, -2.46533203125, -2.326416015625, -2.1875, -2.048583984375, -1.90966796875, -1.770751953125, -1.6318359375, -1.492919921875, -1.35400390625, -1.215087890625, -1.076171875, -0.937255859375, -0.79833984375, -0.659423828125, -0.5205078125, -0.381591796875, -0.24267578125, -0.103759765625, 0.03515625, 0.174072265625, 0.31298828125, 0.451904296875, 0.5908203125, 0.729736328125, 0.86865234375, 1.007568359375, 1.146484375, 1.285400390625, 1.42431640625, 1.563232421875, 1.7021484375, 1.841064453125, 1.97998046875, 2.118896484375, 2.2578125, 2.396728515625, 2.53564453125, 2.674560546875, 2.8134765625, 2.952392578125, 3.09130859375, 3.230224609375, 3.369140625, 3.508056640625, 3.64697265625, 3.785888671875, 3.9248046875, 4.063720703125, 4.20263671875, 4.341552734375, 4.48046875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [6.0, 42.0, 285.0, 520.0, 150.0, 12.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.979235291481018, -1.3747215270996094, -0.7702078819274902, -0.16569411754608154, 0.4388195276260376, 1.0433331727981567, 1.647847056388855, 2.2523608207702637, 2.856874465942383, 3.461388111114502, 4.065901756286621, 4.670415878295898, 5.274929046630859, 5.879443168640137, 6.483956813812256, 7.088470458984375, 7.692984104156494, 8.297497749328613, 8.90201187133789, 9.506525039672852, 10.111039161682129, 10.71555233001709, 11.320066452026367, 11.924579620361328, 12.529093742370605, 13.133607864379883, 13.738121032714844, 14.342635154724121, 14.947148323059082, 15.55166244506836, 16.15617561340332, 16.76068878173828, 17.365201950073242, 17.969715118408203, 18.574230194091797, 19.178743362426758, 19.78325653076172, 20.38776969909668, 20.992284774780273, 21.596797943115234, 22.201311111450195, 22.805824279785156, 23.41033935546875, 24.01485252380371, 24.619365692138672, 25.223878860473633, 25.828393936157227, 26.432907104492188, 27.03742218017578, 27.641935348510742, 28.246450424194336, 28.850963592529297, 29.455476760864258, 30.05998992919922, 30.664505004882812, 31.269018173217773, 31.873531341552734, 32.47804641723633, 33.082557678222656, 33.68707275390625, 34.291587829589844, 34.89609909057617, 35.500614166259766, 36.105125427246094, 36.70964050292969]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 4.0, 15.0, 13.0, 18.0, 19.0, 15.0, 16.0, 28.0, 20.0, 23.0, 24.0, 34.0, 35.0, 43.0, 48.0, 34.0, 32.0, 46.0, 45.0, 40.0, 44.0, 46.0, 33.0, 37.0, 30.0, 31.0, 23.0, 25.0, 25.0, 25.0, 17.0, 11.0, 16.0, 11.0, 6.0, 10.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.257637023925781, -5.094078540802002, -4.930520057678223, -4.766962051391602, -4.603403568267822, -4.439845085144043, -4.276286602020264, -4.112728118896484, -3.949169635772705, -3.785611152648926, -3.6220529079437256, -3.4584944248199463, -3.294935941696167, -3.131377696990967, -2.9678192138671875, -2.804260730743408, -2.640702486038208, -2.4771440029144287, -2.3135857582092285, -2.150027275085449, -1.98646879196167, -1.8229104280471802, -1.6593520641326904, -1.4957935810089111, -1.3322352170944214, -1.1686768531799316, -1.0051183700561523, -0.8415600061416626, -0.6780015826225281, -0.5144431591033936, -0.3508847951889038, -0.1873263120651245, -0.023767948150634766, 0.13979046046733856, 0.3033488690853119, 0.466907262802124, 0.6304656863212585, 0.7940241098403931, 0.9575824737548828, 1.121140956878662, 1.2846993207931519, 1.4482576847076416, 1.611816167831421, 1.7753745317459106, 1.9389328956604004, 2.1024913787841797, 2.266049861907959, 2.4296083450317383, 2.5931665897369385, 2.7567250728607178, 2.920283317565918, 3.0838418006896973, 3.2474002838134766, 3.410958766937256, 3.574517011642456, 3.7380754947662354, 3.9016337394714355, 4.065192222595215, 4.228750705718994, 4.392309188842773, 4.5558671951293945, 4.719425678253174, 4.882984161376953, 5.046542644500732, 5.210101127624512]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 8.0, 8.0, 4.0, 13.0, 9.0, 15.0, 10.0, 19.0, 22.0, 16.0, 17.0, 28.0, 27.0, 27.0, 27.0, 30.0, 38.0, 32.0, 32.0, 37.0, 40.0, 50.0, 38.0, 37.0, 32.0, 49.0, 43.0, 30.0, 23.0, 22.0, 30.0, 21.0, 21.0, 16.0, 19.0, 17.0, 17.0, 9.0, 7.0, 11.0, 8.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.6455078125, -0.6255722045898438, -0.6056365966796875, -0.5857009887695312, -0.565765380859375, -0.5458297729492188, -0.5258941650390625, -0.5059585571289062, -0.48602294921875, -0.46608734130859375, -0.4461517333984375, -0.42621612548828125, -0.406280517578125, -0.38634490966796875, -0.3664093017578125, -0.34647369384765625, -0.3265380859375, -0.30660247802734375, -0.2866668701171875, -0.26673126220703125, -0.246795654296875, -0.22686004638671875, -0.2069244384765625, -0.18698883056640625, -0.16705322265625, -0.14711761474609375, -0.1271820068359375, -0.10724639892578125, -0.087310791015625, -0.06737518310546875, -0.0474395751953125, -0.02750396728515625, -0.007568359375, 0.01236724853515625, 0.0323028564453125, 0.05223846435546875, 0.072174072265625, 0.09210968017578125, 0.1120452880859375, 0.13198089599609375, 0.15191650390625, 0.17185211181640625, 0.1917877197265625, 0.21172332763671875, 0.231658935546875, 0.25159454345703125, 0.2715301513671875, 0.29146575927734375, 0.3114013671875, 0.33133697509765625, 0.3512725830078125, 0.37120819091796875, 0.391143798828125, 0.41107940673828125, 0.4310150146484375, 0.45095062255859375, 0.47088623046875, 0.49082183837890625, 0.5107574462890625, 0.5306930541992188, 0.550628662109375, 0.5705642700195312, 0.5904998779296875, 0.6104354858398438, 0.63037109375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 5.0, 13.0, 13.0, 15.0, 21.0, 34.0, 36.0, 59.0, 91.0, 121.0, 140.0, 199.0, 289.0, 331.0, 458.0, 713.0, 996.0, 1414.0, 2065.0, 3247.0, 5285.0, 9199.0, 17419.0, 39406.0, 111287.0, 420636.0, 1683053.0, 1393117.0, 337396.0, 94853.0, 34362.0, 15617.0, 8494.0, 4825.0, 2963.0, 1902.0, 1226.0, 861.0, 614.0, 427.0, 297.0, 211.0, 159.0, 110.0, 78.0, 72.0, 39.0, 32.0, 28.0, 17.0, 16.0, 12.0, 11.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0224609375, -0.9914016723632812, -0.9603424072265625, -0.9292831420898438, -0.898223876953125, -0.8671646118164062, -0.8361053466796875, -0.8050460815429688, -0.77398681640625, -0.7429275512695312, -0.7118682861328125, -0.6808090209960938, -0.649749755859375, -0.6186904907226562, -0.5876312255859375, -0.5565719604492188, -0.5255126953125, -0.49445343017578125, -0.4633941650390625, -0.43233489990234375, -0.401275634765625, -0.37021636962890625, -0.3391571044921875, -0.30809783935546875, -0.27703857421875, -0.24597930908203125, -0.2149200439453125, -0.18386077880859375, -0.152801513671875, -0.12174224853515625, -0.0906829833984375, -0.05962371826171875, -0.028564453125, 0.00249481201171875, 0.0335540771484375, 0.06461334228515625, 0.095672607421875, 0.12673187255859375, 0.1577911376953125, 0.18885040283203125, 0.21990966796875, 0.25096893310546875, 0.2820281982421875, 0.31308746337890625, 0.344146728515625, 0.37520599365234375, 0.4062652587890625, 0.43732452392578125, 0.4683837890625, 0.49944305419921875, 0.5305023193359375, 0.5615615844726562, 0.592620849609375, 0.6236801147460938, 0.6547393798828125, 0.6857986450195312, 0.71685791015625, 0.7479171752929688, 0.7789764404296875, 0.8100357055664062, 0.841094970703125, 0.8721542358398438, 0.9032135009765625, 0.9342727661132812, 0.96533203125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 6.0, 5.0, 4.0, 11.0, 7.0, 8.0, 14.0, 21.0, 30.0, 36.0, 52.0, 67.0, 93.0, 151.0, 249.0, 347.0, 556.0, 658.0, 584.0, 377.0, 269.0, 149.0, 111.0, 63.0, 56.0, 31.0, 33.0, 12.0, 22.0, 11.0, 8.0, 4.0, 13.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4825592041015625, -1.439727783203125, -1.3968963623046875, -1.35406494140625, -1.3112335205078125, -1.268402099609375, -1.2255706787109375, -1.1827392578125, -1.1399078369140625, -1.097076416015625, -1.0542449951171875, -1.01141357421875, -0.9685821533203125, -0.925750732421875, -0.8829193115234375, -0.840087890625, -0.7972564697265625, -0.754425048828125, -0.7115936279296875, -0.66876220703125, -0.6259307861328125, -0.583099365234375, -0.5402679443359375, -0.4974365234375, -0.4546051025390625, -0.411773681640625, -0.3689422607421875, -0.32611083984375, -0.2832794189453125, -0.240447998046875, -0.1976165771484375, -0.15478515625, -0.1119537353515625, -0.069122314453125, -0.0262908935546875, 0.01654052734375, 0.0593719482421875, 0.102203369140625, 0.1450347900390625, 0.1878662109375, 0.2306976318359375, 0.273529052734375, 0.3163604736328125, 0.35919189453125, 0.4020233154296875, 0.444854736328125, 0.4876861572265625, 0.530517578125, 0.5733489990234375, 0.616180419921875, 0.6590118408203125, 0.70184326171875, 0.7446746826171875, 0.787506103515625, 0.8303375244140625, 0.8731689453125, 0.9160003662109375, 0.958831787109375, 1.0016632080078125, 1.04449462890625, 1.0873260498046875, 1.130157470703125, 1.1729888916015625, 1.2158203125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 13.0, 15.0, 18.0, 17.0, 30.0, 47.0, 59.0, 109.0, 264.0, 676.0, 2048.0, 6989.0, 32872.0, 417560.0, 3545342.0, 160922.0, 20043.0, 4728.0, 1483.0, 518.0, 208.0, 115.0, 64.0, 38.0, 27.0, 17.0, 11.0, 15.0, 3.0, 6.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.65667724609375, -3.5321044921875, -3.40753173828125, -3.282958984375, -3.15838623046875, -3.0338134765625, -2.90924072265625, -2.78466796875, -2.66009521484375, -2.5355224609375, -2.41094970703125, -2.286376953125, -2.16180419921875, -2.0372314453125, -1.91265869140625, -1.7880859375, -1.66351318359375, -1.5389404296875, -1.41436767578125, -1.289794921875, -1.16522216796875, -1.0406494140625, -0.91607666015625, -0.79150390625, -0.66693115234375, -0.5423583984375, -0.41778564453125, -0.293212890625, -0.16864013671875, -0.0440673828125, 0.08050537109375, 0.205078125, 0.32965087890625, 0.4542236328125, 0.57879638671875, 0.703369140625, 0.82794189453125, 0.9525146484375, 1.07708740234375, 1.20166015625, 1.32623291015625, 1.4508056640625, 1.57537841796875, 1.699951171875, 1.82452392578125, 1.9490966796875, 2.07366943359375, 2.1982421875, 2.32281494140625, 2.4473876953125, 2.57196044921875, 2.696533203125, 2.82110595703125, 2.9456787109375, 3.07025146484375, 3.19482421875, 3.31939697265625, 3.4439697265625, 3.56854248046875, 3.693115234375, 3.81768798828125, 3.9422607421875, 4.06683349609375, 4.19140625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 21.0, 33.0, 60.0, 61.0, 102.0, 119.0, 148.0, 144.0, 105.0, 73.0, 45.0, 32.0, 16.0, 15.0, 11.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.012527942657471, -6.792513370513916, -6.572498798370361, -6.352484226226807, -6.132469654083252, -5.912455081939697, -5.692440032958984, -5.47242546081543, -5.252410888671875, -5.03239631652832, -4.812381744384766, -4.592367172241211, -4.372352600097656, -4.152338027954102, -3.9323232173919678, -3.712308645248413, -3.4922943115234375, -3.272279739379883, -3.052265167236328, -2.8322505950927734, -2.6122360229492188, -2.392221450805664, -2.1722066402435303, -1.9521920680999756, -1.732177495956421, -1.5121629238128662, -1.2921483516693115, -1.0721336603164673, -0.8521190881729126, -0.6321045160293579, -0.41208982467651367, -0.19207525253295898, 0.0279388427734375, 0.24795344471931458, 0.46796804666519165, 0.6879826784133911, 0.9079972505569458, 1.1280118227005005, 1.3480265140533447, 1.5680410861968994, 1.788055658340454, 2.008070230484009, 2.2280848026275635, 2.4480996131896973, 2.668114185333252, 2.8881287574768066, 3.1081433296203613, 3.328157901763916, 3.5481724739074707, 3.7681870460510254, 3.98820161819458, 4.208216190338135, 4.4282307624816895, 4.648245334625244, 4.868260383605957, 5.088274955749512, 5.308289527893066, 5.528304100036621, 5.748318672180176, 5.9683332443237305, 6.188347816467285, 6.40836238861084, 6.6283769607543945, 6.848391532897949, 7.068406105041504]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 7.0, 4.0, 5.0, 11.0, 12.0, 7.0, 16.0, 13.0, 18.0, 23.0, 24.0, 24.0, 28.0, 23.0, 31.0, 33.0, 37.0, 42.0, 45.0, 36.0, 52.0, 33.0, 52.0, 39.0, 46.0, 43.0, 31.0, 32.0, 38.0, 29.0, 24.0, 18.0, 17.0, 13.0, 17.0, 14.0, 12.0, 12.0, 6.0, 7.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.694469451904297, -3.575237512588501, -3.456005811691284, -3.3367738723754883, -3.2175421714782715, -3.0983102321624756, -2.979078531265259, -2.859846591949463, -2.740614891052246, -2.62138295173645, -2.5021512508392334, -2.3829193115234375, -2.2636876106262207, -2.144455671310425, -2.025223970413208, -1.905992031097412, -1.7867602109909058, -1.6675283908843994, -1.548296570777893, -1.4290647506713867, -1.3098329305648804, -1.190601110458374, -1.0713691711425781, -0.9521374106407166, -0.8329055905342102, -0.7136737704277039, -0.5944419503211975, -0.4752101004123688, -0.3559782803058624, -0.2367464303970337, -0.11751461029052734, 0.001717209815979004, 0.12094902992248535, 0.2401808500289917, 0.35941267013549805, 0.4786445200443268, 0.5978763103485107, 0.7171081900596619, 0.8363400101661682, 0.9555718302726746, 1.0748035907745361, 1.1940354108810425, 1.3132672309875488, 1.4324990510940552, 1.5517308712005615, 1.6709628105163574, 1.7901945114135742, 1.9094264507293701, 2.028658390045166, 2.147890329360962, 2.2671220302581787, 2.3863539695739746, 2.5055856704711914, 2.6248176097869873, 2.744049310684204, 2.86328125, 2.982512950897217, 3.1017448902130127, 3.2209765911102295, 3.3402085304260254, 3.459440231323242, 3.578672170639038, 3.697903871536255, 3.817135810852051, 3.9363675117492676]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 8.0, 4.0, 4.0, 11.0, 8.0, 11.0, 8.0, 19.0, 15.0, 11.0, 23.0, 22.0, 19.0, 22.0, 30.0, 25.0, 28.0, 33.0, 38.0, 36.0, 37.0, 44.0, 35.0, 38.0, 38.0, 46.0, 31.0, 42.0, 36.0, 38.0, 37.0, 27.0, 25.0, 19.0, 29.0, 13.0, 23.0, 9.0, 12.0, 14.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.70458984375, -0.6832656860351562, -0.6619415283203125, -0.6406173706054688, -0.619293212890625, -0.5979690551757812, -0.5766448974609375, -0.5553207397460938, -0.53399658203125, -0.5126724243164062, -0.4913482666015625, -0.47002410888671875, -0.448699951171875, -0.42737579345703125, -0.4060516357421875, -0.38472747802734375, -0.3634033203125, -0.34207916259765625, -0.3207550048828125, -0.29943084716796875, -0.278106689453125, -0.25678253173828125, -0.2354583740234375, -0.21413421630859375, -0.19281005859375, -0.17148590087890625, -0.1501617431640625, -0.12883758544921875, -0.107513427734375, -0.08618927001953125, -0.0648651123046875, -0.04354095458984375, -0.022216796875, -0.00089263916015625, 0.0204315185546875, 0.04175567626953125, 0.063079833984375, 0.08440399169921875, 0.1057281494140625, 0.12705230712890625, 0.14837646484375, 0.16970062255859375, 0.1910247802734375, 0.21234893798828125, 0.233673095703125, 0.25499725341796875, 0.2763214111328125, 0.29764556884765625, 0.3189697265625, 0.34029388427734375, 0.3616180419921875, 0.38294219970703125, 0.404266357421875, 0.42559051513671875, 0.4469146728515625, 0.46823883056640625, 0.48956298828125, 0.5108871459960938, 0.5322113037109375, 0.5535354614257812, 0.574859619140625, 0.5961837768554688, 0.6175079345703125, 0.6388320922851562, 0.66015625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 6.0, 11.0, 12.0, 13.0, 33.0, 37.0, 59.0, 83.0, 110.0, 150.0, 243.0, 302.0, 503.0, 708.0, 1139.0, 1529.0, 2395.0, 3724.0, 5732.0, 8755.0, 13695.0, 21522.0, 35152.0, 60037.0, 104330.0, 176630.0, 220309.0, 159373.0, 92009.0, 53032.0, 31835.0, 19546.0, 12473.0, 7820.0, 5090.0, 3282.0, 2215.0, 1466.0, 1023.0, 733.0, 467.0, 312.0, 232.0, 121.0, 83.0, 74.0, 45.0, 30.0, 31.0, 18.0, 11.0, 6.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.06853008270263672, -0.06619834899902344, -0.06386661529541016, -0.061534881591796875, -0.059203147888183594, -0.05687141418457031, -0.05453968048095703, -0.05220794677734375, -0.04987621307373047, -0.04754447937011719, -0.045212745666503906, -0.042881011962890625, -0.040549278259277344, -0.03821754455566406, -0.03588581085205078, -0.0335540771484375, -0.03122234344482422, -0.028890609741210938, -0.026558876037597656, -0.024227142333984375, -0.021895408630371094, -0.019563674926757812, -0.01723194122314453, -0.01490020751953125, -0.012568473815917969, -0.010236740112304688, -0.007905006408691406, -0.005573272705078125, -0.0032415390014648438, -0.0009098052978515625, 0.0014219284057617188, 0.003753662109375, 0.006085395812988281, 0.008417129516601562, 0.010748863220214844, 0.013080596923828125, 0.015412330627441406, 0.017744064331054688, 0.02007579803466797, 0.02240753173828125, 0.02473926544189453, 0.027070999145507812, 0.029402732849121094, 0.031734466552734375, 0.034066200256347656, 0.03639793395996094, 0.03872966766357422, 0.0410614013671875, 0.04339313507080078, 0.04572486877441406, 0.048056602478027344, 0.050388336181640625, 0.052720069885253906, 0.05505180358886719, 0.05738353729248047, 0.05971527099609375, 0.06204700469970703, 0.06437873840332031, 0.0667104721069336, 0.06904220581054688, 0.07137393951416016, 0.07370567321777344, 0.07603740692138672, 0.078369140625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 5.0, 7.0, 7.0, 5.0, 7.0, 10.0, 20.0, 11.0, 12.0, 20.0, 24.0, 26.0, 21.0, 22.0, 32.0, 40.0, 42.0, 37.0, 41.0, 51.0, 1059.0, 42.0, 40.0, 31.0, 43.0, 38.0, 34.0, 31.0, 36.0, 27.0, 27.0, 15.0, 21.0, 20.0, 23.0, 20.0, 12.0, 13.0, 8.0, 8.0, 8.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.59521484375, -0.5769882202148438, -0.5587615966796875, -0.5405349731445312, -0.522308349609375, -0.5040817260742188, -0.4858551025390625, -0.46762847900390625, -0.44940185546875, -0.43117523193359375, -0.4129486083984375, -0.39472198486328125, -0.376495361328125, -0.35826873779296875, -0.3400421142578125, -0.32181549072265625, -0.3035888671875, -0.28536224365234375, -0.2671356201171875, -0.24890899658203125, -0.230682373046875, -0.21245574951171875, -0.1942291259765625, -0.17600250244140625, -0.15777587890625, -0.13954925537109375, -0.1213226318359375, -0.10309600830078125, -0.084869384765625, -0.06664276123046875, -0.0484161376953125, -0.03018951416015625, -0.011962890625, 0.00626373291015625, 0.0244903564453125, 0.04271697998046875, 0.060943603515625, 0.07917022705078125, 0.0973968505859375, 0.11562347412109375, 0.13385009765625, 0.15207672119140625, 0.1703033447265625, 0.18852996826171875, 0.206756591796875, 0.22498321533203125, 0.2432098388671875, 0.26143646240234375, 0.2796630859375, 0.29788970947265625, 0.3161163330078125, 0.33434295654296875, 0.352569580078125, 0.37079620361328125, 0.3890228271484375, 0.40724945068359375, 0.42547607421875, 0.44370269775390625, 0.4619293212890625, 0.48015594482421875, 0.498382568359375, 0.5166091918945312, 0.5348358154296875, 0.5530624389648438, 0.5712890625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 8.0, 12.0, 22.0, 18.0, 39.0, 52.0, 66.0, 105.0, 132.0, 191.0, 245.0, 361.0, 519.0, 782.0, 1140.0, 1666.0, 2504.0, 3897.0, 6220.0, 10717.0, 22191.0, 77269.0, 1760465.0, 146496.0, 28908.0, 12821.0, 7192.0, 4340.0, 2787.0, 1821.0, 1257.0, 848.0, 591.0, 427.0, 307.0, 188.0, 148.0, 110.0, 77.0, 56.0, 31.0, 25.0, 25.0, 13.0, 11.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1678466796875, -0.1627044677734375, -0.157562255859375, -0.1524200439453125, -0.14727783203125, -0.1421356201171875, -0.136993408203125, -0.1318511962890625, -0.126708984375, -0.1215667724609375, -0.116424560546875, -0.1112823486328125, -0.10614013671875, -0.1009979248046875, -0.095855712890625, -0.0907135009765625, -0.0855712890625, -0.0804290771484375, -0.075286865234375, -0.0701446533203125, -0.06500244140625, -0.0598602294921875, -0.054718017578125, -0.0495758056640625, -0.04443359375, -0.0392913818359375, -0.034149169921875, -0.0290069580078125, -0.02386474609375, -0.0187225341796875, -0.013580322265625, -0.0084381103515625, -0.0032958984375, 0.0018463134765625, 0.006988525390625, 0.0121307373046875, 0.01727294921875, 0.0224151611328125, 0.027557373046875, 0.0326995849609375, 0.037841796875, 0.0429840087890625, 0.048126220703125, 0.0532684326171875, 0.05841064453125, 0.0635528564453125, 0.068695068359375, 0.0738372802734375, 0.0789794921875, 0.0841217041015625, 0.089263916015625, 0.0944061279296875, 0.09954833984375, 0.1046905517578125, 0.109832763671875, 0.1149749755859375, 0.1201171875, 0.1252593994140625, 0.130401611328125, 0.1355438232421875, 0.14068603515625, 0.1458282470703125, 0.150970458984375, 0.1561126708984375, 0.1612548828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 2.0, 5.0, 7.0, 6.0, 10.0, 15.0, 16.0, 15.0, 19.0, 20.0, 23.0, 32.0, 28.0, 36.0, 27.0, 40.0, 36.0, 51.0, 39.0, 46.0, 48.0, 51.0, 51.0, 41.0, 49.0, 43.0, 32.0, 33.0, 27.0, 22.0, 17.0, 16.0, 19.0, 10.0, 7.0, 12.0, 11.0, 9.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00556182861328125, -0.005371749401092529, -0.005181670188903809, -0.004991590976715088, -0.004801511764526367, -0.0046114325523376465, -0.004421353340148926, -0.004231274127960205, -0.004041194915771484, -0.0038511157035827637, -0.003661036491394043, -0.0034709572792053223, -0.0032808780670166016, -0.003090798854827881, -0.00290071964263916, -0.0027106404304504395, -0.0025205612182617188, -0.002330482006072998, -0.0021404027938842773, -0.0019503235816955566, -0.001760244369506836, -0.0015701651573181152, -0.0013800859451293945, -0.0011900067329406738, -0.0009999275207519531, -0.0008098483085632324, -0.0006197690963745117, -0.000429689884185791, -0.0002396106719970703, -4.953145980834961e-05, 0.0001405477523803711, 0.0003306269645690918, 0.0005207061767578125, 0.0007107853889465332, 0.0009008646011352539, 0.0010909438133239746, 0.0012810230255126953, 0.001471102237701416, 0.0016611814498901367, 0.0018512606620788574, 0.002041339874267578, 0.002231419086456299, 0.0024214982986450195, 0.0026115775108337402, 0.002801656723022461, 0.0029917359352111816, 0.0031818151473999023, 0.003371894359588623, 0.0035619735717773438, 0.0037520527839660645, 0.003942131996154785, 0.004132211208343506, 0.0043222904205322266, 0.004512369632720947, 0.004702448844909668, 0.004892528057098389, 0.005082607269287109, 0.00527268648147583, 0.005462765693664551, 0.0056528449058532715, 0.005842924118041992, 0.006033003330230713, 0.006223082542419434, 0.006413161754608154, 0.006603240966796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 3.0, 9.0, 8.0, 9.0, 12.0, 14.0, 13.0, 22.0, 28.0, 26.0, 38.0, 53.0, 63.0, 91.0, 137.0, 163.0, 268.0, 522.0, 2450.0, 833113.0, 208949.0, 1227.0, 435.0, 228.0, 142.0, 100.0, 88.0, 77.0, 49.0, 40.0, 34.0, 23.0, 25.0, 18.0, 16.0, 16.0, 5.0, 7.0, 5.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.13037109375, -0.1266326904296875, -0.122894287109375, -0.1191558837890625, -0.11541748046875, -0.1116790771484375, -0.107940673828125, -0.1042022705078125, -0.1004638671875, -0.0967254638671875, -0.092987060546875, -0.0892486572265625, -0.08551025390625, -0.0817718505859375, -0.078033447265625, -0.0742950439453125, -0.070556640625, -0.0668182373046875, -0.063079833984375, -0.0593414306640625, -0.05560302734375, -0.0518646240234375, -0.048126220703125, -0.0443878173828125, -0.0406494140625, -0.0369110107421875, -0.033172607421875, -0.0294342041015625, -0.02569580078125, -0.0219573974609375, -0.018218994140625, -0.0144805908203125, -0.0107421875, -0.0070037841796875, -0.003265380859375, 0.0004730224609375, 0.00421142578125, 0.0079498291015625, 0.011688232421875, 0.0154266357421875, 0.0191650390625, 0.0229034423828125, 0.026641845703125, 0.0303802490234375, 0.03411865234375, 0.0378570556640625, 0.041595458984375, 0.0453338623046875, 0.049072265625, 0.0528106689453125, 0.056549072265625, 0.0602874755859375, 0.06402587890625, 0.0677642822265625, 0.071502685546875, 0.0752410888671875, 0.0789794921875, 0.0827178955078125, 0.086456298828125, 0.0901947021484375, 0.09393310546875, 0.0976715087890625, 0.101409912109375, 0.1051483154296875, 0.10888671875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 44.0, 783.0, 178.0, 7.0, 1.0], "bins": [-0.18664827942848206, -0.18357637524604797, -0.1805044710636139, -0.177432581782341, -0.17436067759990692, -0.17128877341747284, -0.16821688413619995, -0.16514497995376587, -0.1620730757713318, -0.1590011715888977, -0.15592926740646362, -0.15285737812519073, -0.14978547394275665, -0.14671356976032257, -0.14364168047904968, -0.1405697762966156, -0.13749787211418152, -0.13442596793174744, -0.13135406374931335, -0.12828217446804047, -0.12521027028560638, -0.1221383661031723, -0.11906646937131882, -0.11599457263946533, -0.11292266845703125, -0.10985076427459717, -0.10677886754274368, -0.1037069708108902, -0.10063506662845612, -0.09756316244602203, -0.09449126571416855, -0.09141936898231506, -0.08834746479988098, -0.0852755606174469, -0.08220366388559341, -0.07913176715373993, -0.07605986297130585, -0.07298795878887177, -0.06991606205701828, -0.0668441653251648, -0.06377226114273071, -0.06070036068558693, -0.057628460228443146, -0.05455655977129936, -0.05148465931415558, -0.048412758857011795, -0.04534085839986801, -0.04226895794272423, -0.039197057485580444, -0.03612515702843666, -0.03305325657129288, -0.029981356114149094, -0.02690945565700531, -0.023837555199861526, -0.020765654742717743, -0.01769375428557396, -0.014621851965785027, -0.011549951508641243, -0.00847805105149746, -0.005406150594353676, -0.0023342501372098923, 0.0007376503199338913, 0.003809550777077675, 0.0068814512342214584, 0.009953351691365242]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 11.0, 18.0, 28.0, 17.0, 34.0, 29.0, 35.0, 32.0, 35.0, 41.0, 58.0, 45.0, 66.0, 50.0, 59.0, 38.0, 47.0, 56.0, 35.0, 39.0, 31.0, 23.0, 23.0, 31.0, 22.0, 17.0, 21.0, 10.0, 1.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.017871081829071045, -0.01736886240541935, -0.016866642981767654, -0.01636442355811596, -0.015862204134464264, -0.015359984710812569, -0.014857765287160873, -0.014355545863509178, -0.013853326439857483, -0.013351107016205788, -0.012848887592554092, -0.012346668168902397, -0.011844448745250702, -0.011342229321599007, -0.010840009897947311, -0.010337790474295616, -0.009835571050643921, -0.009333351626992226, -0.00883113220334053, -0.008328912779688835, -0.00782669335603714, -0.007324473932385445, -0.006822254508733749, -0.006320035085082054, -0.005817815661430359, -0.005315596237778664, -0.004813376814126968, -0.004311157390475273, -0.003808937966823578, -0.0033067185431718826, -0.0028044991195201874, -0.002302279695868492, -0.0018000602722167969, -0.0012978408485651016, -0.0007956214249134064, -0.0002934020012617111, 0.00020881742238998413, 0.0007110368460416794, 0.0012132562696933746, 0.0017154756933450699, 0.002217695116996765, 0.0027199145406484604, 0.0032221339643001556, 0.003724353387951851, 0.004226572811603546, 0.004728792235255241, 0.005231011658906937, 0.005733231082558632, 0.006235450506210327, 0.006737669929862022, 0.007239889353513718, 0.007742108777165413, 0.008244328200817108, 0.008746547624468803, 0.009248767048120499, 0.009750986471772194, 0.01025320589542389, 0.010755425319075584, 0.01125764474272728, 0.011759864166378975, 0.01226208359003067, 0.012764303013682365, 0.01326652243733406, 0.013768741860985756, 0.014270961284637451]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 5.0, 3.0, 12.0, 8.0, 11.0, 8.0, 17.0, 17.0, 10.0, 22.0, 22.0, 21.0, 22.0, 29.0, 24.0, 30.0, 32.0, 37.0, 38.0, 36.0, 43.0, 37.0, 37.0, 38.0, 47.0, 29.0, 43.0, 35.0, 40.0, 37.0, 27.0, 24.0, 20.0, 29.0, 12.0, 24.0, 9.0, 12.0, 14.0, 7.0, 6.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.70556640625, -0.684234619140625, -0.66290283203125, -0.641571044921875, -0.6202392578125, -0.598907470703125, -0.57757568359375, -0.556243896484375, -0.534912109375, -0.513580322265625, -0.49224853515625, -0.470916748046875, -0.4495849609375, -0.428253173828125, -0.40692138671875, -0.385589599609375, -0.3642578125, -0.342926025390625, -0.32159423828125, -0.300262451171875, -0.2789306640625, -0.257598876953125, -0.23626708984375, -0.214935302734375, -0.193603515625, -0.172271728515625, -0.15093994140625, -0.129608154296875, -0.1082763671875, -0.086944580078125, -0.06561279296875, -0.044281005859375, -0.02294921875, -0.001617431640625, 0.01971435546875, 0.041046142578125, 0.0623779296875, 0.083709716796875, 0.10504150390625, 0.126373291015625, 0.147705078125, 0.169036865234375, 0.19036865234375, 0.211700439453125, 0.2330322265625, 0.254364013671875, 0.27569580078125, 0.297027587890625, 0.318359375, 0.339691162109375, 0.36102294921875, 0.382354736328125, 0.4036865234375, 0.425018310546875, 0.44635009765625, 0.467681884765625, 0.489013671875, 0.510345458984375, 0.53167724609375, 0.553009033203125, 0.5743408203125, 0.595672607421875, 0.61700439453125, 0.638336181640625, 0.65966796875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 13.0, 11.0, 35.0, 45.0, 47.0, 56.0, 101.0, 169.0, 257.0, 410.0, 697.0, 1091.0, 2029.0, 3589.0, 6749.0, 13582.0, 30912.0, 89931.0, 312904.0, 393775.0, 118908.0, 39300.0, 16404.0, 7803.0, 4092.0, 2253.0, 1309.0, 751.0, 492.0, 276.0, 179.0, 112.0, 74.0, 58.0, 45.0, 22.0, 17.0, 10.0, 10.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-1.375, -1.335845947265625, -1.29669189453125, -1.257537841796875, -1.2183837890625, -1.179229736328125, -1.14007568359375, -1.100921630859375, -1.061767578125, -1.022613525390625, -0.98345947265625, -0.944305419921875, -0.9051513671875, -0.865997314453125, -0.82684326171875, -0.787689208984375, -0.74853515625, -0.709381103515625, -0.67022705078125, -0.631072998046875, -0.5919189453125, -0.552764892578125, -0.51361083984375, -0.474456787109375, -0.435302734375, -0.396148681640625, -0.35699462890625, -0.317840576171875, -0.2786865234375, -0.239532470703125, -0.20037841796875, -0.161224365234375, -0.1220703125, -0.082916259765625, -0.04376220703125, -0.004608154296875, 0.0345458984375, 0.073699951171875, 0.11285400390625, 0.152008056640625, 0.191162109375, 0.230316162109375, 0.26947021484375, 0.308624267578125, 0.3477783203125, 0.386932373046875, 0.42608642578125, 0.465240478515625, 0.50439453125, 0.543548583984375, 0.58270263671875, 0.621856689453125, 0.6610107421875, 0.700164794921875, 0.73931884765625, 0.778472900390625, 0.817626953125, 0.856781005859375, 0.89593505859375, 0.935089111328125, 0.9742431640625, 1.013397216796875, 1.05255126953125, 1.091705322265625, 1.130859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 3.0, 9.0, 7.0, 9.0, 12.0, 15.0, 18.0, 22.0, 21.0, 14.0, 22.0, 22.0, 23.0, 27.0, 23.0, 39.0, 39.0, 48.0, 62.0, 98.0, 194.0, 1404.0, 292.0, 148.0, 68.0, 45.0, 49.0, 40.0, 36.0, 34.0, 20.0, 27.0, 27.0, 15.0, 17.0, 16.0, 16.0, 3.0, 6.0, 15.0, 6.0, 7.0, 7.0, 4.0, 8.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.986328125, -1.9275665283203125, -1.868804931640625, -1.8100433349609375, -1.75128173828125, -1.6925201416015625, -1.633758544921875, -1.5749969482421875, -1.5162353515625, -1.4574737548828125, -1.398712158203125, -1.3399505615234375, -1.28118896484375, -1.2224273681640625, -1.163665771484375, -1.1049041748046875, -1.046142578125, -0.9873809814453125, -0.928619384765625, -0.8698577880859375, -0.81109619140625, -0.7523345947265625, -0.693572998046875, -0.6348114013671875, -0.5760498046875, -0.5172882080078125, -0.458526611328125, -0.3997650146484375, -0.34100341796875, -0.2822418212890625, -0.223480224609375, -0.1647186279296875, -0.10595703125, -0.0471954345703125, 0.011566162109375, 0.0703277587890625, 0.12908935546875, 0.1878509521484375, 0.246612548828125, 0.3053741455078125, 0.3641357421875, 0.4228973388671875, 0.481658935546875, 0.5404205322265625, 0.59918212890625, 0.6579437255859375, 0.716705322265625, 0.7754669189453125, 0.834228515625, 0.8929901123046875, 0.951751708984375, 1.0105133056640625, 1.06927490234375, 1.1280364990234375, 1.186798095703125, 1.2455596923828125, 1.3043212890625, 1.3630828857421875, 1.421844482421875, 1.4806060791015625, 1.53936767578125, 1.5981292724609375, 1.656890869140625, 1.7156524658203125, 1.7744140625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 5.0, 6.0, 13.0, 20.0, 13.0, 28.0, 34.0, 55.0, 80.0, 107.0, 160.0, 245.0, 530.0, 1238.0, 3125.0, 10350.0, 46917.0, 689091.0, 2262604.0, 105185.0, 17565.0, 4905.0, 1710.0, 699.0, 381.0, 224.0, 135.0, 69.0, 52.0, 35.0, 31.0, 19.0, 14.0, 11.0, 6.0, 9.0, 3.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.302642822265625, -2.22637939453125, -2.150115966796875, -2.0738525390625, -1.997589111328125, -1.92132568359375, -1.845062255859375, -1.768798828125, -1.692535400390625, -1.61627197265625, -1.540008544921875, -1.4637451171875, -1.387481689453125, -1.31121826171875, -1.234954833984375, -1.15869140625, -1.082427978515625, -1.00616455078125, -0.929901123046875, -0.8536376953125, -0.777374267578125, -0.70111083984375, -0.624847412109375, -0.548583984375, -0.472320556640625, -0.39605712890625, -0.319793701171875, -0.2435302734375, -0.167266845703125, -0.09100341796875, -0.014739990234375, 0.0615234375, 0.137786865234375, 0.21405029296875, 0.290313720703125, 0.3665771484375, 0.442840576171875, 0.51910400390625, 0.595367431640625, 0.671630859375, 0.747894287109375, 0.82415771484375, 0.900421142578125, 0.9766845703125, 1.052947998046875, 1.12921142578125, 1.205474853515625, 1.28173828125, 1.358001708984375, 1.43426513671875, 1.510528564453125, 1.5867919921875, 1.663055419921875, 1.73931884765625, 1.815582275390625, 1.891845703125, 1.968109130859375, 2.04437255859375, 2.120635986328125, 2.1968994140625, 2.273162841796875, 2.34942626953125, 2.425689697265625, 2.501953125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [34.0, 546.0, 411.0, 28.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5845626592636108, -0.7517861127853394, 0.08099043369293213, 0.9137669801712036, 1.746543526649475, 2.579319953918457, 3.4120965003967285, 4.244873046875, 5.0776495933532715, 5.910426139831543, 6.7432026863098145, 7.575979232788086, 8.408756256103516, 9.241532325744629, 10.074308395385742, 10.907085418701172, 11.739862442016602, 12.572639465332031, 13.405415534973145, 14.238191604614258, 15.070968627929688, 15.903745651245117, 16.736522674560547, 17.569297790527344, 18.402074813842773, 19.234851837158203, 20.067626953125, 20.90040397644043, 21.73318099975586, 22.56595802307129, 23.39873504638672, 24.231510162353516, 25.064285278320312, 25.897062301635742, 26.729839324951172, 27.56261444091797, 28.3953914642334, 29.228168487548828, 30.060943603515625, 30.893720626831055, 31.726497650146484, 32.55927276611328, 33.392051696777344, 34.22482681274414, 35.05760192871094, 35.890380859375, 36.7231559753418, 37.55593490600586, 38.388710021972656, 39.22148513793945, 40.054264068603516, 40.88703918457031, 41.719818115234375, 42.55259323120117, 43.38536834716797, 44.21814727783203, 45.05092239379883, 45.883697509765625, 46.71647644042969, 47.549251556396484, 48.38202667236328, 49.214805603027344, 50.04758071899414, 50.8803596496582, 51.713134765625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 3.0, 3.0, 5.0, 6.0, 12.0, 4.0, 19.0, 8.0, 17.0, 21.0, 24.0, 16.0, 17.0, 17.0, 26.0, 30.0, 23.0, 25.0, 30.0, 37.0, 36.0, 35.0, 39.0, 33.0, 37.0, 36.0, 37.0, 36.0, 40.0, 25.0, 35.0, 35.0, 32.0, 28.0, 23.0, 21.0, 16.0, 18.0, 19.0, 17.0, 16.0, 7.0, 5.0, 7.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-4.2147932052612305, -4.082930564880371, -3.9510679244995117, -3.8192055225372314, -3.687342882156372, -3.5554802417755127, -3.4236178398132324, -3.291755199432373, -3.1598925590515137, -3.0280299186706543, -2.896167278289795, -2.7643048763275146, -2.6324422359466553, -2.500579595565796, -2.3687171936035156, -2.2368545532226562, -2.104991912841797, -1.9731292724609375, -1.8412667512893677, -1.7094042301177979, -1.5775415897369385, -1.445678949356079, -1.3138164281845093, -1.1819539070129395, -1.05009126663208, -0.9182286858558655, -0.7863661050796509, -0.6545035243034363, -0.5226409435272217, -0.3907783627510071, -0.2589157819747925, -0.12705320119857788, 0.004809379577636719, 0.13667196035385132, 0.2685345411300659, 0.4003971219062805, 0.5322597026824951, 0.6641222834587097, 0.7959848642349243, 0.9278474450111389, 1.0597100257873535, 1.191572666168213, 1.3234351873397827, 1.4552977085113525, 1.587160348892212, 1.7190229892730713, 1.8508855104446411, 1.982748031616211, 2.1146106719970703, 2.2464733123779297, 2.378335952758789, 2.5101983547210693, 2.6420609951019287, 2.773923635482788, 2.9057860374450684, 3.0376486778259277, 3.169511318206787, 3.3013739585876465, 3.433236598968506, 3.565099000930786, 3.6969616413116455, 3.828824281692505, 3.960686683654785, 4.0925493240356445, 4.224411964416504]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 5.0, 13.0, 13.0, 21.0, 18.0, 23.0, 30.0, 22.0, 29.0, 23.0, 33.0, 39.0, 27.0, 37.0, 42.0, 43.0, 30.0, 42.0, 39.0, 54.0, 45.0, 46.0, 34.0, 28.0, 35.0, 36.0, 33.0, 23.0, 15.0, 20.0, 19.0, 14.0, 12.0, 5.0, 9.0, 7.0, 8.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7333984375, -0.70989990234375, -0.6864013671875, -0.66290283203125, -0.639404296875, -0.61590576171875, -0.5924072265625, -0.56890869140625, -0.54541015625, -0.52191162109375, -0.4984130859375, -0.47491455078125, -0.451416015625, -0.42791748046875, -0.4044189453125, -0.38092041015625, -0.357421875, -0.33392333984375, -0.3104248046875, -0.28692626953125, -0.263427734375, -0.23992919921875, -0.2164306640625, -0.19293212890625, -0.16943359375, -0.14593505859375, -0.1224365234375, -0.09893798828125, -0.075439453125, -0.05194091796875, -0.0284423828125, -0.00494384765625, 0.0185546875, 0.04205322265625, 0.0655517578125, 0.08905029296875, 0.112548828125, 0.13604736328125, 0.1595458984375, 0.18304443359375, 0.20654296875, 0.23004150390625, 0.2535400390625, 0.27703857421875, 0.300537109375, 0.32403564453125, 0.3475341796875, 0.37103271484375, 0.39453125, 0.41802978515625, 0.4415283203125, 0.46502685546875, 0.488525390625, 0.51202392578125, 0.5355224609375, 0.55902099609375, 0.58251953125, 0.60601806640625, 0.6295166015625, 0.65301513671875, 0.676513671875, 0.70001220703125, 0.7235107421875, 0.74700927734375, 0.7705078125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 2.0, 10.0, 9.0, 19.0, 21.0, 29.0, 42.0, 60.0, 86.0, 102.0, 148.0, 206.0, 305.0, 438.0, 664.0, 951.0, 1430.0, 2254.0, 3372.0, 5836.0, 10758.0, 22971.0, 62206.0, 245335.0, 1305299.0, 1963226.0, 412446.0, 93412.0, 30818.0, 13380.0, 7207.0, 4013.0, 2510.0, 1534.0, 1049.0, 711.0, 422.0, 314.0, 222.0, 122.0, 89.0, 81.0, 56.0, 28.0, 29.0, 16.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.095703125, -1.0616302490234375, -1.027557373046875, -0.9934844970703125, -0.95941162109375, -0.9253387451171875, -0.891265869140625, -0.8571929931640625, -0.8231201171875, -0.7890472412109375, -0.754974365234375, -0.7209014892578125, -0.68682861328125, -0.6527557373046875, -0.618682861328125, -0.5846099853515625, -0.550537109375, -0.5164642333984375, -0.482391357421875, -0.4483184814453125, -0.41424560546875, -0.3801727294921875, -0.346099853515625, -0.3120269775390625, -0.2779541015625, -0.2438812255859375, -0.209808349609375, -0.1757354736328125, -0.14166259765625, -0.1075897216796875, -0.073516845703125, -0.0394439697265625, -0.00537109375, 0.0287017822265625, 0.062774658203125, 0.0968475341796875, 0.13092041015625, 0.1649932861328125, 0.199066162109375, 0.2331390380859375, 0.2672119140625, 0.3012847900390625, 0.335357666015625, 0.3694305419921875, 0.40350341796875, 0.4375762939453125, 0.471649169921875, 0.5057220458984375, 0.539794921875, 0.5738677978515625, 0.607940673828125, 0.6420135498046875, 0.67608642578125, 0.7101593017578125, 0.744232177734375, 0.7783050537109375, 0.8123779296875, 0.8464508056640625, 0.880523681640625, 0.9145965576171875, 0.94866943359375, 0.9827423095703125, 1.016815185546875, 1.0508880615234375, 1.0849609375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 9.0, 11.0, 13.0, 24.0, 31.0, 64.0, 96.0, 183.0, 270.0, 651.0, 1082.0, 759.0, 391.0, 181.0, 87.0, 75.0, 47.0, 29.0, 18.0, 14.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.478515625, -1.41845703125, -1.3583984375, -1.29833984375, -1.23828125, -1.17822265625, -1.1181640625, -1.05810546875, -0.998046875, -0.93798828125, -0.8779296875, -0.81787109375, -0.7578125, -0.69775390625, -0.6376953125, -0.57763671875, -0.517578125, -0.45751953125, -0.3974609375, -0.33740234375, -0.27734375, -0.21728515625, -0.1572265625, -0.09716796875, -0.037109375, 0.02294921875, 0.0830078125, 0.14306640625, 0.203125, 0.26318359375, 0.3232421875, 0.38330078125, 0.443359375, 0.50341796875, 0.5634765625, 0.62353515625, 0.68359375, 0.74365234375, 0.8037109375, 0.86376953125, 0.923828125, 0.98388671875, 1.0439453125, 1.10400390625, 1.1640625, 1.22412109375, 1.2841796875, 1.34423828125, 1.404296875, 1.46435546875, 1.5244140625, 1.58447265625, 1.64453125, 1.70458984375, 1.7646484375, 1.82470703125, 1.884765625, 1.94482421875, 2.0048828125, 2.06494140625, 2.125, 2.18505859375, 2.2451171875, 2.30517578125, 2.365234375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 17.0, 24.0, 29.0, 63.0, 98.0, 188.0, 372.0, 849.0, 2276.0, 7559.0, 37990.0, 608809.0, 3405818.0, 108748.0, 15085.0, 3828.0, 1383.0, 564.0, 247.0, 133.0, 77.0, 45.0, 30.0, 9.0, 16.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.901763916015625, -2.78204345703125, -2.662322998046875, -2.5426025390625, -2.422882080078125, -2.30316162109375, -2.183441162109375, -2.063720703125, -1.944000244140625, -1.82427978515625, -1.704559326171875, -1.5848388671875, -1.465118408203125, -1.34539794921875, -1.225677490234375, -1.10595703125, -0.986236572265625, -0.86651611328125, -0.746795654296875, -0.6270751953125, -0.507354736328125, -0.38763427734375, -0.267913818359375, -0.148193359375, -0.028472900390625, 0.09124755859375, 0.210968017578125, 0.3306884765625, 0.450408935546875, 0.57012939453125, 0.689849853515625, 0.8095703125, 0.929290771484375, 1.04901123046875, 1.168731689453125, 1.2884521484375, 1.408172607421875, 1.52789306640625, 1.647613525390625, 1.767333984375, 1.887054443359375, 2.00677490234375, 2.126495361328125, 2.2462158203125, 2.365936279296875, 2.48565673828125, 2.605377197265625, 2.72509765625, 2.844818115234375, 2.96453857421875, 3.084259033203125, 3.2039794921875, 3.323699951171875, 3.44342041015625, 3.563140869140625, 3.682861328125, 3.802581787109375, 3.92230224609375, 4.042022705078125, 4.1617431640625, 4.281463623046875, 4.40118408203125, 4.520904541015625, 4.640625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 12.0, 31.0, 93.0, 196.0, 285.0, 241.0, 105.0, 31.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-24.625186920166016, -24.173757553100586, -23.722328186035156, -23.27090072631836, -22.81947135925293, -22.3680419921875, -21.91661262512207, -21.46518325805664, -21.01375389099121, -20.56232452392578, -20.11089515686035, -19.659465789794922, -19.208038330078125, -18.756608963012695, -18.305179595947266, -17.853750228881836, -17.402320861816406, -16.950891494750977, -16.499462127685547, -16.04803466796875, -15.596604347229004, -15.14517593383789, -14.693746566772461, -14.242317199707031, -13.790889739990234, -13.339460372924805, -12.888031959533691, -12.436602592468262, -11.985173225402832, -11.533744812011719, -11.082315444946289, -10.63088607788086, -10.179455757141113, -9.728026390075684, -9.27659797668457, -8.82516860961914, -8.373739242553711, -7.9223103523254395, -7.470881462097168, -7.019452095031738, -6.568023204803467, -6.116594314575195, -5.665164947509766, -5.213736057281494, -4.762307167053223, -4.310877799987793, -3.8594489097595215, -3.408019781112671, -2.9565906524658203, -2.5051615238189697, -2.053732395172119, -1.6023035049438477, -1.150874376296997, -0.6994452476501465, -0.248016357421875, 0.20341277122497559, 0.6548418998718262, 1.1062710285186768, 1.5577000379562378, 2.009129047393799, 2.4605581760406494, 2.9119873046875, 3.3634161949157715, 3.814845323562622, 4.266274452209473]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 6.0, 6.0, 10.0, 12.0, 9.0, 13.0, 13.0, 20.0, 19.0, 16.0, 25.0, 30.0, 29.0, 19.0, 27.0, 32.0, 38.0, 43.0, 49.0, 42.0, 39.0, 41.0, 41.0, 38.0, 36.0, 41.0, 36.0, 38.0, 23.0, 20.0, 26.0, 29.0, 18.0, 19.0, 15.0, 11.0, 18.0, 17.0, 10.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.710777997970581, -3.586059331893921, -3.4613404273986816, -3.3366217613220215, -3.2119030952453613, -3.087184429168701, -2.962465524673462, -2.8377468585968018, -2.7130279541015625, -2.5883092880249023, -2.463590383529663, -2.338871717453003, -2.2141530513763428, -2.0894341468811035, -1.9647154808044434, -1.8399968147277832, -1.715278148651123, -1.5905593633651733, -1.4658406972885132, -1.3411219120025635, -1.2164032459259033, -1.0916844606399536, -0.9669656753540039, -0.842246949672699, -0.717528223991394, -0.5928094983100891, -0.4680907428264618, -0.3433719873428345, -0.21865326166152954, -0.09393453598022461, 0.030784249305725098, 0.15550297498703003, 0.28022193908691406, 0.404940664768219, 0.5296593904495239, 0.6543781757354736, 0.7790969014167786, 0.9038156270980835, 1.0285344123840332, 1.1532530784606934, 1.277971863746643, 1.4026906490325928, 1.527409315109253, 1.6521281003952026, 1.7768468856811523, 1.9015655517578125, 2.0262842178344727, 2.151003122329712, 2.275721788406372, 2.4004404544830322, 2.5251593589782715, 2.6498780250549316, 2.774596691131592, 2.899315357208252, 3.024034261703491, 3.1487529277801514, 3.2734718322753906, 3.398190498352051, 3.52290940284729, 3.64762806892395, 3.7723467350006104, 3.8970656394958496, 4.02178430557251, 4.14650297164917, 4.27122163772583]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 6.0, 6.0, 16.0, 8.0, 16.0, 11.0, 19.0, 16.0, 19.0, 26.0, 26.0, 35.0, 40.0, 32.0, 39.0, 50.0, 45.0, 38.0, 42.0, 36.0, 36.0, 45.0, 49.0, 39.0, 38.0, 36.0, 24.0, 30.0, 27.0, 27.0, 19.0, 23.0, 16.0, 11.0, 8.0, 11.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.73095703125, -0.7067031860351562, -0.6824493408203125, -0.6581954956054688, -0.633941650390625, -0.6096878051757812, -0.5854339599609375, -0.5611801147460938, -0.53692626953125, -0.5126724243164062, -0.4884185791015625, -0.46416473388671875, -0.439910888671875, -0.41565704345703125, -0.3914031982421875, -0.36714935302734375, -0.3428955078125, -0.31864166259765625, -0.2943878173828125, -0.27013397216796875, -0.245880126953125, -0.22162628173828125, -0.1973724365234375, -0.17311859130859375, -0.14886474609375, -0.12461090087890625, -0.1003570556640625, -0.07610321044921875, -0.051849365234375, -0.02759552001953125, -0.0033416748046875, 0.02091217041015625, 0.045166015625, 0.06941986083984375, 0.0936737060546875, 0.11792755126953125, 0.142181396484375, 0.16643524169921875, 0.1906890869140625, 0.21494293212890625, 0.23919677734375, 0.26345062255859375, 0.2877044677734375, 0.31195831298828125, 0.336212158203125, 0.36046600341796875, 0.3847198486328125, 0.40897369384765625, 0.4332275390625, 0.45748138427734375, 0.4817352294921875, 0.5059890747070312, 0.530242919921875, 0.5544967651367188, 0.5787506103515625, 0.6030044555664062, 0.62725830078125, 0.6515121459960938, 0.6757659912109375, 0.7000198364257812, 0.724273681640625, 0.7485275268554688, 0.7727813720703125, 0.7970352172851562, 0.8212890625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 15.0, 25.0, 18.0, 29.0, 51.0, 77.0, 130.0, 174.0, 257.0, 384.0, 637.0, 979.0, 1451.0, 2339.0, 3463.0, 5492.0, 8953.0, 14559.0, 23997.0, 42197.0, 77167.0, 146128.0, 245097.0, 211424.0, 115339.0, 61610.0, 34071.0, 19802.0, 11875.0, 7436.0, 4872.0, 2957.0, 1938.0, 1259.0, 774.0, 509.0, 358.0, 237.0, 144.0, 117.0, 76.0, 40.0, 48.0, 22.0, 10.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08807373046875, -0.08521556854248047, -0.08235740661621094, -0.0794992446899414, -0.07664108276367188, -0.07378292083740234, -0.07092475891113281, -0.06806659698486328, -0.06520843505859375, -0.06235027313232422, -0.05949211120605469, -0.056633949279785156, -0.053775787353515625, -0.050917625427246094, -0.04805946350097656, -0.04520130157470703, -0.0423431396484375, -0.03948497772216797, -0.03662681579589844, -0.033768653869628906, -0.030910491943359375, -0.028052330017089844, -0.025194168090820312, -0.02233600616455078, -0.01947784423828125, -0.01661968231201172, -0.013761520385742188, -0.010903358459472656, -0.008045196533203125, -0.005187034606933594, -0.0023288726806640625, 0.0005292892456054688, 0.003387451171875, 0.006245613098144531, 0.009103775024414062, 0.011961936950683594, 0.014820098876953125, 0.017678260803222656, 0.020536422729492188, 0.02339458465576172, 0.02625274658203125, 0.02911090850830078, 0.03196907043457031, 0.034827232360839844, 0.037685394287109375, 0.040543556213378906, 0.04340171813964844, 0.04625988006591797, 0.0491180419921875, 0.05197620391845703, 0.05483436584472656, 0.057692527770996094, 0.060550689697265625, 0.06340885162353516, 0.06626701354980469, 0.06912517547607422, 0.07198333740234375, 0.07484149932861328, 0.07769966125488281, 0.08055782318115234, 0.08341598510742188, 0.0862741470336914, 0.08913230895996094, 0.09199047088623047, 0.0948486328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 4.0, 8.0, 5.0, 10.0, 12.0, 18.0, 10.0, 19.0, 25.0, 17.0, 22.0, 29.0, 25.0, 30.0, 24.0, 34.0, 31.0, 41.0, 34.0, 39.0, 1070.0, 37.0, 46.0, 36.0, 35.0, 40.0, 47.0, 29.0, 29.0, 28.0, 21.0, 22.0, 14.0, 16.0, 26.0, 10.0, 14.0, 8.0, 11.0, 6.0, 4.0, 9.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.59228515625, -0.5735855102539062, -0.5548858642578125, -0.5361862182617188, -0.517486572265625, -0.49878692626953125, -0.4800872802734375, -0.46138763427734375, -0.44268798828125, -0.42398834228515625, -0.4052886962890625, -0.38658905029296875, -0.367889404296875, -0.34918975830078125, -0.3304901123046875, -0.31179046630859375, -0.2930908203125, -0.27439117431640625, -0.2556915283203125, -0.23699188232421875, -0.218292236328125, -0.19959259033203125, -0.1808929443359375, -0.16219329833984375, -0.14349365234375, -0.12479400634765625, -0.1060943603515625, -0.08739471435546875, -0.068695068359375, -0.04999542236328125, -0.0312957763671875, -0.01259613037109375, 0.006103515625, 0.02480316162109375, 0.0435028076171875, 0.06220245361328125, 0.080902099609375, 0.09960174560546875, 0.1183013916015625, 0.13700103759765625, 0.15570068359375, 0.17440032958984375, 0.1930999755859375, 0.21179962158203125, 0.230499267578125, 0.24919891357421875, 0.2678985595703125, 0.28659820556640625, 0.3052978515625, 0.32399749755859375, 0.3426971435546875, 0.36139678955078125, 0.380096435546875, 0.39879608154296875, 0.4174957275390625, 0.43619537353515625, 0.45489501953125, 0.47359466552734375, 0.4922943115234375, 0.5109939575195312, 0.529693603515625, 0.5483932495117188, 0.5670928955078125, 0.5857925415039062, 0.6044921875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 10.0, 9.0, 19.0, 18.0, 38.0, 49.0, 69.0, 94.0, 155.0, 180.0, 297.0, 369.0, 566.0, 852.0, 1247.0, 1931.0, 2834.0, 4410.0, 7455.0, 13670.0, 31853.0, 189961.0, 1726658.0, 67022.0, 20621.0, 10172.0, 5853.0, 3551.0, 2325.0, 1493.0, 1047.0, 691.0, 476.0, 345.0, 224.0, 174.0, 124.0, 79.0, 60.0, 32.0, 24.0, 22.0, 15.0, 13.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.184326171875, -0.17894744873046875, -0.1735687255859375, -0.16819000244140625, -0.162811279296875, -0.15743255615234375, -0.1520538330078125, -0.14667510986328125, -0.14129638671875, -0.13591766357421875, -0.1305389404296875, -0.12516021728515625, -0.119781494140625, -0.11440277099609375, -0.1090240478515625, -0.10364532470703125, -0.0982666015625, -0.09288787841796875, -0.0875091552734375, -0.08213043212890625, -0.076751708984375, -0.07137298583984375, -0.0659942626953125, -0.06061553955078125, -0.05523681640625, -0.04985809326171875, -0.0444793701171875, -0.03910064697265625, -0.033721923828125, -0.02834320068359375, -0.0229644775390625, -0.01758575439453125, -0.01220703125, -0.00682830810546875, -0.0014495849609375, 0.00392913818359375, 0.009307861328125, 0.01468658447265625, 0.0200653076171875, 0.02544403076171875, 0.03082275390625, 0.03620147705078125, 0.0415802001953125, 0.04695892333984375, 0.052337646484375, 0.05771636962890625, 0.0630950927734375, 0.06847381591796875, 0.0738525390625, 0.07923126220703125, 0.0846099853515625, 0.08998870849609375, 0.095367431640625, 0.10074615478515625, 0.1061248779296875, 0.11150360107421875, 0.11688232421875, 0.12226104736328125, 0.1276397705078125, 0.13301849365234375, 0.138397216796875, 0.14377593994140625, 0.1491546630859375, 0.15453338623046875, 0.159912109375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 4.0, 13.0, 10.0, 11.0, 13.0, 11.0, 20.0, 18.0, 25.0, 29.0, 22.0, 27.0, 33.0, 37.0, 34.0, 41.0, 37.0, 41.0, 48.0, 39.0, 43.0, 41.0, 39.0, 37.0, 32.0, 33.0, 32.0, 23.0, 32.0, 24.0, 23.0, 17.0, 13.0, 12.0, 10.0, 9.0, 16.0, 2.0, 8.0, 11.0, 2.0, 8.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.005939483642578125, -0.005738317966461182, -0.005537152290344238, -0.005335986614227295, -0.0051348209381103516, -0.004933655261993408, -0.004732489585876465, -0.0045313239097595215, -0.004330158233642578, -0.004128992557525635, -0.003927826881408691, -0.003726661205291748, -0.0035254955291748047, -0.0033243298530578613, -0.003123164176940918, -0.0029219985008239746, -0.0027208328247070312, -0.002519667148590088, -0.0023185014724731445, -0.002117335796356201, -0.0019161701202392578, -0.0017150044441223145, -0.001513838768005371, -0.0013126730918884277, -0.0011115074157714844, -0.000910341739654541, -0.0007091760635375977, -0.0005080103874206543, -0.00030684471130371094, -0.00010567903518676758, 9.548664093017578e-05, 0.00029665231704711914, 0.0004978179931640625, 0.0006989836692810059, 0.0009001493453979492, 0.0011013150215148926, 0.001302480697631836, 0.0015036463737487793, 0.0017048120498657227, 0.001905977725982666, 0.0021071434020996094, 0.0023083090782165527, 0.002509474754333496, 0.0027106404304504395, 0.002911806106567383, 0.003112971782684326, 0.0033141374588012695, 0.003515303134918213, 0.0037164688110351562, 0.0039176344871521, 0.004118800163269043, 0.004319965839385986, 0.00452113151550293, 0.004722297191619873, 0.004923462867736816, 0.00512462854385376, 0.005325794219970703, 0.0055269598960876465, 0.00572812557220459, 0.005929291248321533, 0.0061304569244384766, 0.00633162260055542, 0.006532788276672363, 0.006733953952789307, 0.00693511962890625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 9.0, 5.0, 6.0, 11.0, 13.0, 12.0, 11.0, 25.0, 16.0, 26.0, 43.0, 46.0, 57.0, 58.0, 86.0, 98.0, 140.0, 217.0, 333.0, 771.0, 9816.0, 982368.0, 51798.0, 1134.0, 450.0, 245.0, 156.0, 114.0, 82.0, 77.0, 60.0, 51.0, 38.0, 33.0, 31.0, 25.0, 11.0, 14.0, 12.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1314697265625, -0.1275634765625, -0.1236572265625, -0.1197509765625, -0.1158447265625, -0.1119384765625, -0.1080322265625, -0.1041259765625, -0.1002197265625, -0.0963134765625, -0.0924072265625, -0.0885009765625, -0.0845947265625, -0.0806884765625, -0.0767822265625, -0.0728759765625, -0.0689697265625, -0.0650634765625, -0.0611572265625, -0.0572509765625, -0.0533447265625, -0.0494384765625, -0.0455322265625, -0.0416259765625, -0.0377197265625, -0.0338134765625, -0.0299072265625, -0.0260009765625, -0.0220947265625, -0.0181884765625, -0.0142822265625, -0.0103759765625, -0.0064697265625, -0.0025634765625, 0.0013427734375, 0.0052490234375, 0.0091552734375, 0.0130615234375, 0.0169677734375, 0.0208740234375, 0.0247802734375, 0.0286865234375, 0.0325927734375, 0.0364990234375, 0.0404052734375, 0.0443115234375, 0.0482177734375, 0.0521240234375, 0.0560302734375, 0.0599365234375, 0.0638427734375, 0.0677490234375, 0.0716552734375, 0.0755615234375, 0.0794677734375, 0.0833740234375, 0.0872802734375, 0.0911865234375, 0.0950927734375, 0.0989990234375, 0.1029052734375, 0.1068115234375, 0.1107177734375, 0.1146240234375, 0.1185302734375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 19.0, 170.0, 763.0, 49.0, 10.0, 1.0], "bins": [-0.1980019360780716, -0.19472168385982513, -0.19144143164157867, -0.1881611943244934, -0.18488094210624695, -0.1816006898880005, -0.17832043766975403, -0.17504018545150757, -0.1717599481344223, -0.16847969591617584, -0.16519944369792938, -0.16191920638084412, -0.15863895416259766, -0.1553587019443512, -0.15207844972610474, -0.14879819750785828, -0.14551794528961182, -0.14223769307136536, -0.1389574408531189, -0.13567720353603363, -0.13239695131778717, -0.1291166990995407, -0.12583644688129425, -0.12255620211362839, -0.11927595734596252, -0.11599570512771606, -0.1127154603600502, -0.10943520814180374, -0.10615496337413788, -0.10287471115589142, -0.09959445893764496, -0.0963142141699791, -0.09303396195173264, -0.08975370973348618, -0.08647346496582031, -0.08319321274757385, -0.07991296797990799, -0.07663271576166153, -0.07335247099399567, -0.0700722187757492, -0.06679196655750275, -0.06351171433925629, -0.060231469571590424, -0.056951217353343964, -0.0536709688603878, -0.05039072036743164, -0.04711047187447548, -0.04383022338151932, -0.040549974888563156, -0.037269726395606995, -0.03398947790265083, -0.030709227547049522, -0.02742897719144821, -0.02414872869849205, -0.02086848020553589, -0.017588229849934578, -0.014307981356978416, -0.01102773193269968, -0.0077474829740822315, -0.004467234015464783, -0.0011869845911860466, 0.0020932648330926895, 0.005373513326048851, 0.008653763681650162, 0.011934012174606323]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 4.0, 6.0, 10.0, 15.0, 22.0, 9.0, 32.0, 28.0, 28.0, 40.0, 38.0, 41.0, 45.0, 51.0, 54.0, 53.0, 52.0, 56.0, 55.0, 45.0, 38.0, 43.0, 35.0, 27.0, 31.0, 32.0, 20.0, 15.0, 17.0, 16.0, 13.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020380795001983643, -0.01980174146592617, -0.019222687929868698, -0.018643634393811226, -0.018064580857753754, -0.01748552732169628, -0.01690647378563881, -0.016327420249581337, -0.015748366713523865, -0.015169313177466393, -0.01459025964140892, -0.014011206105351448, -0.013432152569293976, -0.012853099033236504, -0.012274045497179031, -0.01169499196112156, -0.011115938425064087, -0.010536884889006615, -0.009957831352949142, -0.00937877781689167, -0.008799724280834198, -0.008220670744776726, -0.0076416172087192535, -0.007062563672661781, -0.006483510136604309, -0.005904456600546837, -0.005325403064489365, -0.004746349528431892, -0.00416729599237442, -0.003588242456316948, -0.0030091889202594757, -0.0024301353842020035, -0.0018510818481445312, -0.001272028312087059, -0.0006929747760295868, -0.00011392123997211456, 0.00046513229608535767, 0.00104418583214283, 0.0016232393682003021, 0.0022022929042577744, 0.0027813464403152466, 0.003360399976372719, 0.003939453512430191, 0.004518507048487663, 0.0050975605845451355, 0.005676614120602608, 0.00625566765666008, 0.006834721192717552, 0.007413774728775024, 0.007992828264832497, 0.008571881800889969, 0.009150935336947441, 0.009729988873004913, 0.010309042409062386, 0.010888095945119858, 0.01146714948117733, 0.012046203017234802, 0.012625256553292274, 0.013204310089349747, 0.013783363625407219, 0.014362417161464691, 0.014941470697522163, 0.015520524233579636, 0.016099577769637108, 0.01667863130569458]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 5.0, 17.0, 8.0, 15.0, 13.0, 15.0, 19.0, 19.0, 26.0, 25.0, 35.0, 41.0, 32.0, 38.0, 48.0, 48.0, 38.0, 42.0, 36.0, 37.0, 43.0, 49.0, 40.0, 36.0, 38.0, 23.0, 31.0, 29.0, 25.0, 19.0, 22.0, 17.0, 11.0, 8.0, 11.0, 10.0, 3.0, 5.0, 6.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.73193359375, -0.7076568603515625, -0.683380126953125, -0.6591033935546875, -0.63482666015625, -0.6105499267578125, -0.586273193359375, -0.5619964599609375, -0.5377197265625, -0.5134429931640625, -0.489166259765625, -0.4648895263671875, -0.44061279296875, -0.4163360595703125, -0.392059326171875, -0.3677825927734375, -0.343505859375, -0.3192291259765625, -0.294952392578125, -0.2706756591796875, -0.24639892578125, -0.2221221923828125, -0.197845458984375, -0.1735687255859375, -0.1492919921875, -0.1250152587890625, -0.100738525390625, -0.0764617919921875, -0.05218505859375, -0.0279083251953125, -0.003631591796875, 0.0206451416015625, 0.044921875, 0.0691986083984375, 0.093475341796875, 0.1177520751953125, 0.14202880859375, 0.1663055419921875, 0.190582275390625, 0.2148590087890625, 0.2391357421875, 0.2634124755859375, 0.287689208984375, 0.3119659423828125, 0.33624267578125, 0.3605194091796875, 0.384796142578125, 0.4090728759765625, 0.433349609375, 0.4576263427734375, 0.481903076171875, 0.5061798095703125, 0.53045654296875, 0.5547332763671875, 0.579010009765625, 0.6032867431640625, 0.6275634765625, 0.6518402099609375, 0.676116943359375, 0.7003936767578125, 0.72467041015625, 0.7489471435546875, 0.773223876953125, 0.7975006103515625, 0.82177734375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 5.0, 10.0, 6.0, 11.0, 14.0, 28.0, 22.0, 44.0, 51.0, 65.0, 103.0, 162.0, 250.0, 434.0, 890.0, 1603.0, 3103.0, 6909.0, 16322.0, 43993.0, 152776.0, 478139.0, 241583.0, 62676.0, 21889.0, 9052.0, 4014.0, 1931.0, 991.0, 549.0, 308.0, 203.0, 114.0, 88.0, 59.0, 35.0, 21.0, 27.0, 15.0, 15.0, 12.0, 9.0, 7.0, 1.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.4541015625, -1.409576416015625, -1.36505126953125, -1.320526123046875, -1.2760009765625, -1.231475830078125, -1.18695068359375, -1.142425537109375, -1.097900390625, -1.053375244140625, -1.00885009765625, -0.964324951171875, -0.9197998046875, -0.875274658203125, -0.83074951171875, -0.786224365234375, -0.74169921875, -0.697174072265625, -0.65264892578125, -0.608123779296875, -0.5635986328125, -0.519073486328125, -0.47454833984375, -0.430023193359375, -0.385498046875, -0.340972900390625, -0.29644775390625, -0.251922607421875, -0.2073974609375, -0.162872314453125, -0.11834716796875, -0.073822021484375, -0.029296875, 0.015228271484375, 0.05975341796875, 0.104278564453125, 0.1488037109375, 0.193328857421875, 0.23785400390625, 0.282379150390625, 0.326904296875, 0.371429443359375, 0.41595458984375, 0.460479736328125, 0.5050048828125, 0.549530029296875, 0.59405517578125, 0.638580322265625, 0.68310546875, 0.727630615234375, 0.77215576171875, 0.816680908203125, 0.8612060546875, 0.905731201171875, 0.95025634765625, 0.994781494140625, 1.039306640625, 1.083831787109375, 1.12835693359375, 1.172882080078125, 1.2174072265625, 1.261932373046875, 1.30645751953125, 1.350982666015625, 1.3955078125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 1.0, 5.0, 4.0, 4.0, 13.0, 10.0, 17.0, 22.0, 22.0, 29.0, 31.0, 34.0, 36.0, 38.0, 58.0, 58.0, 85.0, 166.0, 277.0, 1408.0, 196.0, 128.0, 63.0, 58.0, 41.0, 42.0, 40.0, 28.0, 19.0, 25.0, 19.0, 17.0, 12.0, 4.0, 4.0, 12.0, 4.0, 4.0, 3.0, 1.0, 5.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.2829437255859375, -2.216278076171875, -2.1496124267578125, -2.08294677734375, -2.0162811279296875, -1.949615478515625, -1.8829498291015625, -1.8162841796875, -1.7496185302734375, -1.682952880859375, -1.6162872314453125, -1.54962158203125, -1.4829559326171875, -1.416290283203125, -1.3496246337890625, -1.282958984375, -1.2162933349609375, -1.149627685546875, -1.0829620361328125, -1.01629638671875, -0.9496307373046875, -0.882965087890625, -0.8162994384765625, -0.7496337890625, -0.6829681396484375, -0.616302490234375, -0.5496368408203125, -0.48297119140625, -0.4163055419921875, -0.349639892578125, -0.2829742431640625, -0.21630859375, -0.1496429443359375, -0.082977294921875, -0.0163116455078125, 0.05035400390625, 0.1170196533203125, 0.183685302734375, 0.2503509521484375, 0.3170166015625, 0.3836822509765625, 0.450347900390625, 0.5170135498046875, 0.58367919921875, 0.6503448486328125, 0.717010498046875, 0.7836761474609375, 0.850341796875, 0.9170074462890625, 0.983673095703125, 1.0503387451171875, 1.11700439453125, 1.1836700439453125, 1.250335693359375, 1.3170013427734375, 1.3836669921875, 1.4503326416015625, 1.516998291015625, 1.5836639404296875, 1.65032958984375, 1.7169952392578125, 1.783660888671875, 1.8503265380859375, 1.9169921875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 10.0, 19.0, 27.0, 23.0, 35.0, 43.0, 72.0, 79.0, 116.0, 182.0, 271.0, 493.0, 1009.0, 2957.0, 11619.0, 65920.0, 1536222.0, 1446216.0, 63777.0, 11289.0, 2858.0, 1047.0, 471.0, 272.0, 167.0, 133.0, 81.0, 55.0, 40.0, 40.0, 38.0, 19.0, 19.0, 17.0, 21.0, 4.0, 4.0, 6.0, 1.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.66015625, -2.57952880859375, -2.4989013671875, -2.41827392578125, -2.337646484375, -2.25701904296875, -2.1763916015625, -2.09576416015625, -2.01513671875, -1.93450927734375, -1.8538818359375, -1.77325439453125, -1.692626953125, -1.61199951171875, -1.5313720703125, -1.45074462890625, -1.3701171875, -1.28948974609375, -1.2088623046875, -1.12823486328125, -1.047607421875, -0.96697998046875, -0.8863525390625, -0.80572509765625, -0.72509765625, -0.64447021484375, -0.5638427734375, -0.48321533203125, -0.402587890625, -0.32196044921875, -0.2413330078125, -0.16070556640625, -0.080078125, 0.00054931640625, 0.0811767578125, 0.16180419921875, 0.242431640625, 0.32305908203125, 0.4036865234375, 0.48431396484375, 0.56494140625, 0.64556884765625, 0.7261962890625, 0.80682373046875, 0.887451171875, 0.96807861328125, 1.0487060546875, 1.12933349609375, 1.2099609375, 1.29058837890625, 1.3712158203125, 1.45184326171875, 1.532470703125, 1.61309814453125, 1.6937255859375, 1.77435302734375, 1.85498046875, 1.93560791015625, 2.0162353515625, 2.09686279296875, 2.177490234375, 2.25811767578125, 2.3387451171875, 2.41937255859375, 2.5]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 120.0, 839.0, 56.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.475202560424805, -24.090402603149414, -22.70560073852539, -21.32080078125, -19.93600082397461, -18.55120086669922, -17.166399002075195, -15.781599044799805, -14.396798133850098, -13.01199722290039, -11.627197265625, -10.242396354675293, -8.857595443725586, -7.472795486450195, -6.087994575500488, -4.703194618225098, -3.3183937072753906, -1.9335931539535522, -0.5487926006317139, 0.8360080718994141, 2.220808506011963, 3.6056089401245117, 4.990409851074219, 6.375209808349609, 7.760010719299316, 9.144811630249023, 10.529611587524414, 11.914412498474121, 13.299213409423828, 14.684013366699219, 16.06881332397461, 17.45361328125, 18.83841323852539, 20.22321319580078, 21.608015060424805, 22.992815017700195, 24.377614974975586, 25.76241683959961, 27.147216796875, 28.53201675415039, 29.91681671142578, 31.301616668701172, 32.68641662597656, 34.07122039794922, 35.45602035522461, 36.8408203125, 38.22562026977539, 39.61042022705078, 40.99522399902344, 42.38002395629883, 43.76482391357422, 45.149627685546875, 46.534427642822266, 47.919227600097656, 49.30402755737305, 50.68882751464844, 52.07362747192383, 53.45842742919922, 54.84322738647461, 56.22802734375, 57.612831115722656, 58.99763107299805, 60.38243103027344, 61.76723098754883, 63.15203094482422]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 9.0, 3.0, 6.0, 10.0, 8.0, 19.0, 10.0, 25.0, 18.0, 27.0, 20.0, 27.0, 27.0, 26.0, 21.0, 33.0, 39.0, 32.0, 44.0, 32.0, 40.0, 38.0, 43.0, 51.0, 39.0, 37.0, 39.0, 26.0, 33.0, 24.0, 29.0, 20.0, 23.0, 20.0, 16.0, 17.0, 7.0, 15.0, 13.0, 3.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.157461166381836, -5.008908748626709, -4.86035680770874, -4.711804389953613, -4.563251972198486, -4.414699554443359, -4.266147613525391, -4.117595195770264, -3.9690427780151367, -3.820490598678589, -3.671938180923462, -3.523386001586914, -3.374833583831787, -3.2262814044952393, -3.0777292251586914, -2.9291768074035645, -2.7806246280670166, -2.6320724487304688, -2.483520030975342, -2.334967851638794, -2.186415433883667, -2.037863254547119, -1.8893109560012817, -1.7407586574554443, -1.592206358909607, -1.4436540603637695, -1.2951017618179321, -1.1465494632720947, -0.9979972243309021, -0.8494449257850647, -0.7008926868438721, -0.5523403882980347, -0.40378808975219727, -0.25523579120635986, -0.10668352246284485, 0.041868746280670166, 0.19042104482650757, 0.33897334337234497, 0.4875255823135376, 0.636077880859375, 0.7846301794052124, 0.9331824779510498, 1.0817347764968872, 1.2302870750427246, 1.3788392543792725, 1.5273916721343994, 1.6759438514709473, 1.8244961500167847, 1.973048448562622, 2.12160062789917, 2.270153045654297, 2.4187052249908447, 2.5672576427459717, 2.7158098220825195, 2.8643622398376465, 3.0129144191741943, 3.161466598510742, 3.31001877784729, 3.458571195602417, 3.607123374938965, 3.755675792694092, 3.9042279720306396, 4.0527801513671875, 4.2013325691223145, 4.349884986877441]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 5.0, 6.0, 9.0, 16.0, 12.0, 18.0, 16.0, 21.0, 24.0, 26.0, 19.0, 41.0, 35.0, 37.0, 41.0, 47.0, 41.0, 39.0, 45.0, 46.0, 34.0, 46.0, 43.0, 29.0, 33.0, 34.0, 33.0, 27.0, 35.0, 27.0, 18.0, 15.0, 14.0, 14.0, 11.0, 10.0, 6.0, 11.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77490234375, -0.7497177124023438, -0.7245330810546875, -0.6993484497070312, -0.674163818359375, -0.6489791870117188, -0.6237945556640625, -0.5986099243164062, -0.57342529296875, -0.5482406616210938, -0.5230560302734375, -0.49787139892578125, -0.472686767578125, -0.44750213623046875, -0.4223175048828125, -0.39713287353515625, -0.3719482421875, -0.34676361083984375, -0.3215789794921875, -0.29639434814453125, -0.271209716796875, -0.24602508544921875, -0.2208404541015625, -0.19565582275390625, -0.17047119140625, -0.14528656005859375, -0.1201019287109375, -0.09491729736328125, -0.069732666015625, -0.04454803466796875, -0.0193634033203125, 0.00582122802734375, 0.031005859375, 0.05619049072265625, 0.0813751220703125, 0.10655975341796875, 0.131744384765625, 0.15692901611328125, 0.1821136474609375, 0.20729827880859375, 0.23248291015625, 0.25766754150390625, 0.2828521728515625, 0.30803680419921875, 0.333221435546875, 0.35840606689453125, 0.3835906982421875, 0.40877532958984375, 0.4339599609375, 0.45914459228515625, 0.4843292236328125, 0.5095138549804688, 0.534698486328125, 0.5598831176757812, 0.5850677490234375, 0.6102523803710938, 0.63543701171875, 0.6606216430664062, 0.6858062744140625, 0.7109909057617188, 0.736175537109375, 0.7613601684570312, 0.7865447998046875, 0.8117294311523438, 0.8369140625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 10.0, 8.0, 10.0, 11.0, 18.0, 11.0, 21.0, 21.0, 39.0, 42.0, 54.0, 63.0, 85.0, 157.0, 222.0, 356.0, 869.0, 4276.0, 134534.0, 4024988.0, 24952.0, 2036.0, 552.0, 287.0, 182.0, 102.0, 79.0, 62.0, 57.0, 38.0, 32.0, 22.0, 14.0, 15.0, 19.0, 10.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.28350830078125, -5.0748291015625, -4.86614990234375, -4.657470703125, -4.44879150390625, -4.2401123046875, -4.03143310546875, -3.82275390625, -3.61407470703125, -3.4053955078125, -3.19671630859375, -2.988037109375, -2.77935791015625, -2.5706787109375, -2.36199951171875, -2.1533203125, -1.94464111328125, -1.7359619140625, -1.52728271484375, -1.318603515625, -1.10992431640625, -0.9012451171875, -0.69256591796875, -0.48388671875, -0.27520751953125, -0.0665283203125, 0.14215087890625, 0.350830078125, 0.55950927734375, 0.7681884765625, 0.97686767578125, 1.185546875, 1.39422607421875, 1.6029052734375, 1.81158447265625, 2.020263671875, 2.22894287109375, 2.4376220703125, 2.64630126953125, 2.85498046875, 3.06365966796875, 3.2723388671875, 3.48101806640625, 3.689697265625, 3.89837646484375, 4.1070556640625, 4.31573486328125, 4.5244140625, 4.73309326171875, 4.9417724609375, 5.15045166015625, 5.359130859375, 5.56781005859375, 5.7764892578125, 5.98516845703125, 6.19384765625, 6.40252685546875, 6.6112060546875, 6.81988525390625, 7.028564453125, 7.23724365234375, 7.4459228515625, 7.65460205078125, 7.86328125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 9.0, 12.0, 11.0, 20.0, 27.0, 53.0, 67.0, 121.0, 185.0, 330.0, 764.0, 1087.0, 661.0, 309.0, 162.0, 92.0, 46.0, 34.0, 21.0, 19.0, 6.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.349609375, -1.292022705078125, -1.23443603515625, -1.176849365234375, -1.1192626953125, -1.061676025390625, -1.00408935546875, -0.946502685546875, -0.888916015625, -0.831329345703125, -0.77374267578125, -0.716156005859375, -0.6585693359375, -0.600982666015625, -0.54339599609375, -0.485809326171875, -0.42822265625, -0.370635986328125, -0.31304931640625, -0.255462646484375, -0.1978759765625, -0.140289306640625, -0.08270263671875, -0.025115966796875, 0.032470703125, 0.090057373046875, 0.14764404296875, 0.205230712890625, 0.2628173828125, 0.320404052734375, 0.37799072265625, 0.435577392578125, 0.4931640625, 0.550750732421875, 0.60833740234375, 0.665924072265625, 0.7235107421875, 0.781097412109375, 0.83868408203125, 0.896270751953125, 0.953857421875, 1.011444091796875, 1.06903076171875, 1.126617431640625, 1.1842041015625, 1.241790771484375, 1.29937744140625, 1.356964111328125, 1.41455078125, 1.472137451171875, 1.52972412109375, 1.587310791015625, 1.6448974609375, 1.702484130859375, 1.76007080078125, 1.817657470703125, 1.875244140625, 1.932830810546875, 1.99041748046875, 2.048004150390625, 2.1055908203125, 2.163177490234375, 2.22076416015625, 2.278350830078125, 2.3359375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 10.0, 10.0, 21.0, 33.0, 35.0, 63.0, 135.0, 249.0, 566.0, 1257.0, 3659.0, 12932.0, 102285.0, 3650768.0, 388471.0, 24654.0, 5595.0, 1968.0, 766.0, 359.0, 157.0, 99.0, 62.0, 45.0, 24.0, 16.0, 15.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -2.98345947265625, -2.8575439453125, -2.73162841796875, -2.605712890625, -2.47979736328125, -2.3538818359375, -2.22796630859375, -2.10205078125, -1.97613525390625, -1.8502197265625, -1.72430419921875, -1.598388671875, -1.47247314453125, -1.3465576171875, -1.22064208984375, -1.0947265625, -0.96881103515625, -0.8428955078125, -0.71697998046875, -0.591064453125, -0.46514892578125, -0.3392333984375, -0.21331787109375, -0.08740234375, 0.03851318359375, 0.1644287109375, 0.29034423828125, 0.416259765625, 0.54217529296875, 0.6680908203125, 0.79400634765625, 0.919921875, 1.04583740234375, 1.1717529296875, 1.29766845703125, 1.423583984375, 1.54949951171875, 1.6754150390625, 1.80133056640625, 1.92724609375, 2.05316162109375, 2.1790771484375, 2.30499267578125, 2.430908203125, 2.55682373046875, 2.6827392578125, 2.80865478515625, 2.9345703125, 3.06048583984375, 3.1864013671875, 3.31231689453125, 3.438232421875, 3.56414794921875, 3.6900634765625, 3.81597900390625, 3.94189453125, 4.06781005859375, 4.1937255859375, 4.31964111328125, 4.445556640625, 4.57147216796875, 4.6973876953125, 4.82330322265625, 4.94921875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 8.0, 8.0, 31.0, 96.0, 277.0, 326.0, 178.0, 51.0, 26.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.201010227203369, -3.7501463890075684, -3.2992827892303467, -2.848418951034546, -2.397555351257324, -1.9466915130615234, -1.4958276748657227, -1.044964075088501, -0.5941002368927002, -0.14323648810386658, 0.30762726068496704, 0.758491039276123, 1.2093547582626343, 1.6602184772491455, 2.1110823154449463, 2.561945915222168, 3.0128097534179688, 3.4636735916137695, 3.914537191390991, 4.365401268005371, 4.816264629364014, 5.2671284675598145, 5.717992305755615, 6.168855667114258, 6.619719505310059, 7.070583343505859, 7.52144718170166, 7.972311019897461, 8.423174858093262, 8.874038696289062, 9.324901580810547, 9.775765419006348, 10.226630210876465, 10.677494049072266, 11.128357887268066, 11.579221725463867, 12.030085563659668, 12.480949401855469, 12.931812286376953, 13.382676124572754, 13.833539962768555, 14.284403800964355, 14.735267639160156, 15.186131477355957, 15.636995315551758, 16.087858200073242, 16.53872299194336, 16.989585876464844, 17.44045066833496, 17.891313552856445, 18.342178344726562, 18.793041229248047, 19.243906021118164, 19.69476890563965, 20.145633697509766, 20.59649658203125, 21.047359466552734, 21.49822235107422, 21.949087142944336, 22.39995002746582, 22.850814819335938, 23.301677703857422, 23.75254249572754, 24.203405380249023, 24.65427017211914]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 7.0, 6.0, 14.0, 11.0, 17.0, 24.0, 25.0, 21.0, 40.0, 28.0, 46.0, 26.0, 40.0, 47.0, 41.0, 41.0, 45.0, 39.0, 44.0, 51.0, 46.0, 31.0, 37.0, 36.0, 20.0, 33.0, 25.0, 19.0, 18.0, 22.0, 17.0, 13.0, 13.0, 8.0, 7.0, 10.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.342362642288208, -3.2243616580963135, -3.106360912322998, -2.9883599281311035, -2.870358943939209, -2.7523581981658936, -2.634357213973999, -2.5163564682006836, -2.398355484008789, -2.2803544998168945, -2.162353754043579, -2.0443527698516846, -1.9263519048690796, -1.8083510398864746, -1.69035005569458, -1.572349190711975, -1.4543483257293701, -1.3363474607467651, -1.2183465957641602, -1.1003456115722656, -0.9823447465896606, -0.8643438816070557, -0.7463429570198059, -0.6283420324325562, -0.5103411674499512, -0.3923402726650238, -0.27433937788009644, -0.15633848309516907, -0.0383375883102417, 0.07966327667236328, 0.19766420125961304, 0.3156651258468628, 0.43366575241088867, 0.5516666173934937, 0.6696675419807434, 0.7876684665679932, 0.9056693315505981, 1.0236701965332031, 1.1416711807250977, 1.2596720457077026, 1.3776729106903076, 1.4956737756729126, 1.6136746406555176, 1.731675624847412, 1.849676489830017, 1.967677354812622, 2.0856783390045166, 2.203679084777832, 2.3216800689697266, 2.439681053161621, 2.5576817989349365, 2.675682783126831, 2.7936835289001465, 2.911684513092041, 3.0296854972839355, 3.14768648147583, 3.2656872272491455, 3.38368821144104, 3.5016889572143555, 3.61968994140625, 3.7376909255981445, 3.85569167137146, 3.9736926555633545, 4.09169340133667, 4.2096943855285645]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 3.0, 7.0, 3.0, 10.0, 2.0, 13.0, 21.0, 11.0, 12.0, 23.0, 24.0, 32.0, 33.0, 27.0, 38.0, 29.0, 33.0, 29.0, 36.0, 50.0, 44.0, 33.0, 31.0, 33.0, 45.0, 22.0, 35.0, 37.0, 40.0, 27.0, 30.0, 21.0, 16.0, 19.0, 16.0, 12.0, 18.0, 14.0, 7.0, 13.0, 7.0, 12.0, 3.0, 3.0, 0.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.71142578125, -0.6900558471679688, -0.6686859130859375, -0.6473159790039062, -0.625946044921875, -0.6045761108398438, -0.5832061767578125, -0.5618362426757812, -0.54046630859375, -0.5190963745117188, -0.4977264404296875, -0.47635650634765625, -0.454986572265625, -0.43361663818359375, -0.4122467041015625, -0.39087677001953125, -0.3695068359375, -0.34813690185546875, -0.3267669677734375, -0.30539703369140625, -0.284027099609375, -0.26265716552734375, -0.2412872314453125, -0.21991729736328125, -0.19854736328125, -0.17717742919921875, -0.1558074951171875, -0.13443756103515625, -0.113067626953125, -0.09169769287109375, -0.0703277587890625, -0.04895782470703125, -0.027587890625, -0.00621795654296875, 0.0151519775390625, 0.03652191162109375, 0.057891845703125, 0.07926177978515625, 0.1006317138671875, 0.12200164794921875, 0.14337158203125, 0.16474151611328125, 0.1861114501953125, 0.20748138427734375, 0.228851318359375, 0.25022125244140625, 0.2715911865234375, 0.29296112060546875, 0.3143310546875, 0.33570098876953125, 0.3570709228515625, 0.37844085693359375, 0.399810791015625, 0.42118072509765625, 0.4425506591796875, 0.46392059326171875, 0.48529052734375, 0.5066604614257812, 0.5280303955078125, 0.5494003295898438, 0.570770263671875, 0.5921401977539062, 0.6135101318359375, 0.6348800659179688, 0.65625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 14.0, 10.0, 17.0, 44.0, 42.0, 69.0, 95.0, 162.0, 221.0, 352.0, 497.0, 782.0, 1113.0, 1638.0, 2579.0, 4104.0, 6392.0, 10390.0, 17381.0, 29680.0, 51501.0, 93069.0, 166781.0, 236712.0, 182058.0, 103164.0, 57320.0, 32282.0, 19028.0, 11379.0, 7036.0, 4341.0, 2767.0, 1903.0, 1206.0, 771.0, 559.0, 373.0, 228.0, 151.0, 111.0, 76.0, 53.0, 36.0, 24.0, 20.0, 9.0, 9.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0838623046875, -0.081207275390625, -0.07855224609375, -0.075897216796875, -0.0732421875, -0.070587158203125, -0.06793212890625, -0.065277099609375, -0.0626220703125, -0.059967041015625, -0.05731201171875, -0.054656982421875, -0.052001953125, -0.049346923828125, -0.04669189453125, -0.044036865234375, -0.0413818359375, -0.038726806640625, -0.03607177734375, -0.033416748046875, -0.03076171875, -0.028106689453125, -0.02545166015625, -0.022796630859375, -0.0201416015625, -0.017486572265625, -0.01483154296875, -0.012176513671875, -0.009521484375, -0.006866455078125, -0.00421142578125, -0.001556396484375, 0.0010986328125, 0.003753662109375, 0.00640869140625, 0.009063720703125, 0.01171875, 0.014373779296875, 0.01702880859375, 0.019683837890625, 0.0223388671875, 0.024993896484375, 0.02764892578125, 0.030303955078125, 0.032958984375, 0.035614013671875, 0.03826904296875, 0.040924072265625, 0.0435791015625, 0.046234130859375, 0.04888916015625, 0.051544189453125, 0.05419921875, 0.056854248046875, 0.05950927734375, 0.062164306640625, 0.0648193359375, 0.067474365234375, 0.07012939453125, 0.072784423828125, 0.075439453125, 0.078094482421875, 0.08074951171875, 0.083404541015625, 0.0860595703125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 7.0, 5.0, 17.0, 11.0, 16.0, 19.0, 21.0, 23.0, 22.0, 26.0, 32.0, 25.0, 32.0, 36.0, 30.0, 39.0, 47.0, 42.0, 41.0, 1057.0, 56.0, 35.0, 41.0, 29.0, 28.0, 28.0, 36.0, 26.0, 21.0, 20.0, 22.0, 15.0, 16.0, 20.0, 15.0, 13.0, 9.0, 8.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.70751953125, -0.6869125366210938, -0.6663055419921875, -0.6456985473632812, -0.625091552734375, -0.6044845581054688, -0.5838775634765625, -0.5632705688476562, -0.54266357421875, -0.5220565795898438, -0.5014495849609375, -0.48084259033203125, -0.460235595703125, -0.43962860107421875, -0.4190216064453125, -0.39841461181640625, -0.3778076171875, -0.35720062255859375, -0.3365936279296875, -0.31598663330078125, -0.295379638671875, -0.27477264404296875, -0.2541656494140625, -0.23355865478515625, -0.21295166015625, -0.19234466552734375, -0.1717376708984375, -0.15113067626953125, -0.130523681640625, -0.10991668701171875, -0.0893096923828125, -0.06870269775390625, -0.048095703125, -0.02748870849609375, -0.0068817138671875, 0.01372528076171875, 0.034332275390625, 0.05493927001953125, 0.0755462646484375, 0.09615325927734375, 0.11676025390625, 0.13736724853515625, 0.1579742431640625, 0.17858123779296875, 0.199188232421875, 0.21979522705078125, 0.2404022216796875, 0.26100921630859375, 0.2816162109375, 0.30222320556640625, 0.3228302001953125, 0.34343719482421875, 0.364044189453125, 0.38465118408203125, 0.4052581787109375, 0.42586517333984375, 0.44647216796875, 0.46707916259765625, 0.4876861572265625, 0.5082931518554688, 0.528900146484375, 0.5495071411132812, 0.5701141357421875, 0.5907211303710938, 0.611328125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 23.0, 31.0, 29.0, 58.0, 73.0, 93.0, 117.0, 191.0, 234.0, 369.0, 499.0, 704.0, 1013.0, 1513.0, 2106.0, 3061.0, 4620.0, 7381.0, 12597.0, 27357.0, 113160.0, 1747847.0, 111860.0, 27293.0, 12692.0, 7406.0, 4603.0, 3098.0, 2061.0, 1512.0, 1043.0, 700.0, 491.0, 349.0, 257.0, 184.0, 137.0, 115.0, 70.0, 50.0, 31.0, 24.0, 19.0, 13.0, 13.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1533203125, -0.14812278747558594, -0.14292526245117188, -0.1377277374267578, -0.13253021240234375, -0.1273326873779297, -0.12213516235351562, -0.11693763732910156, -0.1117401123046875, -0.10654258728027344, -0.10134506225585938, -0.09614753723144531, -0.09095001220703125, -0.08575248718261719, -0.08055496215820312, -0.07535743713378906, -0.070159912109375, -0.06496238708496094, -0.059764862060546875, -0.05456733703613281, -0.04936981201171875, -0.04417228698730469, -0.038974761962890625, -0.03377723693847656, -0.0285797119140625, -0.023382186889648438, -0.018184661865234375, -0.012987136840820312, -0.00778961181640625, -0.0025920867919921875, 0.002605438232421875, 0.0078029632568359375, 0.01300048828125, 0.018198013305664062, 0.023395538330078125, 0.028593063354492188, 0.03379058837890625, 0.03898811340332031, 0.044185638427734375, 0.04938316345214844, 0.0545806884765625, 0.05977821350097656, 0.06497573852539062, 0.07017326354980469, 0.07537078857421875, 0.08056831359863281, 0.08576583862304688, 0.09096336364746094, 0.096160888671875, 0.10135841369628906, 0.10655593872070312, 0.11175346374511719, 0.11695098876953125, 0.12214851379394531, 0.12734603881835938, 0.13254356384277344, 0.1377410888671875, 0.14293861389160156, 0.14813613891601562, 0.1533336639404297, 0.15853118896484375, 0.1637287139892578, 0.16892623901367188, 0.17412376403808594, 0.1793212890625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 6.0, 4.0, 2.0, 4.0, 6.0, 3.0, 7.0, 7.0, 5.0, 9.0, 10.0, 13.0, 22.0, 18.0, 28.0, 20.0, 20.0, 25.0, 34.0, 33.0, 33.0, 38.0, 35.0, 34.0, 50.0, 42.0, 48.0, 43.0, 46.0, 40.0, 29.0, 23.0, 32.0, 23.0, 30.0, 23.0, 27.0, 24.0, 21.0, 21.0, 18.0, 7.0, 6.0, 7.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00787353515625, -0.007646322250366211, -0.007419109344482422, -0.007191896438598633, -0.006964683532714844, -0.006737470626831055, -0.006510257720947266, -0.0062830448150634766, -0.0060558319091796875, -0.0058286190032958984, -0.005601406097412109, -0.00537419319152832, -0.005146980285644531, -0.004919767379760742, -0.004692554473876953, -0.004465341567993164, -0.004238128662109375, -0.004010915756225586, -0.003783702850341797, -0.003556489944458008, -0.0033292770385742188, -0.0031020641326904297, -0.0028748512268066406, -0.0026476383209228516, -0.0024204254150390625, -0.0021932125091552734, -0.0019659996032714844, -0.0017387866973876953, -0.0015115737915039062, -0.0012843608856201172, -0.0010571479797363281, -0.0008299350738525391, -0.00060272216796875, -0.00037550926208496094, -0.00014829635620117188, 7.891654968261719e-05, 0.00030612945556640625, 0.0005333423614501953, 0.0007605552673339844, 0.0009877681732177734, 0.0012149810791015625, 0.0014421939849853516, 0.0016694068908691406, 0.0018966197967529297, 0.0021238327026367188, 0.002351045608520508, 0.002578258514404297, 0.002805471420288086, 0.003032684326171875, 0.003259897232055664, 0.003487110137939453, 0.003714323043823242, 0.003941535949707031, 0.00416874885559082, 0.004395961761474609, 0.0046231746673583984, 0.0048503875732421875, 0.0050776004791259766, 0.005304813385009766, 0.005532026290893555, 0.005759239196777344, 0.005986452102661133, 0.006213665008544922, 0.006440877914428711, 0.0066680908203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 8.0, 5.0, 14.0, 9.0, 22.0, 29.0, 36.0, 39.0, 38.0, 52.0, 55.0, 71.0, 81.0, 130.0, 153.0, 203.0, 383.0, 813.0, 7861.0, 979026.0, 56742.0, 1204.0, 456.0, 260.0, 168.0, 144.0, 125.0, 77.0, 59.0, 41.0, 43.0, 38.0, 23.0, 29.0, 20.0, 22.0, 10.0, 5.0, 7.0, 4.0, 9.0, 3.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12261962890625, -0.11834430694580078, -0.11406898498535156, -0.10979366302490234, -0.10551834106445312, -0.1012430191040039, -0.09696769714355469, -0.09269237518310547, -0.08841705322265625, -0.08414173126220703, -0.07986640930175781, -0.0755910873413086, -0.07131576538085938, -0.06704044342041016, -0.06276512145996094, -0.05848979949951172, -0.0542144775390625, -0.04993915557861328, -0.04566383361816406, -0.041388511657714844, -0.037113189697265625, -0.032837867736816406, -0.028562545776367188, -0.02428722381591797, -0.02001190185546875, -0.01573657989501953, -0.011461257934570312, -0.007185935974121094, -0.002910614013671875, 0.0013647079467773438, 0.0056400299072265625, 0.009915351867675781, 0.014190673828125, 0.01846599578857422, 0.022741317749023438, 0.027016639709472656, 0.031291961669921875, 0.035567283630371094, 0.03984260559082031, 0.04411792755126953, 0.04839324951171875, 0.05266857147216797, 0.05694389343261719, 0.061219215393066406, 0.06549453735351562, 0.06976985931396484, 0.07404518127441406, 0.07832050323486328, 0.0825958251953125, 0.08687114715576172, 0.09114646911621094, 0.09542179107666016, 0.09969711303710938, 0.1039724349975586, 0.10824775695800781, 0.11252307891845703, 0.11679840087890625, 0.12107372283935547, 0.1253490447998047, 0.1296243667602539, 0.13389968872070312, 0.13817501068115234, 0.14245033264160156, 0.14672565460205078, 0.1510009765625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 42.0, 872.0, 96.0, 1.0, 2.0], "bins": [-0.34811604022979736, -0.34237784147262573, -0.3366396427154541, -0.33090144395828247, -0.32516324520111084, -0.3194250464439392, -0.3136868476867676, -0.30794861912727356, -0.30221042037010193, -0.2964722216129303, -0.29073402285575867, -0.28499582409858704, -0.2792576253414154, -0.2735193967819214, -0.26778119802474976, -0.2620429992675781, -0.2563048005104065, -0.25056660175323486, -0.24482840299606323, -0.2390902042388916, -0.23335199058055878, -0.22761379182338715, -0.22187559306621552, -0.21613739430904388, -0.21039921045303345, -0.20466101169586182, -0.19892281293869019, -0.19318461418151855, -0.18744640052318573, -0.1817082017660141, -0.17597000300884247, -0.17023180425167084, -0.164493590593338, -0.15875539183616638, -0.15301719307899475, -0.14727899432182312, -0.1415407806634903, -0.13580258190631866, -0.13006438314914703, -0.1243261843919754, -0.11858798563480377, -0.11284978687763214, -0.10711158066987991, -0.10137338191270828, -0.09563517570495605, -0.08989697694778442, -0.08415877819061279, -0.07842057943344116, -0.07268237322568893, -0.0669441744685173, -0.061205968260765076, -0.055467769503593445, -0.049729567021131516, -0.043991364538669586, -0.038253165781497955, -0.032514963299036026, -0.026776758953928947, -0.021038558334112167, -0.015300355851650238, -0.009562155231833458, -0.0038239527493715286, 0.0019142497330904007, 0.0076524484902620316, 0.013390650972723961, 0.01912885345518589]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 14.0, 15.0, 19.0, 19.0, 24.0, 30.0, 26.0, 39.0, 34.0, 44.0, 39.0, 33.0, 45.0, 38.0, 43.0, 40.0, 44.0, 34.0, 36.0, 43.0, 41.0, 37.0, 31.0, 26.0, 20.0, 24.0, 17.0, 10.0, 23.0, 10.0, 14.0, 14.0, 14.0, 12.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.02403157949447632, -0.023369699716567993, -0.022707819938659668, -0.022045940160751343, -0.021384060382843018, -0.020722180604934692, -0.020060300827026367, -0.019398421049118042, -0.018736541271209717, -0.01807466149330139, -0.017412781715393066, -0.01675090193748474, -0.016089022159576416, -0.01542714238166809, -0.014765262603759766, -0.01410338282585144, -0.013441503047943115, -0.01277962327003479, -0.012117743492126465, -0.01145586371421814, -0.010793983936309814, -0.01013210415840149, -0.009470224380493164, -0.008808344602584839, -0.008146464824676514, -0.0074845850467681885, -0.006822705268859863, -0.006160825490951538, -0.005498945713043213, -0.004837065935134888, -0.0041751861572265625, -0.0035133063793182373, -0.002851426601409912, -0.002189546823501587, -0.0015276670455932617, -0.0008657872676849365, -0.00020390748977661133, 0.00045797228813171387, 0.001119852066040039, 0.0017817318439483643, 0.0024436116218566895, 0.0031054913997650146, 0.00376737117767334, 0.004429250955581665, 0.00509113073348999, 0.005753010511398315, 0.006414890289306641, 0.007076770067214966, 0.007738649845123291, 0.008400529623031616, 0.009062409400939941, 0.009724289178848267, 0.010386168956756592, 0.011048048734664917, 0.011709928512573242, 0.012371808290481567, 0.013033688068389893, 0.013695567846298218, 0.014357447624206543, 0.015019327402114868, 0.015681207180023193, 0.01634308695793152, 0.017004966735839844, 0.01766684651374817, 0.018328726291656494]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 8.0, 3.0, 5.0, 5.0, 10.0, 2.0, 13.0, 19.0, 14.0, 12.0, 21.0, 24.0, 32.0, 35.0, 27.0, 37.0, 29.0, 33.0, 29.0, 39.0, 45.0, 45.0, 33.0, 32.0, 33.0, 45.0, 22.0, 38.0, 36.0, 38.0, 27.0, 31.0, 20.0, 16.0, 23.0, 12.0, 13.0, 17.0, 14.0, 5.0, 15.0, 8.0, 12.0, 2.0, 3.0, 0.0, 2.0, 7.0, 0.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.7119140625, -0.6905288696289062, -0.6691436767578125, -0.6477584838867188, -0.626373291015625, -0.6049880981445312, -0.5836029052734375, -0.5622177124023438, -0.54083251953125, -0.5194473266601562, -0.4980621337890625, -0.47667694091796875, -0.455291748046875, -0.43390655517578125, -0.4125213623046875, -0.39113616943359375, -0.3697509765625, -0.34836578369140625, -0.3269805908203125, -0.30559539794921875, -0.284210205078125, -0.26282501220703125, -0.2414398193359375, -0.22005462646484375, -0.19866943359375, -0.17728424072265625, -0.1558990478515625, -0.13451385498046875, -0.113128662109375, -0.09174346923828125, -0.0703582763671875, -0.04897308349609375, -0.027587890625, -0.00620269775390625, 0.0151824951171875, 0.03656768798828125, 0.057952880859375, 0.07933807373046875, 0.1007232666015625, 0.12210845947265625, 0.14349365234375, 0.16487884521484375, 0.1862640380859375, 0.20764923095703125, 0.229034423828125, 0.25041961669921875, 0.2718048095703125, 0.29319000244140625, 0.3145751953125, 0.33596038818359375, 0.3573455810546875, 0.37873077392578125, 0.400115966796875, 0.42150115966796875, 0.4428863525390625, 0.46427154541015625, 0.48565673828125, 0.5070419311523438, 0.5284271240234375, 0.5498123168945312, 0.571197509765625, 0.5925827026367188, 0.6139678955078125, 0.6353530883789062, 0.65673828125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 10.0, 18.0, 11.0, 22.0, 38.0, 40.0, 61.0, 81.0, 97.0, 129.0, 179.0, 218.0, 328.0, 492.0, 678.0, 950.0, 1553.0, 2482.0, 4082.0, 7133.0, 13875.0, 28053.0, 58426.0, 129152.0, 285714.0, 275992.0, 124223.0, 56564.0, 26562.0, 13217.0, 7051.0, 3946.0, 2357.0, 1460.0, 958.0, 675.0, 460.0, 321.0, 268.0, 148.0, 142.0, 110.0, 66.0, 54.0, 44.0, 31.0, 15.0, 17.0, 11.0, 11.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.90576171875, -0.8765182495117188, -0.8472747802734375, -0.8180313110351562, -0.788787841796875, -0.7595443725585938, -0.7303009033203125, -0.7010574340820312, -0.67181396484375, -0.6425704956054688, -0.6133270263671875, -0.5840835571289062, -0.554840087890625, -0.5255966186523438, -0.4963531494140625, -0.46710968017578125, -0.4378662109375, -0.40862274169921875, -0.3793792724609375, -0.35013580322265625, -0.320892333984375, -0.29164886474609375, -0.2624053955078125, -0.23316192626953125, -0.20391845703125, -0.17467498779296875, -0.1454315185546875, -0.11618804931640625, -0.086944580078125, -0.05770111083984375, -0.0284576416015625, 0.00078582763671875, 0.030029296875, 0.05927276611328125, 0.0885162353515625, 0.11775970458984375, 0.147003173828125, 0.17624664306640625, 0.2054901123046875, 0.23473358154296875, 0.26397705078125, 0.29322052001953125, 0.3224639892578125, 0.35170745849609375, 0.380950927734375, 0.41019439697265625, 0.4394378662109375, 0.46868133544921875, 0.4979248046875, 0.5271682739257812, 0.5564117431640625, 0.5856552124023438, 0.614898681640625, 0.6441421508789062, 0.6733856201171875, 0.7026290893554688, 0.73187255859375, 0.7611160278320312, 0.7903594970703125, 0.8196029663085938, 0.848846435546875, 0.8780899047851562, 0.9073333740234375, 0.9365768432617188, 0.9658203125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 7.0, 14.0, 10.0, 12.0, 26.0, 28.0, 33.0, 38.0, 39.0, 35.0, 53.0, 74.0, 121.0, 318.0, 1490.0, 274.0, 100.0, 68.0, 60.0, 44.0, 46.0, 30.0, 23.0, 22.0, 17.0, 13.0, 9.0, 10.0, 5.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -2.003997802734375, -1.93572998046875, -1.867462158203125, -1.7991943359375, -1.730926513671875, -1.66265869140625, -1.594390869140625, -1.526123046875, -1.457855224609375, -1.38958740234375, -1.321319580078125, -1.2530517578125, -1.184783935546875, -1.11651611328125, -1.048248291015625, -0.97998046875, -0.911712646484375, -0.84344482421875, -0.775177001953125, -0.7069091796875, -0.638641357421875, -0.57037353515625, -0.502105712890625, -0.433837890625, -0.365570068359375, -0.29730224609375, -0.229034423828125, -0.1607666015625, -0.092498779296875, -0.02423095703125, 0.044036865234375, 0.1123046875, 0.180572509765625, 0.24884033203125, 0.317108154296875, 0.3853759765625, 0.453643798828125, 0.52191162109375, 0.590179443359375, 0.658447265625, 0.726715087890625, 0.79498291015625, 0.863250732421875, 0.9315185546875, 0.999786376953125, 1.06805419921875, 1.136322021484375, 1.20458984375, 1.272857666015625, 1.34112548828125, 1.409393310546875, 1.4776611328125, 1.545928955078125, 1.61419677734375, 1.682464599609375, 1.750732421875, 1.819000244140625, 1.88726806640625, 1.955535888671875, 2.0238037109375, 2.092071533203125, 2.16033935546875, 2.228607177734375, 2.296875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 16.0, 18.0, 20.0, 30.0, 49.0, 56.0, 71.0, 122.0, 119.0, 195.0, 244.0, 430.0, 608.0, 1500.0, 15033.0, 2902552.0, 217890.0, 4134.0, 945.0, 485.0, 319.0, 212.0, 156.0, 107.0, 79.0, 64.0, 56.0, 41.0, 26.0, 25.0, 15.0, 20.0, 8.0, 10.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.10833740234375, -3.9549560546875, -3.80157470703125, -3.648193359375, -3.49481201171875, -3.3414306640625, -3.18804931640625, -3.03466796875, -2.88128662109375, -2.7279052734375, -2.57452392578125, -2.421142578125, -2.26776123046875, -2.1143798828125, -1.96099853515625, -1.8076171875, -1.65423583984375, -1.5008544921875, -1.34747314453125, -1.194091796875, -1.04071044921875, -0.8873291015625, -0.73394775390625, -0.58056640625, -0.42718505859375, -0.2738037109375, -0.12042236328125, 0.032958984375, 0.18634033203125, 0.3397216796875, 0.49310302734375, 0.646484375, 0.79986572265625, 0.9532470703125, 1.10662841796875, 1.260009765625, 1.41339111328125, 1.5667724609375, 1.72015380859375, 1.87353515625, 2.02691650390625, 2.1802978515625, 2.33367919921875, 2.487060546875, 2.64044189453125, 2.7938232421875, 2.94720458984375, 3.1005859375, 3.25396728515625, 3.4073486328125, 3.56072998046875, 3.714111328125, 3.86749267578125, 4.0208740234375, 4.17425537109375, 4.32763671875, 4.48101806640625, 4.6343994140625, 4.78778076171875, 4.941162109375, 5.09454345703125, 5.2479248046875, 5.40130615234375, 5.5546875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 12.0, 54.0, 212.0, 446.0, 225.0, 62.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.196987152099609, -5.697972774505615, -5.198958873748779, -4.699944496154785, -4.200930595397949, -3.701916217803955, -3.202901840209961, -2.703887701034546, -2.204873561859131, -1.7058594226837158, -1.2068451642990112, -0.7078309059143066, -0.2088167667388916, 0.29019737243652344, 0.7892117500305176, 1.2882258892059326, 1.7872400283813477, 2.2862541675567627, 2.7852683067321777, 3.284282684326172, 3.783296823501587, 4.282310962677002, 4.781325340270996, 5.280339241027832, 5.779353618621826, 6.27836799621582, 6.777381896972656, 7.27639627456665, 7.7754106521606445, 8.27442455291748, 8.773439407348633, 9.272453308105469, 9.771467208862305, 10.27048110961914, 10.769495964050293, 11.268509864807129, 11.767523765563965, 12.266538619995117, 12.765552520751953, 13.264566421508789, 13.763580322265625, 14.262594223022461, 14.761609077453613, 15.26062297821045, 15.759636878967285, 16.258651733398438, 16.757665634155273, 17.25667953491211, 17.755695343017578, 18.254709243774414, 18.75372314453125, 19.25273895263672, 19.751752853393555, 20.25076675415039, 20.749780654907227, 21.248794555664062, 21.7478084564209, 22.246822357177734, 22.74583625793457, 23.244850158691406, 23.743865966796875, 24.24287986755371, 24.741893768310547, 25.240907669067383, 25.73992156982422]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 7.0, 6.0, 8.0, 11.0, 15.0, 11.0, 19.0, 22.0, 18.0, 27.0, 20.0, 28.0, 28.0, 48.0, 38.0, 42.0, 33.0, 37.0, 43.0, 41.0, 49.0, 39.0, 46.0, 33.0, 34.0, 28.0, 28.0, 25.0, 26.0, 35.0, 31.0, 23.0, 9.0, 18.0, 8.0, 9.0, 9.0, 18.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0], "bins": [-5.955723285675049, -5.805081844329834, -5.654439926147461, -5.503798484802246, -5.353157043457031, -5.202515125274658, -5.051873683929443, -4.90123176574707, -4.7505903244018555, -4.599948883056641, -4.449306964874268, -4.298665523529053, -4.14802360534668, -3.997382164001465, -3.84674072265625, -3.696099042892456, -3.545457363128662, -3.394815683364868, -3.244174003601074, -3.0935325622558594, -2.9428908824920654, -2.7922492027282715, -2.6416077613830566, -2.4909660816192627, -2.3403244018554688, -2.189682722091675, -2.039041042327881, -1.888399600982666, -1.737757921218872, -1.5871162414550781, -1.4364746809005737, -1.2858331203460693, -1.1351919174194336, -0.9845502972602844, -0.8339086771011353, -0.6832670569419861, -0.5326254367828369, -0.38198381662368774, -0.23134219646453857, -0.08070063591003418, 0.06994104385375977, 0.22058266401290894, 0.3712242841720581, 0.5218659043312073, 0.6725075244903564, 0.8231491446495056, 0.9737907648086548, 1.1244323253631592, 1.2750740051269531, 1.425715684890747, 1.5763572454452515, 1.7269988059997559, 1.8776404857635498, 2.0282821655273438, 2.1789236068725586, 2.3295652866363525, 2.4802069664001465, 2.6308486461639404, 2.7814903259277344, 2.932131767272949, 3.082773447036743, 3.233415126800537, 3.384056568145752, 3.534698247909546, 3.68533992767334]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 4.0, 12.0, 12.0, 7.0, 19.0, 23.0, 16.0, 21.0, 33.0, 27.0, 33.0, 35.0, 30.0, 44.0, 27.0, 28.0, 37.0, 33.0, 31.0, 37.0, 28.0, 32.0, 37.0, 44.0, 37.0, 28.0, 25.0, 31.0, 21.0, 28.0, 16.0, 13.0, 20.0, 18.0, 9.0, 12.0, 12.0, 9.0, 11.0, 5.0, 6.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.7275390625, -0.7065048217773438, -0.6854705810546875, -0.6644363403320312, -0.643402099609375, -0.6223678588867188, -0.6013336181640625, -0.5802993774414062, -0.55926513671875, -0.5382308959960938, -0.5171966552734375, -0.49616241455078125, -0.475128173828125, -0.45409393310546875, -0.4330596923828125, -0.41202545166015625, -0.3909912109375, -0.36995697021484375, -0.3489227294921875, -0.32788848876953125, -0.306854248046875, -0.28582000732421875, -0.2647857666015625, -0.24375152587890625, -0.22271728515625, -0.20168304443359375, -0.1806488037109375, -0.15961456298828125, -0.138580322265625, -0.11754608154296875, -0.0965118408203125, -0.07547760009765625, -0.054443359375, -0.03340911865234375, -0.0123748779296875, 0.00865936279296875, 0.029693603515625, 0.05072784423828125, 0.0717620849609375, 0.09279632568359375, 0.11383056640625, 0.13486480712890625, 0.1558990478515625, 0.17693328857421875, 0.197967529296875, 0.21900177001953125, 0.2400360107421875, 0.26107025146484375, 0.2821044921875, 0.30313873291015625, 0.3241729736328125, 0.34520721435546875, 0.366241455078125, 0.38727569580078125, 0.4083099365234375, 0.42934417724609375, 0.45037841796875, 0.47141265869140625, 0.4924468994140625, 0.5134811401367188, 0.534515380859375, 0.5555496215820312, 0.5765838623046875, 0.5976181030273438, 0.61865234375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 10.0, 11.0, 13.0, 10.0, 27.0, 30.0, 37.0, 60.0, 89.0, 93.0, 146.0, 249.0, 386.0, 626.0, 1072.0, 1916.0, 3675.0, 8254.0, 23862.0, 168135.0, 1890492.0, 1883948.0, 169928.0, 24376.0, 8382.0, 3780.0, 1916.0, 1031.0, 591.0, 380.0, 229.0, 166.0, 105.0, 61.0, 49.0, 40.0, 37.0, 18.0, 11.0, 7.0, 12.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.90234375, -1.847991943359375, -1.79364013671875, -1.739288330078125, -1.6849365234375, -1.630584716796875, -1.57623291015625, -1.521881103515625, -1.467529296875, -1.413177490234375, -1.35882568359375, -1.304473876953125, -1.2501220703125, -1.195770263671875, -1.14141845703125, -1.087066650390625, -1.03271484375, -0.978363037109375, -0.92401123046875, -0.869659423828125, -0.8153076171875, -0.760955810546875, -0.70660400390625, -0.652252197265625, -0.597900390625, -0.543548583984375, -0.48919677734375, -0.434844970703125, -0.3804931640625, -0.326141357421875, -0.27178955078125, -0.217437744140625, -0.1630859375, -0.108734130859375, -0.05438232421875, -3.0517578125e-05, 0.0543212890625, 0.108673095703125, 0.16302490234375, 0.217376708984375, 0.271728515625, 0.326080322265625, 0.38043212890625, 0.434783935546875, 0.4891357421875, 0.543487548828125, 0.59783935546875, 0.652191162109375, 0.70654296875, 0.760894775390625, 0.81524658203125, 0.869598388671875, 0.9239501953125, 0.978302001953125, 1.03265380859375, 1.087005615234375, 1.141357421875, 1.195709228515625, 1.25006103515625, 1.304412841796875, 1.3587646484375, 1.413116455078125, 1.46746826171875, 1.521820068359375, 1.576171875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 10.0, 6.0, 18.0, 20.0, 21.0, 44.0, 50.0, 86.0, 122.0, 176.0, 291.0, 430.0, 669.0, 713.0, 474.0, 314.0, 200.0, 133.0, 83.0, 60.0, 34.0, 30.0, 13.0, 19.0, 6.0, 3.0, 6.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.13275146484375, -1.0858154296875, -1.03887939453125, -0.991943359375, -0.94500732421875, -0.8980712890625, -0.85113525390625, -0.80419921875, -0.75726318359375, -0.7103271484375, -0.66339111328125, -0.616455078125, -0.56951904296875, -0.5225830078125, -0.47564697265625, -0.4287109375, -0.38177490234375, -0.3348388671875, -0.28790283203125, -0.240966796875, -0.19403076171875, -0.1470947265625, -0.10015869140625, -0.05322265625, -0.00628662109375, 0.0406494140625, 0.08758544921875, 0.134521484375, 0.18145751953125, 0.2283935546875, 0.27532958984375, 0.322265625, 0.36920166015625, 0.4161376953125, 0.46307373046875, 0.510009765625, 0.55694580078125, 0.6038818359375, 0.65081787109375, 0.69775390625, 0.74468994140625, 0.7916259765625, 0.83856201171875, 0.885498046875, 0.93243408203125, 0.9793701171875, 1.02630615234375, 1.0732421875, 1.12017822265625, 1.1671142578125, 1.21405029296875, 1.260986328125, 1.30792236328125, 1.3548583984375, 1.40179443359375, 1.44873046875, 1.49566650390625, 1.5426025390625, 1.58953857421875, 1.636474609375, 1.68341064453125, 1.7303466796875, 1.77728271484375, 1.82421875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 9.0, 13.0, 7.0, 15.0, 26.0, 34.0, 67.0, 108.0, 204.0, 434.0, 992.0, 2728.0, 9830.0, 54617.0, 1637985.0, 2405688.0, 65328.0, 10989.0, 3129.0, 1071.0, 482.0, 241.0, 125.0, 62.0, 30.0, 27.0, 13.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.6011962890625, -2.497314453125, -2.3934326171875, -2.28955078125, -2.1856689453125, -2.081787109375, -1.9779052734375, -1.8740234375, -1.7701416015625, -1.666259765625, -1.5623779296875, -1.45849609375, -1.3546142578125, -1.250732421875, -1.1468505859375, -1.04296875, -0.9390869140625, -0.835205078125, -0.7313232421875, -0.62744140625, -0.5235595703125, -0.419677734375, -0.3157958984375, -0.2119140625, -0.1080322265625, -0.004150390625, 0.0997314453125, 0.20361328125, 0.3074951171875, 0.411376953125, 0.5152587890625, 0.619140625, 0.7230224609375, 0.826904296875, 0.9307861328125, 1.03466796875, 1.1385498046875, 1.242431640625, 1.3463134765625, 1.4501953125, 1.5540771484375, 1.657958984375, 1.7618408203125, 1.86572265625, 1.9696044921875, 2.073486328125, 2.1773681640625, 2.28125, 2.3851318359375, 2.489013671875, 2.5928955078125, 2.69677734375, 2.8006591796875, 2.904541015625, 3.0084228515625, 3.1123046875, 3.2161865234375, 3.320068359375, 3.4239501953125, 3.52783203125, 3.6317138671875, 3.735595703125, 3.8394775390625, 3.943359375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 17.0, 163.0, 515.0, 259.0, 43.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.529300689697266, -29.696321487426758, -28.86334228515625, -28.030364990234375, -27.197385787963867, -26.36440658569336, -25.531429290771484, -24.698450088500977, -23.86547088623047, -23.03249168395996, -22.199512481689453, -21.366535186767578, -20.53355598449707, -19.700576782226562, -18.867599487304688, -18.03462028503418, -17.201641082763672, -16.368661880493164, -15.535683631896973, -14.702705383300781, -13.869726181030273, -13.036746978759766, -12.203768730163574, -11.370790481567383, -10.537811279296875, -9.704832077026367, -8.871853828430176, -8.038875579833984, -7.205896377563477, -6.372917652130127, -5.539938926696777, -4.706960201263428, -3.873981475830078, -3.0410027503967285, -2.208024024963379, -1.3750452995300293, -0.5420665740966797, 0.2909121513366699, 1.1238908767700195, 1.9568696022033691, 2.7898483276367188, 3.6228270530700684, 4.455805778503418, 5.288784503936768, 6.121763229370117, 6.954741954803467, 7.787720680236816, 8.620698928833008, 9.453678131103516, 10.286657333374023, 11.119635581970215, 11.952613830566406, 12.785593032836914, 13.618572235107422, 14.451550483703613, 15.284528732299805, 16.117507934570312, 16.95048713684082, 17.783466339111328, 18.616443634033203, 19.44942283630371, 20.28240203857422, 21.115379333496094, 21.9483585357666, 22.78133773803711]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 3.0, 1.0, 4.0, 9.0, 5.0, 13.0, 17.0, 17.0, 18.0, 27.0, 21.0, 24.0, 29.0, 44.0, 43.0, 40.0, 37.0, 39.0, 36.0, 44.0, 46.0, 44.0, 39.0, 42.0, 38.0, 39.0, 32.0, 29.0, 29.0, 27.0, 35.0, 23.0, 12.0, 16.0, 7.0, 14.0, 13.0, 11.0, 9.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.385064125061035, -4.243892669677734, -4.102721214294434, -3.961549758911133, -3.820378065109253, -3.679206609725952, -3.5380351543426514, -3.3968636989593506, -3.2556920051574707, -3.11452054977417, -2.973349094390869, -2.8321776390075684, -2.6910059452056885, -2.5498344898223877, -2.408663034439087, -2.267491579055786, -2.1263201236724854, -1.9851486682891846, -1.8439770936965942, -1.7028056383132935, -1.5616340637207031, -1.4204626083374023, -1.2792911529541016, -1.1381196975708008, -0.9969481229782104, -0.8557766079902649, -0.7146050930023193, -0.5734336376190186, -0.432262122631073, -0.29109060764312744, -0.14991915225982666, -0.008747637271881104, 0.13242387771606445, 0.27359539270401, 0.4147668778896332, 0.5559383630752563, 0.6971098780632019, 0.8382813930511475, 0.9794528484344482, 1.120624303817749, 1.2617958784103394, 1.4029673337936401, 1.5441389083862305, 1.6853103637695312, 1.826481819152832, 1.9676533937454224, 2.1088247299194336, 2.2499964237213135, 2.3911678791046143, 2.532339334487915, 2.673510789871216, 2.8146824836730957, 2.9558539390563965, 3.0970253944396973, 3.238196849822998, 3.379368305206299, 3.5205397605895996, 3.6617112159729004, 3.802882671356201, 3.944054126739502, 4.085225582122803, 4.226397514343262, 4.3675689697265625, 4.508740425109863, 4.649911880493164]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 12.0, 13.0, 13.0, 17.0, 20.0, 21.0, 18.0, 33.0, 25.0, 23.0, 23.0, 31.0, 35.0, 42.0, 32.0, 37.0, 41.0, 48.0, 45.0, 44.0, 36.0, 37.0, 37.0, 37.0, 37.0, 33.0, 28.0, 29.0, 22.0, 13.0, 14.0, 10.0, 17.0, 8.0, 9.0, 7.0, 7.0, 4.0, 3.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67724609375, -0.6556167602539062, -0.6339874267578125, -0.6123580932617188, -0.590728759765625, -0.5690994262695312, -0.5474700927734375, -0.5258407592773438, -0.50421142578125, -0.48258209228515625, -0.4609527587890625, -0.43932342529296875, -0.417694091796875, -0.39606475830078125, -0.3744354248046875, -0.35280609130859375, -0.3311767578125, -0.30954742431640625, -0.2879180908203125, -0.26628875732421875, -0.244659423828125, -0.22303009033203125, -0.2014007568359375, -0.17977142333984375, -0.15814208984375, -0.13651275634765625, -0.1148834228515625, -0.09325408935546875, -0.071624755859375, -0.04999542236328125, -0.0283660888671875, -0.00673675537109375, 0.014892578125, 0.03652191162109375, 0.0581512451171875, 0.07978057861328125, 0.101409912109375, 0.12303924560546875, 0.1446685791015625, 0.16629791259765625, 0.18792724609375, 0.20955657958984375, 0.2311859130859375, 0.25281524658203125, 0.274444580078125, 0.29607391357421875, 0.3177032470703125, 0.33933258056640625, 0.3609619140625, 0.38259124755859375, 0.4042205810546875, 0.42584991455078125, 0.447479248046875, 0.46910858154296875, 0.4907379150390625, 0.5123672485351562, 0.53399658203125, 0.5556259155273438, 0.5772552490234375, 0.5988845825195312, 0.620513916015625, 0.6421432495117188, 0.6637725830078125, 0.6854019165039062, 0.70703125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 18.0, 13.0, 34.0, 36.0, 73.0, 112.0, 150.0, 253.0, 390.0, 586.0, 933.0, 1487.0, 2390.0, 3815.0, 6701.0, 11672.0, 20918.0, 39081.0, 76131.0, 149877.0, 253930.0, 223930.0, 121088.0, 60954.0, 32380.0, 17314.0, 9704.0, 5598.0, 3400.0, 2020.0, 1262.0, 807.0, 499.0, 319.0, 232.0, 149.0, 106.0, 59.0, 35.0, 30.0, 28.0, 11.0, 5.0, 7.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.092529296875, -0.08979511260986328, -0.08706092834472656, -0.08432674407958984, -0.08159255981445312, -0.0788583755493164, -0.07612419128417969, -0.07339000701904297, -0.07065582275390625, -0.06792163848876953, -0.06518745422363281, -0.062453269958496094, -0.059719085693359375, -0.056984901428222656, -0.05425071716308594, -0.05151653289794922, -0.0487823486328125, -0.04604816436767578, -0.04331398010253906, -0.040579795837402344, -0.037845611572265625, -0.035111427307128906, -0.03237724304199219, -0.02964305877685547, -0.02690887451171875, -0.02417469024658203, -0.021440505981445312, -0.018706321716308594, -0.015972137451171875, -0.013237953186035156, -0.010503768920898438, -0.007769584655761719, -0.005035400390625, -0.0023012161254882812, 0.0004329681396484375, 0.0031671524047851562, 0.005901336669921875, 0.008635520935058594, 0.011369705200195312, 0.014103889465332031, 0.01683807373046875, 0.01957225799560547, 0.022306442260742188, 0.025040626525878906, 0.027774810791015625, 0.030508995056152344, 0.03324317932128906, 0.03597736358642578, 0.0387115478515625, 0.04144573211669922, 0.04417991638183594, 0.046914100646972656, 0.049648284912109375, 0.052382469177246094, 0.05511665344238281, 0.05785083770751953, 0.06058502197265625, 0.06331920623779297, 0.06605339050292969, 0.0687875747680664, 0.07152175903320312, 0.07425594329833984, 0.07699012756347656, 0.07972431182861328, 0.08245849609375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 15.0, 15.0, 9.0, 14.0, 16.0, 27.0, 20.0, 26.0, 20.0, 30.0, 30.0, 32.0, 41.0, 39.0, 35.0, 27.0, 48.0, 1071.0, 29.0, 34.0, 36.0, 27.0, 27.0, 53.0, 38.0, 21.0, 29.0, 29.0, 17.0, 15.0, 19.0, 15.0, 15.0, 13.0, 14.0, 16.0, 10.0, 8.0, 3.0, 4.0, 2.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.55810546875, -0.5404281616210938, -0.5227508544921875, -0.5050735473632812, -0.487396240234375, -0.46971893310546875, -0.4520416259765625, -0.43436431884765625, -0.41668701171875, -0.39900970458984375, -0.3813323974609375, -0.36365509033203125, -0.345977783203125, -0.32830047607421875, -0.3106231689453125, -0.29294586181640625, -0.2752685546875, -0.25759124755859375, -0.2399139404296875, -0.22223663330078125, -0.204559326171875, -0.18688201904296875, -0.1692047119140625, -0.15152740478515625, -0.13385009765625, -0.11617279052734375, -0.0984954833984375, -0.08081817626953125, -0.063140869140625, -0.04546356201171875, -0.0277862548828125, -0.01010894775390625, 0.007568359375, 0.02524566650390625, 0.0429229736328125, 0.06060028076171875, 0.078277587890625, 0.09595489501953125, 0.1136322021484375, 0.13130950927734375, 0.14898681640625, 0.16666412353515625, 0.1843414306640625, 0.20201873779296875, 0.219696044921875, 0.23737335205078125, 0.2550506591796875, 0.27272796630859375, 0.2904052734375, 0.30808258056640625, 0.3257598876953125, 0.34343719482421875, 0.361114501953125, 0.37879180908203125, 0.3964691162109375, 0.41414642333984375, 0.43182373046875, 0.44950103759765625, 0.4671783447265625, 0.48485565185546875, 0.502532958984375, 0.5202102661132812, 0.5378875732421875, 0.5555648803710938, 0.5732421875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 11.0, 24.0, 24.0, 39.0, 53.0, 73.0, 112.0, 125.0, 165.0, 241.0, 312.0, 482.0, 660.0, 874.0, 1274.0, 1818.0, 2647.0, 3879.0, 6237.0, 10381.0, 19734.0, 56323.0, 1417023.0, 481997.0, 46870.0, 18056.0, 9712.0, 5824.0, 3730.0, 2473.0, 1662.0, 1158.0, 875.0, 581.0, 455.0, 350.0, 231.0, 168.0, 138.0, 89.0, 65.0, 42.0, 37.0, 26.0, 19.0, 17.0, 11.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.1378173828125, -0.13363265991210938, -0.12944793701171875, -0.12526321411132812, -0.1210784912109375, -0.11689376831054688, -0.11270904541015625, -0.10852432250976562, -0.104339599609375, -0.10015487670898438, -0.09597015380859375, -0.09178543090820312, -0.0876007080078125, -0.08341598510742188, -0.07923126220703125, -0.07504653930664062, -0.07086181640625, -0.06667709350585938, -0.06249237060546875, -0.058307647705078125, -0.0541229248046875, -0.049938201904296875, -0.04575347900390625, -0.041568756103515625, -0.037384033203125, -0.033199310302734375, -0.02901458740234375, -0.024829864501953125, -0.0206451416015625, -0.016460418701171875, -0.01227569580078125, -0.008090972900390625, -0.00390625, 0.000278472900390625, 0.00446319580078125, 0.008647918701171875, 0.0128326416015625, 0.017017364501953125, 0.02120208740234375, 0.025386810302734375, 0.029571533203125, 0.033756256103515625, 0.03794097900390625, 0.042125701904296875, 0.0463104248046875, 0.050495147705078125, 0.05467987060546875, 0.058864593505859375, 0.06304931640625, 0.06723403930664062, 0.07141876220703125, 0.07560348510742188, 0.0797882080078125, 0.08397293090820312, 0.08815765380859375, 0.09234237670898438, 0.096527099609375, 0.10071182250976562, 0.10489654541015625, 0.10908126831054688, 0.1132659912109375, 0.11745071411132812, 0.12163543701171875, 0.12582015991210938, 0.1300048828125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 10.0, 5.0, 6.0, 6.0, 8.0, 13.0, 25.0, 30.0, 23.0, 37.0, 39.0, 39.0, 41.0, 49.0, 52.0, 33.0, 45.0, 57.0, 51.0, 48.0, 46.0, 51.0, 44.0, 37.0, 29.0, 37.0, 32.0, 21.0, 20.0, 11.0, 15.0, 9.0, 13.0, 8.0, 8.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00957489013671875, -0.009250998497009277, -0.008927106857299805, -0.008603215217590332, -0.00827932357788086, -0.007955431938171387, -0.007631540298461914, -0.007307648658752441, -0.006983757019042969, -0.006659865379333496, -0.0063359737396240234, -0.006012082099914551, -0.005688190460205078, -0.0053642988204956055, -0.005040407180786133, -0.00471651554107666, -0.0043926239013671875, -0.004068732261657715, -0.003744840621948242, -0.0034209489822387695, -0.003097057342529297, -0.0027731657028198242, -0.0024492740631103516, -0.002125382423400879, -0.0018014907836914062, -0.0014775991439819336, -0.001153707504272461, -0.0008298158645629883, -0.0005059242248535156, -0.00018203258514404297, 0.0001418590545654297, 0.00046575069427490234, 0.000789642333984375, 0.0011135339736938477, 0.0014374256134033203, 0.001761317253112793, 0.0020852088928222656, 0.0024091005325317383, 0.002732992172241211, 0.0030568838119506836, 0.0033807754516601562, 0.003704667091369629, 0.0040285587310791016, 0.004352450370788574, 0.004676342010498047, 0.0050002336502075195, 0.005324125289916992, 0.005648016929626465, 0.0059719085693359375, 0.00629580020904541, 0.006619691848754883, 0.0069435834884643555, 0.007267475128173828, 0.007591366767883301, 0.007915258407592773, 0.008239150047302246, 0.008563041687011719, 0.008886933326721191, 0.009210824966430664, 0.009534716606140137, 0.00985860824584961, 0.010182499885559082, 0.010506391525268555, 0.010830283164978027, 0.0111541748046875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 17.0, 15.0, 10.0, 15.0, 18.0, 28.0, 50.0, 64.0, 64.0, 80.0, 121.0, 180.0, 238.0, 413.0, 1003.0, 35333.0, 1004387.0, 4655.0, 700.0, 315.0, 210.0, 159.0, 119.0, 94.0, 66.0, 43.0, 38.0, 36.0, 26.0, 11.0, 9.0, 4.0, 8.0, 8.0, 9.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2069091796875, -0.2008800506591797, -0.19485092163085938, -0.18882179260253906, -0.18279266357421875, -0.17676353454589844, -0.17073440551757812, -0.1647052764892578, -0.1586761474609375, -0.1526470184326172, -0.14661788940429688, -0.14058876037597656, -0.13455963134765625, -0.12853050231933594, -0.12250137329101562, -0.11647224426269531, -0.110443115234375, -0.10441398620605469, -0.09838485717773438, -0.09235572814941406, -0.08632659912109375, -0.08029747009277344, -0.07426834106445312, -0.06823921203613281, -0.0622100830078125, -0.05618095397949219, -0.050151824951171875, -0.04412269592285156, -0.03809356689453125, -0.03206443786621094, -0.026035308837890625, -0.020006179809570312, -0.01397705078125, -0.007947921752929688, -0.001918792724609375, 0.0041103363037109375, 0.01013946533203125, 0.016168594360351562, 0.022197723388671875, 0.028226852416992188, 0.0342559814453125, 0.04028511047363281, 0.046314239501953125, 0.05234336853027344, 0.05837249755859375, 0.06440162658691406, 0.07043075561523438, 0.07645988464355469, 0.082489013671875, 0.08851814270019531, 0.09454727172851562, 0.10057640075683594, 0.10660552978515625, 0.11263465881347656, 0.11866378784179688, 0.12469291687011719, 0.1307220458984375, 0.1367511749267578, 0.14278030395507812, 0.14880943298339844, 0.15483856201171875, 0.16086769104003906, 0.16689682006835938, 0.1729259490966797, 0.178955078125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 16.0, 153.0, 786.0, 56.0, 2.0, 2.0, 1.0], "bins": [-0.28487062454223633, -0.28007587790489197, -0.27528116106987, -0.27048641443252563, -0.26569169759750366, -0.2608969509601593, -0.25610220432281494, -0.25130748748779297, -0.2465127557516098, -0.24171802401542664, -0.23692329227924347, -0.2321285605430603, -0.22733381390571594, -0.22253908216953278, -0.2177443504333496, -0.21294961869716644, -0.20815488696098328, -0.2033601552248001, -0.19856542348861694, -0.19377067685127258, -0.18897594511508942, -0.18418121337890625, -0.17938648164272308, -0.17459174990653992, -0.16979700326919556, -0.1650022715330124, -0.16020753979682922, -0.15541279315948486, -0.1506180614233017, -0.14582332968711853, -0.14102859795093536, -0.1362338662147522, -0.13143913447856903, -0.12664440274238586, -0.1218496635556221, -0.11705493181943893, -0.11226020008325577, -0.107465460896492, -0.10267072916030884, -0.09787599742412567, -0.09308125823736191, -0.08828652650117874, -0.08349178731441498, -0.07869705557823181, -0.07390232384204865, -0.06910759210586548, -0.06431285291910172, -0.05951812118291855, -0.054723381996154785, -0.04992864653468132, -0.045133914798498154, -0.04033917933702469, -0.03554444760084152, -0.030749712139368057, -0.025954976677894592, -0.021160244941711426, -0.01636551134288311, -0.011570777744054794, -0.006776043213903904, -0.0019813086837530136, 0.002813424915075302, 0.007608158513903618, 0.012402893975377083, 0.01719762571156025, 0.021992361173033714]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 5.0, 9.0, 10.0, 16.0, 17.0, 17.0, 24.0, 18.0, 26.0, 27.0, 31.0, 28.0, 33.0, 45.0, 36.0, 28.0, 46.0, 48.0, 42.0, 46.0, 39.0, 40.0, 37.0, 44.0, 34.0, 32.0, 33.0, 23.0, 23.0, 25.0, 17.0, 10.0, 12.0, 17.0, 10.0, 5.0, 7.0, 1.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.024955391883850098, -0.02417573519051075, -0.023396078497171402, -0.022616421803832054, -0.021836765110492706, -0.02105710841715336, -0.02027745172381401, -0.019497795030474663, -0.018718138337135315, -0.017938481643795967, -0.01715882495045662, -0.01637916825711727, -0.015599511563777924, -0.014819854870438576, -0.014040198177099228, -0.01326054148375988, -0.012480884790420532, -0.011701228097081184, -0.010921571403741837, -0.010141914710402489, -0.009362258017063141, -0.008582601323723793, -0.007802944630384445, -0.007023287937045097, -0.0062436312437057495, -0.005463974550366402, -0.004684317857027054, -0.003904661163687706, -0.003125004470348358, -0.0023453477770090103, -0.0015656910836696625, -0.0007860343903303146, -6.377696990966797e-06, 0.000773278996348381, 0.0015529356896877289, 0.0023325923830270767, 0.0031122490763664246, 0.0038919057697057724, 0.00467156246304512, 0.005451219156384468, 0.006230875849723816, 0.007010532543063164, 0.007790189236402512, 0.00856984592974186, 0.009349502623081207, 0.010129159316420555, 0.010908816009759903, 0.01168847270309925, 0.012468129396438599, 0.013247786089777946, 0.014027442783117294, 0.014807099476456642, 0.01558675616979599, 0.016366412863135338, 0.017146069556474686, 0.017925726249814034, 0.01870538294315338, 0.01948503963649273, 0.020264696329832077, 0.021044353023171425, 0.021824009716510773, 0.02260366640985012, 0.02338332310318947, 0.024162979796528816, 0.024942636489868164]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 12.0, 14.0, 12.0, 17.0, 20.0, 22.0, 18.0, 32.0, 25.0, 24.0, 20.0, 33.0, 34.0, 43.0, 33.0, 37.0, 42.0, 44.0, 48.0, 41.0, 37.0, 39.0, 34.0, 39.0, 35.0, 34.0, 28.0, 29.0, 20.0, 16.0, 13.0, 12.0, 16.0, 7.0, 10.0, 7.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6767578125, -0.6551513671875, -0.633544921875, -0.6119384765625, -0.59033203125, -0.5687255859375, -0.547119140625, -0.5255126953125, -0.50390625, -0.4822998046875, -0.460693359375, -0.4390869140625, -0.41748046875, -0.3958740234375, -0.374267578125, -0.3526611328125, -0.3310546875, -0.3094482421875, -0.287841796875, -0.2662353515625, -0.24462890625, -0.2230224609375, -0.201416015625, -0.1798095703125, -0.158203125, -0.1365966796875, -0.114990234375, -0.0933837890625, -0.07177734375, -0.0501708984375, -0.028564453125, -0.0069580078125, 0.0146484375, 0.0362548828125, 0.057861328125, 0.0794677734375, 0.10107421875, 0.1226806640625, 0.144287109375, 0.1658935546875, 0.1875, 0.2091064453125, 0.230712890625, 0.2523193359375, 0.27392578125, 0.2955322265625, 0.317138671875, 0.3387451171875, 0.3603515625, 0.3819580078125, 0.403564453125, 0.4251708984375, 0.44677734375, 0.4683837890625, 0.489990234375, 0.5115966796875, 0.533203125, 0.5548095703125, 0.576416015625, 0.5980224609375, 0.61962890625, 0.6412353515625, 0.662841796875, 0.6844482421875, 0.7060546875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 27.0, 36.0, 47.0, 72.0, 76.0, 132.0, 136.0, 227.0, 317.0, 481.0, 748.0, 1201.0, 2020.0, 3712.0, 7468.0, 17735.0, 50109.0, 171471.0, 542407.0, 166811.0, 49216.0, 17534.0, 7489.0, 3559.0, 1974.0, 1127.0, 763.0, 483.0, 365.0, 224.0, 139.0, 102.0, 85.0, 57.0, 40.0, 35.0, 22.0, 13.0, 22.0, 12.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2978515625, -1.2566375732421875, -1.215423583984375, -1.1742095947265625, -1.13299560546875, -1.0917816162109375, -1.050567626953125, -1.0093536376953125, -0.9681396484375, -0.9269256591796875, -0.885711669921875, -0.8444976806640625, -0.80328369140625, -0.7620697021484375, -0.720855712890625, -0.6796417236328125, -0.638427734375, -0.5972137451171875, -0.555999755859375, -0.5147857666015625, -0.47357177734375, -0.4323577880859375, -0.391143798828125, -0.3499298095703125, -0.3087158203125, -0.2675018310546875, -0.226287841796875, -0.1850738525390625, -0.14385986328125, -0.1026458740234375, -0.061431884765625, -0.0202178955078125, 0.02099609375, 0.0622100830078125, 0.103424072265625, 0.1446380615234375, 0.18585205078125, 0.2270660400390625, 0.268280029296875, 0.3094940185546875, 0.3507080078125, 0.3919219970703125, 0.433135986328125, 0.4743499755859375, 0.51556396484375, 0.5567779541015625, 0.597991943359375, 0.6392059326171875, 0.680419921875, 0.7216339111328125, 0.762847900390625, 0.8040618896484375, 0.84527587890625, 0.8864898681640625, 0.927703857421875, 0.9689178466796875, 1.0101318359375, 1.0513458251953125, 1.092559814453125, 1.1337738037109375, 1.17498779296875, 1.2162017822265625, 1.257415771484375, 1.2986297607421875, 1.33984375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 7.0, 12.0, 14.0, 19.0, 17.0, 21.0, 26.0, 34.0, 31.0, 30.0, 48.0, 60.0, 59.0, 96.0, 204.0, 1433.0, 318.0, 169.0, 91.0, 55.0, 56.0, 44.0, 41.0, 34.0, 23.0, 20.0, 16.0, 12.0, 13.0, 13.0, 6.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.033203125, -1.9749755859375, -1.916748046875, -1.8585205078125, -1.80029296875, -1.7420654296875, -1.683837890625, -1.6256103515625, -1.5673828125, -1.5091552734375, -1.450927734375, -1.3927001953125, -1.33447265625, -1.2762451171875, -1.218017578125, -1.1597900390625, -1.1015625, -1.0433349609375, -0.985107421875, -0.9268798828125, -0.86865234375, -0.8104248046875, -0.752197265625, -0.6939697265625, -0.6357421875, -0.5775146484375, -0.519287109375, -0.4610595703125, -0.40283203125, -0.3446044921875, -0.286376953125, -0.2281494140625, -0.169921875, -0.1116943359375, -0.053466796875, 0.0047607421875, 0.06298828125, 0.1212158203125, 0.179443359375, 0.2376708984375, 0.2958984375, 0.3541259765625, 0.412353515625, 0.4705810546875, 0.52880859375, 0.5870361328125, 0.645263671875, 0.7034912109375, 0.76171875, 0.8199462890625, 0.878173828125, 0.9364013671875, 0.99462890625, 1.0528564453125, 1.111083984375, 1.1693115234375, 1.2275390625, 1.2857666015625, 1.343994140625, 1.4022216796875, 1.46044921875, 1.5186767578125, 1.576904296875, 1.6351318359375, 1.693359375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 3.0, 13.0, 16.0, 23.0, 19.0, 37.0, 57.0, 84.0, 108.0, 152.0, 202.0, 300.0, 521.0, 1021.0, 2675.0, 43261.0, 3070558.0, 22006.0, 2262.0, 876.0, 499.0, 303.0, 215.0, 133.0, 103.0, 66.0, 48.0, 34.0, 24.0, 21.0, 22.0, 9.0, 9.0, 4.0, 0.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.45098876953125, -4.2886962890625, -4.12640380859375, -3.964111328125, -3.80181884765625, -3.6395263671875, -3.47723388671875, -3.31494140625, -3.15264892578125, -2.9903564453125, -2.82806396484375, -2.665771484375, -2.50347900390625, -2.3411865234375, -2.17889404296875, -2.0166015625, -1.85430908203125, -1.6920166015625, -1.52972412109375, -1.367431640625, -1.20513916015625, -1.0428466796875, -0.88055419921875, -0.71826171875, -0.55596923828125, -0.3936767578125, -0.23138427734375, -0.069091796875, 0.09320068359375, 0.2554931640625, 0.41778564453125, 0.580078125, 0.74237060546875, 0.9046630859375, 1.06695556640625, 1.229248046875, 1.39154052734375, 1.5538330078125, 1.71612548828125, 1.87841796875, 2.04071044921875, 2.2030029296875, 2.36529541015625, 2.527587890625, 2.68988037109375, 2.8521728515625, 3.01446533203125, 3.1767578125, 3.33905029296875, 3.5013427734375, 3.66363525390625, 3.825927734375, 3.98822021484375, 4.1505126953125, 4.31280517578125, 4.47509765625, 4.63739013671875, 4.7996826171875, 4.96197509765625, 5.124267578125, 5.28656005859375, 5.4488525390625, 5.61114501953125, 5.7734375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 22.0, 88.0, 320.0, 412.0, 141.0, 24.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.477821350097656, -12.838793754577637, -12.199766159057617, -11.560738563537598, -10.921710968017578, -10.282684326171875, -9.643656730651855, -9.004629135131836, -8.365601539611816, -7.726573944091797, -7.087546348571777, -6.448519229888916, -5.8094916343688965, -5.170464038848877, -4.531436920166016, -3.892409324645996, -3.2533817291259766, -2.614354133605957, -1.9753267765045166, -1.3362993001937866, -0.6972718238830566, -0.05824422836303711, 0.5807831287384033, 1.2198104858398438, 1.8588380813598633, 2.497865676879883, 3.1368930339813232, 3.7759203910827637, 4.414947986602783, 5.053975582122803, 5.693002700805664, 6.332030296325684, 6.971059799194336, 7.6100873947143555, 8.249114990234375, 8.888142585754395, 9.527170181274414, 10.166196823120117, 10.805224418640137, 11.444252014160156, 12.083279609680176, 12.722307205200195, 13.361334800720215, 14.000362396240234, 14.639389038085938, 15.278417587280273, 15.917444229125977, 16.556472778320312, 17.195499420166016, 17.83452606201172, 18.473554611206055, 19.112581253051758, 19.751609802246094, 20.390636444091797, 21.029664993286133, 21.668691635131836, 22.307720184326172, 22.946746826171875, 23.58577537536621, 24.224802017211914, 24.86383056640625, 25.502857208251953, 26.14188575744629, 26.780912399291992, 27.419939041137695]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 2.0, 7.0, 9.0, 14.0, 8.0, 11.0, 9.0, 12.0, 17.0, 23.0, 27.0, 24.0, 22.0, 40.0, 24.0, 33.0, 31.0, 41.0, 38.0, 33.0, 34.0, 44.0, 40.0, 38.0, 41.0, 44.0, 35.0, 38.0, 35.0, 27.0, 30.0, 26.0, 26.0, 19.0, 18.0, 18.0, 11.0, 14.0, 11.0, 2.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.012927532196045, -4.857840538024902, -4.702754020690918, -4.547667026519775, -4.392580509185791, -4.237493515014648, -4.082406997680664, -3.9273200035095215, -3.772233486175537, -3.6171467304229736, -3.46205997467041, -3.3069732189178467, -3.151886463165283, -2.9967997074127197, -2.8417129516601562, -2.6866259574890137, -2.53153920173645, -2.3764524459838867, -2.2213656902313232, -2.0662789344787598, -1.9111921787261963, -1.7561054229736328, -1.6010185480117798, -1.4459317922592163, -1.2908450365066528, -1.1357582807540894, -0.9806715250015259, -0.8255847096443176, -0.6704979538917542, -0.5154111981391907, -0.3603243827819824, -0.20523762702941895, -0.05015087127685547, 0.1049358993768692, 0.26002267003059387, 0.41510945558547974, 0.5701962113380432, 0.7252829670906067, 0.8803697824478149, 1.0354565382003784, 1.190543293952942, 1.3456300497055054, 1.5007168054580688, 1.6558036804199219, 1.8108904361724854, 1.9659771919250488, 2.1210639476776123, 2.276150703430176, 2.4312374591827393, 2.5863242149353027, 2.741410970687866, 2.8964977264404297, 3.051584482192993, 3.2066712379455566, 3.361758232116699, 3.5168447494506836, 3.671931743621826, 3.8270184993743896, 3.982105255126953, 4.137192249298096, 4.29227876663208, 4.447365760803223, 4.602452278137207, 4.75753927230835, 4.912625789642334]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 7.0, 5.0, 9.0, 9.0, 7.0, 10.0, 15.0, 18.0, 23.0, 16.0, 24.0, 21.0, 17.0, 31.0, 23.0, 31.0, 38.0, 29.0, 35.0, 30.0, 29.0, 32.0, 37.0, 53.0, 37.0, 43.0, 35.0, 31.0, 31.0, 37.0, 27.0, 26.0, 34.0, 25.0, 18.0, 20.0, 12.0, 12.0, 12.0, 10.0, 12.0, 5.0, 6.0, 7.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6867523193359375, -0.665496826171875, -0.6442413330078125, -0.62298583984375, -0.6017303466796875, -0.580474853515625, -0.5592193603515625, -0.5379638671875, -0.5167083740234375, -0.495452880859375, -0.4741973876953125, -0.45294189453125, -0.4316864013671875, -0.410430908203125, -0.3891754150390625, -0.367919921875, -0.3466644287109375, -0.325408935546875, -0.3041534423828125, -0.28289794921875, -0.2616424560546875, -0.240386962890625, -0.2191314697265625, -0.1978759765625, -0.1766204833984375, -0.155364990234375, -0.1341094970703125, -0.11285400390625, -0.0915985107421875, -0.070343017578125, -0.0490875244140625, -0.02783203125, -0.0065765380859375, 0.014678955078125, 0.0359344482421875, 0.05718994140625, 0.0784454345703125, 0.099700927734375, 0.1209564208984375, 0.1422119140625, 0.1634674072265625, 0.184722900390625, 0.2059783935546875, 0.22723388671875, 0.2484893798828125, 0.269744873046875, 0.2910003662109375, 0.312255859375, 0.3335113525390625, 0.354766845703125, 0.3760223388671875, 0.39727783203125, 0.4185333251953125, 0.439788818359375, 0.4610443115234375, 0.4822998046875, 0.5035552978515625, 0.524810791015625, 0.5460662841796875, 0.56732177734375, 0.5885772705078125, 0.609832763671875, 0.6310882568359375, 0.65234375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 12.0, 10.0, 16.0, 30.0, 31.0, 49.0, 49.0, 97.0, 154.0, 183.0, 300.0, 489.0, 725.0, 1207.0, 2006.0, 3631.0, 7272.0, 17188.0, 63233.0, 474760.0, 2501654.0, 953956.0, 121997.0, 25042.0, 9620.0, 4426.0, 2379.0, 1349.0, 796.0, 503.0, 358.0, 242.0, 147.0, 95.0, 72.0, 39.0, 39.0, 29.0, 22.0, 11.0, 15.0, 9.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.41796875, -1.371734619140625, -1.32550048828125, -1.279266357421875, -1.2330322265625, -1.186798095703125, -1.14056396484375, -1.094329833984375, -1.048095703125, -1.001861572265625, -0.95562744140625, -0.909393310546875, -0.8631591796875, -0.816925048828125, -0.77069091796875, -0.724456787109375, -0.67822265625, -0.631988525390625, -0.58575439453125, -0.539520263671875, -0.4932861328125, -0.447052001953125, -0.40081787109375, -0.354583740234375, -0.308349609375, -0.262115478515625, -0.21588134765625, -0.169647216796875, -0.1234130859375, -0.077178955078125, -0.03094482421875, 0.015289306640625, 0.0615234375, 0.107757568359375, 0.15399169921875, 0.200225830078125, 0.2464599609375, 0.292694091796875, 0.33892822265625, 0.385162353515625, 0.431396484375, 0.477630615234375, 0.52386474609375, 0.570098876953125, 0.6163330078125, 0.662567138671875, 0.70880126953125, 0.755035400390625, 0.80126953125, 0.847503662109375, 0.89373779296875, 0.939971923828125, 0.9862060546875, 1.032440185546875, 1.07867431640625, 1.124908447265625, 1.171142578125, 1.217376708984375, 1.26361083984375, 1.309844970703125, 1.3560791015625, 1.402313232421875, 1.44854736328125, 1.494781494140625, 1.541015625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 16.0, 27.0, 23.0, 41.0, 62.0, 69.0, 98.0, 151.0, 194.0, 264.0, 397.0, 493.0, 609.0, 450.0, 361.0, 230.0, 163.0, 104.0, 72.0, 55.0, 43.0, 40.0, 27.0, 12.0, 11.0, 10.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.28515625, -1.24774169921875, -1.2103271484375, -1.17291259765625, -1.135498046875, -1.09808349609375, -1.0606689453125, -1.02325439453125, -0.98583984375, -0.94842529296875, -0.9110107421875, -0.87359619140625, -0.836181640625, -0.79876708984375, -0.7613525390625, -0.72393798828125, -0.6865234375, -0.64910888671875, -0.6116943359375, -0.57427978515625, -0.536865234375, -0.49945068359375, -0.4620361328125, -0.42462158203125, -0.38720703125, -0.34979248046875, -0.3123779296875, -0.27496337890625, -0.237548828125, -0.20013427734375, -0.1627197265625, -0.12530517578125, -0.087890625, -0.05047607421875, -0.0130615234375, 0.02435302734375, 0.061767578125, 0.09918212890625, 0.1365966796875, 0.17401123046875, 0.21142578125, 0.24884033203125, 0.2862548828125, 0.32366943359375, 0.361083984375, 0.39849853515625, 0.4359130859375, 0.47332763671875, 0.5107421875, 0.54815673828125, 0.5855712890625, 0.62298583984375, 0.660400390625, 0.69781494140625, 0.7352294921875, 0.77264404296875, 0.81005859375, 0.84747314453125, 0.8848876953125, 0.92230224609375, 0.959716796875, 0.99713134765625, 1.0345458984375, 1.07196044921875, 1.109375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 21.0, 20.0, 47.0, 44.0, 85.0, 142.0, 254.0, 484.0, 914.0, 2145.0, 5105.0, 14353.0, 56524.0, 461005.0, 3207193.0, 373649.0, 50235.0, 13359.0, 4617.0, 2007.0, 936.0, 464.0, 242.0, 156.0, 94.0, 49.0, 37.0, 17.0, 18.0, 12.0, 9.0, 3.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8837890625, -1.8219451904296875, -1.760101318359375, -1.6982574462890625, -1.63641357421875, -1.5745697021484375, -1.512725830078125, -1.4508819580078125, -1.3890380859375, -1.3271942138671875, -1.265350341796875, -1.2035064697265625, -1.14166259765625, -1.0798187255859375, -1.017974853515625, -0.9561309814453125, -0.894287109375, -0.8324432373046875, -0.770599365234375, -0.7087554931640625, -0.64691162109375, -0.5850677490234375, -0.523223876953125, -0.4613800048828125, -0.3995361328125, -0.3376922607421875, -0.275848388671875, -0.2140045166015625, -0.15216064453125, -0.0903167724609375, -0.028472900390625, 0.0333709716796875, 0.09521484375, 0.1570587158203125, 0.218902587890625, 0.2807464599609375, 0.34259033203125, 0.4044342041015625, 0.466278076171875, 0.5281219482421875, 0.5899658203125, 0.6518096923828125, 0.713653564453125, 0.7754974365234375, 0.83734130859375, 0.8991851806640625, 0.961029052734375, 1.0228729248046875, 1.084716796875, 1.1465606689453125, 1.208404541015625, 1.2702484130859375, 1.33209228515625, 1.3939361572265625, 1.455780029296875, 1.5176239013671875, 1.5794677734375, 1.6413116455078125, 1.703155517578125, 1.7649993896484375, 1.82684326171875, 1.8886871337890625, 1.950531005859375, 2.0123748779296875, 2.07421875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 12.0, 28.0, 116.0, 329.0, 357.0, 120.0, 35.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.94904899597168, -17.353107452392578, -16.757165908813477, -16.161224365234375, -15.565281867980957, -14.969340324401855, -14.373397827148438, -13.777456283569336, -13.181514739990234, -12.585573196411133, -11.989631652832031, -11.393689155578613, -10.797747611999512, -10.20180606842041, -9.605863571166992, -9.00992202758789, -8.413980484008789, -7.8180389404296875, -7.222096920013428, -6.626154899597168, -6.030213356018066, -5.434271812438965, -4.838329792022705, -4.242387771606445, -3.6464462280273438, -3.050504446029663, -2.4545626640319824, -1.8586208820343018, -1.262679100036621, -0.6667373180389404, -0.07079553604125977, 0.525146484375, 1.1210899353027344, 1.717031717300415, 2.3129734992980957, 2.9089152812957764, 3.504857063293457, 4.100798606872559, 4.696740627288818, 5.292682647705078, 5.88862419128418, 6.484565734863281, 7.080507755279541, 7.676449775695801, 8.272391319274902, 8.868332862854004, 9.464275360107422, 10.060216903686523, 10.656158447265625, 11.252099990844727, 11.848041534423828, 12.443984031677246, 13.039925575256348, 13.63586711883545, 14.231809616088867, 14.827751159667969, 15.42369270324707, 16.019634246826172, 16.615575790405273, 17.211517333984375, 17.80746078491211, 18.40340232849121, 18.999343872070312, 19.595285415649414, 20.191226959228516]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 8.0, 11.0, 16.0, 17.0, 27.0, 38.0, 30.0, 38.0, 42.0, 43.0, 63.0, 54.0, 66.0, 62.0, 52.0, 61.0, 41.0, 48.0, 53.0, 39.0, 35.0, 32.0, 27.0, 14.0, 15.0, 12.0, 14.0, 10.0, 3.0, 9.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.929605484008789, -5.752139091491699, -5.574672698974609, -5.3972063064575195, -5.21973991394043, -5.04227352142334, -4.86480712890625, -4.68734073638916, -4.50987434387207, -4.3324079513549805, -4.154941558837891, -3.977475166320801, -3.800008773803711, -3.622542381286621, -3.4450762271881104, -3.2676098346710205, -3.0901436805725098, -2.91267728805542, -2.73521089553833, -2.5577445030212402, -2.3802781105041504, -2.2028117179870605, -2.02534556388855, -1.84787917137146, -1.6704127788543701, -1.4929463863372803, -1.3154799938201904, -1.1380137205123901, -0.9605473279953003, -0.7830809354782104, -0.6056146621704102, -0.4281482696533203, -0.25068140029907227, -0.07321503758430481, 0.10425132513046265, 0.2817176580429077, 0.45918405055999756, 0.6366504430770874, 0.8141167163848877, 0.9915831089019775, 1.1690495014190674, 1.3465158939361572, 1.523982286453247, 1.7014485597610474, 1.8789149522781372, 2.0563812255859375, 2.2338476181030273, 2.411314010620117, 2.588780403137207, 2.766246795654297, 2.9437131881713867, 3.1211795806884766, 3.2986459732055664, 3.4761123657226562, 3.653578519821167, 3.831044912338257, 4.008511543273926, 4.185977935791016, 4.3634443283081055, 4.540910720825195, 4.718377113342285, 4.895843505859375, 5.073309898376465, 5.250776290893555, 5.428242206573486]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 7.0, 5.0, 6.0, 8.0, 11.0, 14.0, 21.0, 16.0, 21.0, 18.0, 18.0, 31.0, 25.0, 33.0, 24.0, 30.0, 32.0, 34.0, 39.0, 37.0, 45.0, 47.0, 37.0, 43.0, 31.0, 31.0, 27.0, 32.0, 23.0, 31.0, 27.0, 21.0, 22.0, 18.0, 17.0, 18.0, 18.0, 12.0, 19.0, 17.0, 6.0, 4.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.599609375, -0.5804595947265625, -0.561309814453125, -0.5421600341796875, -0.52301025390625, -0.5038604736328125, -0.484710693359375, -0.4655609130859375, -0.4464111328125, -0.4272613525390625, -0.408111572265625, -0.3889617919921875, -0.36981201171875, -0.3506622314453125, -0.331512451171875, -0.3123626708984375, -0.293212890625, -0.2740631103515625, -0.254913330078125, -0.2357635498046875, -0.21661376953125, -0.1974639892578125, -0.178314208984375, -0.1591644287109375, -0.1400146484375, -0.1208648681640625, -0.101715087890625, -0.0825653076171875, -0.06341552734375, -0.0442657470703125, -0.025115966796875, -0.0059661865234375, 0.01318359375, 0.0323333740234375, 0.051483154296875, 0.0706329345703125, 0.08978271484375, 0.1089324951171875, 0.128082275390625, 0.1472320556640625, 0.1663818359375, 0.1855316162109375, 0.204681396484375, 0.2238311767578125, 0.24298095703125, 0.2621307373046875, 0.281280517578125, 0.3004302978515625, 0.319580078125, 0.3387298583984375, 0.357879638671875, 0.3770294189453125, 0.39617919921875, 0.4153289794921875, 0.434478759765625, 0.4536285400390625, 0.4727783203125, 0.4919281005859375, 0.511077880859375, 0.5302276611328125, 0.54937744140625, 0.5685272216796875, 0.587677001953125, 0.6068267822265625, 0.6259765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 5.0, 5.0, 7.0, 8.0, 10.0, 7.0, 20.0, 25.0, 33.0, 50.0, 85.0, 105.0, 153.0, 233.0, 286.0, 473.0, 686.0, 979.0, 1493.0, 2341.0, 3556.0, 5649.0, 9010.0, 14585.0, 24048.0, 41182.0, 72079.0, 132126.0, 222143.0, 217501.0, 127806.0, 70208.0, 39292.0, 23642.0, 14090.0, 8797.0, 5497.0, 3560.0, 2239.0, 1509.0, 923.0, 664.0, 401.0, 327.0, 206.0, 159.0, 127.0, 68.0, 45.0, 38.0, 25.0, 17.0, 10.0, 11.0, 5.0, 3.0, 5.0, 7.0, 1.0, 3.0, 2.0], "bins": [-0.06817626953125, -0.06604385375976562, -0.06391143798828125, -0.061779022216796875, -0.0596466064453125, -0.057514190673828125, -0.05538177490234375, -0.053249359130859375, -0.051116943359375, -0.048984527587890625, -0.04685211181640625, -0.044719696044921875, -0.0425872802734375, -0.040454864501953125, -0.03832244873046875, -0.036190032958984375, -0.0340576171875, -0.031925201416015625, -0.02979278564453125, -0.027660369873046875, -0.0255279541015625, -0.023395538330078125, -0.02126312255859375, -0.019130706787109375, -0.016998291015625, -0.014865875244140625, -0.01273345947265625, -0.010601043701171875, -0.0084686279296875, -0.006336212158203125, -0.00420379638671875, -0.002071380615234375, 6.103515625e-05, 0.002193450927734375, 0.00432586669921875, 0.006458282470703125, 0.0085906982421875, 0.010723114013671875, 0.01285552978515625, 0.014987945556640625, 0.017120361328125, 0.019252777099609375, 0.02138519287109375, 0.023517608642578125, 0.0256500244140625, 0.027782440185546875, 0.02991485595703125, 0.032047271728515625, 0.0341796875, 0.036312103271484375, 0.03844451904296875, 0.040576934814453125, 0.0427093505859375, 0.044841766357421875, 0.04697418212890625, 0.049106597900390625, 0.051239013671875, 0.053371429443359375, 0.05550384521484375, 0.057636260986328125, 0.0597686767578125, 0.061901092529296875, 0.06403350830078125, 0.06616592407226562, 0.06829833984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 15.0, 13.0, 21.0, 18.0, 23.0, 22.0, 29.0, 27.0, 39.0, 38.0, 38.0, 40.0, 47.0, 31.0, 49.0, 32.0, 1063.0, 47.0, 34.0, 34.0, 38.0, 34.0, 33.0, 29.0, 36.0, 27.0, 23.0, 17.0, 16.0, 16.0, 13.0, 11.0, 10.0, 7.0, 10.0, 5.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5517578125, -0.533477783203125, -0.51519775390625, -0.496917724609375, -0.4786376953125, -0.460357666015625, -0.44207763671875, -0.423797607421875, -0.405517578125, -0.387237548828125, -0.36895751953125, -0.350677490234375, -0.3323974609375, -0.314117431640625, -0.29583740234375, -0.277557373046875, -0.25927734375, -0.240997314453125, -0.22271728515625, -0.204437255859375, -0.1861572265625, -0.167877197265625, -0.14959716796875, -0.131317138671875, -0.113037109375, -0.094757080078125, -0.07647705078125, -0.058197021484375, -0.0399169921875, -0.021636962890625, -0.00335693359375, 0.014923095703125, 0.033203125, 0.051483154296875, 0.06976318359375, 0.088043212890625, 0.1063232421875, 0.124603271484375, 0.14288330078125, 0.161163330078125, 0.179443359375, 0.197723388671875, 0.21600341796875, 0.234283447265625, 0.2525634765625, 0.270843505859375, 0.28912353515625, 0.307403564453125, 0.32568359375, 0.343963623046875, 0.36224365234375, 0.380523681640625, 0.3988037109375, 0.417083740234375, 0.43536376953125, 0.453643798828125, 0.471923828125, 0.490203857421875, 0.50848388671875, 0.526763916015625, 0.5450439453125, 0.563323974609375, 0.58160400390625, 0.599884033203125, 0.6181640625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 7.0, 14.0, 21.0, 26.0, 47.0, 80.0, 107.0, 154.0, 220.0, 338.0, 541.0, 798.0, 1411.0, 2171.0, 3607.0, 6425.0, 12371.0, 30498.0, 239290.0, 1711759.0, 50684.0, 16612.0, 8227.0, 4583.0, 2637.0, 1633.0, 1011.0, 620.0, 427.0, 257.0, 178.0, 114.0, 87.0, 52.0, 30.0, 25.0, 17.0, 15.0, 9.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1917724609375, -0.18616294860839844, -0.18055343627929688, -0.1749439239501953, -0.16933441162109375, -0.1637248992919922, -0.15811538696289062, -0.15250587463378906, -0.1468963623046875, -0.14128684997558594, -0.13567733764648438, -0.1300678253173828, -0.12445831298828125, -0.11884880065917969, -0.11323928833007812, -0.10762977600097656, -0.102020263671875, -0.09641075134277344, -0.09080123901367188, -0.08519172668457031, -0.07958221435546875, -0.07397270202636719, -0.06836318969726562, -0.06275367736816406, -0.0571441650390625, -0.05153465270996094, -0.045925140380859375, -0.04031562805175781, -0.03470611572265625, -0.029096603393554688, -0.023487091064453125, -0.017877578735351562, -0.01226806640625, -0.0066585540771484375, -0.001049041748046875, 0.0045604705810546875, 0.01016998291015625, 0.015779495239257812, 0.021389007568359375, 0.026998519897460938, 0.0326080322265625, 0.03821754455566406, 0.043827056884765625, 0.04943656921386719, 0.05504608154296875, 0.06065559387207031, 0.06626510620117188, 0.07187461853027344, 0.077484130859375, 0.08309364318847656, 0.08870315551757812, 0.09431266784667969, 0.09992218017578125, 0.10553169250488281, 0.11114120483398438, 0.11675071716308594, 0.1223602294921875, 0.12796974182128906, 0.13357925415039062, 0.1391887664794922, 0.14479827880859375, 0.1504077911376953, 0.15601730346679688, 0.16162681579589844, 0.167236328125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 6.0, 7.0, 5.0, 6.0, 6.0, 11.0, 19.0, 9.0, 17.0, 22.0, 19.0, 28.0, 20.0, 30.0, 29.0, 42.0, 48.0, 45.0, 35.0, 35.0, 28.0, 44.0, 41.0, 21.0, 28.0, 45.0, 40.0, 34.0, 30.0, 31.0, 39.0, 30.0, 29.0, 20.0, 18.0, 13.0, 20.0, 13.0, 6.0, 4.0, 8.0, 7.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00519561767578125, -0.005035281181335449, -0.0048749446868896484, -0.004714608192443848, -0.004554271697998047, -0.004393935203552246, -0.004233598709106445, -0.0040732622146606445, -0.003912925720214844, -0.003752589225769043, -0.003592252731323242, -0.0034319162368774414, -0.0032715797424316406, -0.00311124324798584, -0.002950906753540039, -0.0027905702590942383, -0.0026302337646484375, -0.0024698972702026367, -0.002309560775756836, -0.002149224281311035, -0.0019888877868652344, -0.0018285512924194336, -0.0016682147979736328, -0.001507878303527832, -0.0013475418090820312, -0.0011872053146362305, -0.0010268688201904297, -0.0008665323257446289, -0.0007061958312988281, -0.0005458593368530273, -0.00038552284240722656, -0.00022518634796142578, -6.4849853515625e-05, 9.548664093017578e-05, 0.00025582313537597656, 0.00041615962982177734, 0.0005764961242675781, 0.0007368326187133789, 0.0008971691131591797, 0.0010575056076049805, 0.0012178421020507812, 0.001378178596496582, 0.0015385150909423828, 0.0016988515853881836, 0.0018591880798339844, 0.002019524574279785, 0.002179861068725586, 0.0023401975631713867, 0.0025005340576171875, 0.0026608705520629883, 0.002821207046508789, 0.00298154354095459, 0.0031418800354003906, 0.0033022165298461914, 0.003462553024291992, 0.003622889518737793, 0.0037832260131835938, 0.0039435625076293945, 0.004103899002075195, 0.004264235496520996, 0.004424571990966797, 0.004584908485412598, 0.0047452449798583984, 0.004905581474304199, 0.00506591796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 2.0, 7.0, 12.0, 9.0, 12.0, 18.0, 25.0, 24.0, 37.0, 53.0, 59.0, 82.0, 79.0, 107.0, 136.0, 159.0, 261.0, 347.0, 515.0, 1006.0, 15502.0, 962213.0, 64188.0, 1588.0, 559.0, 415.0, 259.0, 209.0, 144.0, 90.0, 86.0, 82.0, 48.0, 47.0, 33.0, 32.0, 29.0, 17.0, 13.0, 9.0, 7.0, 8.0, 7.0, 4.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08465576171875, -0.08198070526123047, -0.07930564880371094, -0.0766305923461914, -0.07395553588867188, -0.07128047943115234, -0.06860542297363281, -0.06593036651611328, -0.06325531005859375, -0.06058025360107422, -0.05790519714355469, -0.055230140686035156, -0.052555084228515625, -0.049880027770996094, -0.04720497131347656, -0.04452991485595703, -0.0418548583984375, -0.03917980194091797, -0.03650474548339844, -0.033829689025878906, -0.031154632568359375, -0.028479576110839844, -0.025804519653320312, -0.02312946319580078, -0.02045440673828125, -0.01777935028076172, -0.015104293823242188, -0.012429237365722656, -0.009754180908203125, -0.007079124450683594, -0.0044040679931640625, -0.0017290115356445312, 0.000946044921875, 0.0036211013793945312, 0.0062961578369140625, 0.008971214294433594, 0.011646270751953125, 0.014321327209472656, 0.016996383666992188, 0.01967144012451172, 0.02234649658203125, 0.02502155303955078, 0.027696609497070312, 0.030371665954589844, 0.033046722412109375, 0.035721778869628906, 0.03839683532714844, 0.04107189178466797, 0.0437469482421875, 0.04642200469970703, 0.04909706115722656, 0.051772117614746094, 0.054447174072265625, 0.057122230529785156, 0.05979728698730469, 0.06247234344482422, 0.06514739990234375, 0.06782245635986328, 0.07049751281738281, 0.07317256927490234, 0.07584762573242188, 0.0785226821899414, 0.08119773864746094, 0.08387279510498047, 0.0865478515625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 27.0, 329.0, 617.0, 36.0, 1.0], "bins": [-0.17205320298671722, -0.16923828423023224, -0.16642335057258606, -0.16360843181610107, -0.1607935130596161, -0.1579785794019699, -0.15516366064548492, -0.15234872698783875, -0.14953380823135376, -0.14671888947486877, -0.1439039558172226, -0.1410890370607376, -0.13827410340309143, -0.13545918464660645, -0.13264426589012146, -0.12982933223247528, -0.1270144134759903, -0.12419948726892471, -0.12138456106185913, -0.11856964230537415, -0.11575471609830856, -0.11293978989124298, -0.110124871134758, -0.10730994492769241, -0.10449501872062683, -0.10168009251356125, -0.09886516630649567, -0.09605024755001068, -0.0932353213429451, -0.09042039513587952, -0.08760547637939453, -0.08479055017232895, -0.08197562396526337, -0.07916069775819778, -0.0763457715511322, -0.07353085279464722, -0.07071592658758163, -0.06790100038051605, -0.06508608162403107, -0.062271155416965485, -0.0594562329351902, -0.05664131045341492, -0.053826384246349335, -0.05101145803928375, -0.04819653555750847, -0.045381613075733185, -0.0425666868686676, -0.03975176066160202, -0.036936838179826736, -0.03412191569805145, -0.03130698949098587, -0.028492065146565437, -0.025677140802145004, -0.02286221645772457, -0.020047292113304138, -0.017232367768883705, -0.014417442493140697, -0.011602518148720264, -0.008787593804299831, -0.005972669459879398, -0.0031577451154589653, -0.00034282077103853226, 0.002472103573381901, 0.005287027917802334, 0.008101952262222767]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 2.0, 8.0, 13.0, 14.0, 27.0, 17.0, 23.0, 17.0, 25.0, 30.0, 35.0, 41.0, 34.0, 25.0, 42.0, 33.0, 44.0, 39.0, 46.0, 42.0, 31.0, 38.0, 41.0, 46.0, 37.0, 37.0, 23.0, 36.0, 17.0, 21.0, 19.0, 13.0, 14.0, 12.0, 8.0, 10.0, 8.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.012272179126739502, -0.011850595474243164, -0.011429011821746826, -0.011007428169250488, -0.01058584451675415, -0.010164260864257812, -0.009742677211761475, -0.009321093559265137, -0.008899509906768799, -0.008477926254272461, -0.008056342601776123, -0.007634758949279785, -0.007213175296783447, -0.006791591644287109, -0.0063700079917907715, -0.005948424339294434, -0.005526840686798096, -0.005105257034301758, -0.00468367338180542, -0.004262089729309082, -0.003840506076812744, -0.0034189224243164062, -0.0029973387718200684, -0.0025757551193237305, -0.0021541714668273926, -0.0017325878143310547, -0.0013110041618347168, -0.0008894205093383789, -0.000467836856842041, -4.6253204345703125e-05, 0.00037533044815063477, 0.0007969141006469727, 0.0012184977531433105, 0.0016400814056396484, 0.0020616650581359863, 0.0024832487106323242, 0.002904832363128662, 0.003326416015625, 0.003747999668121338, 0.004169583320617676, 0.004591166973114014, 0.0050127506256103516, 0.0054343342781066895, 0.005855917930603027, 0.006277501583099365, 0.006699085235595703, 0.007120668888092041, 0.007542252540588379, 0.007963836193084717, 0.008385419845581055, 0.008807003498077393, 0.00922858715057373, 0.009650170803070068, 0.010071754455566406, 0.010493338108062744, 0.010914921760559082, 0.01133650541305542, 0.011758089065551758, 0.012179672718048096, 0.012601256370544434, 0.013022840023040771, 0.01344442367553711, 0.013866007328033447, 0.014287590980529785, 0.014709174633026123]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 0.0, 3.0, 7.0, 7.0, 5.0, 6.0, 8.0, 11.0, 15.0, 20.0, 16.0, 21.0, 17.0, 20.0, 30.0, 25.0, 33.0, 24.0, 31.0, 31.0, 34.0, 38.0, 39.0, 45.0, 46.0, 37.0, 43.0, 32.0, 31.0, 26.0, 32.0, 23.0, 32.0, 26.0, 21.0, 22.0, 18.0, 17.0, 18.0, 18.0, 11.0, 20.0, 16.0, 7.0, 4.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5795135498046875, -0.560394287109375, -0.5412750244140625, -0.52215576171875, -0.5030364990234375, -0.483917236328125, -0.4647979736328125, -0.4456787109375, -0.4265594482421875, -0.407440185546875, -0.3883209228515625, -0.36920166015625, -0.3500823974609375, -0.330963134765625, -0.3118438720703125, -0.292724609375, -0.2736053466796875, -0.254486083984375, -0.2353668212890625, -0.21624755859375, -0.1971282958984375, -0.178009033203125, -0.1588897705078125, -0.1397705078125, -0.1206512451171875, -0.101531982421875, -0.0824127197265625, -0.06329345703125, -0.0441741943359375, -0.025054931640625, -0.0059356689453125, 0.01318359375, 0.0323028564453125, 0.051422119140625, 0.0705413818359375, 0.08966064453125, 0.1087799072265625, 0.127899169921875, 0.1470184326171875, 0.1661376953125, 0.1852569580078125, 0.204376220703125, 0.2234954833984375, 0.24261474609375, 0.2617340087890625, 0.280853271484375, 0.2999725341796875, 0.319091796875, 0.3382110595703125, 0.357330322265625, 0.3764495849609375, 0.39556884765625, 0.4146881103515625, 0.433807373046875, 0.4529266357421875, 0.4720458984375, 0.4911651611328125, 0.510284423828125, 0.5294036865234375, 0.54852294921875, 0.5676422119140625, 0.586761474609375, 0.6058807373046875, 0.625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 5.0, 20.0, 21.0, 27.0, 34.0, 53.0, 59.0, 101.0, 144.0, 203.0, 285.0, 383.0, 528.0, 801.0, 1284.0, 1923.0, 3332.0, 5485.0, 10389.0, 21305.0, 50833.0, 153686.0, 445903.0, 225015.0, 69524.0, 27197.0, 12748.0, 6820.0, 3744.0, 2231.0, 1373.0, 987.0, 602.0, 420.0, 272.0, 232.0, 146.0, 127.0, 76.0, 56.0, 48.0, 33.0, 19.0, 22.0, 8.0, 8.0, 6.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.83056640625, -0.8058853149414062, -0.7812042236328125, -0.7565231323242188, -0.731842041015625, -0.7071609497070312, -0.6824798583984375, -0.6577987670898438, -0.63311767578125, -0.6084365844726562, -0.5837554931640625, -0.5590744018554688, -0.534393310546875, -0.5097122192382812, -0.4850311279296875, -0.46035003662109375, -0.4356689453125, -0.41098785400390625, -0.3863067626953125, -0.36162567138671875, -0.336944580078125, -0.31226348876953125, -0.2875823974609375, -0.26290130615234375, -0.23822021484375, -0.21353912353515625, -0.1888580322265625, -0.16417694091796875, -0.139495849609375, -0.11481475830078125, -0.0901336669921875, -0.06545257568359375, -0.040771484375, -0.01609039306640625, 0.0085906982421875, 0.03327178955078125, 0.057952880859375, 0.08263397216796875, 0.1073150634765625, 0.13199615478515625, 0.15667724609375, 0.18135833740234375, 0.2060394287109375, 0.23072052001953125, 0.255401611328125, 0.28008270263671875, 0.3047637939453125, 0.32944488525390625, 0.3541259765625, 0.37880706787109375, 0.4034881591796875, 0.42816925048828125, 0.452850341796875, 0.47753143310546875, 0.5022125244140625, 0.5268936157226562, 0.55157470703125, 0.5762557983398438, 0.6009368896484375, 0.6256179809570312, 0.650299072265625, 0.6749801635742188, 0.6996612548828125, 0.7243423461914062, 0.7490234375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 8.0, 6.0, 7.0, 12.0, 10.0, 24.0, 19.0, 26.0, 33.0, 38.0, 28.0, 52.0, 74.0, 81.0, 210.0, 1443.0, 365.0, 156.0, 89.0, 65.0, 54.0, 47.0, 35.0, 32.0, 25.0, 17.0, 19.0, 10.0, 10.0, 11.0, 12.0, 7.0, 7.0, 3.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5092010498046875, -1.452972412109375, -1.3967437744140625, -1.34051513671875, -1.2842864990234375, -1.228057861328125, -1.1718292236328125, -1.1156005859375, -1.0593719482421875, -1.003143310546875, -0.9469146728515625, -0.89068603515625, -0.8344573974609375, -0.778228759765625, -0.7220001220703125, -0.665771484375, -0.6095428466796875, -0.553314208984375, -0.4970855712890625, -0.44085693359375, -0.3846282958984375, -0.328399658203125, -0.2721710205078125, -0.2159423828125, -0.1597137451171875, -0.103485107421875, -0.0472564697265625, 0.00897216796875, 0.0652008056640625, 0.121429443359375, 0.1776580810546875, 0.23388671875, 0.2901153564453125, 0.346343994140625, 0.4025726318359375, 0.45880126953125, 0.5150299072265625, 0.571258544921875, 0.6274871826171875, 0.6837158203125, 0.7399444580078125, 0.796173095703125, 0.8524017333984375, 0.90863037109375, 0.9648590087890625, 1.021087646484375, 1.0773162841796875, 1.133544921875, 1.1897735595703125, 1.246002197265625, 1.3022308349609375, 1.35845947265625, 1.4146881103515625, 1.470916748046875, 1.5271453857421875, 1.5833740234375, 1.6396026611328125, 1.695831298828125, 1.7520599365234375, 1.80828857421875, 1.8645172119140625, 1.920745849609375, 1.9769744873046875, 2.033203125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 6.0, 8.0, 10.0, 17.0, 23.0, 21.0, 19.0, 26.0, 32.0, 40.0, 74.0, 104.0, 133.0, 192.0, 333.0, 716.0, 2518.0, 47893.0, 3024339.0, 64729.0, 2730.0, 685.0, 358.0, 181.0, 129.0, 95.0, 66.0, 52.0, 29.0, 38.0, 19.0, 17.0, 14.0, 6.0, 12.0, 6.0, 9.0, 3.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.052734375, -2.961700439453125, -2.87066650390625, -2.779632568359375, -2.6885986328125, -2.597564697265625, -2.50653076171875, -2.415496826171875, -2.324462890625, -2.233428955078125, -2.14239501953125, -2.051361083984375, -1.9603271484375, -1.869293212890625, -1.77825927734375, -1.687225341796875, -1.59619140625, -1.505157470703125, -1.41412353515625, -1.323089599609375, -1.2320556640625, -1.141021728515625, -1.04998779296875, -0.958953857421875, -0.867919921875, -0.776885986328125, -0.68585205078125, -0.594818115234375, -0.5037841796875, -0.412750244140625, -0.32171630859375, -0.230682373046875, -0.1396484375, -0.048614501953125, 0.04241943359375, 0.133453369140625, 0.2244873046875, 0.315521240234375, 0.40655517578125, 0.497589111328125, 0.588623046875, 0.679656982421875, 0.77069091796875, 0.861724853515625, 0.9527587890625, 1.043792724609375, 1.13482666015625, 1.225860595703125, 1.31689453125, 1.407928466796875, 1.49896240234375, 1.589996337890625, 1.6810302734375, 1.772064208984375, 1.86309814453125, 1.954132080078125, 2.045166015625, 2.136199951171875, 2.22723388671875, 2.318267822265625, 2.4093017578125, 2.500335693359375, 2.59136962890625, 2.682403564453125, 2.7734375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 21.0, 301.0, 599.0, 91.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.105854034423828, -30.49928092956543, -29.8927059173584, -29.2861328125, -28.67955780029297, -28.07298469543457, -27.466411590576172, -26.85983657836914, -26.253263473510742, -25.646690368652344, -25.040115356445312, -24.433542251586914, -23.826969146728516, -23.220394134521484, -22.613821029663086, -22.007247924804688, -21.400672912597656, -20.794099807739258, -20.187524795532227, -19.580951690673828, -18.974376678466797, -18.3678035736084, -17.76123046875, -17.15465545654297, -16.54808235168457, -15.941508293151855, -15.33493423461914, -14.728361129760742, -14.121787071228027, -13.515213012695312, -12.908639907836914, -12.3020658493042, -11.695490837097168, -11.088916778564453, -10.482343673706055, -9.87576961517334, -9.269195556640625, -8.66262149810791, -8.056047439575195, -7.449474334716797, -6.842900276184082, -6.236326217651367, -5.6297526359558105, -5.023179054260254, -4.416604995727539, -3.8100311756134033, -3.2034573554992676, -2.596883773803711, -1.990309715270996, -1.3837358951568604, -0.7771620750427246, -0.17058825492858887, 0.4359855651855469, 1.0425593852996826, 1.6491332054138184, 2.255706787109375, 2.86228084564209, 3.4688546657562256, 4.075428485870361, 4.682002067565918, 5.288576126098633, 5.895150184631348, 6.501723766326904, 7.108297348022461, 7.714871406555176]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 8.0, 7.0, 9.0, 10.0, 14.0, 13.0, 5.0, 9.0, 14.0, 20.0, 24.0, 29.0, 22.0, 28.0, 33.0, 27.0, 40.0, 39.0, 36.0, 40.0, 39.0, 46.0, 45.0, 38.0, 38.0, 36.0, 50.0, 44.0, 35.0, 22.0, 28.0, 20.0, 23.0, 21.0, 14.0, 12.0, 4.0, 17.0, 6.0, 6.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.18989896774292, -3.082162857055664, -2.9744269847869873, -2.8666908740997314, -2.7589550018310547, -2.651218891143799, -2.543482780456543, -2.435746669769287, -2.3280107975006104, -2.2202746868133545, -2.1125388145446777, -2.004802703857422, -1.8970667123794556, -1.7893307209014893, -1.6815946102142334, -1.573858618736267, -1.4661226272583008, -1.3583866357803345, -1.2506506443023682, -1.1429145336151123, -1.035178542137146, -0.9274425506591797, -0.8197064995765686, -0.7119704484939575, -0.6042344570159912, -0.4964984357357025, -0.3887624144554138, -0.2810263931751251, -0.17329037189483643, -0.06555438041687012, 0.04218167066574097, 0.14991772174835205, 0.25765395164489746, 0.36538997292518616, 0.47312599420547485, 0.5808620452880859, 0.6885980367660522, 0.7963340282440186, 0.9040700793266296, 1.0118061304092407, 1.119542121887207, 1.2272781133651733, 1.3350141048431396, 1.4427502155303955, 1.5504862070083618, 1.6582221984863281, 1.765958309173584, 1.8736943006515503, 1.9814302921295166, 2.0891664028167725, 2.196902275085449, 2.304638385772705, 2.412374496459961, 2.5201103687286377, 2.6278464794158936, 2.7355823516845703, 2.843318462371826, 2.951054573059082, 3.058790445327759, 3.1665265560150146, 3.2742624282836914, 3.3819985389709473, 3.489734649658203, 3.597470760345459, 3.7052066326141357]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 7.0, 7.0, 10.0, 5.0, 10.0, 12.0, 9.0, 20.0, 19.0, 18.0, 13.0, 26.0, 32.0, 27.0, 36.0, 34.0, 31.0, 39.0, 36.0, 39.0, 26.0, 39.0, 36.0, 35.0, 41.0, 39.0, 27.0, 36.0, 29.0, 28.0, 25.0, 25.0, 23.0, 21.0, 14.0, 16.0, 14.0, 19.0, 10.0, 11.0, 11.0, 8.0, 11.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.60986328125, -0.5893096923828125, -0.568756103515625, -0.5482025146484375, -0.52764892578125, -0.5070953369140625, -0.486541748046875, -0.4659881591796875, -0.4454345703125, -0.4248809814453125, -0.404327392578125, -0.3837738037109375, -0.36322021484375, -0.3426666259765625, -0.322113037109375, -0.3015594482421875, -0.281005859375, -0.2604522705078125, -0.239898681640625, -0.2193450927734375, -0.19879150390625, -0.1782379150390625, -0.157684326171875, -0.1371307373046875, -0.1165771484375, -0.0960235595703125, -0.075469970703125, -0.0549163818359375, -0.03436279296875, -0.0138092041015625, 0.006744384765625, 0.0272979736328125, 0.0478515625, 0.0684051513671875, 0.088958740234375, 0.1095123291015625, 0.13006591796875, 0.1506195068359375, 0.171173095703125, 0.1917266845703125, 0.2122802734375, 0.2328338623046875, 0.253387451171875, 0.2739410400390625, 0.29449462890625, 0.3150482177734375, 0.335601806640625, 0.3561553955078125, 0.376708984375, 0.3972625732421875, 0.417816162109375, 0.4383697509765625, 0.45892333984375, 0.4794769287109375, 0.500030517578125, 0.5205841064453125, 0.5411376953125, 0.5616912841796875, 0.582244873046875, 0.6027984619140625, 0.62335205078125, 0.6439056396484375, 0.664459228515625, 0.6850128173828125, 0.70556640625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 10.0, 5.0, 9.0, 9.0, 17.0, 20.0, 24.0, 22.0, 33.0, 59.0, 51.0, 98.0, 128.0, 199.0, 347.0, 488.0, 928.0, 1708.0, 3265.0, 6779.0, 14954.0, 39232.0, 153473.0, 1569728.0, 2105933.0, 217779.0, 47236.0, 16676.0, 7183.0, 3485.0, 1736.0, 961.0, 562.0, 378.0, 221.0, 146.0, 114.0, 92.0, 46.0, 31.0, 24.0, 33.0, 18.0, 13.0, 9.0, 13.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.515625, -2.4320068359375, -2.348388671875, -2.2647705078125, -2.18115234375, -2.0975341796875, -2.013916015625, -1.9302978515625, -1.8466796875, -1.7630615234375, -1.679443359375, -1.5958251953125, -1.51220703125, -1.4285888671875, -1.344970703125, -1.2613525390625, -1.177734375, -1.0941162109375, -1.010498046875, -0.9268798828125, -0.84326171875, -0.7596435546875, -0.676025390625, -0.5924072265625, -0.5087890625, -0.4251708984375, -0.341552734375, -0.2579345703125, -0.17431640625, -0.0906982421875, -0.007080078125, 0.0765380859375, 0.16015625, 0.2437744140625, 0.327392578125, 0.4110107421875, 0.49462890625, 0.5782470703125, 0.661865234375, 0.7454833984375, 0.8291015625, 0.9127197265625, 0.996337890625, 1.0799560546875, 1.16357421875, 1.2471923828125, 1.330810546875, 1.4144287109375, 1.498046875, 1.5816650390625, 1.665283203125, 1.7489013671875, 1.83251953125, 1.9161376953125, 1.999755859375, 2.0833740234375, 2.1669921875, 2.2506103515625, 2.334228515625, 2.4178466796875, 2.50146484375, 2.5850830078125, 2.668701171875, 2.7523193359375, 2.8359375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 9.0, 8.0, 18.0, 19.0, 25.0, 50.0, 51.0, 83.0, 116.0, 178.0, 266.0, 447.0, 625.0, 659.0, 470.0, 337.0, 217.0, 137.0, 114.0, 73.0, 47.0, 35.0, 21.0, 17.0, 15.0, 9.0, 3.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.078125, -2.997467041015625, -2.91680908203125, -2.836151123046875, -2.7554931640625, -2.674835205078125, -2.59417724609375, -2.513519287109375, -2.432861328125, -2.352203369140625, -2.27154541015625, -2.190887451171875, -2.1102294921875, -2.029571533203125, -1.94891357421875, -1.868255615234375, -1.78759765625, -1.706939697265625, -1.62628173828125, -1.545623779296875, -1.4649658203125, -1.384307861328125, -1.30364990234375, -1.222991943359375, -1.142333984375, -1.061676025390625, -0.98101806640625, -0.900360107421875, -0.8197021484375, -0.739044189453125, -0.65838623046875, -0.577728271484375, -0.4970703125, -0.416412353515625, -0.33575439453125, -0.255096435546875, -0.1744384765625, -0.093780517578125, -0.01312255859375, 0.067535400390625, 0.148193359375, 0.228851318359375, 0.30950927734375, 0.390167236328125, 0.4708251953125, 0.551483154296875, 0.63214111328125, 0.712799072265625, 0.79345703125, 0.874114990234375, 0.95477294921875, 1.035430908203125, 1.1160888671875, 1.196746826171875, 1.27740478515625, 1.358062744140625, 1.438720703125, 1.519378662109375, 1.60003662109375, 1.680694580078125, 1.7613525390625, 1.842010498046875, 1.92266845703125, 2.003326416015625, 2.083984375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 13.0, 23.0, 28.0, 34.0, 34.0, 61.0, 87.0, 120.0, 249.0, 394.0, 543.0, 890.0, 1617.0, 3191.0, 6091.0, 12711.0, 28704.0, 73939.0, 243128.0, 1330966.0, 1969578.0, 357381.0, 96213.0, 36613.0, 15861.0, 7327.0, 3592.0, 2075.0, 1096.0, 651.0, 363.0, 233.0, 150.0, 88.0, 78.0, 54.0, 29.0, 27.0, 13.0, 15.0, 5.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.9130859375, -1.8586273193359375, -1.804168701171875, -1.7497100830078125, -1.69525146484375, -1.6407928466796875, -1.586334228515625, -1.5318756103515625, -1.4774169921875, -1.4229583740234375, -1.368499755859375, -1.3140411376953125, -1.25958251953125, -1.2051239013671875, -1.150665283203125, -1.0962066650390625, -1.041748046875, -0.9872894287109375, -0.932830810546875, -0.8783721923828125, -0.82391357421875, -0.7694549560546875, -0.714996337890625, -0.6605377197265625, -0.6060791015625, -0.5516204833984375, -0.497161865234375, -0.4427032470703125, -0.38824462890625, -0.3337860107421875, -0.279327392578125, -0.2248687744140625, -0.17041015625, -0.1159515380859375, -0.061492919921875, -0.0070343017578125, 0.04742431640625, 0.1018829345703125, 0.156341552734375, 0.2108001708984375, 0.2652587890625, 0.3197174072265625, 0.374176025390625, 0.4286346435546875, 0.48309326171875, 0.5375518798828125, 0.592010498046875, 0.6464691162109375, 0.700927734375, 0.7553863525390625, 0.809844970703125, 0.8643035888671875, 0.91876220703125, 0.9732208251953125, 1.027679443359375, 1.0821380615234375, 1.1365966796875, 1.1910552978515625, 1.245513916015625, 1.2999725341796875, 1.35443115234375, 1.4088897705078125, 1.463348388671875, 1.5178070068359375, 1.572265625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 12.0, 2.0, 11.0, 12.0, 15.0, 14.0, 15.0, 24.0, 44.0, 34.0, 64.0, 67.0, 69.0, 83.0, 104.0, 77.0, 63.0, 62.0, 45.0, 36.0, 25.0, 22.0, 20.0, 12.0, 13.0, 13.0, 8.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.795857429504395, -11.386923789978027, -10.97799015045166, -10.569056510925293, -10.160122871398926, -9.751189231872559, -9.342255592346191, -8.933321952819824, -8.524388313293457, -8.11545467376709, -7.706521034240723, -7.2975873947143555, -6.888653755187988, -6.479720115661621, -6.070786476135254, -5.661852836608887, -5.2529191970825195, -4.843985557556152, -4.435051918029785, -4.026118278503418, -3.617184638977051, -3.2082509994506836, -2.7993173599243164, -2.390383720397949, -1.981450080871582, -1.5725164413452148, -1.1635828018188477, -0.7546491622924805, -0.3457155227661133, 0.0632181167602539, 0.4721517562866211, 0.8810853958129883, 1.290018081665039, 1.6989517211914062, 2.1078853607177734, 2.5168190002441406, 2.925752639770508, 3.334686279296875, 3.743619918823242, 4.152553558349609, 4.561487197875977, 4.970420837402344, 5.379354476928711, 5.788288116455078, 6.197221755981445, 6.6061553955078125, 7.01508903503418, 7.424022674560547, 7.832956314086914, 8.241889953613281, 8.650823593139648, 9.059757232666016, 9.468690872192383, 9.87762451171875, 10.286558151245117, 10.695491790771484, 11.104425430297852, 11.513359069824219, 11.922292709350586, 12.331226348876953, 12.74015998840332, 13.149093627929688, 13.558027267456055, 13.966960906982422, 14.375894546508789]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 17.0, 11.0, 15.0, 13.0, 14.0, 17.0, 22.0, 17.0, 35.0, 27.0, 35.0, 43.0, 32.0, 42.0, 46.0, 29.0, 47.0, 44.0, 38.0, 38.0, 34.0, 23.0, 44.0, 38.0, 24.0, 27.0, 24.0, 35.0, 22.0, 19.0, 14.0, 11.0, 18.0, 12.0, 13.0, 8.0, 4.0, 3.0, 7.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.22474479675293, -8.941580772399902, -8.658416748046875, -8.375252723693848, -8.09208869934082, -7.808924674987793, -7.525760173797607, -7.24259614944458, -6.959432125091553, -6.676268100738525, -6.393104076385498, -6.109940052032471, -5.826775550842285, -5.543611526489258, -5.2604475021362305, -4.977283477783203, -4.694119453430176, -4.410955429077148, -4.127791404724121, -3.8446271419525146, -3.5614631175994873, -3.27829909324646, -2.9951348304748535, -2.711970806121826, -2.428806781768799, -2.1456427574157715, -1.8624786138534546, -1.5793144702911377, -1.2961504459381104, -1.012986421585083, -0.7298222780227661, -0.4466581344604492, -0.16349506378173828, 0.11966902017593384, 0.40283310413360596, 0.6859971880912781, 0.9691612720489502, 1.2523252964019775, 1.5354894399642944, 1.8186535835266113, 2.1018176078796387, 2.384981632232666, 2.6681456565856934, 2.9513099193573, 3.234473943710327, 3.5176379680633545, 3.800802230834961, 4.083966255187988, 4.367130279541016, 4.650294303894043, 4.93345832824707, 5.216622352600098, 5.499786376953125, 5.782950401306152, 6.066114902496338, 6.349278926849365, 6.632442951202393, 6.91560697555542, 7.198770999908447, 7.481935024261475, 7.76509952545166, 8.048263549804688, 8.331427574157715, 8.614591598510742, 8.89775562286377]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 5.0, 6.0, 7.0, 11.0, 9.0, 13.0, 15.0, 12.0, 17.0, 26.0, 16.0, 24.0, 40.0, 32.0, 28.0, 46.0, 38.0, 40.0, 45.0, 48.0, 41.0, 47.0, 43.0, 38.0, 33.0, 45.0, 35.0, 27.0, 28.0, 29.0, 20.0, 25.0, 15.0, 16.0, 15.0, 15.0, 9.0, 12.0, 4.0, 5.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-18.15625, -17.599609375, -17.04296875, -16.486328125, -15.9296875, -15.373046875, -14.81640625, -14.259765625, -13.703125, -13.146484375, -12.58984375, -12.033203125, -11.4765625, -10.919921875, -10.36328125, -9.806640625, -9.25, -8.693359375, -8.13671875, -7.580078125, -7.0234375, -6.466796875, -5.91015625, -5.353515625, -4.796875, -4.240234375, -3.68359375, -3.126953125, -2.5703125, -2.013671875, -1.45703125, -0.900390625, -0.34375, 0.212890625, 0.76953125, 1.326171875, 1.8828125, 2.439453125, 2.99609375, 3.552734375, 4.109375, 4.666015625, 5.22265625, 5.779296875, 6.3359375, 6.892578125, 7.44921875, 8.005859375, 8.5625, 9.119140625, 9.67578125, 10.232421875, 10.7890625, 11.345703125, 11.90234375, 12.458984375, 13.015625, 13.572265625, 14.12890625, 14.685546875, 15.2421875, 15.798828125, 16.35546875, 16.912109375, 17.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 30.0, 45.0, 46.0, 65.0, 81.0, 114.0, 200.0, 259.0, 338.0, 521.0, 731.0, 1071.0, 1566.0, 2282.0, 3397.0, 5139.0, 7782.0, 12078.0, 18591.0, 30735.0, 53100.0, 101517.0, 217882.0, 278453.0, 139530.0, 69006.0, 38188.0, 23145.0, 14386.0, 9354.0, 6179.0, 4046.0, 2714.0, 1820.0, 1272.0, 800.0, 592.0, 459.0, 283.0, 208.0, 148.0, 107.0, 73.0, 45.0, 43.0, 33.0, 20.0, 18.0, 7.0, 12.0, 4.0, 4.0, 4.0, 2.0, 1.0], "bins": [-0.88671875, -0.85919189453125, -0.8316650390625, -0.80413818359375, -0.776611328125, -0.74908447265625, -0.7215576171875, -0.69403076171875, -0.66650390625, -0.63897705078125, -0.6114501953125, -0.58392333984375, -0.556396484375, -0.52886962890625, -0.5013427734375, -0.47381591796875, -0.4462890625, -0.41876220703125, -0.3912353515625, -0.36370849609375, -0.336181640625, -0.30865478515625, -0.2811279296875, -0.25360107421875, -0.22607421875, -0.19854736328125, -0.1710205078125, -0.14349365234375, -0.115966796875, -0.08843994140625, -0.0609130859375, -0.03338623046875, -0.005859375, 0.02166748046875, 0.0491943359375, 0.07672119140625, 0.104248046875, 0.13177490234375, 0.1593017578125, 0.18682861328125, 0.21435546875, 0.24188232421875, 0.2694091796875, 0.29693603515625, 0.324462890625, 0.35198974609375, 0.3795166015625, 0.40704345703125, 0.4345703125, 0.46209716796875, 0.4896240234375, 0.51715087890625, 0.544677734375, 0.57220458984375, 0.5997314453125, 0.62725830078125, 0.65478515625, 0.68231201171875, 0.7098388671875, 0.73736572265625, 0.764892578125, 0.79241943359375, 0.8199462890625, 0.84747314453125, 0.875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 7.0, 9.0, 12.0, 18.0, 15.0, 23.0, 17.0, 25.0, 25.0, 30.0, 27.0, 33.0, 44.0, 44.0, 35.0, 40.0, 48.0, 1065.0, 38.0, 38.0, 46.0, 37.0, 39.0, 39.0, 36.0, 36.0, 22.0, 20.0, 26.0, 23.0, 24.0, 14.0, 13.0, 7.0, 10.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.7806396484375, -10.428466796875, -10.0762939453125, -9.72412109375, -9.3719482421875, -9.019775390625, -8.6676025390625, -8.3154296875, -7.9632568359375, -7.611083984375, -7.2589111328125, -6.90673828125, -6.5545654296875, -6.202392578125, -5.8502197265625, -5.498046875, -5.1458740234375, -4.793701171875, -4.4415283203125, -4.08935546875, -3.7371826171875, -3.385009765625, -3.0328369140625, -2.6806640625, -2.3284912109375, -1.976318359375, -1.6241455078125, -1.27197265625, -0.9197998046875, -0.567626953125, -0.2154541015625, 0.13671875, 0.4888916015625, 0.841064453125, 1.1932373046875, 1.54541015625, 1.8975830078125, 2.249755859375, 2.6019287109375, 2.9541015625, 3.3062744140625, 3.658447265625, 4.0106201171875, 4.36279296875, 4.7149658203125, 5.067138671875, 5.4193115234375, 5.771484375, 6.1236572265625, 6.475830078125, 6.8280029296875, 7.18017578125, 7.5323486328125, 7.884521484375, 8.2366943359375, 8.5888671875, 8.9410400390625, 9.293212890625, 9.6453857421875, 9.99755859375, 10.3497314453125, 10.701904296875, 11.0540771484375, 11.40625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 5.0, 14.0, 15.0, 23.0, 27.0, 52.0, 65.0, 75.0, 115.0, 187.0, 240.0, 374.0, 560.0, 858.0, 1258.0, 1932.0, 2982.0, 4817.0, 8499.0, 17248.0, 50022.0, 917019.0, 1001647.0, 49818.0, 17120.0, 8522.0, 4856.0, 3003.0, 1864.0, 1272.0, 832.0, 559.0, 394.0, 281.0, 171.0, 139.0, 80.0, 52.0, 30.0, 29.0, 18.0, 15.0, 14.0, 10.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.240234375, -2.174346923828125, -2.10845947265625, -2.042572021484375, -1.9766845703125, -1.910797119140625, -1.84490966796875, -1.779022216796875, -1.713134765625, -1.647247314453125, -1.58135986328125, -1.515472412109375, -1.4495849609375, -1.383697509765625, -1.31781005859375, -1.251922607421875, -1.18603515625, -1.120147705078125, -1.05426025390625, -0.988372802734375, -0.9224853515625, -0.856597900390625, -0.79071044921875, -0.724822998046875, -0.658935546875, -0.593048095703125, -0.52716064453125, -0.461273193359375, -0.3953857421875, -0.329498291015625, -0.26361083984375, -0.197723388671875, -0.1318359375, -0.065948486328125, -6.103515625e-05, 0.065826416015625, 0.1317138671875, 0.197601318359375, 0.26348876953125, 0.329376220703125, 0.395263671875, 0.461151123046875, 0.52703857421875, 0.592926025390625, 0.6588134765625, 0.724700927734375, 0.79058837890625, 0.856475830078125, 0.92236328125, 0.988250732421875, 1.05413818359375, 1.120025634765625, 1.1859130859375, 1.251800537109375, 1.31768798828125, 1.383575439453125, 1.449462890625, 1.515350341796875, 1.58123779296875, 1.647125244140625, 1.7130126953125, 1.778900146484375, 1.84478759765625, 1.910675048828125, 1.9765625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 8.0, 8.0, 13.0, 5.0, 11.0, 14.0, 22.0, 29.0, 28.0, 35.0, 36.0, 50.0, 54.0, 63.0, 71.0, 72.0, 64.0, 70.0, 58.0, 47.0, 44.0, 41.0, 37.0, 19.0, 17.0, 20.0, 14.0, 9.0, 12.0, 14.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0266876220703125, -0.02572941780090332, -0.02477121353149414, -0.02381300926208496, -0.02285480499267578, -0.0218966007232666, -0.020938396453857422, -0.019980192184448242, -0.019021987915039062, -0.018063783645629883, -0.017105579376220703, -0.016147375106811523, -0.015189170837402344, -0.014230966567993164, -0.013272762298583984, -0.012314558029174805, -0.011356353759765625, -0.010398149490356445, -0.009439945220947266, -0.008481740951538086, -0.007523536682128906, -0.0065653324127197266, -0.005607128143310547, -0.004648923873901367, -0.0036907196044921875, -0.002732515335083008, -0.0017743110656738281, -0.0008161067962646484, 0.00014209747314453125, 0.001100301742553711, 0.0020585060119628906, 0.0030167102813720703, 0.00397491455078125, 0.00493311882019043, 0.005891323089599609, 0.006849527359008789, 0.007807731628417969, 0.008765935897827148, 0.009724140167236328, 0.010682344436645508, 0.011640548706054688, 0.012598752975463867, 0.013556957244873047, 0.014515161514282227, 0.015473365783691406, 0.016431570053100586, 0.017389774322509766, 0.018347978591918945, 0.019306182861328125, 0.020264387130737305, 0.021222591400146484, 0.022180795669555664, 0.023138999938964844, 0.024097204208374023, 0.025055408477783203, 0.026013612747192383, 0.026971817016601562, 0.027930021286010742, 0.028888225555419922, 0.0298464298248291, 0.03080463409423828, 0.03176283836364746, 0.03272104263305664, 0.03367924690246582, 0.034637451171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 10.0, 11.0, 10.0, 12.0, 20.0, 31.0, 51.0, 82.0, 150.0, 217.0, 342.0, 651.0, 1092.0, 1978.0, 3815.0, 7864.0, 17430.0, 40621.0, 101633.0, 255802.0, 339936.0, 163649.0, 63905.0, 26120.0, 11514.0, 5350.0, 2766.0, 1503.0, 807.0, 456.0, 262.0, 187.0, 89.0, 81.0, 39.0, 21.0, 13.0, 10.0, 10.0, 8.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11187744140625, -0.10805225372314453, -0.10422706604003906, -0.1004018783569336, -0.09657669067382812, -0.09275150299072266, -0.08892631530761719, -0.08510112762451172, -0.08127593994140625, -0.07745075225830078, -0.07362556457519531, -0.06980037689208984, -0.06597518920898438, -0.062150001525878906, -0.05832481384277344, -0.05449962615966797, -0.0506744384765625, -0.04684925079345703, -0.04302406311035156, -0.039198875427246094, -0.035373687744140625, -0.031548500061035156, -0.027723312377929688, -0.02389812469482422, -0.02007293701171875, -0.01624774932861328, -0.012422561645507812, -0.008597373962402344, -0.004772186279296875, -0.0009469985961914062, 0.0028781890869140625, 0.006703376770019531, 0.010528564453125, 0.014353752136230469, 0.018178939819335938, 0.022004127502441406, 0.025829315185546875, 0.029654502868652344, 0.03347969055175781, 0.03730487823486328, 0.04113006591796875, 0.04495525360107422, 0.04878044128417969, 0.052605628967285156, 0.056430816650390625, 0.060256004333496094, 0.06408119201660156, 0.06790637969970703, 0.0717315673828125, 0.07555675506591797, 0.07938194274902344, 0.0832071304321289, 0.08703231811523438, 0.09085750579833984, 0.09468269348144531, 0.09850788116455078, 0.10233306884765625, 0.10615825653076172, 0.10998344421386719, 0.11380863189697266, 0.11763381958007812, 0.1214590072631836, 0.12528419494628906, 0.12910938262939453, 0.1329345703125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 1.0, 8.0, 4.0, 5.0, 8.0, 11.0, 5.0, 16.0, 12.0, 19.0, 21.0, 39.0, 46.0, 60.0, 68.0, 99.0, 102.0, 110.0, 87.0, 82.0, 47.0, 41.0, 26.0, 25.0, 21.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0], "bins": [-0.08136045187711716, -0.0797160193324089, -0.07807158678770065, -0.0764271467924118, -0.07478271424770355, -0.0731382817029953, -0.07149384915828705, -0.0698494091629982, -0.06820497661828995, -0.0665605440735817, -0.06491611152887344, -0.0632716715335846, -0.06162723898887634, -0.05998280644416809, -0.05833837017416954, -0.05669393762946129, -0.05504950135946274, -0.053405068814754486, -0.051760632544755936, -0.050116200000047684, -0.04847176373004913, -0.04682733118534088, -0.04518289491534233, -0.04353846237063408, -0.04189402982592583, -0.040249597281217575, -0.038605161011219025, -0.03696072846651077, -0.03531629219651222, -0.03367185965180397, -0.03202742338180542, -0.030382990837097168, -0.02873855270445347, -0.027094118297100067, -0.025449683889746666, -0.023805249482393265, -0.022160815075039864, -0.020516380667686462, -0.01887194812297821, -0.01722751185297966, -0.015583078376948833, -0.013938643969595432, -0.012294209562242031, -0.010649776086211205, -0.009005341678857803, -0.007360907271504402, -0.005716472864151001, -0.0040720384567976, -0.0024276040494441986, -0.0007831697585061193, 0.0008612645324319601, 0.0025056987069547176, 0.004150133114308119, 0.005794567056000233, 0.007439001463353634, 0.009083435870707035, 0.010727870278060436, 0.012372304685413837, 0.014016739092767239, 0.015661172568798065, 0.017305606976151466, 0.018950041383504868, 0.02059447579085827, 0.02223891019821167, 0.02388334460556507]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 14.0, 7.0, 12.0, 9.0, 14.0, 19.0, 22.0, 16.0, 20.0, 18.0, 39.0, 23.0, 28.0, 27.0, 27.0, 38.0, 33.0, 33.0, 36.0, 30.0, 41.0, 41.0, 41.0, 23.0, 24.0, 23.0, 27.0, 28.0, 31.0, 30.0, 28.0, 26.0, 12.0, 25.0, 15.0, 19.0, 18.0, 12.0, 13.0, 12.0, 11.0, 7.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.03300124406814575, -0.0319954939186573, -0.030989741906523705, -0.029983989894390106, -0.028978239744901657, -0.027972489595413208, -0.02696673758327961, -0.02596098557114601, -0.024955235421657562, -0.023949485272169113, -0.022943733260035515, -0.021937981247901917, -0.020932231098413467, -0.01992648094892502, -0.01892072893679142, -0.01791497692465782, -0.016909226775169373, -0.015903476625680923, -0.014897724613547325, -0.013891973532736301, -0.012886222451925278, -0.011880471371114254, -0.01087472029030323, -0.009868969209492207, -0.008863218128681183, -0.00785746704787016, -0.0068517159670591354, -0.005845964886248112, -0.004840213805437088, -0.0038344627246260643, -0.0028287116438150406, -0.0018229605630040169, -0.0008172094821929932, 0.00018854159861803055, 0.0011942926794290543, 0.002200043760240078, 0.0032057948410511017, 0.004211545921862125, 0.005217297002673149, 0.006223048083484173, 0.0072287991642951965, 0.00823455024510622, 0.009240301325917244, 0.010246052406728268, 0.011251803487539291, 0.012257554568350315, 0.013263305649161339, 0.014269056729972363, 0.015274807810783386, 0.016280557960271835, 0.017286309972405434, 0.018292061984539032, 0.01929781213402748, 0.02030356228351593, 0.02130931429564953, 0.022315066307783127, 0.023320816457271576, 0.024326566606760025, 0.025332318618893623, 0.02633807063102722, 0.02734382078051567, 0.02834957093000412, 0.029355322942137718, 0.030361074954271317, 0.031366825103759766]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 12.0, 8.0, 13.0, 15.0, 12.0, 19.0, 25.0, 15.0, 26.0, 38.0, 32.0, 28.0, 45.0, 37.0, 39.0, 46.0, 46.0, 46.0, 46.0, 42.0, 38.0, 34.0, 43.0, 39.0, 25.0, 27.0, 28.0, 24.0, 24.0, 16.0, 14.0, 17.0, 12.0, 10.0, 13.0, 4.0, 4.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-18.234375, -17.676025390625, -17.11767578125, -16.559326171875, -16.0009765625, -15.442626953125, -14.88427734375, -14.325927734375, -13.767578125, -13.209228515625, -12.65087890625, -12.092529296875, -11.5341796875, -10.975830078125, -10.41748046875, -9.859130859375, -9.30078125, -8.742431640625, -8.18408203125, -7.625732421875, -7.0673828125, -6.509033203125, -5.95068359375, -5.392333984375, -4.833984375, -4.275634765625, -3.71728515625, -3.158935546875, -2.6005859375, -2.042236328125, -1.48388671875, -0.925537109375, -0.3671875, 0.191162109375, 0.74951171875, 1.307861328125, 1.8662109375, 2.424560546875, 2.98291015625, 3.541259765625, 4.099609375, 4.657958984375, 5.21630859375, 5.774658203125, 6.3330078125, 6.891357421875, 7.44970703125, 8.008056640625, 8.56640625, 9.124755859375, 9.68310546875, 10.241455078125, 10.7998046875, 11.358154296875, 11.91650390625, 12.474853515625, 13.033203125, 13.591552734375, 14.14990234375, 14.708251953125, 15.2666015625, 15.824951171875, 16.38330078125, 16.941650390625, 17.5]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 5.0, 7.0, 7.0, 8.0, 13.0, 12.0, 15.0, 14.0, 21.0, 42.0, 46.0, 62.0, 94.0, 166.0, 214.0, 351.0, 717.0, 1640.0, 5511.0, 25069.0, 217419.0, 701077.0, 77950.0, 12386.0, 3150.0, 1120.0, 534.0, 272.0, 194.0, 120.0, 83.0, 50.0, 45.0, 25.0, 29.0, 18.0, 20.0, 14.0, 7.0, 3.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.84375, -3.724700927734375, -3.60565185546875, -3.486602783203125, -3.3675537109375, -3.248504638671875, -3.12945556640625, -3.010406494140625, -2.891357421875, -2.772308349609375, -2.65325927734375, -2.534210205078125, -2.4151611328125, -2.296112060546875, -2.17706298828125, -2.058013916015625, -1.93896484375, -1.819915771484375, -1.70086669921875, -1.581817626953125, -1.4627685546875, -1.343719482421875, -1.22467041015625, -1.105621337890625, -0.986572265625, -0.867523193359375, -0.74847412109375, -0.629425048828125, -0.5103759765625, -0.391326904296875, -0.27227783203125, -0.153228759765625, -0.0341796875, 0.084869384765625, 0.20391845703125, 0.322967529296875, 0.4420166015625, 0.561065673828125, 0.68011474609375, 0.799163818359375, 0.918212890625, 1.037261962890625, 1.15631103515625, 1.275360107421875, 1.3944091796875, 1.513458251953125, 1.63250732421875, 1.751556396484375, 1.87060546875, 1.989654541015625, 2.10870361328125, 2.227752685546875, 2.3468017578125, 2.465850830078125, 2.58489990234375, 2.703948974609375, 2.822998046875, 2.942047119140625, 3.06109619140625, 3.180145263671875, 3.2991943359375, 3.418243408203125, 3.53729248046875, 3.656341552734375, 3.775390625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 16.0, 13.0, 13.0, 22.0, 16.0, 22.0, 31.0, 25.0, 43.0, 42.0, 56.0, 42.0, 42.0, 61.0, 59.0, 2107.0, 42.0, 51.0, 40.0, 54.0, 43.0, 32.0, 34.0, 26.0, 21.0, 27.0, 17.0, 18.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.484375, -22.630126953125, -21.77587890625, -20.921630859375, -20.0673828125, -19.213134765625, -18.35888671875, -17.504638671875, -16.650390625, -15.796142578125, -14.94189453125, -14.087646484375, -13.2333984375, -12.379150390625, -11.52490234375, -10.670654296875, -9.81640625, -8.962158203125, -8.10791015625, -7.253662109375, -6.3994140625, -5.545166015625, -4.69091796875, -3.836669921875, -2.982421875, -2.128173828125, -1.27392578125, -0.419677734375, 0.4345703125, 1.288818359375, 2.14306640625, 2.997314453125, 3.8515625, 4.705810546875, 5.56005859375, 6.414306640625, 7.2685546875, 8.122802734375, 8.97705078125, 9.831298828125, 10.685546875, 11.539794921875, 12.39404296875, 13.248291015625, 14.1025390625, 14.956787109375, 15.81103515625, 16.665283203125, 17.51953125, 18.373779296875, 19.22802734375, 20.082275390625, 20.9365234375, 21.790771484375, 22.64501953125, 23.499267578125, 24.353515625, 25.207763671875, 26.06201171875, 26.916259765625, 27.7705078125, 28.624755859375, 29.47900390625, 30.333251953125, 31.1875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 5.0, 4.0, 4.0, 7.0, 9.0, 13.0, 14.0, 28.0, 30.0, 51.0, 64.0, 115.0, 200.0, 504.0, 1663.0, 9005.0, 97080.0, 2938766.0, 87102.0, 8418.0, 1569.0, 494.0, 195.0, 105.0, 77.0, 43.0, 35.0, 24.0, 26.0, 17.0, 7.0, 4.0, 9.0, 5.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.46484375, -4.335357666015625, -4.20587158203125, -4.076385498046875, -3.9468994140625, -3.817413330078125, -3.68792724609375, -3.558441162109375, -3.428955078125, -3.299468994140625, -3.16998291015625, -3.040496826171875, -2.9110107421875, -2.781524658203125, -2.65203857421875, -2.522552490234375, -2.39306640625, -2.263580322265625, -2.13409423828125, -2.004608154296875, -1.8751220703125, -1.745635986328125, -1.61614990234375, -1.486663818359375, -1.357177734375, -1.227691650390625, -1.09820556640625, -0.968719482421875, -0.8392333984375, -0.709747314453125, -0.58026123046875, -0.450775146484375, -0.3212890625, -0.191802978515625, -0.06231689453125, 0.067169189453125, 0.1966552734375, 0.326141357421875, 0.45562744140625, 0.585113525390625, 0.714599609375, 0.844085693359375, 0.97357177734375, 1.103057861328125, 1.2325439453125, 1.362030029296875, 1.49151611328125, 1.621002197265625, 1.75048828125, 1.879974365234375, 2.00946044921875, 2.138946533203125, 2.2684326171875, 2.397918701171875, 2.52740478515625, 2.656890869140625, 2.786376953125, 2.915863037109375, 3.04534912109375, 3.174835205078125, 3.3043212890625, 3.433807373046875, 3.56329345703125, 3.692779541015625, 3.822265625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 5.0, 12.0, 12.0, 31.0, 38.0, 45.0, 94.0, 131.0, 171.0, 137.0, 98.0, 64.0, 32.0, 27.0, 21.0, 12.0, 10.0, 13.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.203628540039062, -22.123918533325195, -21.044206619262695, -19.964496612548828, -18.884784698486328, -17.80507469177246, -16.725364685058594, -15.645652770996094, -14.56594181060791, -13.486230850219727, -12.406519889831543, -11.32680892944336, -10.247098922729492, -9.167387008666992, -8.087677001953125, -7.007966041564941, -5.928255081176758, -4.848544120788574, -3.7688333988189697, -2.6891226768493652, -1.6094117164611816, -0.529700756072998, 0.5500097274780273, 1.629720687866211, 2.7094316482543945, 3.789142608642578, 4.868853569030762, 5.948564052581787, 7.028275012969971, 8.107986450195312, 9.18769645690918, 10.267407417297363, 11.347118377685547, 12.42682933807373, 13.506540298461914, 14.586250305175781, 15.665962219238281, 16.74567222595215, 17.825382232666016, 18.905094146728516, 19.984806060791016, 21.064516067504883, 22.144227981567383, 23.22393798828125, 24.30364990234375, 25.383359909057617, 26.463069915771484, 27.542781829833984, 28.62249183654785, 29.70220184326172, 30.78191375732422, 31.861623764038086, 32.94133377075195, 34.02104568481445, 35.10075759887695, 36.18046569824219, 37.26017761230469, 38.33988952636719, 39.41959762573242, 40.49930953979492, 41.57902145385742, 42.65873336791992, 43.738441467285156, 44.818153381347656, 45.897865295410156]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 10.0, 16.0, 15.0, 19.0, 15.0, 37.0, 24.0, 30.0, 31.0, 27.0, 39.0, 38.0, 48.0, 54.0, 53.0, 55.0, 36.0, 49.0, 44.0, 36.0, 24.0, 36.0, 30.0, 29.0, 30.0, 26.0, 11.0, 20.0, 11.0, 15.0, 13.0, 4.0, 5.0, 5.0, 4.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.56686782836914, -32.4387092590332, -31.310546875, -30.18238639831543, -29.05422592163086, -27.926067352294922, -26.79790687561035, -25.66974639892578, -24.54158592224121, -23.41342544555664, -22.28526496887207, -21.1571044921875, -20.028945922851562, -18.90078353881836, -17.772624969482422, -16.64446449279785, -15.516304016113281, -14.388143539428711, -13.25998306274414, -12.131823539733887, -11.003663063049316, -9.875502586364746, -8.747343063354492, -7.619182586669922, -6.491022109985352, -5.362861633300781, -4.234701633453369, -3.106541395187378, -1.9783811569213867, -0.8502206802368164, 0.2779393196105957, 1.4060993194580078, 2.5342559814453125, 3.6624162197113037, 4.790576457977295, 5.918736457824707, 7.046896934509277, 8.175057411193848, 9.303216934204102, 10.431377410888672, 11.559537887573242, 12.687698364257812, 13.815858840942383, 14.944018363952637, 16.07217788696289, 17.200340270996094, 18.32849884033203, 19.4566593170166, 20.584819793701172, 21.712980270385742, 22.841140747070312, 23.969301223754883, 25.097461700439453, 26.22562026977539, 27.35378074645996, 28.48194122314453, 29.6101016998291, 30.738262176513672, 31.866422653198242, 32.99458312988281, 34.12274169921875, 35.25090408325195, 36.37906265258789, 37.507225036621094, 38.63538360595703]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 7.0, 5.0, 13.0, 11.0, 7.0, 16.0, 20.0, 16.0, 30.0, 28.0, 24.0, 27.0, 51.0, 73.0, 103.0, 179.0, 445.0, 1598.0, 9670.0, 1029629.0, 4783.0, 926.0, 342.0, 145.0, 83.0, 48.0, 38.0, 45.0, 24.0, 22.0, 20.0, 18.0, 16.0, 14.0, 11.0, 11.0, 8.0, 7.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.872523307800293, -13.4148588180542, -12.957194328308105, -12.499528884887695, -12.041864395141602, -11.584199905395508, -11.126535415649414, -10.66887092590332, -10.211206436157227, -9.753541946411133, -9.295877456665039, -8.838212966918945, -8.380547523498535, -7.922883033752441, -7.465218544006348, -7.007554054260254, -6.549889087677002, -6.092224597930908, -5.634559631347656, -5.1768951416015625, -4.719230651855469, -4.261566162109375, -3.803901195526123, -3.3462367057800293, -2.8885719776153564, -2.4309072494506836, -1.9732427597045898, -1.515578031539917, -1.0579134225845337, -0.6002488136291504, -0.14258408546447754, 0.3150804042816162, 0.7727451324462891, 1.2304097414016724, 1.6880743503570557, 2.1457390785217285, 2.6034035682678223, 3.061068296432495, 3.518733024597168, 3.9763975143432617, 4.4340620040893555, 4.891726493835449, 5.349391460418701, 5.807055950164795, 6.264720439910889, 6.722385406494141, 7.180049896240234, 7.637714385986328, 8.095378875732422, 8.553043365478516, 9.01070785522461, 9.468372344970703, 9.926037788391113, 10.383702278137207, 10.8413667678833, 11.299031257629395, 11.756696701049805, 12.214361190795898, 12.672025680541992, 13.129690170288086, 13.587355613708496, 14.04502010345459, 14.502684593200684, 14.960349082946777, 15.418013572692871]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 20.0, 316.0, 51459800.0, 2898.0, 92.0, 12.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.65272521972656, -214.3427734375, -206.03282165527344, -197.72286987304688, -189.4129180908203, -181.10296630859375, -172.79302978515625, -164.48306274414062, -156.17312622070312, -147.86317443847656, -139.55322265625, -131.24327087402344, -122.93331909179688, -114.62336730957031, -106.31342315673828, -98.00347137451172, -89.69351196289062, -81.38356018066406, -73.0736083984375, -64.76365661621094, -56.45370864868164, -48.14375686645508, -39.83380889892578, -31.52385711669922, -23.213905334472656, -14.90395450592041, -6.594003677368164, 1.7159461975097656, 10.025897979736328, 18.33584976196289, 26.645797729492188, 34.95574951171875, 43.265716552734375, 51.57566833496094, 59.8856201171875, 68.19557189941406, 76.50552368164062, 84.81547546386719, 93.12541961669922, 101.43537139892578, 109.74532318115234, 118.0552749633789, 126.36522674560547, 134.6751708984375, 142.98512268066406, 151.29507446289062, 159.6050262451172, 167.91497802734375, 176.2249298095703, 184.53488159179688, 192.84483337402344, 201.15478515625, 209.46473693847656, 217.77468872070312, 226.08462524414062, 234.39459228515625, 242.70452880859375, 251.0144805908203, 259.3244323730469, 267.6343688964844, 275.9443359375, 284.2542724609375, 292.5642395019531, 300.8741760253906, 309.18414306640625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 13.0, 16.0, 27.0, 41.0, 66.0, 102.0, 150.0, 185.0, 137.0, 88.0, 61.0, 40.0, 22.0, 10.0, 9.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.37734031677246, -17.655338287353516, -16.93333625793457, -16.211334228515625, -15.48933219909668, -14.767330169677734, -14.045328140258789, -13.323326110839844, -12.601324081420898, -11.879322052001953, -11.157320022583008, -10.435317993164062, -9.713315963745117, -8.991313934326172, -8.269311904907227, -7.547309875488281, -6.825307846069336, -6.103305816650391, -5.381303787231445, -4.6593017578125, -3.9372997283935547, -3.2152976989746094, -2.493295669555664, -1.7712936401367188, -1.0492916107177734, -0.3272895812988281, 0.3947124481201172, 1.1167144775390625, 1.8387165069580078, 2.560718536376953, 3.2827205657958984, 4.004722595214844, 4.726726531982422, 5.448728561401367, 6.1707305908203125, 6.892732620239258, 7.614734649658203, 8.336736679077148, 9.058738708496094, 9.780740737915039, 10.502742767333984, 11.22474479675293, 11.946746826171875, 12.66874885559082, 13.390750885009766, 14.112752914428711, 14.834754943847656, 15.556756973266602, 16.278759002685547, 17.000761032104492, 17.722763061523438, 18.444765090942383, 19.166767120361328, 19.888769149780273, 20.61077117919922, 21.332773208618164, 22.05477523803711, 22.776777267456055, 23.498779296875, 24.220781326293945, 24.94278335571289, 25.664785385131836, 26.38678741455078, 27.108789443969727, 27.830791473388672]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 5.0, 2.0, 5.0, 5.0, 9.0, 12.0, 13.0, 21.0, 22.0, 26.0, 31.0, 30.0, 35.0, 30.0, 34.0, 53.0, 43.0, 49.0, 54.0, 51.0, 58.0, 41.0, 42.0, 39.0, 39.0, 30.0, 28.0, 25.0, 27.0, 16.0, 28.0, 13.0, 21.0, 5.0, 11.0, 9.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-15.704792022705078, -15.232220649719238, -14.759649276733398, -14.287077903747559, -13.814506530761719, -13.341935157775879, -12.869363784790039, -12.3967924118042, -11.92422103881836, -11.45164966583252, -10.97907829284668, -10.50650691986084, -10.033935546875, -9.56136417388916, -9.08879280090332, -8.61622142791748, -8.14365005493164, -7.671078681945801, -7.198507308959961, -6.725935935974121, -6.253364562988281, -5.780793190002441, -5.308221817016602, -4.835650444030762, -4.3630781173706055, -3.8905067443847656, -3.417935371398926, -2.945363998413086, -2.472792625427246, -2.000221014022827, -1.5276496410369873, -1.0550782680511475, -0.5825071334838867, -0.10993573069572449, 0.36263567209243774, 0.8352071046829224, 1.3077784776687622, 1.7803499698638916, 2.2529213428497314, 2.7254927158355713, 3.198064088821411, 3.670635461807251, 4.14320707321167, 4.61577844619751, 5.08834981918335, 5.5609211921691895, 6.033492565155029, 6.506063938140869, 6.978635311126709, 7.451206684112549, 7.923778057098389, 8.396349906921387, 8.868921279907227, 9.341492652893066, 9.814064025878906, 10.286635398864746, 10.759206771850586, 11.231778144836426, 11.704349517822266, 12.176920890808105, 12.649492263793945, 13.122063636779785, 13.594635009765625, 14.067206382751465, 14.539777755737305]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 13.0, 16.0, 13.0, 28.0, 51.0, 74.0, 121.0, 210.0, 359.0, 538.0, 972.0, 1586.0, 2748.0, 4897.0, 9202.0, 18623.0, 45246.0, 173286.0, 3114053.0, 654057.0, 98195.0, 34420.0, 16443.0, 8342.0, 4677.0, 2631.0, 1412.0, 820.0, 436.0, 295.0, 185.0, 109.0, 72.0, 43.0, 32.0, 17.0, 23.0, 6.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.56689453125, -0.5490798950195312, -0.5312652587890625, -0.5134506225585938, -0.495635986328125, -0.47782135009765625, -0.4600067138671875, -0.44219207763671875, -0.42437744140625, -0.40656280517578125, -0.3887481689453125, -0.37093353271484375, -0.353118896484375, -0.33530426025390625, -0.3174896240234375, -0.29967498779296875, -0.2818603515625, -0.26404571533203125, -0.2462310791015625, -0.22841644287109375, -0.210601806640625, -0.19278717041015625, -0.1749725341796875, -0.15715789794921875, -0.13934326171875, -0.12152862548828125, -0.1037139892578125, -0.08589935302734375, -0.068084716796875, -0.05027008056640625, -0.0324554443359375, -0.01464080810546875, 0.003173828125, 0.02098846435546875, 0.0388031005859375, 0.05661773681640625, 0.074432373046875, 0.09224700927734375, 0.1100616455078125, 0.12787628173828125, 0.14569091796875, 0.16350555419921875, 0.1813201904296875, 0.19913482666015625, 0.216949462890625, 0.23476409912109375, 0.2525787353515625, 0.27039337158203125, 0.2882080078125, 0.30602264404296875, 0.3238372802734375, 0.34165191650390625, 0.359466552734375, 0.37728118896484375, 0.3950958251953125, 0.41291046142578125, 0.43072509765625, 0.44853973388671875, 0.4663543701171875, 0.48416900634765625, 0.501983642578125, 0.5197982788085938, 0.5376129150390625, 0.5554275512695312, 0.5732421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 2.0, 5.0, 3.0, 5.0, 10.0, 8.0, 11.0, 7.0, 19.0, 32.0, 63.0, 122.0, 154.0, 179.0, 112.0, 92.0, 46.0, 35.0, 13.0, 12.0, 6.0, 7.0, 5.0, 7.0, 9.0, 4.0, 9.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05584716796875, -0.05365180969238281, -0.051456451416015625, -0.04926109313964844, -0.04706573486328125, -0.04487037658691406, -0.042675018310546875, -0.04047966003417969, -0.0382843017578125, -0.03608894348144531, -0.033893585205078125, -0.03169822692871094, -0.02950286865234375, -0.027307510375976562, -0.025112152099609375, -0.022916793823242188, -0.020721435546875, -0.018526077270507812, -0.016330718994140625, -0.014135360717773438, -0.01194000244140625, -0.009744644165039062, -0.007549285888671875, -0.0053539276123046875, -0.0031585693359375, -0.0009632110595703125, 0.001232147216796875, 0.0034275054931640625, 0.00562286376953125, 0.007818222045898438, 0.010013580322265625, 0.012208938598632812, 0.014404296875, 0.016599655151367188, 0.018795013427734375, 0.020990371704101562, 0.02318572998046875, 0.025381088256835938, 0.027576446533203125, 0.029771804809570312, 0.0319671630859375, 0.03416252136230469, 0.036357879638671875, 0.03855323791503906, 0.04074859619140625, 0.04294395446777344, 0.045139312744140625, 0.04733467102050781, 0.049530029296875, 0.05172538757324219, 0.053920745849609375, 0.05611610412597656, 0.05831146240234375, 0.06050682067871094, 0.06270217895507812, 0.06489753723144531, 0.0670928955078125, 0.06928825378417969, 0.07148361206054688, 0.07367897033691406, 0.07587432861328125, 0.07806968688964844, 0.08026504516601562, 0.08246040344238281, 0.08465576171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 10.0, 13.0, 24.0, 33.0, 40.0, 73.0, 85.0, 134.0, 271.0, 396.0, 770.0, 1425.0, 2849.0, 5808.0, 13084.0, 32330.0, 91647.0, 311577.0, 2337124.0, 1054886.0, 224281.0, 70501.0, 25943.0, 10779.0, 4896.0, 2391.0, 1217.0, 670.0, 404.0, 229.0, 134.0, 94.0, 46.0, 37.0, 29.0, 13.0, 13.0, 5.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.3504638671875, -0.337890625, -0.3253173828125, -0.312744140625, -0.3001708984375, -0.28759765625, -0.2750244140625, -0.262451171875, -0.2498779296875, -0.2373046875, -0.2247314453125, -0.212158203125, -0.1995849609375, -0.18701171875, -0.1744384765625, -0.161865234375, -0.1492919921875, -0.13671875, -0.1241455078125, -0.111572265625, -0.0989990234375, -0.08642578125, -0.0738525390625, -0.061279296875, -0.0487060546875, -0.0361328125, -0.0235595703125, -0.010986328125, 0.0015869140625, 0.01416015625, 0.0267333984375, 0.039306640625, 0.0518798828125, 0.064453125, 0.0770263671875, 0.089599609375, 0.1021728515625, 0.11474609375, 0.1273193359375, 0.139892578125, 0.1524658203125, 0.1650390625, 0.1776123046875, 0.190185546875, 0.2027587890625, 0.21533203125, 0.2279052734375, 0.240478515625, 0.2530517578125, 0.265625, 0.2781982421875, 0.290771484375, 0.3033447265625, 0.31591796875, 0.3284912109375, 0.341064453125, 0.3536376953125, 0.3662109375, 0.3787841796875, 0.391357421875, 0.4039306640625, 0.41650390625, 0.4290771484375, 0.441650390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 15.0, 6.0, 7.0, 24.0, 13.0, 23.0, 31.0, 44.0, 66.0, 77.0, 87.0, 111.0, 158.0, 185.0, 202.0, 358.0, 856.0, 488.0, 299.0, 223.0, 155.0, 130.0, 125.0, 78.0, 68.0, 58.0, 37.0, 34.0, 22.0, 17.0, 11.0, 10.0, 14.0, 6.0, 2.0, 8.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08978271484375, -0.08676719665527344, -0.08375167846679688, -0.08073616027832031, -0.07772064208984375, -0.07470512390136719, -0.07168960571289062, -0.06867408752441406, -0.0656585693359375, -0.06264305114746094, -0.059627532958984375, -0.05661201477050781, -0.05359649658203125, -0.05058097839355469, -0.047565460205078125, -0.04454994201660156, -0.041534423828125, -0.03851890563964844, -0.035503387451171875, -0.03248786926269531, -0.02947235107421875, -0.026456832885742188, -0.023441314697265625, -0.020425796508789062, -0.0174102783203125, -0.014394760131835938, -0.011379241943359375, -0.008363723754882812, -0.00534820556640625, -0.0023326873779296875, 0.000682830810546875, 0.0036983489990234375, 0.0067138671875, 0.009729385375976562, 0.012744903564453125, 0.015760421752929688, 0.01877593994140625, 0.021791458129882812, 0.024806976318359375, 0.027822494506835938, 0.0308380126953125, 0.03385353088378906, 0.036869049072265625, 0.03988456726074219, 0.04290008544921875, 0.04591560363769531, 0.048931121826171875, 0.05194664001464844, 0.054962158203125, 0.05797767639160156, 0.060993194580078125, 0.06400871276855469, 0.06702423095703125, 0.07003974914550781, 0.07305526733398438, 0.07607078552246094, 0.0790863037109375, 0.08210182189941406, 0.08511734008789062, 0.08813285827636719, 0.09114837646484375, 0.09416389465332031, 0.09717941284179688, 0.10019493103027344, 0.10321044921875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 8.0, 10.0, 14.0, 30.0, 32.0, 51.0, 87.0, 121.0, 117.0, 111.0, 120.0, 89.0, 52.0, 47.0, 27.0, 24.0, 11.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.088911771774292, -1.0484071969985962, -1.00790274143219, -0.9673981666564941, -0.9268935918807983, -0.8863890767097473, -0.8458845615386963, -0.8053799867630005, -0.7648754715919495, -0.7243709564208984, -0.6838663816452026, -0.6433618664741516, -0.6028573513031006, -0.5623527765274048, -0.5218482613563538, -0.48134371638298035, -0.44083917140960693, -0.4003346264362335, -0.3598300814628601, -0.3193255662918091, -0.27882102131843567, -0.23831647634506226, -0.19781194627285004, -0.15730741620063782, -0.1168028712272644, -0.07629833370447159, -0.03579379618167877, 0.004710741341114044, 0.04521527886390686, 0.08571982383728027, 0.1262243539094925, 0.1667288839817047, 0.20723342895507812, 0.24773797392845154, 0.28824251890182495, 0.328747034072876, 0.3692515790462494, 0.4097561240196228, 0.45026063919067383, 0.49076518416404724, 0.5312697291374207, 0.5717742443084717, 0.6122788190841675, 0.6527833342552185, 0.6932878494262695, 0.7337924242019653, 0.7742969393730164, 0.8148014545440674, 0.8553060293197632, 0.8958105444908142, 0.93631511926651, 0.976819634437561, 1.0173242092132568, 1.057828664779663, 1.0983332395553589, 1.1388378143310547, 1.179342269897461, 1.2198468446731567, 1.260351300239563, 1.3008558750152588, 1.3413604497909546, 1.3818650245666504, 1.4223694801330566, 1.4628740549087524, 1.5033786296844482]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 12.0, 6.0, 7.0, 13.0, 12.0, 17.0, 15.0, 16.0, 22.0, 21.0, 23.0, 24.0, 39.0, 44.0, 42.0, 38.0, 34.0, 50.0, 55.0, 47.0, 55.0, 40.0, 43.0, 46.0, 35.0, 29.0, 32.0, 20.0, 23.0, 17.0, 22.0, 19.0, 14.0, 11.0, 13.0, 5.0, 6.0, 11.0, 1.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5396407246589661, -0.5225182175636292, -0.5053956508636475, -0.48827314376831055, -0.47115063667297363, -0.45402809977531433, -0.43690556287765503, -0.4197830557823181, -0.4026605486869812, -0.3855380117893219, -0.368415504693985, -0.3512929677963257, -0.33417046070098877, -0.31704792380332947, -0.29992538690567017, -0.28280287981033325, -0.26568034291267395, -0.24855782091617584, -0.23143529891967773, -0.21431276202201843, -0.19719025492668152, -0.18006771802902222, -0.1629451960325241, -0.145822674036026, -0.1287001520395279, -0.11157763004302979, -0.09445510804653168, -0.07733257859945297, -0.060210056602954865, -0.04308753460645676, -0.025965005159378052, -0.008842483162879944, 0.008280038833618164, 0.02540256269276142, 0.04252508655190468, 0.059647612273693085, 0.07677013427019119, 0.0938926562666893, 0.111015185713768, 0.1281377077102661, 0.14526022970676422, 0.16238275170326233, 0.17950527369976044, 0.19662779569625854, 0.21375033259391785, 0.23087283968925476, 0.24799537658691406, 0.265117883682251, 0.2822404205799103, 0.2993629574775696, 0.3164854645729065, 0.3336080014705658, 0.3507305085659027, 0.367853045463562, 0.3849755525588989, 0.4020980894565582, 0.41922062635421753, 0.43634316325187683, 0.45346567034721375, 0.47058820724487305, 0.48771071434020996, 0.5048332214355469, 0.5219557881355286, 0.5390782952308655, 0.5562008023262024]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 6.0, 5.0, 11.0, 17.0, 21.0, 25.0, 42.0, 76.0, 93.0, 144.0, 209.0, 284.0, 496.0, 713.0, 1090.0, 1532.0, 2484.0, 3602.0, 5887.0, 9493.0, 16696.0, 33393.0, 81133.0, 236613.0, 380910.0, 155997.0, 56810.0, 25198.0, 13327.0, 7772.0, 5015.0, 3187.0, 2074.0, 1302.0, 947.0, 605.0, 439.0, 274.0, 201.0, 144.0, 84.0, 51.0, 41.0, 33.0, 22.0, 15.0, 8.0, 14.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.255615234375, -0.2474517822265625, -0.239288330078125, -0.2311248779296875, -0.22296142578125, -0.2147979736328125, -0.206634521484375, -0.1984710693359375, -0.1903076171875, -0.1821441650390625, -0.173980712890625, -0.1658172607421875, -0.15765380859375, -0.1494903564453125, -0.141326904296875, -0.1331634521484375, -0.125, -0.1168365478515625, -0.108673095703125, -0.1005096435546875, -0.09234619140625, -0.0841827392578125, -0.076019287109375, -0.0678558349609375, -0.0596923828125, -0.0515289306640625, -0.043365478515625, -0.0352020263671875, -0.02703857421875, -0.0188751220703125, -0.010711669921875, -0.0025482177734375, 0.005615234375, 0.0137786865234375, 0.021942138671875, 0.0301055908203125, 0.03826904296875, 0.0464324951171875, 0.054595947265625, 0.0627593994140625, 0.0709228515625, 0.0790863037109375, 0.087249755859375, 0.0954132080078125, 0.10357666015625, 0.1117401123046875, 0.119903564453125, 0.1280670166015625, 0.13623046875, 0.1443939208984375, 0.152557373046875, 0.1607208251953125, 0.16888427734375, 0.1770477294921875, 0.185211181640625, 0.1933746337890625, 0.2015380859375, 0.2097015380859375, 0.217864990234375, 0.2260284423828125, 0.23419189453125, 0.2423553466796875, 0.250518798828125, 0.2586822509765625, 0.266845703125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 2.0, 5.0, 5.0, 6.0, 9.0, 14.0, 12.0, 19.0, 43.0, 77.0, 100.0, 130.0, 153.0, 131.0, 79.0, 61.0, 44.0, 23.0, 16.0, 9.0, 7.0, 7.0, 5.0, 3.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0616455078125, -0.059322357177734375, -0.05699920654296875, -0.054676055908203125, -0.0523529052734375, -0.050029754638671875, -0.04770660400390625, -0.045383453369140625, -0.043060302734375, -0.040737152099609375, -0.03841400146484375, -0.036090850830078125, -0.0337677001953125, -0.031444549560546875, -0.02912139892578125, -0.026798248291015625, -0.02447509765625, -0.022151947021484375, -0.01982879638671875, -0.017505645751953125, -0.0151824951171875, -0.012859344482421875, -0.01053619384765625, -0.008213043212890625, -0.005889892578125, -0.003566741943359375, -0.00124359130859375, 0.001079559326171875, 0.0034027099609375, 0.005725860595703125, 0.00804901123046875, 0.010372161865234375, 0.0126953125, 0.015018463134765625, 0.01734161376953125, 0.019664764404296875, 0.0219879150390625, 0.024311065673828125, 0.02663421630859375, 0.028957366943359375, 0.031280517578125, 0.033603668212890625, 0.03592681884765625, 0.038249969482421875, 0.0405731201171875, 0.042896270751953125, 0.04521942138671875, 0.047542572021484375, 0.04986572265625, 0.052188873291015625, 0.05451202392578125, 0.056835174560546875, 0.0591583251953125, 0.061481475830078125, 0.06380462646484375, 0.06612777709960938, 0.068450927734375, 0.07077407836914062, 0.07309722900390625, 0.07542037963867188, 0.0777435302734375, 0.08006668090820312, 0.08238983154296875, 0.08471298217773438, 0.0870361328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 10.0, 9.0, 16.0, 18.0, 16.0, 23.0, 36.0, 46.0, 72.0, 106.0, 197.0, 324.0, 530.0, 938.0, 1620.0, 3072.0, 5988.0, 13278.0, 37347.0, 172295.0, 562633.0, 183843.0, 39308.0, 13579.0, 6165.0, 3104.0, 1672.0, 901.0, 491.0, 325.0, 180.0, 133.0, 79.0, 59.0, 44.0, 23.0, 13.0, 14.0, 13.0, 9.0, 4.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0], "bins": [-0.396240234375, -0.3844184875488281, -0.37259674072265625, -0.3607749938964844, -0.3489532470703125, -0.3371315002441406, -0.32530975341796875, -0.3134880065917969, -0.301666259765625, -0.2898445129394531, -0.27802276611328125, -0.2662010192871094, -0.2543792724609375, -0.24255752563476562, -0.23073577880859375, -0.21891403198242188, -0.20709228515625, -0.19527053833007812, -0.18344879150390625, -0.17162704467773438, -0.1598052978515625, -0.14798355102539062, -0.13616180419921875, -0.12434005737304688, -0.112518310546875, -0.10069656372070312, -0.08887481689453125, -0.07705307006835938, -0.0652313232421875, -0.053409576416015625, -0.04158782958984375, -0.029766082763671875, -0.0179443359375, -0.006122589111328125, 0.00569915771484375, 0.017520904541015625, 0.0293426513671875, 0.041164398193359375, 0.05298614501953125, 0.06480789184570312, 0.076629638671875, 0.08845138549804688, 0.10027313232421875, 0.11209487915039062, 0.1239166259765625, 0.13573837280273438, 0.14756011962890625, 0.15938186645507812, 0.17120361328125, 0.18302536010742188, 0.19484710693359375, 0.20666885375976562, 0.2184906005859375, 0.23031234741210938, 0.24213409423828125, 0.2539558410644531, 0.265777587890625, 0.2775993347167969, 0.28942108154296875, 0.3012428283691406, 0.3130645751953125, 0.3248863220214844, 0.33670806884765625, 0.3485298156738281, 0.3603515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 1.0, 2.0, 10.0, 6.0, 14.0, 10.0, 11.0, 14.0, 13.0, 22.0, 21.0, 33.0, 28.0, 31.0, 43.0, 45.0, 56.0, 34.0, 44.0, 49.0, 40.0, 56.0, 41.0, 47.0, 42.0, 31.0, 32.0, 41.0, 30.0, 24.0, 30.0, 23.0, 18.0, 15.0, 9.0, 9.0, 8.0, 6.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.2713661193847656, -0.26270294189453125, -0.2540397644042969, -0.2453765869140625, -0.23671340942382812, -0.22805023193359375, -0.21938705444335938, -0.210723876953125, -0.20206069946289062, -0.19339752197265625, -0.18473434448242188, -0.1760711669921875, -0.16740798950195312, -0.15874481201171875, -0.15008163452148438, -0.14141845703125, -0.13275527954101562, -0.12409210205078125, -0.11542892456054688, -0.1067657470703125, -0.09810256958007812, -0.08943939208984375, -0.08077621459960938, -0.072113037109375, -0.06344985961914062, -0.05478668212890625, -0.046123504638671875, -0.0374603271484375, -0.028797149658203125, -0.02013397216796875, -0.011470794677734375, -0.0028076171875, 0.005855560302734375, 0.01451873779296875, 0.023181915283203125, 0.0318450927734375, 0.040508270263671875, 0.04917144775390625, 0.057834625244140625, 0.066497802734375, 0.07516098022460938, 0.08382415771484375, 0.09248733520507812, 0.1011505126953125, 0.10981369018554688, 0.11847686767578125, 0.12714004516601562, 0.13580322265625, 0.14446640014648438, 0.15312957763671875, 0.16179275512695312, 0.1704559326171875, 0.17911911010742188, 0.18778228759765625, 0.19644546508789062, 0.205108642578125, 0.21377182006835938, 0.22243499755859375, 0.23109817504882812, 0.2397613525390625, 0.24842453002929688, 0.25708770751953125, 0.2657508850097656, 0.2744140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 11.0, 14.0, 15.0, 18.0, 26.0, 24.0, 46.0, 55.0, 80.0, 130.0, 185.0, 295.0, 454.0, 723.0, 1181.0, 2146.0, 4083.0, 8923.0, 24114.0, 105770.0, 638995.0, 201741.0, 36079.0, 11843.0, 5191.0, 2642.0, 1390.0, 832.0, 494.0, 336.0, 201.0, 147.0, 96.0, 78.0, 43.0, 33.0, 34.0, 21.0, 15.0, 9.0, 11.0, 7.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4560546875, -0.4425048828125, -0.428955078125, -0.4154052734375, -0.40185546875, -0.3883056640625, -0.374755859375, -0.3612060546875, -0.34765625, -0.3341064453125, -0.320556640625, -0.3070068359375, -0.29345703125, -0.2799072265625, -0.266357421875, -0.2528076171875, -0.2392578125, -0.2257080078125, -0.212158203125, -0.1986083984375, -0.18505859375, -0.1715087890625, -0.157958984375, -0.1444091796875, -0.130859375, -0.1173095703125, -0.103759765625, -0.0902099609375, -0.07666015625, -0.0631103515625, -0.049560546875, -0.0360107421875, -0.0224609375, -0.0089111328125, 0.004638671875, 0.0181884765625, 0.03173828125, 0.0452880859375, 0.058837890625, 0.0723876953125, 0.0859375, 0.0994873046875, 0.113037109375, 0.1265869140625, 0.14013671875, 0.1536865234375, 0.167236328125, 0.1807861328125, 0.1943359375, 0.2078857421875, 0.221435546875, 0.2349853515625, 0.24853515625, 0.2620849609375, 0.275634765625, 0.2891845703125, 0.302734375, 0.3162841796875, 0.329833984375, 0.3433837890625, 0.35693359375, 0.3704833984375, 0.384033203125, 0.3975830078125, 0.4111328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 17.0, 12.0, 19.0, 28.0, 22.0, 38.0, 43.0, 66.0, 79.0, 113.0, 111.0, 90.0, 78.0, 57.0, 49.0, 36.0, 27.0, 21.0, 16.0, 9.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00037789344787597656, -0.0003672093152999878, -0.000356525182723999, -0.00034584105014801025, -0.0003351569175720215, -0.0003244727849960327, -0.00031378865242004395, -0.0003031045198440552, -0.0002924203872680664, -0.00028173625469207764, -0.00027105212211608887, -0.0002603679895401001, -0.00024968385696411133, -0.00023899972438812256, -0.0002283155918121338, -0.00021763145923614502, -0.00020694732666015625, -0.00019626319408416748, -0.0001855790615081787, -0.00017489492893218994, -0.00016421079635620117, -0.0001535266637802124, -0.00014284253120422363, -0.00013215839862823486, -0.0001214742660522461, -0.00011079013347625732, -0.00010010600090026855, -8.942186832427979e-05, -7.873773574829102e-05, -6.805360317230225e-05, -5.7369470596313477e-05, -4.668533802032471e-05, -3.600120544433594e-05, -2.5317072868347168e-05, -1.4632940292358398e-05, -3.948807716369629e-06, 6.735324859619141e-06, 1.741945743560791e-05, 2.810359001159668e-05, 3.878772258758545e-05, 4.947185516357422e-05, 6.015598773956299e-05, 7.084012031555176e-05, 8.152425289154053e-05, 9.22083854675293e-05, 0.00010289251804351807, 0.00011357665061950684, 0.0001242607831954956, 0.00013494491577148438, 0.00014562904834747314, 0.00015631318092346191, 0.00016699731349945068, 0.00017768144607543945, 0.00018836557865142822, 0.000199049711227417, 0.00020973384380340576, 0.00022041797637939453, 0.0002311021089553833, 0.00024178624153137207, 0.00025247037410736084, 0.0002631545066833496, 0.0002738386392593384, 0.00028452277183532715, 0.0002952069044113159, 0.0003058910369873047]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 14.0, 13.0, 12.0, 17.0, 38.0, 40.0, 58.0, 86.0, 134.0, 212.0, 327.0, 556.0, 888.0, 1552.0, 3026.0, 5873.0, 12749.0, 33479.0, 125403.0, 528658.0, 246931.0, 53440.0, 18294.0, 7840.0, 3914.0, 1977.0, 1152.0, 717.0, 379.0, 255.0, 176.0, 102.0, 75.0, 46.0, 30.0, 28.0, 22.0, 5.0, 7.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.311279296875, -0.29962158203125, -0.2879638671875, -0.27630615234375, -0.2646484375, -0.25299072265625, -0.2413330078125, -0.22967529296875, -0.218017578125, -0.20635986328125, -0.1947021484375, -0.18304443359375, -0.17138671875, -0.15972900390625, -0.1480712890625, -0.13641357421875, -0.124755859375, -0.11309814453125, -0.1014404296875, -0.08978271484375, -0.078125, -0.06646728515625, -0.0548095703125, -0.04315185546875, -0.031494140625, -0.01983642578125, -0.0081787109375, 0.00347900390625, 0.01513671875, 0.02679443359375, 0.0384521484375, 0.05010986328125, 0.061767578125, 0.07342529296875, 0.0850830078125, 0.09674072265625, 0.1083984375, 0.12005615234375, 0.1317138671875, 0.14337158203125, 0.155029296875, 0.16668701171875, 0.1783447265625, 0.19000244140625, 0.20166015625, 0.21331787109375, 0.2249755859375, 0.23663330078125, 0.248291015625, 0.25994873046875, 0.2716064453125, 0.28326416015625, 0.294921875, 0.30657958984375, 0.3182373046875, 0.32989501953125, 0.341552734375, 0.35321044921875, 0.3648681640625, 0.37652587890625, 0.38818359375, 0.39984130859375, 0.4114990234375, 0.42315673828125, 0.434814453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 6.0, 4.0, 15.0, 15.0, 17.0, 15.0, 16.0, 21.0, 19.0, 37.0, 45.0, 41.0, 55.0, 81.0, 78.0, 76.0, 67.0, 72.0, 69.0, 47.0, 45.0, 36.0, 30.0, 15.0, 18.0, 17.0, 11.0, 5.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.241943359375, -0.23418426513671875, -0.2264251708984375, -0.21866607666015625, -0.210906982421875, -0.20314788818359375, -0.1953887939453125, -0.18762969970703125, -0.17987060546875, -0.17211151123046875, -0.1643524169921875, -0.15659332275390625, -0.148834228515625, -0.14107513427734375, -0.1333160400390625, -0.12555694580078125, -0.1177978515625, -0.11003875732421875, -0.1022796630859375, -0.09452056884765625, -0.086761474609375, -0.07900238037109375, -0.0712432861328125, -0.06348419189453125, -0.05572509765625, -0.04796600341796875, -0.0402069091796875, -0.03244781494140625, -0.024688720703125, -0.01692962646484375, -0.0091705322265625, -0.00141143798828125, 0.00634765625, 0.01410675048828125, 0.0218658447265625, 0.02962493896484375, 0.037384033203125, 0.04514312744140625, 0.0529022216796875, 0.06066131591796875, 0.06842041015625, 0.07617950439453125, 0.0839385986328125, 0.09169769287109375, 0.099456787109375, 0.10721588134765625, 0.1149749755859375, 0.12273406982421875, 0.1304931640625, 0.13825225830078125, 0.1460113525390625, 0.15377044677734375, 0.161529541015625, 0.16928863525390625, 0.1770477294921875, 0.18480682373046875, 0.19256591796875, 0.20032501220703125, 0.2080841064453125, 0.21584320068359375, 0.223602294921875, 0.23136138916015625, 0.2391204833984375, 0.24687957763671875, 0.254638671875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 9.0, 17.0, 36.0, 135.0, 330.0, 259.0, 97.0, 32.0, 31.0, 13.0, 5.0, 8.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7828826904296875, -7.581912994384766, -7.380943775177002, -7.17997407913208, -6.979004859924316, -6.7780351638793945, -6.577065944671631, -6.376096248626709, -6.175127029418945, -5.974157333374023, -5.77318811416626, -5.572218418121338, -5.371249198913574, -5.170279502868652, -4.969310283660889, -4.768340587615967, -4.567371368408203, -4.366401672363281, -4.165432453155518, -3.964462995529175, -3.763493537902832, -3.56252384185791, -3.3615546226501465, -3.1605849266052246, -2.9596152305603027, -2.75864577293396, -2.557676315307617, -2.3567068576812744, -2.1557374000549316, -1.9547678232192993, -1.7537983655929565, -1.5528289079666138, -1.3518595695495605, -1.1508901119232178, -0.949920654296875, -0.7489511370658875, -0.5479816794395447, -0.34701216220855713, -0.14604270458221436, 0.05492675304412842, 0.2558962106704712, 0.45686566829681396, 0.6578351259231567, 0.8588046431541443, 1.0597741603851318, 1.2607436180114746, 1.4617130756378174, 1.6626825332641602, 1.863651990890503, 2.0646214485168457, 2.2655909061431885, 2.4665603637695312, 2.667529821395874, 2.868499279022217, 3.0694689750671387, 3.2704381942749023, 3.471407890319824, 3.672377347946167, 3.8733468055725098, 4.074316501617432, 4.275285720825195, 4.476255416870117, 4.677224636077881, 4.878194332122803, 5.079163551330566]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 5.0, 4.0, 4.0, 6.0, 15.0, 19.0, 39.0, 66.0, 104.0, 147.0, 182.0, 153.0, 92.0, 59.0, 31.0, 13.0, 15.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.01859188079834, -7.829758644104004, -7.640925407409668, -7.452092170715332, -7.263258934020996, -7.07442569732666, -6.885592460632324, -6.6967597007751465, -6.5079264640808105, -6.319093227386475, -6.130259990692139, -5.941426753997803, -5.752593517303467, -5.563760757446289, -5.374927520751953, -5.186094284057617, -4.997261047363281, -4.808427810668945, -4.619594573974609, -4.430761337280273, -4.2419281005859375, -4.053094863891602, -3.8642618656158447, -3.675428867340088, -3.4865951538085938, -3.297761917114258, -3.108928680419922, -2.920095443725586, -2.731262445449829, -2.542429208755493, -2.3535959720611572, -2.1647629737854004, -1.9759297370910645, -1.7870965003967285, -1.5982633829116821, -1.4094301462173462, -1.2205970287322998, -1.0317637920379639, -0.8429305553436279, -0.6540974378585815, -0.4652642011642456, -0.27643102407455444, -0.0875978171825409, 0.10123538970947266, 0.2900685667991638, 0.478901743888855, 0.6677349805831909, 0.8565680980682373, 1.0454013347625732, 1.2342345714569092, 1.4230676889419556, 1.6119009256362915, 1.800734043121338, 1.9895672798156738, 2.1784005165100098, 2.3672337532043457, 2.5560669898986816, 2.7449002265930176, 2.9337334632873535, 3.1225666999816895, 3.3113996982574463, 3.5002329349517822, 3.689066171646118, 3.877899169921875, 4.066732406616211]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 13.0, 22.0, 28.0, 58.0, 80.0, 146.0, 223.0, 407.0, 834.0, 2115.0, 5902.0, 24461.0, 367509.0, 3738105.0, 41467.0, 8294.0, 2486.0, 1022.0, 461.0, 258.0, 146.0, 84.0, 39.0, 29.0, 14.0, 13.0, 7.0, 8.0, 3.0, 4.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4970703125, -1.4456939697265625, -1.394317626953125, -1.3429412841796875, -1.29156494140625, -1.2401885986328125, -1.188812255859375, -1.1374359130859375, -1.0860595703125, -1.0346832275390625, -0.983306884765625, -0.9319305419921875, -0.88055419921875, -0.8291778564453125, -0.777801513671875, -0.7264251708984375, -0.675048828125, -0.6236724853515625, -0.572296142578125, -0.5209197998046875, -0.46954345703125, -0.4181671142578125, -0.366790771484375, -0.3154144287109375, -0.2640380859375, -0.2126617431640625, -0.161285400390625, -0.1099090576171875, -0.05853271484375, -0.0071563720703125, 0.044219970703125, 0.0955963134765625, 0.14697265625, 0.1983489990234375, 0.249725341796875, 0.3011016845703125, 0.35247802734375, 0.4038543701171875, 0.455230712890625, 0.5066070556640625, 0.5579833984375, 0.6093597412109375, 0.660736083984375, 0.7121124267578125, 0.76348876953125, 0.8148651123046875, 0.866241455078125, 0.9176177978515625, 0.968994140625, 1.0203704833984375, 1.071746826171875, 1.1231231689453125, 1.17449951171875, 1.2258758544921875, 1.277252197265625, 1.3286285400390625, 1.3800048828125, 1.4313812255859375, 1.482757568359375, 1.5341339111328125, 1.58551025390625, 1.6368865966796875, 1.688262939453125, 1.7396392822265625, 1.791015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 2.0, 16.0, 18.0, 14.0, 34.0, 64.0, 62.0, 81.0, 101.0, 123.0, 116.0, 90.0, 60.0, 51.0, 29.0, 28.0, 18.0, 12.0, 8.0, 7.0, 7.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.06376266479492188, -0.06166839599609375, -0.059574127197265625, -0.0574798583984375, -0.055385589599609375, -0.05329132080078125, -0.051197052001953125, -0.049102783203125, -0.047008514404296875, -0.04491424560546875, -0.042819976806640625, -0.0407257080078125, -0.038631439208984375, -0.03653717041015625, -0.034442901611328125, -0.0323486328125, -0.030254364013671875, -0.02816009521484375, -0.026065826416015625, -0.0239715576171875, -0.021877288818359375, -0.01978302001953125, -0.017688751220703125, -0.015594482421875, -0.013500213623046875, -0.01140594482421875, -0.009311676025390625, -0.0072174072265625, -0.005123138427734375, -0.00302886962890625, -0.000934600830078125, 0.00115966796875, 0.003253936767578125, 0.00534820556640625, 0.007442474365234375, 0.0095367431640625, 0.011631011962890625, 0.01372528076171875, 0.015819549560546875, 0.017913818359375, 0.020008087158203125, 0.02210235595703125, 0.024196624755859375, 0.0262908935546875, 0.028385162353515625, 0.03047943115234375, 0.032573699951171875, 0.03466796875, 0.036762237548828125, 0.03885650634765625, 0.040950775146484375, 0.0430450439453125, 0.045139312744140625, 0.04723358154296875, 0.049327850341796875, 0.051422119140625, 0.053516387939453125, 0.05561065673828125, 0.057704925537109375, 0.0597991943359375, 0.061893463134765625, 0.06398773193359375, 0.06608200073242188, 0.06817626953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 3.0, 8.0, 11.0, 26.0, 28.0, 44.0, 97.0, 157.0, 342.0, 678.0, 1563.0, 4103.0, 12907.0, 52073.0, 414394.0, 3554112.0, 118125.0, 23866.0, 6977.0, 2578.0, 1080.0, 504.0, 244.0, 149.0, 78.0, 41.0, 36.0, 20.0, 10.0, 10.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.9405670166015625, -0.909454345703125, -0.8783416748046875, -0.84722900390625, -0.8161163330078125, -0.785003662109375, -0.7538909912109375, -0.7227783203125, -0.6916656494140625, -0.660552978515625, -0.6294403076171875, -0.59832763671875, -0.5672149658203125, -0.536102294921875, -0.5049896240234375, -0.473876953125, -0.4427642822265625, -0.411651611328125, -0.3805389404296875, -0.34942626953125, -0.3183135986328125, -0.287200927734375, -0.2560882568359375, -0.2249755859375, -0.1938629150390625, -0.162750244140625, -0.1316375732421875, -0.10052490234375, -0.0694122314453125, -0.038299560546875, -0.0071868896484375, 0.02392578125, 0.0550384521484375, 0.086151123046875, 0.1172637939453125, 0.14837646484375, 0.1794891357421875, 0.210601806640625, 0.2417144775390625, 0.2728271484375, 0.3039398193359375, 0.335052490234375, 0.3661651611328125, 0.39727783203125, 0.4283905029296875, 0.459503173828125, 0.4906158447265625, 0.521728515625, 0.5528411865234375, 0.583953857421875, 0.6150665283203125, 0.64617919921875, 0.6772918701171875, 0.708404541015625, 0.7395172119140625, 0.7706298828125, 0.8017425537109375, 0.832855224609375, 0.8639678955078125, 0.89508056640625, 0.9261932373046875, 0.957305908203125, 0.9884185791015625, 1.01953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 12.0, 7.0, 19.0, 22.0, 37.0, 40.0, 71.0, 105.0, 175.0, 445.0, 2148.0, 391.0, 198.0, 109.0, 83.0, 66.0, 38.0, 29.0, 20.0, 12.0, 11.0, 10.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09344482421875, -0.0894479751586914, -0.08545112609863281, -0.08145427703857422, -0.07745742797851562, -0.07346057891845703, -0.06946372985839844, -0.06546688079833984, -0.06147003173828125, -0.057473182678222656, -0.05347633361816406, -0.04947948455810547, -0.045482635498046875, -0.04148578643798828, -0.03748893737792969, -0.033492088317871094, -0.0294952392578125, -0.025498390197753906, -0.021501541137695312, -0.01750469207763672, -0.013507843017578125, -0.009510993957519531, -0.0055141448974609375, -0.0015172958374023438, 0.00247955322265625, 0.006476402282714844, 0.010473251342773438, 0.014470100402832031, 0.018466949462890625, 0.02246379852294922, 0.026460647583007812, 0.030457496643066406, 0.034454345703125, 0.038451194763183594, 0.04244804382324219, 0.04644489288330078, 0.050441741943359375, 0.05443859100341797, 0.05843544006347656, 0.062432289123535156, 0.06642913818359375, 0.07042598724365234, 0.07442283630371094, 0.07841968536376953, 0.08241653442382812, 0.08641338348388672, 0.09041023254394531, 0.0944070816040039, 0.0984039306640625, 0.1024007797241211, 0.10639762878417969, 0.11039447784423828, 0.11439132690429688, 0.11838817596435547, 0.12238502502441406, 0.12638187408447266, 0.13037872314453125, 0.13437557220458984, 0.13837242126464844, 0.14236927032470703, 0.14636611938476562, 0.15036296844482422, 0.1543598175048828, 0.1583566665649414, 0.162353515625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 15.0, 65.0, 442.0, 368.0, 82.0, 20.0, 7.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7176588773727417, -0.6260332465171814, -0.5344076156616211, -0.4427820146083832, -0.3511563837528229, -0.2595307528972626, -0.16790515184402466, -0.07627952098846436, 0.015346109867095947, 0.10697173327207565, 0.19859735667705536, 0.29022297263145447, 0.38184860348701477, 0.4734742343425751, 0.565099835395813, 0.6567254662513733, 0.7483510971069336, 0.8399767279624939, 0.9316023588180542, 1.0232279300689697, 1.1148536205291748, 1.2064791917800903, 1.2981047630310059, 1.389730453491211, 1.481356143951416, 1.5729817152023315, 1.6646074056625366, 1.7562329769134521, 1.8478586673736572, 1.9394842386245728, 2.0311098098754883, 2.1227355003356934, 2.2143609523773193, 2.3059866428375244, 2.3976120948791504, 2.4892377853393555, 2.5808634757995605, 2.6724891662597656, 2.7641146183013916, 2.8557403087615967, 2.9473659992218018, 3.038991689682007, 3.130617141723633, 3.222242832183838, 3.313868522644043, 3.405494213104248, 3.497119665145874, 3.588745355606079, 3.680370807647705, 3.77199649810791, 3.863621950149536, 3.955247640609741, 4.046873092651367, 4.138498783111572, 4.230124473571777, 4.321750164031982, 4.4133758544921875, 4.505001544952393, 4.596627235412598, 4.688252925872803, 4.77987813949585, 4.871503829956055, 4.96312952041626, 5.054755210876465, 5.14638090133667]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 6.0, 10.0, 9.0, 17.0, 18.0, 23.0, 29.0, 48.0, 42.0, 48.0, 52.0, 52.0, 63.0, 49.0, 50.0, 82.0, 58.0, 51.0, 46.0, 34.0, 28.0, 25.0, 33.0, 26.0, 11.0, 20.0, 10.0, 12.0, 10.0, 5.0, 12.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4612400531768799, -0.4440639913082123, -0.4268879294395447, -0.4097118675708771, -0.3925358057022095, -0.3753597140312195, -0.3581836521625519, -0.3410075902938843, -0.3238315284252167, -0.3066554665565491, -0.28947940468788147, -0.27230334281921387, -0.2551272511482239, -0.23795120418071747, -0.22077512741088867, -0.20359906554222107, -0.18642300367355347, -0.16924694180488586, -0.15207087993621826, -0.13489480316638947, -0.11771874129772186, -0.10054267942905426, -0.08336661010980606, -0.06619054079055786, -0.04901447892189026, -0.03183841332793236, -0.014662347733974457, 0.002513717859983444, 0.019689783453941345, 0.03686584532260895, 0.05404191464185715, 0.07121798396110535, 0.08839410543441772, 0.10557016730308533, 0.12274623662233353, 0.13992230594158173, 0.15709836781024933, 0.17427442967891693, 0.19145050644874573, 0.20862656831741333, 0.22580263018608093, 0.24297869205474854, 0.26015475392341614, 0.27733081579208374, 0.29450690746307373, 0.31168293952941895, 0.32885903120040894, 0.34603509306907654, 0.36321115493774414, 0.38038721680641174, 0.39756327867507935, 0.41473934054374695, 0.43191540241241455, 0.44909149408340454, 0.46626755595207214, 0.48344361782073975, 0.500619649887085, 0.517795741558075, 0.5349717736244202, 0.5521478652954102, 0.5693238973617554, 0.5864999890327454, 0.6036760210990906, 0.6208521127700806, 0.6380282044410706]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 14.0, 6.0, 17.0, 20.0, 24.0, 27.0, 55.0, 69.0, 107.0, 163.0, 285.0, 450.0, 683.0, 1215.0, 2017.0, 3682.0, 6870.0, 13618.0, 30778.0, 80278.0, 236168.0, 391394.0, 171931.0, 60388.0, 24102.0, 11225.0, 5600.0, 2982.0, 1723.0, 966.0, 582.0, 405.0, 223.0, 154.0, 120.0, 72.0, 42.0, 30.0, 20.0, 17.0, 12.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3679046630859375, -0.356170654296875, -0.3444366455078125, -0.33270263671875, -0.3209686279296875, -0.309234619140625, -0.2975006103515625, -0.2857666015625, -0.2740325927734375, -0.262298583984375, -0.2505645751953125, -0.23883056640625, -0.2270965576171875, -0.215362548828125, -0.2036285400390625, -0.19189453125, -0.1801605224609375, -0.168426513671875, -0.1566925048828125, -0.14495849609375, -0.1332244873046875, -0.121490478515625, -0.1097564697265625, -0.0980224609375, -0.0862884521484375, -0.074554443359375, -0.0628204345703125, -0.05108642578125, -0.0393524169921875, -0.027618408203125, -0.0158843994140625, -0.004150390625, 0.0075836181640625, 0.019317626953125, 0.0310516357421875, 0.04278564453125, 0.0545196533203125, 0.066253662109375, 0.0779876708984375, 0.0897216796875, 0.1014556884765625, 0.113189697265625, 0.1249237060546875, 0.13665771484375, 0.1483917236328125, 0.160125732421875, 0.1718597412109375, 0.18359375, 0.1953277587890625, 0.207061767578125, 0.2187957763671875, 0.23052978515625, 0.2422637939453125, 0.253997802734375, 0.2657318115234375, 0.2774658203125, 0.2891998291015625, 0.300933837890625, 0.3126678466796875, 0.32440185546875, 0.3361358642578125, 0.347869873046875, 0.3596038818359375, 0.371337890625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 4.0, 10.0, 19.0, 19.0, 28.0, 32.0, 55.0, 72.0, 92.0, 120.0, 108.0, 94.0, 78.0, 62.0, 50.0, 31.0, 29.0, 27.0, 11.0, 9.0, 5.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07061767578125, -0.06836414337158203, -0.06611061096191406, -0.0638570785522461, -0.061603546142578125, -0.059350013732910156, -0.05709648132324219, -0.05484294891357422, -0.05258941650390625, -0.05033588409423828, -0.04808235168457031, -0.045828819274902344, -0.043575286865234375, -0.041321754455566406, -0.03906822204589844, -0.03681468963623047, -0.0345611572265625, -0.03230762481689453, -0.030054092407226562, -0.027800559997558594, -0.025547027587890625, -0.023293495178222656, -0.021039962768554688, -0.01878643035888672, -0.01653289794921875, -0.014279365539550781, -0.012025833129882812, -0.009772300720214844, -0.007518768310546875, -0.005265235900878906, -0.0030117034912109375, -0.0007581710815429688, 0.001495361328125, 0.0037488937377929688, 0.0060024261474609375, 0.008255958557128906, 0.010509490966796875, 0.012763023376464844, 0.015016555786132812, 0.01727008819580078, 0.01952362060546875, 0.02177715301513672, 0.024030685424804688, 0.026284217834472656, 0.028537750244140625, 0.030791282653808594, 0.03304481506347656, 0.03529834747314453, 0.0375518798828125, 0.03980541229248047, 0.04205894470214844, 0.044312477111816406, 0.046566009521484375, 0.048819541931152344, 0.05107307434082031, 0.05332660675048828, 0.05558013916015625, 0.05783367156982422, 0.06008720397949219, 0.062340736389160156, 0.06459426879882812, 0.0668478012084961, 0.06910133361816406, 0.07135486602783203, 0.0736083984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 14.0, 15.0, 46.0, 71.0, 160.0, 302.0, 684.0, 1706.0, 5089.0, 19449.0, 113138.0, 608509.0, 250152.0, 36752.0, 8342.0, 2435.0, 903.0, 376.0, 190.0, 81.0, 47.0, 26.0, 14.0, 12.0, 8.0, 1.0, 3.0, 4.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.3644599914550781, -0.34683990478515625, -0.3292198181152344, -0.3115997314453125, -0.2939796447753906, -0.27635955810546875, -0.2587394714355469, -0.241119384765625, -0.22349929809570312, -0.20587921142578125, -0.18825912475585938, -0.1706390380859375, -0.15301895141601562, -0.13539886474609375, -0.11777877807617188, -0.10015869140625, -0.08253860473632812, -0.06491851806640625, -0.047298431396484375, -0.0296783447265625, -0.012058258056640625, 0.00556182861328125, 0.023181915283203125, 0.040802001953125, 0.058422088623046875, 0.07604217529296875, 0.09366226196289062, 0.1112823486328125, 0.12890243530273438, 0.14652252197265625, 0.16414260864257812, 0.1817626953125, 0.19938278198242188, 0.21700286865234375, 0.23462295532226562, 0.2522430419921875, 0.2698631286621094, 0.28748321533203125, 0.3051033020019531, 0.322723388671875, 0.3403434753417969, 0.35796356201171875, 0.3755836486816406, 0.3932037353515625, 0.4108238220214844, 0.42844390869140625, 0.4460639953613281, 0.46368408203125, 0.4813041687011719, 0.49892425537109375, 0.5165443420410156, 0.5341644287109375, 0.5517845153808594, 0.5694046020507812, 0.5870246887207031, 0.604644775390625, 0.6222648620605469, 0.6398849487304688, 0.6575050354003906, 0.6751251220703125, 0.6927452087402344, 0.7103652954101562, 0.7279853820800781, 0.74560546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 1.0, 5.0, 2.0, 8.0, 5.0, 8.0, 9.0, 7.0, 13.0, 17.0, 22.0, 34.0, 23.0, 26.0, 31.0, 39.0, 36.0, 36.0, 54.0, 50.0, 50.0, 46.0, 42.0, 43.0, 49.0, 39.0, 48.0, 38.0, 35.0, 26.0, 24.0, 22.0, 24.0, 15.0, 20.0, 13.0, 13.0, 7.0, 8.0, 4.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2021484375, -0.19516563415527344, -0.18818283081054688, -0.1812000274658203, -0.17421722412109375, -0.1672344207763672, -0.16025161743164062, -0.15326881408691406, -0.1462860107421875, -0.13930320739746094, -0.13232040405273438, -0.1253376007080078, -0.11835479736328125, -0.11137199401855469, -0.10438919067382812, -0.09740638732910156, -0.090423583984375, -0.08344078063964844, -0.07645797729492188, -0.06947517395019531, -0.06249237060546875, -0.05550956726074219, -0.048526763916015625, -0.04154396057128906, -0.0345611572265625, -0.027578353881835938, -0.020595550537109375, -0.013612747192382812, -0.00662994384765625, 0.0003528594970703125, 0.007335662841796875, 0.014318466186523438, 0.02130126953125, 0.028284072875976562, 0.035266876220703125, 0.04224967956542969, 0.04923248291015625, 0.05621528625488281, 0.06319808959960938, 0.07018089294433594, 0.0771636962890625, 0.08414649963378906, 0.09112930297851562, 0.09811210632324219, 0.10509490966796875, 0.11207771301269531, 0.11906051635742188, 0.12604331970214844, 0.133026123046875, 0.14000892639160156, 0.14699172973632812, 0.1539745330810547, 0.16095733642578125, 0.1679401397705078, 0.17492294311523438, 0.18190574645996094, 0.1888885498046875, 0.19587135314941406, 0.20285415649414062, 0.2098369598388672, 0.21681976318359375, 0.2238025665283203, 0.23078536987304688, 0.23776817321777344, 0.2447509765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 9.0, 19.0, 20.0, 13.0, 35.0, 62.0, 71.0, 134.0, 209.0, 331.0, 559.0, 1103.0, 2315.0, 5244.0, 15278.0, 65481.0, 548006.0, 343953.0, 45360.0, 11779.0, 4348.0, 1944.0, 934.0, 500.0, 284.0, 188.0, 122.0, 70.0, 53.0, 40.0, 14.0, 18.0, 10.0, 12.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4660453796386719, -0.44991302490234375, -0.4337806701660156, -0.4176483154296875, -0.4015159606933594, -0.38538360595703125, -0.3692512512207031, -0.353118896484375, -0.3369865417480469, -0.32085418701171875, -0.3047218322753906, -0.2885894775390625, -0.2724571228027344, -0.25632476806640625, -0.24019241333007812, -0.22406005859375, -0.20792770385742188, -0.19179534912109375, -0.17566299438476562, -0.1595306396484375, -0.14339828491210938, -0.12726593017578125, -0.11113357543945312, -0.095001220703125, -0.07886886596679688, -0.06273651123046875, -0.046604156494140625, -0.0304718017578125, -0.014339447021484375, 0.00179290771484375, 0.017925262451171875, 0.0340576171875, 0.050189971923828125, 0.06632232666015625, 0.08245468139648438, 0.0985870361328125, 0.11471939086914062, 0.13085174560546875, 0.14698410034179688, 0.163116455078125, 0.17924880981445312, 0.19538116455078125, 0.21151351928710938, 0.2276458740234375, 0.24377822875976562, 0.25991058349609375, 0.2760429382324219, 0.29217529296875, 0.3083076477050781, 0.32444000244140625, 0.3405723571777344, 0.3567047119140625, 0.3728370666503906, 0.38896942138671875, 0.4051017761230469, 0.421234130859375, 0.4373664855957031, 0.45349884033203125, 0.4696311950683594, 0.4857635498046875, 0.5018959045410156, 0.5180282592773438, 0.5341606140136719, 0.55029296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 4.0, 6.0, 7.0, 18.0, 9.0, 19.0, 18.0, 33.0, 46.0, 56.0, 73.0, 86.0, 113.0, 108.0, 90.0, 73.0, 43.0, 53.0, 25.0, 23.0, 13.0, 11.0, 14.0, 9.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002503395080566406, -0.00024295970797538757, -0.00023557990789413452, -0.00022820010781288147, -0.00022082030773162842, -0.00021344050765037537, -0.00020606070756912231, -0.00019868090748786926, -0.0001913011074066162, -0.00018392130732536316, -0.0001765415072441101, -0.00016916170716285706, -0.000161781907081604, -0.00015440210700035095, -0.0001470223069190979, -0.00013964250683784485, -0.0001322627067565918, -0.00012488290667533875, -0.0001175031065940857, -0.00011012330651283264, -0.00010274350643157959, -9.536370635032654e-05, -8.798390626907349e-05, -8.060410618782043e-05, -7.322430610656738e-05, -6.584450602531433e-05, -5.846470594406128e-05, -5.108490586280823e-05, -4.3705105781555176e-05, -3.6325305700302124e-05, -2.8945505619049072e-05, -2.156570553779602e-05, -1.4185905456542969e-05, -6.806105375289917e-06, 5.736947059631348e-07, 7.953494787216187e-06, 1.5333294868469238e-05, 2.271309494972229e-05, 3.0092895030975342e-05, 3.7472695112228394e-05, 4.4852495193481445e-05, 5.22322952747345e-05, 5.961209535598755e-05, 6.69918954372406e-05, 7.437169551849365e-05, 8.17514955997467e-05, 8.913129568099976e-05, 9.651109576225281e-05, 0.00010389089584350586, 0.00011127069592475891, 0.00011865049600601196, 0.00012603029608726501, 0.00013341009616851807, 0.00014078989624977112, 0.00014816969633102417, 0.00015554949641227722, 0.00016292929649353027, 0.00017030909657478333, 0.00017768889665603638, 0.00018506869673728943, 0.00019244849681854248, 0.00019982829689979553, 0.00020720809698104858, 0.00021458789706230164, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 2.0, 6.0, 3.0, 9.0, 12.0, 17.0, 25.0, 32.0, 53.0, 76.0, 113.0, 172.0, 300.0, 421.0, 729.0, 1268.0, 2309.0, 4796.0, 10850.0, 29191.0, 100950.0, 464443.0, 322596.0, 70410.0, 22097.0, 8778.0, 4032.0, 2055.0, 1047.0, 623.0, 371.0, 254.0, 147.0, 105.0, 73.0, 53.0, 32.0, 28.0, 18.0, 15.0, 15.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.33447265625, -0.3236351013183594, -0.31279754638671875, -0.3019599914550781, -0.2911224365234375, -0.2802848815917969, -0.26944732666015625, -0.2586097717285156, -0.247772216796875, -0.23693466186523438, -0.22609710693359375, -0.21525955200195312, -0.2044219970703125, -0.19358444213867188, -0.18274688720703125, -0.17190933227539062, -0.16107177734375, -0.15023422241210938, -0.13939666748046875, -0.12855911254882812, -0.1177215576171875, -0.10688400268554688, -0.09604644775390625, -0.08520889282226562, -0.074371337890625, -0.06353378295898438, -0.05269622802734375, -0.041858673095703125, -0.0310211181640625, -0.020183563232421875, -0.00934600830078125, 0.001491546630859375, 0.0123291015625, 0.023166656494140625, 0.03400421142578125, 0.044841766357421875, 0.0556793212890625, 0.06651687622070312, 0.07735443115234375, 0.08819198608398438, 0.099029541015625, 0.10986709594726562, 0.12070465087890625, 0.13154220581054688, 0.1423797607421875, 0.15321731567382812, 0.16405487060546875, 0.17489242553710938, 0.18572998046875, 0.19656753540039062, 0.20740509033203125, 0.21824264526367188, 0.2290802001953125, 0.23991775512695312, 0.25075531005859375, 0.2615928649902344, 0.272430419921875, 0.2832679748535156, 0.29410552978515625, 0.3049430847167969, 0.3157806396484375, 0.3266181945800781, 0.33745574951171875, 0.3482933044433594, 0.359130859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 10.0, 5.0, 9.0, 7.0, 8.0, 18.0, 20.0, 23.0, 24.0, 43.0, 40.0, 57.0, 60.0, 73.0, 63.0, 96.0, 81.0, 64.0, 50.0, 41.0, 34.0, 27.0, 26.0, 21.0, 21.0, 16.0, 11.0, 14.0, 7.0, 6.0, 1.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1666259765625, -0.1612262725830078, -0.15582656860351562, -0.15042686462402344, -0.14502716064453125, -0.13962745666503906, -0.13422775268554688, -0.1288280487060547, -0.1234283447265625, -0.11802864074707031, -0.11262893676757812, -0.10722923278808594, -0.10182952880859375, -0.09642982482910156, -0.09103012084960938, -0.08563041687011719, -0.080230712890625, -0.07483100891113281, -0.06943130493164062, -0.06403160095214844, -0.05863189697265625, -0.05323219299316406, -0.047832489013671875, -0.04243278503417969, -0.0370330810546875, -0.03163337707519531, -0.026233673095703125, -0.020833969116210938, -0.01543426513671875, -0.010034561157226562, -0.004634857177734375, 0.0007648468017578125, 0.00616455078125, 0.011564254760742188, 0.016963958740234375, 0.022363662719726562, 0.02776336669921875, 0.03316307067871094, 0.038562774658203125, 0.04396247863769531, 0.0493621826171875, 0.05476188659667969, 0.060161590576171875, 0.06556129455566406, 0.07096099853515625, 0.07636070251464844, 0.08176040649414062, 0.08716011047363281, 0.092559814453125, 0.09795951843261719, 0.10335922241210938, 0.10875892639160156, 0.11415863037109375, 0.11955833435058594, 0.12495803833007812, 0.1303577423095703, 0.1357574462890625, 0.1411571502685547, 0.14655685424804688, 0.15195655822753906, 0.15735626220703125, 0.16275596618652344, 0.16815567016601562, 0.1735553741455078, 0.178955078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 30.0, 170.0, 572.0, 174.0, 30.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3231120109558105, -7.036736965179443, -6.750362396240234, -6.463987350463867, -6.1776123046875, -5.891237735748291, -5.604862689971924, -5.318488121032715, -5.032113075256348, -4.7457380294799805, -4.4593634605407715, -4.172988414764404, -3.886613607406616, -3.600238800048828, -3.313863754272461, -3.027488946914673, -2.7411141395568848, -2.4547393321990967, -2.1683645248413086, -1.8819894790649414, -1.5956146717071533, -1.3092398643493652, -1.0228649377822876, -0.73649001121521, -0.4501152038574219, -0.163740336894989, 0.12263453006744385, 0.4090093970298767, 0.6953842639923096, 0.9817590713500977, 1.2681339979171753, 1.554508924484253, 1.8408832550048828, 2.127258062362671, 2.413632869720459, 2.700007915496826, 2.9863827228546143, 3.2727575302124023, 3.5591325759887695, 3.8455073833465576, 4.131882190704346, 4.418257236480713, 4.704631805419922, 4.991006851196289, 5.277381896972656, 5.563756465911865, 5.850131511688232, 6.136506080627441, 6.422881126403809, 6.709256172180176, 6.995630741119385, 7.282005786895752, 7.568380355834961, 7.854755401611328, 8.141130447387695, 8.427505493164062, 8.71388053894043, 9.000255584716797, 9.286630630493164, 9.573004722595215, 9.859379768371582, 10.14575481414795, 10.432129859924316, 10.718504905700684, 11.004878997802734]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 17.0, 18.0, 21.0, 34.0, 33.0, 50.0, 76.0, 78.0, 86.0, 77.0, 88.0, 93.0, 72.0, 38.0, 49.0, 43.0, 15.0, 15.0, 17.0, 10.0, 9.0, 5.0, 8.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.3589913845062256, -2.275189161300659, -2.1913869380950928, -2.1075844764709473, -2.023782253265381, -1.9399800300598145, -1.856177806854248, -1.7723755836486816, -1.6885732412338257, -1.6047710180282593, -1.5209686756134033, -1.437166452407837, -1.3533642292022705, -1.2695618867874146, -1.1857596635818481, -1.1019573211669922, -1.0181550979614258, -0.9343528151512146, -0.8505505323410034, -0.766748309135437, -0.6829460263252258, -0.5991437435150146, -0.5153415203094482, -0.43153923749923706, -0.3477369546890259, -0.2639346718788147, -0.1801324188709259, -0.09633016586303711, -0.012527883052825928, 0.07127439975738525, 0.15507662296295166, 0.23887890577316284, 0.322681188583374, 0.4064834713935852, 0.490285724401474, 0.5740879774093628, 0.657890260219574, 0.7416925430297852, 0.8254947662353516, 0.9092970490455627, 0.9930993318557739, 1.0769015550613403, 1.1607038974761963, 1.2445061206817627, 1.328308343887329, 1.412110686302185, 1.4959129095077515, 1.5797152519226074, 1.6635174751281738, 1.7473196983337402, 1.8311220407485962, 1.9149242639541626, 1.9987266063690186, 2.082528829574585, 2.1663310527801514, 2.2501332759857178, 2.3339357376098633, 2.4177379608154297, 2.501540184020996, 2.5853424072265625, 2.669144868850708, 2.7529470920562744, 2.836749315261841, 2.9205515384674072, 3.0043537616729736]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 18.0, 29.0, 35.0, 46.0, 73.0, 114.0, 141.0, 227.0, 274.0, 400.0, 610.0, 955.0, 1740.0, 2982.0, 6028.0, 13095.0, 37422.0, 188418.0, 3716218.0, 163847.0, 34851.0, 12957.0, 5997.0, 3008.0, 1734.0, 1005.0, 673.0, 426.0, 289.0, 198.0, 146.0, 83.0, 58.0, 60.0, 39.0, 13.0, 20.0, 12.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8580703735351562, -0.8299102783203125, -0.8017501831054688, -0.773590087890625, -0.7454299926757812, -0.7172698974609375, -0.6891098022460938, -0.66094970703125, -0.6327896118164062, -0.6046295166015625, -0.5764694213867188, -0.548309326171875, -0.5201492309570312, -0.4919891357421875, -0.46382904052734375, -0.4356689453125, -0.40750885009765625, -0.3793487548828125, -0.35118865966796875, -0.323028564453125, -0.29486846923828125, -0.2667083740234375, -0.23854827880859375, -0.21038818359375, -0.18222808837890625, -0.1540679931640625, -0.12590789794921875, -0.097747802734375, -0.06958770751953125, -0.0414276123046875, -0.01326751708984375, 0.014892578125, 0.04305267333984375, 0.0712127685546875, 0.09937286376953125, 0.127532958984375, 0.15569305419921875, 0.1838531494140625, 0.21201324462890625, 0.24017333984375, 0.26833343505859375, 0.2964935302734375, 0.32465362548828125, 0.352813720703125, 0.38097381591796875, 0.4091339111328125, 0.43729400634765625, 0.4654541015625, 0.49361419677734375, 0.5217742919921875, 0.5499343872070312, 0.578094482421875, 0.6062545776367188, 0.6344146728515625, 0.6625747680664062, 0.69073486328125, 0.7188949584960938, 0.7470550537109375, 0.7752151489257812, 0.803375244140625, 0.8315353393554688, 0.8596954345703125, 0.8878555297851562, 0.916015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 12.0, 12.0, 13.0, 18.0, 22.0, 34.0, 42.0, 52.0, 67.0, 73.0, 84.0, 99.0, 90.0, 77.0, 50.0, 58.0, 35.0, 29.0, 33.0, 16.0, 19.0, 9.0, 2.0, 4.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06103515625, -0.05909252166748047, -0.05714988708496094, -0.055207252502441406, -0.053264617919921875, -0.051321983337402344, -0.04937934875488281, -0.04743671417236328, -0.04549407958984375, -0.04355144500732422, -0.04160881042480469, -0.039666175842285156, -0.037723541259765625, -0.035780906677246094, -0.03383827209472656, -0.03189563751220703, -0.0299530029296875, -0.02801036834716797, -0.026067733764648438, -0.024125099182128906, -0.022182464599609375, -0.020239830017089844, -0.018297195434570312, -0.01635456085205078, -0.01441192626953125, -0.012469291687011719, -0.010526657104492188, -0.008584022521972656, -0.006641387939453125, -0.004698753356933594, -0.0027561187744140625, -0.0008134841918945312, 0.001129150390625, 0.0030717849731445312, 0.0050144195556640625, 0.006957054138183594, 0.008899688720703125, 0.010842323303222656, 0.012784957885742188, 0.014727592468261719, 0.01667022705078125, 0.01861286163330078, 0.020555496215820312, 0.022498130798339844, 0.024440765380859375, 0.026383399963378906, 0.028326034545898438, 0.03026866912841797, 0.0322113037109375, 0.03415393829345703, 0.03609657287597656, 0.038039207458496094, 0.039981842041015625, 0.041924476623535156, 0.04386711120605469, 0.04580974578857422, 0.04775238037109375, 0.04969501495361328, 0.05163764953613281, 0.053580284118652344, 0.055522918701171875, 0.057465553283691406, 0.05940818786621094, 0.06135082244873047, 0.06329345703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 6.0, 4.0, 8.0, 11.0, 26.0, 36.0, 64.0, 122.0, 272.0, 667.0, 1506.0, 4899.0, 21100.0, 176458.0, 3833678.0, 130819.0, 17704.0, 4304.0, 1413.0, 622.0, 240.0, 130.0, 71.0, 35.0, 15.0, 20.0, 10.0, 11.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3662109375, -1.327667236328125, -1.28912353515625, -1.250579833984375, -1.2120361328125, -1.173492431640625, -1.13494873046875, -1.096405029296875, -1.057861328125, -1.019317626953125, -0.98077392578125, -0.942230224609375, -0.9036865234375, -0.865142822265625, -0.82659912109375, -0.788055419921875, -0.74951171875, -0.710968017578125, -0.67242431640625, -0.633880615234375, -0.5953369140625, -0.556793212890625, -0.51824951171875, -0.479705810546875, -0.441162109375, -0.402618408203125, -0.36407470703125, -0.325531005859375, -0.2869873046875, -0.248443603515625, -0.20989990234375, -0.171356201171875, -0.1328125, -0.094268798828125, -0.05572509765625, -0.017181396484375, 0.0213623046875, 0.059906005859375, 0.09844970703125, 0.136993408203125, 0.175537109375, 0.214080810546875, 0.25262451171875, 0.291168212890625, 0.3297119140625, 0.368255615234375, 0.40679931640625, 0.445343017578125, 0.48388671875, 0.522430419921875, 0.56097412109375, 0.599517822265625, 0.6380615234375, 0.676605224609375, 0.71514892578125, 0.753692626953125, 0.792236328125, 0.830780029296875, 0.86932373046875, 0.907867431640625, 0.9464111328125, 0.984954833984375, 1.02349853515625, 1.062042236328125, 1.1005859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 14.0, 9.0, 20.0, 23.0, 27.0, 50.0, 82.0, 136.0, 243.0, 699.0, 1938.0, 347.0, 184.0, 99.0, 53.0, 44.0, 27.0, 17.0, 8.0, 8.0, 5.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.12735748291015625, -0.1230010986328125, -0.11864471435546875, -0.114288330078125, -0.10993194580078125, -0.1055755615234375, -0.10121917724609375, -0.09686279296875, -0.09250640869140625, -0.0881500244140625, -0.08379364013671875, -0.079437255859375, -0.07508087158203125, -0.0707244873046875, -0.06636810302734375, -0.06201171875, -0.05765533447265625, -0.0532989501953125, -0.04894256591796875, -0.044586181640625, -0.04022979736328125, -0.0358734130859375, -0.03151702880859375, -0.02716064453125, -0.02280426025390625, -0.0184478759765625, -0.01409149169921875, -0.009735107421875, -0.00537872314453125, -0.0010223388671875, 0.00333404541015625, 0.0076904296875, 0.01204681396484375, 0.0164031982421875, 0.02075958251953125, 0.025115966796875, 0.02947235107421875, 0.0338287353515625, 0.03818511962890625, 0.04254150390625, 0.04689788818359375, 0.0512542724609375, 0.05561065673828125, 0.059967041015625, 0.06432342529296875, 0.0686798095703125, 0.07303619384765625, 0.077392578125, 0.08174896240234375, 0.0861053466796875, 0.09046173095703125, 0.094818115234375, 0.09917449951171875, 0.1035308837890625, 0.10788726806640625, 0.11224365234375, 0.11660003662109375, 0.1209564208984375, 0.12531280517578125, 0.129669189453125, 0.13402557373046875, 0.1383819580078125, 0.14273834228515625, 0.1470947265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 8.0, 4.0, 9.0, 16.0, 34.0, 39.0, 82.0, 91.0, 143.0, 173.0, 130.0, 108.0, 66.0, 41.0, 22.0, 11.0, 7.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7870513796806335, -0.760526180267334, -0.7340009808540344, -0.7074757814407349, -0.6809505224227905, -0.654425323009491, -0.6279001235961914, -0.6013749241828918, -0.5748497247695923, -0.5483245253562927, -0.5217993259429932, -0.4952740967273712, -0.46874886751174927, -0.4422236680984497, -0.41569846868515015, -0.3891732692718506, -0.36264801025390625, -0.3361228108406067, -0.30959758162498474, -0.2830723822116852, -0.25654715299606323, -0.23002195358276367, -0.2034967541694641, -0.17697153985500336, -0.1504463255405426, -0.12392111122608185, -0.09739590436220169, -0.07087069749832153, -0.04434548318386078, -0.017820268869400024, 0.008704930543899536, 0.03523014485836029, 0.06175529956817627, 0.08828051388263702, 0.11480572074651718, 0.14133092761039734, 0.1678561419248581, 0.19438135623931885, 0.2209065556526184, 0.24743176996707916, 0.2739569842815399, 0.3004821836948395, 0.3270074129104614, 0.353532612323761, 0.38005781173706055, 0.4065830409526825, 0.43310824036598206, 0.459633469581604, 0.48615866899490356, 0.5126838684082031, 0.5392090678215027, 0.5657342672348022, 0.5922595262527466, 0.6187847256660461, 0.6453099250793457, 0.6718351244926453, 0.6983603239059448, 0.7248855233192444, 0.751410722732544, 0.7779359817504883, 0.8044611811637878, 0.8309863805770874, 0.857511579990387, 0.8840367794036865, 0.9105620384216309]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 8.0, 10.0, 18.0, 22.0, 21.0, 18.0, 21.0, 29.0, 20.0, 27.0, 46.0, 42.0, 49.0, 30.0, 40.0, 57.0, 50.0, 44.0, 40.0, 43.0, 34.0, 37.0, 48.0, 41.0, 32.0, 18.0, 28.0, 17.0, 15.0, 14.0, 10.0, 15.0, 14.0, 2.0, 4.0, 11.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.4901590943336487, -0.4758659303188324, -0.4615727663040161, -0.44727960228919983, -0.43298643827438354, -0.41869327425956726, -0.404400110244751, -0.3901069164276123, -0.3758137822151184, -0.3615206182003021, -0.34722745418548584, -0.33293429017066956, -0.31864112615585327, -0.304347962141037, -0.2900547981262207, -0.27576160430908203, -0.26146844029426575, -0.24717527627944946, -0.23288211226463318, -0.2185889482498169, -0.2042957842350006, -0.19000262022018433, -0.17570944130420685, -0.16141627728939056, -0.14712311327457428, -0.132829949259758, -0.11853678524494171, -0.10424361377954483, -0.08995044976472855, -0.07565728574991226, -0.06136411428451538, -0.0470709502696991, -0.03277778625488281, -0.01848462037742138, -0.004191454499959946, 0.010101713240146637, 0.02439487725496292, 0.038688041269779205, 0.052981212735176086, 0.06727437674999237, 0.08156754076480865, 0.09586070477962494, 0.11015386879444122, 0.1244470402598381, 0.13874021172523499, 0.15303337574005127, 0.16732653975486755, 0.18161970376968384, 0.19591286778450012, 0.2102060317993164, 0.2244991958141327, 0.23879235982894897, 0.25308552384376526, 0.26737868785858154, 0.2816718816757202, 0.2959650158882141, 0.3102582097053528, 0.32455137372016907, 0.33884453773498535, 0.35313770174980164, 0.3674308657646179, 0.3817240297794342, 0.3960171937942505, 0.41031038761138916, 0.42460352182388306]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 8.0, 23.0, 20.0, 37.0, 49.0, 81.0, 104.0, 165.0, 281.0, 437.0, 783.0, 1358.0, 2427.0, 4718.0, 10092.0, 23860.0, 63419.0, 188600.0, 404284.0, 223112.0, 73950.0, 27502.0, 11561.0, 5351.0, 2738.0, 1459.0, 782.0, 474.0, 310.0, 182.0, 116.0, 77.0, 56.0, 40.0, 28.0, 14.0, 14.0, 7.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.53564453125, -0.5201530456542969, -0.5046615600585938, -0.4891700744628906, -0.4736785888671875, -0.4581871032714844, -0.44269561767578125, -0.4272041320800781, -0.411712646484375, -0.3962211608886719, -0.38072967529296875, -0.3652381896972656, -0.3497467041015625, -0.3342552185058594, -0.31876373291015625, -0.3032722473144531, -0.28778076171875, -0.2722892761230469, -0.25679779052734375, -0.24130630493164062, -0.2258148193359375, -0.21032333374023438, -0.19483184814453125, -0.17934036254882812, -0.163848876953125, -0.14835739135742188, -0.13286590576171875, -0.11737442016601562, -0.1018829345703125, -0.08639144897460938, -0.07089996337890625, -0.055408477783203125, -0.0399169921875, -0.024425506591796875, -0.00893402099609375, 0.006557464599609375, 0.0220489501953125, 0.037540435791015625, 0.05303192138671875, 0.06852340698242188, 0.084014892578125, 0.09950637817382812, 0.11499786376953125, 0.13048934936523438, 0.1459808349609375, 0.16147232055664062, 0.17696380615234375, 0.19245529174804688, 0.20794677734375, 0.22343826293945312, 0.23892974853515625, 0.2544212341308594, 0.2699127197265625, 0.2854042053222656, 0.30089569091796875, 0.3163871765136719, 0.331878662109375, 0.3473701477050781, 0.36286163330078125, 0.3783531188964844, 0.3938446044921875, 0.4093360900878906, 0.42482757568359375, 0.4403190612792969, 0.455810546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 6.0, 1.0, 5.0, 4.0, 12.0, 14.0, 16.0, 16.0, 14.0, 35.0, 44.0, 40.0, 62.0, 67.0, 72.0, 82.0, 79.0, 74.0, 69.0, 56.0, 54.0, 34.0, 32.0, 25.0, 18.0, 11.0, 12.0, 9.0, 0.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049957275390625, -0.048233985900878906, -0.04651069641113281, -0.04478740692138672, -0.043064117431640625, -0.04134082794189453, -0.03961753845214844, -0.037894248962402344, -0.03617095947265625, -0.034447669982910156, -0.03272438049316406, -0.03100109100341797, -0.029277801513671875, -0.02755451202392578, -0.025831222534179688, -0.024107933044433594, -0.0223846435546875, -0.020661354064941406, -0.018938064575195312, -0.01721477508544922, -0.015491485595703125, -0.013768196105957031, -0.012044906616210938, -0.010321617126464844, -0.00859832763671875, -0.006875038146972656, -0.0051517486572265625, -0.0034284591674804688, -0.001705169677734375, 1.811981201171875e-05, 0.0017414093017578125, 0.0034646987915039062, 0.00518798828125, 0.006911277770996094, 0.008634567260742188, 0.010357856750488281, 0.012081146240234375, 0.013804435729980469, 0.015527725219726562, 0.017251014709472656, 0.01897430419921875, 0.020697593688964844, 0.022420883178710938, 0.02414417266845703, 0.025867462158203125, 0.02759075164794922, 0.029314041137695312, 0.031037330627441406, 0.0327606201171875, 0.034483909606933594, 0.03620719909667969, 0.03793048858642578, 0.039653778076171875, 0.04137706756591797, 0.04310035705566406, 0.044823646545410156, 0.04654693603515625, 0.048270225524902344, 0.04999351501464844, 0.05171680450439453, 0.053440093994140625, 0.05516338348388672, 0.05688667297363281, 0.058609962463378906, 0.060333251953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 10.0, 21.0, 16.0, 18.0, 37.0, 48.0, 69.0, 105.0, 153.0, 244.0, 334.0, 558.0, 982.0, 1791.0, 3964.0, 9995.0, 31264.0, 115707.0, 379707.0, 354773.0, 103339.0, 28200.0, 9164.0, 3698.0, 1745.0, 909.0, 546.0, 365.0, 233.0, 155.0, 115.0, 72.0, 46.0, 53.0, 33.0, 18.0, 14.0, 10.0, 1.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.53857421875, -0.5217208862304688, -0.5048675537109375, -0.48801422119140625, -0.471160888671875, -0.45430755615234375, -0.4374542236328125, -0.42060089111328125, -0.40374755859375, -0.38689422607421875, -0.3700408935546875, -0.35318756103515625, -0.336334228515625, -0.31948089599609375, -0.3026275634765625, -0.28577423095703125, -0.2689208984375, -0.25206756591796875, -0.2352142333984375, -0.21836090087890625, -0.201507568359375, -0.18465423583984375, -0.1678009033203125, -0.15094757080078125, -0.13409423828125, -0.11724090576171875, -0.1003875732421875, -0.08353424072265625, -0.066680908203125, -0.04982757568359375, -0.0329742431640625, -0.01612091064453125, 0.000732421875, 0.01758575439453125, 0.0344390869140625, 0.05129241943359375, 0.068145751953125, 0.08499908447265625, 0.1018524169921875, 0.11870574951171875, 0.13555908203125, 0.15241241455078125, 0.1692657470703125, 0.18611907958984375, 0.202972412109375, 0.21982574462890625, 0.2366790771484375, 0.25353240966796875, 0.2703857421875, 0.28723907470703125, 0.3040924072265625, 0.32094573974609375, 0.337799072265625, 0.35465240478515625, 0.3715057373046875, 0.38835906982421875, 0.40521240234375, 0.42206573486328125, 0.4389190673828125, 0.45577239990234375, 0.472625732421875, 0.48947906494140625, 0.5063323974609375, 0.5231857299804688, 0.5400390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 9.0, 8.0, 11.0, 11.0, 14.0, 15.0, 11.0, 11.0, 34.0, 38.0, 37.0, 37.0, 37.0, 37.0, 48.0, 42.0, 40.0, 40.0, 40.0, 52.0, 49.0, 46.0, 51.0, 32.0, 35.0, 39.0, 31.0, 19.0, 16.0, 22.0, 14.0, 11.0, 10.0, 11.0, 9.0, 5.0, 1.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.263427734375, -0.2548789978027344, -0.24633026123046875, -0.23778152465820312, -0.2292327880859375, -0.22068405151367188, -0.21213531494140625, -0.20358657836914062, -0.195037841796875, -0.18648910522460938, -0.17794036865234375, -0.16939163208007812, -0.1608428955078125, -0.15229415893554688, -0.14374542236328125, -0.13519668579101562, -0.12664794921875, -0.11809921264648438, -0.10955047607421875, -0.10100173950195312, -0.0924530029296875, -0.08390426635742188, -0.07535552978515625, -0.06680679321289062, -0.058258056640625, -0.049709320068359375, -0.04116058349609375, -0.032611846923828125, -0.0240631103515625, -0.015514373779296875, -0.00696563720703125, 0.001583099365234375, 0.0101318359375, 0.018680572509765625, 0.02722930908203125, 0.035778045654296875, 0.0443267822265625, 0.052875518798828125, 0.06142425537109375, 0.06997299194335938, 0.078521728515625, 0.08707046508789062, 0.09561920166015625, 0.10416793823242188, 0.1127166748046875, 0.12126541137695312, 0.12981414794921875, 0.13836288452148438, 0.14691162109375, 0.15546035766601562, 0.16400909423828125, 0.17255783081054688, 0.1811065673828125, 0.18965530395507812, 0.19820404052734375, 0.20675277709960938, 0.215301513671875, 0.22385025024414062, 0.23239898681640625, 0.24094772338867188, 0.2494964599609375, 0.2580451965332031, 0.26659393310546875, 0.2751426696777344, 0.28369140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 4.0, 5.0, 14.0, 15.0, 20.0, 30.0, 49.0, 55.0, 90.0, 129.0, 245.0, 424.0, 839.0, 2044.0, 5625.0, 19492.0, 89657.0, 464980.0, 372885.0, 68237.0, 15595.0, 4652.0, 1716.0, 763.0, 358.0, 204.0, 150.0, 92.0, 44.0, 29.0, 24.0, 22.0, 20.0, 12.0, 9.0, 7.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31005859375, -0.3014259338378906, -0.29279327392578125, -0.2841606140136719, -0.2755279541015625, -0.2668952941894531, -0.25826263427734375, -0.24962997436523438, -0.240997314453125, -0.23236465454101562, -0.22373199462890625, -0.21509933471679688, -0.2064666748046875, -0.19783401489257812, -0.18920135498046875, -0.18056869506835938, -0.17193603515625, -0.16330337524414062, -0.15467071533203125, -0.14603805541992188, -0.1374053955078125, -0.12877273559570312, -0.12014007568359375, -0.11150741577148438, -0.102874755859375, -0.09424209594726562, -0.08560943603515625, -0.07697677612304688, -0.0683441162109375, -0.059711456298828125, -0.05107879638671875, -0.042446136474609375, -0.0338134765625, -0.025180816650390625, -0.01654815673828125, -0.007915496826171875, 0.0007171630859375, 0.009349822998046875, 0.01798248291015625, 0.026615142822265625, 0.035247802734375, 0.043880462646484375, 0.05251312255859375, 0.061145782470703125, 0.0697784423828125, 0.07841110229492188, 0.08704376220703125, 0.09567642211914062, 0.10430908203125, 0.11294174194335938, 0.12157440185546875, 0.13020706176757812, 0.1388397216796875, 0.14747238159179688, 0.15610504150390625, 0.16473770141601562, 0.173370361328125, 0.18200302124023438, 0.19063568115234375, 0.19926834106445312, 0.2079010009765625, 0.21653366088867188, 0.22516632080078125, 0.23379898071289062, 0.242431640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 3.0, 5.0, 2.0, 6.0, 10.0, 7.0, 13.0, 16.0, 30.0, 26.0, 30.0, 42.0, 69.0, 82.0, 82.0, 90.0, 90.0, 72.0, 78.0, 63.0, 37.0, 28.0, 14.0, 21.0, 16.0, 8.0, 16.0, 4.0, 11.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010216236114501953, -9.896047413349152e-05, -9.57585871219635e-05, -9.255670011043549e-05, -8.935481309890747e-05, -8.615292608737946e-05, -8.295103907585144e-05, -7.974915206432343e-05, -7.654726505279541e-05, -7.33453780412674e-05, -7.014349102973938e-05, -6.694160401821136e-05, -6.373971700668335e-05, -6.0537829995155334e-05, -5.733594298362732e-05, -5.4134055972099304e-05, -5.093216896057129e-05, -4.7730281949043274e-05, -4.452839493751526e-05, -4.1326507925987244e-05, -3.812462091445923e-05, -3.492273390293121e-05, -3.17208468914032e-05, -2.8518959879875183e-05, -2.5317072868347168e-05, -2.2115185856819153e-05, -1.8913298845291138e-05, -1.5711411833763123e-05, -1.2509524822235107e-05, -9.307637810707092e-06, -6.105750799179077e-06, -2.903863787651062e-06, 2.980232238769531e-07, 3.4999102354049683e-06, 6.701797246932983e-06, 9.903684258460999e-06, 1.3105571269989014e-05, 1.630745828151703e-05, 1.9509345293045044e-05, 2.271123230457306e-05, 2.5913119316101074e-05, 2.911500632762909e-05, 3.2316893339157104e-05, 3.551878035068512e-05, 3.8720667362213135e-05, 4.192255437374115e-05, 4.5124441385269165e-05, 4.832632839679718e-05, 5.1528215408325195e-05, 5.473010241985321e-05, 5.7931989431381226e-05, 6.113387644290924e-05, 6.433576345443726e-05, 6.753765046596527e-05, 7.073953747749329e-05, 7.39414244890213e-05, 7.714331150054932e-05, 8.034519851207733e-05, 8.354708552360535e-05, 8.674897253513336e-05, 8.995085954666138e-05, 9.315274655818939e-05, 9.635463356971741e-05, 9.955652058124542e-05, 0.00010275840759277344]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 4.0, 13.0, 5.0, 6.0, 16.0, 15.0, 21.0, 38.0, 53.0, 59.0, 82.0, 99.0, 186.0, 248.0, 477.0, 864.0, 1787.0, 3944.0, 10094.0, 33244.0, 171718.0, 605843.0, 168478.0, 33071.0, 10197.0, 3979.0, 1774.0, 865.0, 475.0, 293.0, 155.0, 108.0, 81.0, 65.0, 45.0, 28.0, 23.0, 26.0, 22.0, 10.0, 7.0, 11.0, 11.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.2703742980957031, -0.26120758056640625, -0.2520408630371094, -0.2428741455078125, -0.23370742797851562, -0.22454071044921875, -0.21537399291992188, -0.206207275390625, -0.19704055786132812, -0.18787384033203125, -0.17870712280273438, -0.1695404052734375, -0.16037368774414062, -0.15120697021484375, -0.14204025268554688, -0.13287353515625, -0.12370681762695312, -0.11454010009765625, -0.10537338256835938, -0.0962066650390625, -0.08703994750976562, -0.07787322998046875, -0.06870651245117188, -0.059539794921875, -0.050373077392578125, -0.04120635986328125, -0.032039642333984375, -0.0228729248046875, -0.013706207275390625, -0.00453948974609375, 0.004627227783203125, 0.0137939453125, 0.022960662841796875, 0.03212738037109375, 0.041294097900390625, 0.0504608154296875, 0.059627532958984375, 0.06879425048828125, 0.07796096801757812, 0.087127685546875, 0.09629440307617188, 0.10546112060546875, 0.11462783813476562, 0.1237945556640625, 0.13296127319335938, 0.14212799072265625, 0.15129470825195312, 0.16046142578125, 0.16962814331054688, 0.17879486083984375, 0.18796157836914062, 0.1971282958984375, 0.20629501342773438, 0.21546173095703125, 0.22462844848632812, 0.233795166015625, 0.24296188354492188, 0.25212860107421875, 0.2612953186035156, 0.2704620361328125, 0.2796287536621094, 0.28879547119140625, 0.2979621887207031, 0.30712890625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 1.0, 6.0, 11.0, 17.0, 8.0, 15.0, 18.0, 31.0, 37.0, 32.0, 51.0, 52.0, 68.0, 91.0, 76.0, 68.0, 69.0, 58.0, 45.0, 39.0, 40.0, 23.0, 15.0, 25.0, 14.0, 9.0, 9.0, 6.0, 5.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.10223388671875, -0.09864330291748047, -0.09505271911621094, -0.0914621353149414, -0.08787155151367188, -0.08428096771240234, -0.08069038391113281, -0.07709980010986328, -0.07350921630859375, -0.06991863250732422, -0.06632804870605469, -0.06273746490478516, -0.059146881103515625, -0.055556297302246094, -0.05196571350097656, -0.04837512969970703, -0.0447845458984375, -0.04119396209716797, -0.03760337829589844, -0.034012794494628906, -0.030422210693359375, -0.026831626892089844, -0.023241043090820312, -0.01965045928955078, -0.01605987548828125, -0.012469291687011719, -0.008878707885742188, -0.005288124084472656, -0.001697540283203125, 0.0018930435180664062, 0.0054836273193359375, 0.009074211120605469, 0.012664794921875, 0.01625537872314453, 0.019845962524414062, 0.023436546325683594, 0.027027130126953125, 0.030617713928222656, 0.03420829772949219, 0.03779888153076172, 0.04138946533203125, 0.04498004913330078, 0.04857063293457031, 0.052161216735839844, 0.055751800537109375, 0.059342384338378906, 0.06293296813964844, 0.06652355194091797, 0.0701141357421875, 0.07370471954345703, 0.07729530334472656, 0.0808858871459961, 0.08447647094726562, 0.08806705474853516, 0.09165763854980469, 0.09524822235107422, 0.09883880615234375, 0.10242938995361328, 0.10601997375488281, 0.10961055755615234, 0.11320114135742188, 0.1167917251586914, 0.12038230895996094, 0.12397289276123047, 0.1275634765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 19.0, 60.0, 286.0, 454.0, 151.0, 24.0, 9.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.147607803344727, -5.791110515594482, -5.4346137046813965, -5.078116416931152, -4.721619129180908, -4.365121841430664, -4.008625030517578, -3.652127742767334, -3.295630693435669, -2.939133644104004, -2.5826363563537598, -2.2261393070220947, -1.8696421384811401, -1.5131449699401855, -1.1566479206085205, -0.8001506328582764, -0.44365358352661133, -0.08715644478797913, 0.2693406939506531, 0.6258378028869629, 0.9823349714279175, 1.338832139968872, 1.695329189300537, 2.0518264770507812, 2.4083235263824463, 2.7648205757141113, 3.1213178634643555, 3.4778149127960205, 3.8343119621276855, 4.19080924987793, 4.547306060791016, 4.903803825378418, 5.260300636291504, 5.616797924041748, 5.973294734954834, 6.329792022705078, 6.686289310455322, 7.042786598205566, 7.399283409118652, 7.7557806968688965, 8.11227798461914, 8.468774795532227, 8.825272560119629, 9.181769371032715, 9.5382661819458, 9.894763946533203, 10.251260757446289, 10.607757568359375, 10.964254379272461, 11.320751190185547, 11.67724895477295, 12.033745765686035, 12.390242576599121, 12.746740341186523, 13.10323715209961, 13.459733963012695, 13.816231727600098, 14.172728538513184, 14.529226303100586, 14.885723114013672, 15.242219924926758, 15.59871768951416, 15.955214500427246, 16.31171226501465, 16.668209075927734]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 5.0, 6.0, 8.0, 11.0, 7.0, 12.0, 21.0, 17.0, 21.0, 22.0, 31.0, 44.0, 31.0, 32.0, 31.0, 42.0, 41.0, 40.0, 53.0, 49.0, 51.0, 41.0, 57.0, 36.0, 34.0, 45.0, 33.0, 21.0, 20.0, 19.0, 11.0, 22.0, 15.0, 11.0, 10.0, 9.0, 10.0, 5.0, 6.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.0748305320739746, -2.0089237689971924, -1.9430170059204102, -1.877110242843628, -1.8112034797668457, -1.7452967166900635, -1.6793900728225708, -1.6134833097457886, -1.5475765466690063, -1.4816697835922241, -1.415763020515442, -1.3498562574386597, -1.283949613571167, -1.2180428504943848, -1.1521360874176025, -1.0862293243408203, -1.020322561264038, -0.9544157981872559, -0.8885090351104736, -0.8226023316383362, -0.756695568561554, -0.6907888054847717, -0.6248821020126343, -0.558975338935852, -0.4930685758590698, -0.4271618127822876, -0.36125507950782776, -0.2953483462333679, -0.2294415831565857, -0.16353482007980347, -0.09762808680534363, -0.03172135353088379, 0.03418540954589844, 0.10009215772151947, 0.1659989058971405, 0.23190565407276154, 0.29781240224838257, 0.3637191653251648, 0.42962589859962463, 0.4955326318740845, 0.5614393949508667, 0.6273461580276489, 0.6932529211044312, 0.7591596245765686, 0.8250663876533508, 0.8909731507301331, 0.9568798542022705, 1.0227866172790527, 1.088693380355835, 1.1546001434326172, 1.2205069065093994, 1.2864136695861816, 1.3523204326629639, 1.418227195739746, 1.4841338396072388, 1.550040602684021, 1.6159473657608032, 1.6818541288375854, 1.7477608919143677, 1.81366765499115, 1.8795742988586426, 1.9454810619354248, 2.011387825012207, 2.0772945880889893, 2.1432013511657715]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 8.0, 9.0, 7.0, 13.0, 10.0, 24.0, 31.0, 32.0, 47.0, 62.0, 107.0, 341.0, 2187.0, 53371.0, 4124981.0, 11521.0, 987.0, 214.0, 108.0, 57.0, 42.0, 21.0, 16.0, 21.0, 13.0, 11.0, 11.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.98602294921875, -2.8841552734375, -2.78228759765625, -2.680419921875, -2.57855224609375, -2.4766845703125, -2.37481689453125, -2.27294921875, -2.17108154296875, -2.0692138671875, -1.96734619140625, -1.865478515625, -1.76361083984375, -1.6617431640625, -1.55987548828125, -1.4580078125, -1.35614013671875, -1.2542724609375, -1.15240478515625, -1.050537109375, -0.94866943359375, -0.8468017578125, -0.74493408203125, -0.64306640625, -0.54119873046875, -0.4393310546875, -0.33746337890625, -0.235595703125, -0.13372802734375, -0.0318603515625, 0.07000732421875, 0.171875, 0.27374267578125, 0.3756103515625, 0.47747802734375, 0.579345703125, 0.68121337890625, 0.7830810546875, 0.88494873046875, 0.98681640625, 1.08868408203125, 1.1905517578125, 1.29241943359375, 1.394287109375, 1.49615478515625, 1.5980224609375, 1.69989013671875, 1.8017578125, 1.90362548828125, 2.0054931640625, 2.10736083984375, 2.209228515625, 2.31109619140625, 2.4129638671875, 2.51483154296875, 2.61669921875, 2.71856689453125, 2.8204345703125, 2.92230224609375, 3.024169921875, 3.12603759765625, 3.2279052734375, 3.32977294921875, 3.431640625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 14.0, 19.0, 31.0, 36.0, 34.0, 50.0, 56.0, 53.0, 66.0, 74.0, 69.0, 64.0, 76.0, 63.0, 63.0, 39.0, 46.0, 22.0, 17.0, 14.0, 15.0, 12.0, 8.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0665283203125, -0.06426525115966797, -0.06200218200683594, -0.059739112854003906, -0.057476043701171875, -0.055212974548339844, -0.05294990539550781, -0.05068683624267578, -0.04842376708984375, -0.04616069793701172, -0.04389762878417969, -0.041634559631347656, -0.039371490478515625, -0.037108421325683594, -0.03484535217285156, -0.03258228302001953, -0.0303192138671875, -0.02805614471435547, -0.025793075561523438, -0.023530006408691406, -0.021266937255859375, -0.019003868103027344, -0.016740798950195312, -0.014477729797363281, -0.01221466064453125, -0.009951591491699219, -0.0076885223388671875, -0.005425453186035156, -0.003162384033203125, -0.0008993148803710938, 0.0013637542724609375, 0.0036268234252929688, 0.005889892578125, 0.008152961730957031, 0.010416030883789062, 0.012679100036621094, 0.014942169189453125, 0.017205238342285156, 0.019468307495117188, 0.02173137664794922, 0.02399444580078125, 0.02625751495361328, 0.028520584106445312, 0.030783653259277344, 0.033046722412109375, 0.035309791564941406, 0.03757286071777344, 0.03983592987060547, 0.0420989990234375, 0.04436206817626953, 0.04662513732910156, 0.048888206481933594, 0.051151275634765625, 0.053414344787597656, 0.05567741394042969, 0.05794048309326172, 0.06020355224609375, 0.06246662139892578, 0.06472969055175781, 0.06699275970458984, 0.06925582885742188, 0.0715188980102539, 0.07378196716308594, 0.07604503631591797, 0.07830810546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 9.0, 17.0, 28.0, 42.0, 78.0, 136.0, 237.0, 451.0, 1032.0, 2808.0, 10599.0, 52067.0, 820350.0, 3219062.0, 68693.0, 12930.0, 3382.0, 1192.0, 495.0, 264.0, 161.0, 90.0, 58.0, 39.0, 16.0, 15.0, 7.0, 12.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.89013671875, -0.8623809814453125, -0.834625244140625, -0.8068695068359375, -0.77911376953125, -0.7513580322265625, -0.723602294921875, -0.6958465576171875, -0.6680908203125, -0.6403350830078125, -0.612579345703125, -0.5848236083984375, -0.55706787109375, -0.5293121337890625, -0.501556396484375, -0.4738006591796875, -0.446044921875, -0.4182891845703125, -0.390533447265625, -0.3627777099609375, -0.33502197265625, -0.3072662353515625, -0.279510498046875, -0.2517547607421875, -0.2239990234375, -0.1962432861328125, -0.168487548828125, -0.1407318115234375, -0.11297607421875, -0.0852203369140625, -0.057464599609375, -0.0297088623046875, -0.001953125, 0.0258026123046875, 0.053558349609375, 0.0813140869140625, 0.10906982421875, 0.1368255615234375, 0.164581298828125, 0.1923370361328125, 0.2200927734375, 0.2478485107421875, 0.275604248046875, 0.3033599853515625, 0.33111572265625, 0.3588714599609375, 0.386627197265625, 0.4143829345703125, 0.442138671875, 0.4698944091796875, 0.497650146484375, 0.5254058837890625, 0.55316162109375, 0.5809173583984375, 0.608673095703125, 0.6364288330078125, 0.6641845703125, 0.6919403076171875, 0.719696044921875, 0.7474517822265625, 0.77520751953125, 0.8029632568359375, 0.830718994140625, 0.8584747314453125, 0.88623046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 12.0, 14.0, 25.0, 42.0, 50.0, 117.0, 248.0, 1955.0, 1086.0, 227.0, 133.0, 57.0, 41.0, 20.0, 14.0, 15.0, 6.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11480712890625, -0.1087484359741211, -0.10268974304199219, -0.09663105010986328, -0.09057235717773438, -0.08451366424560547, -0.07845497131347656, -0.07239627838134766, -0.06633758544921875, -0.060278892517089844, -0.05422019958496094, -0.04816150665283203, -0.042102813720703125, -0.03604412078857422, -0.029985427856445312, -0.023926734924316406, -0.0178680419921875, -0.011809349060058594, -0.0057506561279296875, 0.00030803680419921875, 0.006366729736328125, 0.012425422668457031, 0.018484115600585938, 0.024542808532714844, 0.03060150146484375, 0.036660194396972656, 0.04271888732910156, 0.04877758026123047, 0.054836273193359375, 0.06089496612548828, 0.06695365905761719, 0.0730123519897461, 0.079071044921875, 0.0851297378540039, 0.09118843078613281, 0.09724712371826172, 0.10330581665039062, 0.10936450958251953, 0.11542320251464844, 0.12148189544677734, 0.12754058837890625, 0.13359928131103516, 0.13965797424316406, 0.14571666717529297, 0.15177536010742188, 0.15783405303955078, 0.1638927459716797, 0.1699514389038086, 0.1760101318359375, 0.1820688247680664, 0.1881275177001953, 0.19418621063232422, 0.20024490356445312, 0.20630359649658203, 0.21236228942871094, 0.21842098236083984, 0.22447967529296875, 0.23053836822509766, 0.23659706115722656, 0.24265575408935547, 0.24871444702148438, 0.2547731399536133, 0.2608318328857422, 0.2668905258178711, 0.27294921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 3.0, 22.0, 25.0, 45.0, 63.0, 65.0, 79.0, 114.0, 112.0, 130.0, 88.0, 65.0, 54.0, 43.0, 31.0, 23.0, 4.0, 14.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.699678897857666, -0.680961549282074, -0.6622442007064819, -0.6435269117355347, -0.6248095631599426, -0.6060922145843506, -0.5873748660087585, -0.5686575174331665, -0.5499401688575745, -0.5312228202819824, -0.5125054717063904, -0.4937881529331207, -0.4750708043575287, -0.45635348558425903, -0.437636137008667, -0.41891878843307495, -0.4002014696598053, -0.38148412108421326, -0.3627668023109436, -0.34404945373535156, -0.3253321051597595, -0.3066147565841675, -0.2878974378108978, -0.2691800892353058, -0.25046277046203613, -0.23174543678760529, -0.21302808821201324, -0.1943107545375824, -0.17559340596199036, -0.1568760722875595, -0.13815873861312866, -0.11944139003753662, -0.10072401165962219, -0.08200667053461075, -0.0632893294095993, -0.04457199573516846, -0.025854654610157013, -0.007137313485145569, 0.011580020189285278, 0.03029736876487732, 0.049014702439308167, 0.06773204356431961, 0.08644938468933105, 0.1051667183637619, 0.12388405948877335, 0.1426014006137848, 0.16131873428821564, 0.18003608286380768, 0.19875341653823853, 0.21747075021266937, 0.2361880987882614, 0.25490543246269226, 0.2736227810382843, 0.29234009981155396, 0.311057448387146, 0.32977479696273804, 0.3484921455383301, 0.3672094941139221, 0.3859268128871918, 0.4046441614627838, 0.42336151003837585, 0.4420788288116455, 0.46079617738723755, 0.4795135259628296, 0.49823084473609924]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 4.0, 4.0, 5.0, 15.0, 11.0, 19.0, 22.0, 24.0, 22.0, 25.0, 23.0, 27.0, 36.0, 36.0, 27.0, 42.0, 49.0, 35.0, 58.0, 47.0, 47.0, 38.0, 40.0, 30.0, 28.0, 30.0, 38.0, 19.0, 24.0, 28.0, 20.0, 14.0, 9.0, 14.0, 24.0, 13.0, 5.0, 6.0, 7.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3550928831100464, -0.34443509578704834, -0.3337773084640503, -0.32311952114105225, -0.3124617636203766, -0.30180397629737854, -0.2911461889743805, -0.28048840165138245, -0.2698306143283844, -0.25917282700538635, -0.2485150545835495, -0.23785726726055145, -0.2271994799375534, -0.21654170751571655, -0.2058839201927185, -0.19522613286972046, -0.1845683604478836, -0.17391057312488556, -0.1632528007030487, -0.15259501338005066, -0.1419372260570526, -0.13127943873405457, -0.12062166631221771, -0.10996387898921967, -0.09930609911680222, -0.08864831924438477, -0.07799053192138672, -0.06733275204896927, -0.05667496845126152, -0.04601718485355377, -0.03535940498113632, -0.024701617658138275, -0.014043837785720825, -0.0033860551193356514, 0.007271727547049522, 0.01792950928211212, 0.02858729287981987, 0.03924507647752762, 0.04990285634994507, 0.060560643672943115, 0.07121842354536057, 0.08187620341777802, 0.09253399074077606, 0.10319177061319351, 0.11384955048561096, 0.12450733780860901, 0.13516512513160706, 0.1458229124546051, 0.15648068487644196, 0.16713847219944, 0.17779624462127686, 0.1884540319442749, 0.19911181926727295, 0.209769606590271, 0.22042737901210785, 0.2310851663351059, 0.24174293875694275, 0.2524007260799408, 0.26305851340293884, 0.2737162709236145, 0.28437405824661255, 0.2950318455696106, 0.30568963289260864, 0.3163474202156067, 0.32700520753860474]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 23.0, 19.0, 36.0, 61.0, 106.0, 138.0, 229.0, 388.0, 661.0, 1178.0, 2245.0, 4659.0, 11477.0, 33327.0, 108855.0, 322481.0, 363655.0, 133956.0, 40281.0, 13906.0, 5295.0, 2439.0, 1247.0, 723.0, 428.0, 246.0, 152.0, 110.0, 60.0, 41.0, 30.0, 19.0, 14.0, 9.0, 4.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5546875, -0.5384140014648438, -0.5221405029296875, -0.5058670043945312, -0.489593505859375, -0.47332000732421875, -0.4570465087890625, -0.44077301025390625, -0.42449951171875, -0.40822601318359375, -0.3919525146484375, -0.37567901611328125, -0.359405517578125, -0.34313201904296875, -0.3268585205078125, -0.31058502197265625, -0.2943115234375, -0.27803802490234375, -0.2617645263671875, -0.24549102783203125, -0.229217529296875, -0.21294403076171875, -0.1966705322265625, -0.18039703369140625, -0.16412353515625, -0.14785003662109375, -0.1315765380859375, -0.11530303955078125, -0.099029541015625, -0.08275604248046875, -0.0664825439453125, -0.05020904541015625, -0.033935546875, -0.01766204833984375, -0.0013885498046875, 0.01488494873046875, 0.031158447265625, 0.04743194580078125, 0.0637054443359375, 0.07997894287109375, 0.09625244140625, 0.11252593994140625, 0.1287994384765625, 0.14507293701171875, 0.161346435546875, 0.17761993408203125, 0.1938934326171875, 0.21016693115234375, 0.2264404296875, 0.24271392822265625, 0.2589874267578125, 0.27526092529296875, 0.291534423828125, 0.30780792236328125, 0.3240814208984375, 0.34035491943359375, 0.35662841796875, 0.37290191650390625, 0.3891754150390625, 0.40544891357421875, 0.421722412109375, 0.43799591064453125, 0.4542694091796875, 0.47054290771484375, 0.48681640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 6.0, 4.0, 12.0, 22.0, 27.0, 24.0, 27.0, 43.0, 53.0, 56.0, 56.0, 55.0, 65.0, 70.0, 81.0, 76.0, 59.0, 41.0, 48.0, 47.0, 24.0, 21.0, 14.0, 14.0, 10.0, 10.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06536865234375, -0.06313037872314453, -0.06089210510253906, -0.058653831481933594, -0.056415557861328125, -0.054177284240722656, -0.05193901062011719, -0.04970073699951172, -0.04746246337890625, -0.04522418975830078, -0.04298591613769531, -0.040747642517089844, -0.038509368896484375, -0.036271095275878906, -0.03403282165527344, -0.03179454803466797, -0.0295562744140625, -0.02731800079345703, -0.025079727172851562, -0.022841453552246094, -0.020603179931640625, -0.018364906311035156, -0.016126632690429688, -0.013888359069824219, -0.01165008544921875, -0.009411811828613281, -0.0071735382080078125, -0.004935264587402344, -0.002696990966796875, -0.00045871734619140625, 0.0017795562744140625, 0.004017829895019531, 0.006256103515625, 0.008494377136230469, 0.010732650756835938, 0.012970924377441406, 0.015209197998046875, 0.017447471618652344, 0.019685745239257812, 0.02192401885986328, 0.02416229248046875, 0.02640056610107422, 0.028638839721679688, 0.030877113342285156, 0.033115386962890625, 0.035353660583496094, 0.03759193420410156, 0.03983020782470703, 0.0420684814453125, 0.04430675506591797, 0.04654502868652344, 0.048783302307128906, 0.051021575927734375, 0.053259849548339844, 0.05549812316894531, 0.05773639678955078, 0.05997467041015625, 0.06221294403076172, 0.06445121765136719, 0.06668949127197266, 0.06892776489257812, 0.0711660385131836, 0.07340431213378906, 0.07564258575439453, 0.077880859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 7.0, 14.0, 7.0, 17.0, 15.0, 21.0, 33.0, 52.0, 75.0, 116.0, 133.0, 215.0, 263.0, 481.0, 707.0, 1196.0, 2347.0, 5047.0, 13113.0, 38992.0, 125153.0, 333463.0, 335717.0, 127844.0, 39484.0, 13219.0, 4991.0, 2344.0, 1238.0, 718.0, 463.0, 314.0, 227.0, 170.0, 99.0, 85.0, 60.0, 34.0, 33.0, 15.0, 4.0, 15.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.423828125, -0.40921783447265625, -0.3946075439453125, -0.37999725341796875, -0.365386962890625, -0.35077667236328125, -0.3361663818359375, -0.32155609130859375, -0.30694580078125, -0.29233551025390625, -0.2777252197265625, -0.26311492919921875, -0.248504638671875, -0.23389434814453125, -0.2192840576171875, -0.20467376708984375, -0.1900634765625, -0.17545318603515625, -0.1608428955078125, -0.14623260498046875, -0.131622314453125, -0.11701202392578125, -0.1024017333984375, -0.08779144287109375, -0.07318115234375, -0.05857086181640625, -0.0439605712890625, -0.02935028076171875, -0.014739990234375, -0.00012969970703125, 0.0144805908203125, 0.02909088134765625, 0.043701171875, 0.05831146240234375, 0.0729217529296875, 0.08753204345703125, 0.102142333984375, 0.11675262451171875, 0.1313629150390625, 0.14597320556640625, 0.16058349609375, 0.17519378662109375, 0.1898040771484375, 0.20441436767578125, 0.219024658203125, 0.23363494873046875, 0.2482452392578125, 0.26285552978515625, 0.2774658203125, 0.29207611083984375, 0.3066864013671875, 0.32129669189453125, 0.335906982421875, 0.35051727294921875, 0.3651275634765625, 0.37973785400390625, 0.39434814453125, 0.40895843505859375, 0.4235687255859375, 0.43817901611328125, 0.452789306640625, 0.46739959716796875, 0.4820098876953125, 0.49662017822265625, 0.51123046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 9.0, 6.0, 6.0, 11.0, 11.0, 8.0, 6.0, 19.0, 12.0, 14.0, 29.0, 34.0, 32.0, 31.0, 43.0, 39.0, 40.0, 34.0, 44.0, 43.0, 47.0, 44.0, 45.0, 42.0, 36.0, 32.0, 26.0, 37.0, 22.0, 28.0, 23.0, 22.0, 20.0, 15.0, 20.0, 16.0, 7.0, 10.0, 12.0, 8.0, 1.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.278564453125, -0.2698211669921875, -0.261077880859375, -0.2523345947265625, -0.24359130859375, -0.2348480224609375, -0.226104736328125, -0.2173614501953125, -0.2086181640625, -0.1998748779296875, -0.191131591796875, -0.1823883056640625, -0.17364501953125, -0.1649017333984375, -0.156158447265625, -0.1474151611328125, -0.138671875, -0.1299285888671875, -0.121185302734375, -0.1124420166015625, -0.10369873046875, -0.0949554443359375, -0.086212158203125, -0.0774688720703125, -0.0687255859375, -0.0599822998046875, -0.051239013671875, -0.0424957275390625, -0.03375244140625, -0.0250091552734375, -0.016265869140625, -0.0075225830078125, 0.001220703125, 0.0099639892578125, 0.018707275390625, 0.0274505615234375, 0.03619384765625, 0.0449371337890625, 0.053680419921875, 0.0624237060546875, 0.0711669921875, 0.0799102783203125, 0.088653564453125, 0.0973968505859375, 0.10614013671875, 0.1148834228515625, 0.123626708984375, 0.1323699951171875, 0.14111328125, 0.1498565673828125, 0.158599853515625, 0.1673431396484375, 0.17608642578125, 0.1848297119140625, 0.193572998046875, 0.2023162841796875, 0.2110595703125, 0.2198028564453125, 0.228546142578125, 0.2372894287109375, 0.24603271484375, 0.2547760009765625, 0.263519287109375, 0.2722625732421875, 0.281005859375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 6.0, 6.0, 14.0, 22.0, 23.0, 42.0, 57.0, 95.0, 168.0, 256.0, 503.0, 1096.0, 2437.0, 6614.0, 21961.0, 98998.0, 520296.0, 316460.0, 56981.0, 14130.0, 4636.0, 1853.0, 859.0, 421.0, 242.0, 132.0, 91.0, 50.0, 27.0, 16.0, 12.0, 13.0, 7.0, 8.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2640953063964844, -0.25524139404296875, -0.24638748168945312, -0.2375335693359375, -0.22867965698242188, -0.21982574462890625, -0.21097183227539062, -0.202117919921875, -0.19326400756835938, -0.18441009521484375, -0.17555618286132812, -0.1667022705078125, -0.15784835815429688, -0.14899444580078125, -0.14014053344726562, -0.13128662109375, -0.12243270874023438, -0.11357879638671875, -0.10472488403320312, -0.0958709716796875, -0.08701705932617188, -0.07816314697265625, -0.06930923461914062, -0.060455322265625, -0.051601409912109375, -0.04274749755859375, -0.033893585205078125, -0.0250396728515625, -0.016185760498046875, -0.00733184814453125, 0.001522064208984375, 0.0103759765625, 0.019229888916015625, 0.02808380126953125, 0.036937713623046875, 0.0457916259765625, 0.054645538330078125, 0.06349945068359375, 0.07235336303710938, 0.081207275390625, 0.09006118774414062, 0.09891510009765625, 0.10776901245117188, 0.1166229248046875, 0.12547683715820312, 0.13433074951171875, 0.14318466186523438, 0.15203857421875, 0.16089248657226562, 0.16974639892578125, 0.17860031127929688, 0.1874542236328125, 0.19630813598632812, 0.20516204833984375, 0.21401596069335938, 0.222869873046875, 0.23172378540039062, 0.24057769775390625, 0.24943161010742188, 0.2582855224609375, 0.2671394348144531, 0.27599334716796875, 0.2848472595214844, 0.293701171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 5.0, 15.0, 27.0, 32.0, 42.0, 53.0, 76.0, 84.0, 103.0, 100.0, 105.0, 77.0, 53.0, 51.0, 33.0, 29.0, 20.0, 12.0, 22.0, 4.0, 4.0, 4.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001227855682373047, -0.00011941418051719666, -0.00011604279279708862, -0.00011267140507698059, -0.00010930001735687256, -0.00010592862963676453, -0.0001025572419166565, -9.918585419654846e-05, -9.581446647644043e-05, -9.24430787563324e-05, -8.907169103622437e-05, -8.570030331611633e-05, -8.23289155960083e-05, -7.895752787590027e-05, -7.558614015579224e-05, -7.22147524356842e-05, -6.884336471557617e-05, -6.547197699546814e-05, -6.210058927536011e-05, -5.8729201555252075e-05, -5.535781383514404e-05, -5.198642611503601e-05, -4.861503839492798e-05, -4.5243650674819946e-05, -4.1872262954711914e-05, -3.850087523460388e-05, -3.512948751449585e-05, -3.175809979438782e-05, -2.8386712074279785e-05, -2.5015324354171753e-05, -2.164393663406372e-05, -1.827254891395569e-05, -1.4901161193847656e-05, -1.1529773473739624e-05, -8.158385753631592e-06, -4.7869980335235596e-06, -1.4156103134155273e-06, 1.955777406692505e-06, 5.327165126800537e-06, 8.69855284690857e-06, 1.2069940567016602e-05, 1.5441328287124634e-05, 1.8812716007232666e-05, 2.2184103727340698e-05, 2.555549144744873e-05, 2.8926879167556763e-05, 3.2298266887664795e-05, 3.566965460777283e-05, 3.904104232788086e-05, 4.241243004798889e-05, 4.5783817768096924e-05, 4.9155205488204956e-05, 5.252659320831299e-05, 5.589798092842102e-05, 5.926936864852905e-05, 6.264075636863708e-05, 6.601214408874512e-05, 6.938353180885315e-05, 7.275491952896118e-05, 7.612630724906921e-05, 7.949769496917725e-05, 8.286908268928528e-05, 8.624047040939331e-05, 8.961185812950134e-05, 9.298324584960938e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 16.0, 20.0, 30.0, 53.0, 64.0, 79.0, 141.0, 183.0, 334.0, 560.0, 1051.0, 2167.0, 4977.0, 13812.0, 51358.0, 309076.0, 543961.0, 87033.0, 20769.0, 6975.0, 2777.0, 1298.0, 660.0, 420.0, 223.0, 134.0, 112.0, 64.0, 41.0, 39.0, 26.0, 28.0, 19.0, 8.0, 7.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3154296875, -0.3049736022949219, -0.29451751708984375, -0.2840614318847656, -0.2736053466796875, -0.2631492614746094, -0.25269317626953125, -0.24223709106445312, -0.231781005859375, -0.22132492065429688, -0.21086883544921875, -0.20041275024414062, -0.1899566650390625, -0.17950057983398438, -0.16904449462890625, -0.15858840942382812, -0.14813232421875, -0.13767623901367188, -0.12722015380859375, -0.11676406860351562, -0.1063079833984375, -0.09585189819335938, -0.08539581298828125, -0.07493972778320312, -0.064483642578125, -0.054027557373046875, -0.04357147216796875, -0.033115386962890625, -0.0226593017578125, -0.012203216552734375, -0.00174713134765625, 0.008708953857421875, 0.0191650390625, 0.029621124267578125, 0.04007720947265625, 0.050533294677734375, 0.0609893798828125, 0.07144546508789062, 0.08190155029296875, 0.09235763549804688, 0.102813720703125, 0.11326980590820312, 0.12372589111328125, 0.13418197631835938, 0.1446380615234375, 0.15509414672851562, 0.16555023193359375, 0.17600631713867188, 0.18646240234375, 0.19691848754882812, 0.20737457275390625, 0.21783065795898438, 0.2282867431640625, 0.23874282836914062, 0.24919891357421875, 0.2596549987792969, 0.270111083984375, 0.2805671691894531, 0.29102325439453125, 0.3014793395996094, 0.3119354248046875, 0.3223915100097656, 0.33284759521484375, 0.3433036804199219, 0.353759765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 5.0, 9.0, 5.0, 8.0, 11.0, 16.0, 16.0, 23.0, 30.0, 27.0, 36.0, 36.0, 66.0, 73.0, 90.0, 98.0, 87.0, 55.0, 52.0, 58.0, 30.0, 26.0, 29.0, 15.0, 16.0, 13.0, 10.0, 6.0, 8.0, 12.0, 7.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.160400390625, -0.1557598114013672, -0.15111923217773438, -0.14647865295410156, -0.14183807373046875, -0.13719749450683594, -0.13255691528320312, -0.1279163360595703, -0.1232757568359375, -0.11863517761230469, -0.11399459838867188, -0.10935401916503906, -0.10471343994140625, -0.10007286071777344, -0.09543228149414062, -0.09079170227050781, -0.086151123046875, -0.08151054382324219, -0.07686996459960938, -0.07222938537597656, -0.06758880615234375, -0.06294822692871094, -0.058307647705078125, -0.05366706848144531, -0.0490264892578125, -0.04438591003417969, -0.039745330810546875, -0.03510475158691406, -0.03046417236328125, -0.025823593139648438, -0.021183013916015625, -0.016542434692382812, -0.01190185546875, -0.0072612762451171875, -0.002620697021484375, 0.0020198822021484375, 0.00666046142578125, 0.011301040649414062, 0.015941619873046875, 0.020582199096679688, 0.0252227783203125, 0.029863357543945312, 0.034503936767578125, 0.03914451599121094, 0.04378509521484375, 0.04842567443847656, 0.053066253662109375, 0.05770683288574219, 0.062347412109375, 0.06698799133300781, 0.07162857055664062, 0.07626914978027344, 0.08090972900390625, 0.08555030822753906, 0.09019088745117188, 0.09483146667480469, 0.0994720458984375, 0.10411262512207031, 0.10875320434570312, 0.11339378356933594, 0.11803436279296875, 0.12267494201660156, 0.12731552124023438, 0.1319561004638672, 0.1365966796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 30.0, 72.0, 197.0, 301.0, 251.0, 93.0, 35.0, 9.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.564261436462402, -4.319271087646484, -4.074280738830566, -3.8292901515960693, -3.5842998027801514, -3.3393092155456543, -3.0943188667297363, -2.8493285179138184, -2.6043381690979004, -2.3593478202819824, -2.1143572330474854, -1.8693668842315674, -1.6243765354156494, -1.379386067390442, -1.1343955993652344, -0.8894052505493164, -0.6444146633148193, -0.3994242548942566, -0.15443381667137146, 0.09055662155151367, 0.3355470299720764, 0.5805374383926392, 0.8255279064178467, 1.0705182552337646, 1.3155087232589722, 1.5604991912841797, 1.8054895401000977, 2.0504798889160156, 2.2954704761505127, 2.5404608249664307, 2.7854514122009277, 3.0304417610168457, 3.2754321098327637, 3.5204224586486816, 3.7654130458831787, 4.010403633117676, 4.255393981933594, 4.500384330749512, 4.74537467956543, 4.990365028381348, 5.235355377197266, 5.480345726013184, 5.725336074829102, 5.9703264236450195, 6.215317249298096, 6.460307598114014, 6.705297946929932, 6.95028829574585, 7.195279121398926, 7.440269470214844, 7.685259819030762, 7.93025016784668, 8.175240516662598, 8.420230865478516, 8.66522216796875, 8.910211563110352, 9.15520191192627, 9.400192260742188, 9.645182609558105, 9.890172958374023, 10.135163307189941, 10.38015365600586, 10.625144958496094, 10.870134353637695, 11.11512565612793]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 8.0, 2.0, 8.0, 12.0, 10.0, 13.0, 27.0, 14.0, 29.0, 24.0, 26.0, 26.0, 29.0, 39.0, 36.0, 22.0, 38.0, 36.0, 66.0, 45.0, 43.0, 37.0, 44.0, 41.0, 39.0, 44.0, 26.0, 27.0, 30.0, 24.0, 26.0, 22.0, 14.0, 10.0, 13.0, 9.0, 13.0, 10.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.2242393493652344, -2.1596336364746094, -2.0950279235839844, -2.0304222106933594, -1.965816617012024, -1.901210904121399, -1.836605191230774, -1.771999478340149, -1.7073938846588135, -1.6427881717681885, -1.5781824588775635, -1.5135767459869385, -1.448971152305603, -1.384365439414978, -1.319759726524353, -1.255154013633728, -1.190548300743103, -1.125942587852478, -1.061336874961853, -0.9967312216758728, -0.9321255683898926, -0.8675198554992676, -0.8029141426086426, -0.7383084297180176, -0.6737027764320374, -0.6090970635414124, -0.5444914102554321, -0.47988569736480713, -0.4152800142765045, -0.3506743311882019, -0.2860686182975769, -0.2214629352092743, -0.15685737133026123, -0.09225168079137802, -0.027645990252494812, 0.036959707736968994, 0.1015653908252716, 0.16617107391357422, 0.23077678680419922, 0.29538246989250183, 0.35998815298080444, 0.42459383606910706, 0.48919951915740967, 0.5538052320480347, 0.6184109449386597, 0.6830165982246399, 0.7476223111152649, 0.8122279644012451, 0.8768336772918701, 0.9414393901824951, 1.0060451030731201, 1.0706508159637451, 1.1352564096450806, 1.1998621225357056, 1.2644678354263306, 1.3290735483169556, 1.393679141998291, 1.458284854888916, 1.522890567779541, 1.587496280670166, 1.6521018743515015, 1.7167075872421265, 1.7813133001327515, 1.8459190130233765, 1.9105247259140015]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 12.0, 16.0, 11.0, 14.0, 28.0, 40.0, 47.0, 66.0, 118.0, 156.0, 276.0, 442.0, 847.0, 1684.0, 4523.0, 16287.0, 121820.0, 3917365.0, 108080.0, 15033.0, 4035.0, 1576.0, 724.0, 388.0, 231.0, 147.0, 93.0, 68.0, 34.0, 35.0, 17.0, 13.0, 10.0, 11.0, 7.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.048828125, -1.0200729370117188, -0.9913177490234375, -0.9625625610351562, -0.933807373046875, -0.9050521850585938, -0.8762969970703125, -0.8475418090820312, -0.81878662109375, -0.7900314331054688, -0.7612762451171875, -0.7325210571289062, -0.703765869140625, -0.6750106811523438, -0.6462554931640625, -0.6175003051757812, -0.5887451171875, -0.5599899291992188, -0.5312347412109375, -0.5024795532226562, -0.473724365234375, -0.44496917724609375, -0.4162139892578125, -0.38745880126953125, -0.35870361328125, -0.32994842529296875, -0.3011932373046875, -0.27243804931640625, -0.243682861328125, -0.21492767333984375, -0.1861724853515625, -0.15741729736328125, -0.128662109375, -0.09990692138671875, -0.0711517333984375, -0.04239654541015625, -0.013641357421875, 0.01511383056640625, 0.0438690185546875, 0.07262420654296875, 0.10137939453125, 0.13013458251953125, 0.1588897705078125, 0.18764495849609375, 0.216400146484375, 0.24515533447265625, 0.2739105224609375, 0.30266571044921875, 0.3314208984375, 0.36017608642578125, 0.3889312744140625, 0.41768646240234375, 0.446441650390625, 0.47519683837890625, 0.5039520263671875, 0.5327072143554688, 0.56146240234375, 0.5902175903320312, 0.6189727783203125, 0.6477279663085938, 0.676483154296875, 0.7052383422851562, 0.7339935302734375, 0.7627487182617188, 0.79150390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 11.0, 7.0, 16.0, 16.0, 18.0, 28.0, 31.0, 47.0, 53.0, 49.0, 63.0, 62.0, 76.0, 63.0, 62.0, 75.0, 57.0, 61.0, 42.0, 49.0, 32.0, 18.0, 14.0, 10.0, 6.0, 5.0, 9.0, 2.0, 1.0, 5.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1002197265625, -0.09743976593017578, -0.09465980529785156, -0.09187984466552734, -0.08909988403320312, -0.0863199234008789, -0.08353996276855469, -0.08076000213623047, -0.07798004150390625, -0.07520008087158203, -0.07242012023925781, -0.0696401596069336, -0.06686019897460938, -0.06408023834228516, -0.06130027770996094, -0.05852031707763672, -0.0557403564453125, -0.05296039581298828, -0.05018043518066406, -0.047400474548339844, -0.044620513916015625, -0.041840553283691406, -0.03906059265136719, -0.03628063201904297, -0.03350067138671875, -0.03072071075439453, -0.027940750122070312, -0.025160789489746094, -0.022380828857421875, -0.019600868225097656, -0.016820907592773438, -0.014040946960449219, -0.011260986328125, -0.008481025695800781, -0.0057010650634765625, -0.0029211044311523438, -0.000141143798828125, 0.0026388168334960938, 0.0054187774658203125, 0.008198738098144531, 0.01097869873046875, 0.013758659362792969, 0.016538619995117188, 0.019318580627441406, 0.022098541259765625, 0.024878501892089844, 0.027658462524414062, 0.03043842315673828, 0.0332183837890625, 0.03599834442138672, 0.03877830505371094, 0.041558265686035156, 0.044338226318359375, 0.047118186950683594, 0.04989814758300781, 0.05267810821533203, 0.05545806884765625, 0.05823802947998047, 0.06101799011230469, 0.0637979507446289, 0.06657791137695312, 0.06935787200927734, 0.07213783264160156, 0.07491779327392578, 0.07769775390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 9.0, 5.0, 12.0, 16.0, 25.0, 38.0, 55.0, 94.0, 113.0, 188.0, 323.0, 557.0, 832.0, 1406.0, 2568.0, 4951.0, 10460.0, 25503.0, 77577.0, 500972.0, 3325185.0, 167997.0, 42858.0, 16328.0, 7160.0, 3822.0, 2084.0, 1167.0, 672.0, 445.0, 301.0, 184.0, 106.0, 76.0, 63.0, 42.0, 25.0, 19.0, 6.0, 11.0, 11.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.483642578125, -0.4691009521484375, -0.454559326171875, -0.4400177001953125, -0.42547607421875, -0.4109344482421875, -0.396392822265625, -0.3818511962890625, -0.3673095703125, -0.3527679443359375, -0.338226318359375, -0.3236846923828125, -0.30914306640625, -0.2946014404296875, -0.280059814453125, -0.2655181884765625, -0.2509765625, -0.2364349365234375, -0.221893310546875, -0.2073516845703125, -0.19281005859375, -0.1782684326171875, -0.163726806640625, -0.1491851806640625, -0.1346435546875, -0.1201019287109375, -0.105560302734375, -0.0910186767578125, -0.07647705078125, -0.0619354248046875, -0.047393798828125, -0.0328521728515625, -0.018310546875, -0.0037689208984375, 0.010772705078125, 0.0253143310546875, 0.03985595703125, 0.0543975830078125, 0.068939208984375, 0.0834808349609375, 0.0980224609375, 0.1125640869140625, 0.127105712890625, 0.1416473388671875, 0.15618896484375, 0.1707305908203125, 0.185272216796875, 0.1998138427734375, 0.21435546875, 0.2288970947265625, 0.243438720703125, 0.2579803466796875, 0.27252197265625, 0.2870635986328125, 0.301605224609375, 0.3161468505859375, 0.3306884765625, 0.3452301025390625, 0.359771728515625, 0.3743133544921875, 0.38885498046875, 0.4033966064453125, 0.417938232421875, 0.4324798583984375, 0.447021484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 11.0, 7.0, 11.0, 18.0, 24.0, 22.0, 29.0, 48.0, 89.0, 132.0, 312.0, 930.0, 1661.0, 324.0, 157.0, 80.0, 54.0, 31.0, 30.0, 18.0, 11.0, 9.0, 11.0, 9.0, 6.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12447547912597656, -0.12004470825195312, -0.11561393737792969, -0.11118316650390625, -0.10675239562988281, -0.10232162475585938, -0.09789085388183594, -0.0934600830078125, -0.08902931213378906, -0.08459854125976562, -0.08016777038574219, -0.07573699951171875, -0.07130622863769531, -0.06687545776367188, -0.06244468688964844, -0.058013916015625, -0.05358314514160156, -0.049152374267578125, -0.04472160339355469, -0.04029083251953125, -0.03586006164550781, -0.031429290771484375, -0.026998519897460938, -0.0225677490234375, -0.018136978149414062, -0.013706207275390625, -0.009275436401367188, -0.00484466552734375, -0.0004138946533203125, 0.004016876220703125, 0.008447647094726562, 0.01287841796875, 0.017309188842773438, 0.021739959716796875, 0.026170730590820312, 0.03060150146484375, 0.03503227233886719, 0.039463043212890625, 0.04389381408691406, 0.0483245849609375, 0.05275535583496094, 0.057186126708984375, 0.06161689758300781, 0.06604766845703125, 0.07047843933105469, 0.07490921020507812, 0.07933998107910156, 0.083770751953125, 0.08820152282714844, 0.09263229370117188, 0.09706306457519531, 0.10149383544921875, 0.10592460632324219, 0.11035537719726562, 0.11478614807128906, 0.1192169189453125, 0.12364768981933594, 0.12807846069335938, 0.1325092315673828, 0.13694000244140625, 0.1413707733154297, 0.14580154418945312, 0.15023231506347656, 0.1546630859375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 4.0, 15.0, 32.0, 81.0, 181.0, 254.0, 219.0, 122.0, 51.0, 23.0, 12.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1639890670776367, -2.110975742340088, -2.05796217918396, -2.004948854446411, -1.9519352912902832, -1.8989219665527344, -1.8459084033966064, -1.7928950786590576, -1.7398816347122192, -1.6868681907653809, -1.6338547468185425, -1.580841302871704, -1.5278278589248657, -1.4748144149780273, -1.4218010902404785, -1.3687876462936401, -1.3157742023468018, -1.2627607583999634, -1.209747314453125, -1.1567338705062866, -1.1037204265594482, -1.0507071018218994, -0.9976935982704163, -0.9446802139282227, -0.8916666507720947, -0.8386532068252563, -0.785639762878418, -0.7326263189315796, -0.679612934589386, -0.6265994906425476, -0.5735860466957092, -0.5205726623535156, -0.46755921840667725, -0.41454577445983887, -0.3615323603153229, -0.3085189163684845, -0.2555055022239685, -0.20249205827713013, -0.14947861433029175, -0.09646520018577576, -0.04345175623893738, 0.009561676532030106, 0.06257510930299759, 0.11558854579925537, 0.16860197484493256, 0.22161540389060974, 0.2746288478374481, 0.3276422619819641, 0.3806557059288025, 0.43366914987564087, 0.48668256402015686, 0.5396959781646729, 0.5927094221115112, 0.6457228660583496, 0.698736310005188, 0.7517497539520264, 0.8047631978988647, 0.8577766418457031, 0.9107900857925415, 0.9638035297393799, 1.0168169736862183, 1.0698304176330566, 1.1228437423706055, 1.1758571863174438, 1.2288706302642822]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 2.0, 6.0, 7.0, 10.0, 11.0, 10.0, 21.0, 17.0, 24.0, 19.0, 28.0, 27.0, 32.0, 30.0, 32.0, 40.0, 46.0, 47.0, 61.0, 50.0, 41.0, 41.0, 42.0, 45.0, 45.0, 33.0, 37.0, 37.0, 26.0, 15.0, 24.0, 22.0, 10.0, 6.0, 12.0, 14.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4659237265586853, -0.4504512846469879, -0.4349788427352905, -0.41950640082359314, -0.40403395891189575, -0.38856151700019836, -0.373089075088501, -0.3576166331768036, -0.3421441912651062, -0.3266717493534088, -0.3111993074417114, -0.29572686553001404, -0.28025442361831665, -0.26478198170661926, -0.24930953979492188, -0.2338370978832245, -0.2183646559715271, -0.2028922140598297, -0.18741977214813232, -0.17194733023643494, -0.15647488832473755, -0.14100244641304016, -0.12553000450134277, -0.11005756258964539, -0.094585120677948, -0.07911267876625061, -0.06364023685455322, -0.048167794942855835, -0.03269535303115845, -0.01722291111946106, -0.0017504692077636719, 0.013721972703933716, 0.029194414615631104, 0.04466685652732849, 0.06013929843902588, 0.07561174035072327, 0.09108418226242065, 0.10655662417411804, 0.12202906608581543, 0.13750150799751282, 0.1529739499092102, 0.1684463918209076, 0.18391883373260498, 0.19939127564430237, 0.21486371755599976, 0.23033615946769714, 0.24580860137939453, 0.2612810432910919, 0.2767534852027893, 0.2922259271144867, 0.3076983690261841, 0.32317081093788147, 0.33864325284957886, 0.35411569476127625, 0.36958813667297363, 0.385060578584671, 0.4005330204963684, 0.4160054624080658, 0.4314779043197632, 0.44695034623146057, 0.46242278814315796, 0.47789523005485535, 0.49336767196655273, 0.5088400840759277, 0.5243125557899475]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 16.0, 23.0, 30.0, 37.0, 60.0, 96.0, 124.0, 213.0, 326.0, 542.0, 962.0, 1801.0, 3744.0, 8212.0, 20049.0, 51053.0, 133210.0, 303048.0, 303533.0, 133457.0, 51562.0, 19896.0, 8373.0, 3791.0, 1868.0, 980.0, 555.0, 328.0, 204.0, 145.0, 95.0, 54.0, 50.0, 33.0, 25.0, 10.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.352783203125, -0.3414039611816406, -0.33002471923828125, -0.3186454772949219, -0.3072662353515625, -0.2958869934082031, -0.28450775146484375, -0.2731285095214844, -0.261749267578125, -0.2503700256347656, -0.23899078369140625, -0.22761154174804688, -0.2162322998046875, -0.20485305786132812, -0.19347381591796875, -0.18209457397460938, -0.17071533203125, -0.15933609008789062, -0.14795684814453125, -0.13657760620117188, -0.1251983642578125, -0.11381912231445312, -0.10243988037109375, -0.09106063842773438, -0.079681396484375, -0.06830215454101562, -0.05692291259765625, -0.045543670654296875, -0.0341644287109375, -0.022785186767578125, -0.01140594482421875, -2.6702880859375e-05, 0.0113525390625, 0.022731781005859375, 0.03411102294921875, 0.045490264892578125, 0.0568695068359375, 0.06824874877929688, 0.07962799072265625, 0.09100723266601562, 0.102386474609375, 0.11376571655273438, 0.12514495849609375, 0.13652420043945312, 0.1479034423828125, 0.15928268432617188, 0.17066192626953125, 0.18204116821289062, 0.19342041015625, 0.20479965209960938, 0.21617889404296875, 0.22755813598632812, 0.2389373779296875, 0.2503166198730469, 0.26169586181640625, 0.2730751037597656, 0.284454345703125, 0.2958335876464844, 0.30721282958984375, 0.3185920715332031, 0.3299713134765625, 0.3413505554199219, 0.35272979736328125, 0.3641090393066406, 0.37548828125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 9.0, 12.0, 9.0, 24.0, 23.0, 28.0, 46.0, 50.0, 42.0, 63.0, 69.0, 57.0, 66.0, 73.0, 63.0, 62.0, 61.0, 70.0, 39.0, 32.0, 37.0, 13.0, 7.0, 10.0, 3.0, 0.0, 9.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10760498046875, -0.10474109649658203, -0.10187721252441406, -0.0990133285522461, -0.09614944458007812, -0.09328556060791016, -0.09042167663574219, -0.08755779266357422, -0.08469390869140625, -0.08183002471923828, -0.07896614074707031, -0.07610225677490234, -0.07323837280273438, -0.0703744888305664, -0.06751060485839844, -0.06464672088623047, -0.0617828369140625, -0.05891895294189453, -0.05605506896972656, -0.053191184997558594, -0.050327301025390625, -0.047463417053222656, -0.04459953308105469, -0.04173564910888672, -0.03887176513671875, -0.03600788116455078, -0.03314399719238281, -0.030280113220214844, -0.027416229248046875, -0.024552345275878906, -0.021688461303710938, -0.01882457733154297, -0.015960693359375, -0.013096809387207031, -0.010232925415039062, -0.007369041442871094, -0.004505157470703125, -0.0016412734985351562, 0.0012226104736328125, 0.004086494445800781, 0.00695037841796875, 0.009814262390136719, 0.012678146362304688, 0.015542030334472656, 0.018405914306640625, 0.021269798278808594, 0.024133682250976562, 0.02699756622314453, 0.0298614501953125, 0.03272533416748047, 0.03558921813964844, 0.038453102111816406, 0.041316986083984375, 0.044180870056152344, 0.04704475402832031, 0.04990863800048828, 0.05277252197265625, 0.05563640594482422, 0.05850028991699219, 0.061364173889160156, 0.06422805786132812, 0.0670919418334961, 0.06995582580566406, 0.07281970977783203, 0.07568359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 5.0, 3.0, 3.0, 10.0, 13.0, 11.0, 30.0, 37.0, 44.0, 51.0, 70.0, 117.0, 142.0, 217.0, 312.0, 469.0, 662.0, 1144.0, 2018.0, 4012.0, 9793.0, 27213.0, 80277.0, 217183.0, 358567.0, 218325.0, 80952.0, 27461.0, 9909.0, 4185.0, 1977.0, 1118.0, 685.0, 445.0, 318.0, 243.0, 157.0, 119.0, 68.0, 57.0, 28.0, 29.0, 26.0, 17.0, 16.0, 12.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.30322265625, -0.29219818115234375, -0.2811737060546875, -0.27014923095703125, -0.259124755859375, -0.24810028076171875, -0.2370758056640625, -0.22605133056640625, -0.21502685546875, -0.20400238037109375, -0.1929779052734375, -0.18195343017578125, -0.170928955078125, -0.15990447998046875, -0.1488800048828125, -0.13785552978515625, -0.1268310546875, -0.11580657958984375, -0.1047821044921875, -0.09375762939453125, -0.082733154296875, -0.07170867919921875, -0.0606842041015625, -0.04965972900390625, -0.03863525390625, -0.02761077880859375, -0.0165863037109375, -0.00556182861328125, 0.005462646484375, 0.01648712158203125, 0.0275115966796875, 0.03853607177734375, 0.049560546875, 0.06058502197265625, 0.0716094970703125, 0.08263397216796875, 0.093658447265625, 0.10468292236328125, 0.1157073974609375, 0.12673187255859375, 0.13775634765625, 0.14878082275390625, 0.1598052978515625, 0.17082977294921875, 0.181854248046875, 0.19287872314453125, 0.2039031982421875, 0.21492767333984375, 0.2259521484375, 0.23697662353515625, 0.2480010986328125, 0.25902557373046875, 0.270050048828125, 0.28107452392578125, 0.2920989990234375, 0.30312347412109375, 0.31414794921875, 0.32517242431640625, 0.3361968994140625, 0.34722137451171875, 0.358245849609375, 0.36927032470703125, 0.3802947998046875, 0.39131927490234375, 0.40234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 3.0, 4.0, 10.0, 7.0, 13.0, 10.0, 14.0, 18.0, 21.0, 23.0, 40.0, 32.0, 31.0, 27.0, 40.0, 42.0, 52.0, 47.0, 31.0, 30.0, 37.0, 44.0, 42.0, 44.0, 33.0, 30.0, 39.0, 31.0, 25.0, 23.0, 22.0, 25.0, 23.0, 18.0, 15.0, 14.0, 10.0, 8.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.27337646484375, -0.2633056640625, -0.25323486328125, -0.2431640625, -0.23309326171875, -0.2230224609375, -0.21295166015625, -0.202880859375, -0.19281005859375, -0.1827392578125, -0.17266845703125, -0.16259765625, -0.15252685546875, -0.1424560546875, -0.13238525390625, -0.122314453125, -0.11224365234375, -0.1021728515625, -0.09210205078125, -0.08203125, -0.07196044921875, -0.0618896484375, -0.05181884765625, -0.041748046875, -0.03167724609375, -0.0216064453125, -0.01153564453125, -0.00146484375, 0.00860595703125, 0.0186767578125, 0.02874755859375, 0.038818359375, 0.04888916015625, 0.0589599609375, 0.06903076171875, 0.0791015625, 0.08917236328125, 0.0992431640625, 0.10931396484375, 0.119384765625, 0.12945556640625, 0.1395263671875, 0.14959716796875, 0.15966796875, 0.16973876953125, 0.1798095703125, 0.18988037109375, 0.199951171875, 0.21002197265625, 0.2200927734375, 0.23016357421875, 0.240234375, 0.25030517578125, 0.2603759765625, 0.27044677734375, 0.280517578125, 0.29058837890625, 0.3006591796875, 0.31072998046875, 0.32080078125, 0.33087158203125, 0.3409423828125, 0.35101318359375, 0.361083984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 11.0, 14.0, 22.0, 21.0, 41.0, 61.0, 103.0, 144.0, 259.0, 504.0, 1070.0, 2655.0, 7740.0, 31459.0, 206795.0, 650630.0, 116846.0, 20483.0, 5640.0, 2101.0, 924.0, 420.0, 213.0, 132.0, 81.0, 45.0, 38.0, 25.0, 10.0, 11.0, 10.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.302001953125, -0.293212890625, -0.284423828125, -0.275634765625, -0.266845703125, -0.258056640625, -0.249267578125, -0.240478515625, -0.231689453125, -0.222900390625, -0.214111328125, -0.205322265625, -0.196533203125, -0.187744140625, -0.178955078125, -0.170166015625, -0.161376953125, -0.152587890625, -0.143798828125, -0.135009765625, -0.126220703125, -0.117431640625, -0.108642578125, -0.099853515625, -0.091064453125, -0.082275390625, -0.073486328125, -0.064697265625, -0.055908203125, -0.047119140625, -0.038330078125, -0.029541015625, -0.020751953125, -0.011962890625, -0.003173828125, 0.005615234375, 0.014404296875, 0.023193359375, 0.031982421875, 0.040771484375, 0.049560546875, 0.058349609375, 0.067138671875, 0.075927734375, 0.084716796875, 0.093505859375, 0.102294921875, 0.111083984375, 0.119873046875, 0.128662109375, 0.137451171875, 0.146240234375, 0.155029296875, 0.163818359375, 0.172607421875, 0.181396484375, 0.190185546875, 0.198974609375, 0.207763671875, 0.216552734375, 0.225341796875, 0.234130859375, 0.242919921875, 0.251708984375, 0.260498046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 18.0, 29.0, 43.0, 44.0, 62.0, 74.0, 93.0, 116.0, 121.0, 93.0, 91.0, 62.0, 37.0, 28.0, 23.0, 11.0, 15.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.505582809448242e-05, -8.189398795366287e-05, -7.873214781284332e-05, -7.557030767202377e-05, -7.240846753120422e-05, -6.924662739038467e-05, -6.608478724956512e-05, -6.292294710874557e-05, -5.9761106967926025e-05, -5.6599266827106476e-05, -5.3437426686286926e-05, -5.027558654546738e-05, -4.711374640464783e-05, -4.395190626382828e-05, -4.079006612300873e-05, -3.762822598218918e-05, -3.446638584136963e-05, -3.130454570055008e-05, -2.814270555973053e-05, -2.498086541891098e-05, -2.181902527809143e-05, -1.865718513727188e-05, -1.549534499645233e-05, -1.2333504855632782e-05, -9.171664714813232e-06, -6.009824573993683e-06, -2.8479844331741333e-06, 3.1385570764541626e-07, 3.475695848464966e-06, 6.637535989284515e-06, 9.799376130104065e-06, 1.2961216270923615e-05, 1.6123056411743164e-05, 1.9284896552562714e-05, 2.2446736693382263e-05, 2.5608576834201813e-05, 2.8770416975021362e-05, 3.193225711584091e-05, 3.509409725666046e-05, 3.825593739748001e-05, 4.141777753829956e-05, 4.457961767911911e-05, 4.774145781993866e-05, 5.090329796075821e-05, 5.406513810157776e-05, 5.722697824239731e-05, 6.038881838321686e-05, 6.355065852403641e-05, 6.671249866485596e-05, 6.98743388056755e-05, 7.303617894649506e-05, 7.61980190873146e-05, 7.935985922813416e-05, 8.25216993689537e-05, 8.568353950977325e-05, 8.88453796505928e-05, 9.200721979141235e-05, 9.51690599322319e-05, 9.833090007305145e-05, 0.000101492740213871, 0.00010465458035469055, 0.0001078164204955101, 0.00011097826063632965, 0.0001141401007771492, 0.00011730194091796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 16.0, 20.0, 22.0, 30.0, 39.0, 58.0, 71.0, 127.0, 175.0, 257.0, 454.0, 781.0, 1529.0, 3170.0, 7095.0, 20701.0, 76007.0, 377016.0, 435044.0, 88068.0, 22637.0, 8009.0, 3385.0, 1666.0, 823.0, 493.0, 293.0, 175.0, 107.0, 72.0, 57.0, 43.0, 38.0, 23.0, 14.0, 12.0, 4.0, 3.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.209228515625, -0.20248985290527344, -0.19575119018554688, -0.1890125274658203, -0.18227386474609375, -0.1755352020263672, -0.16879653930664062, -0.16205787658691406, -0.1553192138671875, -0.14858055114746094, -0.14184188842773438, -0.1351032257080078, -0.12836456298828125, -0.12162590026855469, -0.11488723754882812, -0.10814857482910156, -0.101409912109375, -0.09467124938964844, -0.08793258666992188, -0.08119392395019531, -0.07445526123046875, -0.06771659851074219, -0.060977935791015625, -0.05423927307128906, -0.0475006103515625, -0.04076194763183594, -0.034023284912109375, -0.027284622192382812, -0.02054595947265625, -0.013807296752929688, -0.007068634033203125, -0.0003299713134765625, 0.00640869140625, 0.013147354125976562, 0.019886016845703125, 0.026624679565429688, 0.03336334228515625, 0.04010200500488281, 0.046840667724609375, 0.05357933044433594, 0.0603179931640625, 0.06705665588378906, 0.07379531860351562, 0.08053398132324219, 0.08727264404296875, 0.09401130676269531, 0.10074996948242188, 0.10748863220214844, 0.114227294921875, 0.12096595764160156, 0.12770462036132812, 0.1344432830810547, 0.14118194580078125, 0.1479206085205078, 0.15465927124023438, 0.16139793395996094, 0.1681365966796875, 0.17487525939941406, 0.18161392211914062, 0.1883525848388672, 0.19509124755859375, 0.2018299102783203, 0.20856857299804688, 0.21530723571777344, 0.2220458984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 4.0, 7.0, 8.0, 4.0, 22.0, 14.0, 25.0, 22.0, 43.0, 46.0, 61.0, 74.0, 112.0, 130.0, 104.0, 67.0, 61.0, 52.0, 32.0, 26.0, 20.0, 11.0, 14.0, 9.0, 3.0, 9.0, 2.0, 5.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.192626953125, -0.1870098114013672, -0.18139266967773438, -0.17577552795410156, -0.17015838623046875, -0.16454124450683594, -0.15892410278320312, -0.1533069610595703, -0.1476898193359375, -0.1420726776123047, -0.13645553588867188, -0.13083839416503906, -0.12522125244140625, -0.11960411071777344, -0.11398696899414062, -0.10836982727050781, -0.102752685546875, -0.09713554382324219, -0.09151840209960938, -0.08590126037597656, -0.08028411865234375, -0.07466697692871094, -0.06904983520507812, -0.06343269348144531, -0.0578155517578125, -0.05219841003417969, -0.046581268310546875, -0.04096412658691406, -0.03534698486328125, -0.029729843139648438, -0.024112701416015625, -0.018495559692382812, -0.01287841796875, -0.0072612762451171875, -0.001644134521484375, 0.0039730072021484375, 0.00959014892578125, 0.015207290649414062, 0.020824432373046875, 0.026441574096679688, 0.0320587158203125, 0.03767585754394531, 0.043292999267578125, 0.04891014099121094, 0.05452728271484375, 0.06014442443847656, 0.06576156616210938, 0.07137870788574219, 0.076995849609375, 0.08261299133300781, 0.08823013305664062, 0.09384727478027344, 0.09946441650390625, 0.10508155822753906, 0.11069869995117188, 0.11631584167480469, 0.1219329833984375, 0.1275501251220703, 0.13316726684570312, 0.13878440856933594, 0.14440155029296875, 0.15001869201660156, 0.15563583374023438, 0.1612529754638672, 0.1668701171875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 11.0, 20.0, 71.0, 148.0, 239.0, 263.0, 151.0, 58.0, 24.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.918479919433594, -8.747364044189453, -8.576248168945312, -8.405131340026855, -8.234015464782715, -8.062899589538574, -7.891783714294434, -7.720667839050293, -7.549551486968994, -7.3784356117248535, -7.207319259643555, -7.036203384399414, -6.865087509155273, -6.693971157073975, -6.522855281829834, -6.351738929748535, -6.1806230545043945, -6.009507179260254, -5.838390827178955, -5.6672749519348145, -5.496158599853516, -5.325042724609375, -5.153926849365234, -4.982810974121094, -4.811694622039795, -4.640578746795654, -4.4694623947143555, -4.298346519470215, -4.127230644226074, -3.9561142921447754, -3.7849984169006348, -3.613882303237915, -3.4427666664123535, -3.271650552749634, -3.100534439086914, -2.9294185638427734, -2.7583024501800537, -2.587186336517334, -2.4160704612731934, -2.2449543476104736, -2.073838233947754, -1.9027221202850342, -1.731606125831604, -1.5604901313781738, -1.389374017715454, -1.2182579040527344, -1.0471419095993042, -0.876025915145874, -0.7049098014831543, -0.5337937474250793, -0.3626776933670044, -0.19156163930892944, -0.020445585250854492, 0.15067046880722046, 0.3217865228652954, 0.4929025173187256, 0.6640186309814453, 0.8351346850395203, 1.0062507390975952, 1.1773667335510254, 1.3484828472137451, 1.5195989608764648, 1.690714955329895, 1.8618309497833252, 2.032947063446045]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 7.0, 7.0, 9.0, 15.0, 11.0, 23.0, 21.0, 25.0, 30.0, 25.0, 32.0, 49.0, 46.0, 59.0, 39.0, 55.0, 49.0, 55.0, 42.0, 38.0, 44.0, 32.0, 52.0, 35.0, 34.0, 27.0, 23.0, 23.0, 13.0, 12.0, 15.0, 11.0, 9.0, 7.0, 4.0, 2.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.199100971221924, -2.133584499359131, -2.068068265914917, -2.002551794052124, -1.9370354413986206, -1.8715190887451172, -1.8060026168823242, -1.7404862642288208, -1.6749699115753174, -1.609453558921814, -1.543937087059021, -1.4784207344055176, -1.4129043817520142, -1.3473880290985107, -1.2818715572357178, -1.2163552045822144, -1.1508387327194214, -1.085322380065918, -1.019805908203125, -0.9542895555496216, -0.8887732028961182, -0.82325679063797, -0.7577403783798218, -0.6922240257263184, -0.6267076134681702, -0.561191201210022, -0.49567484855651855, -0.43015843629837036, -0.36464205384254456, -0.29912567138671875, -0.23360925912857056, -0.16809287667274475, -0.1025766134262085, -0.037060223519802094, 0.02845616638660431, 0.09397256374359131, 0.15948894619941711, 0.22500532865524292, 0.2905217409133911, 0.3560381233692169, 0.4215545058250427, 0.48707088828086853, 0.5525872707366943, 0.6181036829948425, 0.6836200952529907, 0.7491364479064941, 0.8146528601646423, 0.8801692724227905, 0.945685625076294, 1.0112019777297974, 1.0767184495925903, 1.1422348022460938, 1.2077511548995972, 1.2732675075531006, 1.3387839794158936, 1.404300332069397, 1.4698166847229004, 1.5353330373764038, 1.6008495092391968, 1.6663658618927002, 1.7318822145462036, 1.797398567199707, 1.8629150390625, 1.9284313917160034, 1.9939478635787964]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 6.0, 11.0, 15.0, 30.0, 31.0, 35.0, 70.0, 82.0, 155.0, 228.0, 403.0, 772.0, 1598.0, 4012.0, 11607.0, 48651.0, 3351037.0, 718728.0, 40119.0, 10260.0, 3420.0, 1387.0, 675.0, 370.0, 180.0, 132.0, 84.0, 60.0, 46.0, 17.0, 11.0, 13.0, 8.0, 8.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5751953125, -0.5559844970703125, -0.536773681640625, -0.5175628662109375, -0.49835205078125, -0.4791412353515625, -0.459930419921875, -0.4407196044921875, -0.4215087890625, -0.4022979736328125, -0.383087158203125, -0.3638763427734375, -0.34466552734375, -0.3254547119140625, -0.306243896484375, -0.2870330810546875, -0.267822265625, -0.2486114501953125, -0.229400634765625, -0.2101898193359375, -0.19097900390625, -0.1717681884765625, -0.152557373046875, -0.1333465576171875, -0.1141357421875, -0.0949249267578125, -0.075714111328125, -0.0565032958984375, -0.03729248046875, -0.0180816650390625, 0.001129150390625, 0.0203399658203125, 0.03955078125, 0.0587615966796875, 0.077972412109375, 0.0971832275390625, 0.11639404296875, 0.1356048583984375, 0.154815673828125, 0.1740264892578125, 0.1932373046875, 0.2124481201171875, 0.231658935546875, 0.2508697509765625, 0.27008056640625, 0.2892913818359375, 0.308502197265625, 0.3277130126953125, 0.346923828125, 0.3661346435546875, 0.385345458984375, 0.4045562744140625, 0.42376708984375, 0.4429779052734375, 0.462188720703125, 0.4813995361328125, 0.5006103515625, 0.5198211669921875, 0.539031982421875, 0.5582427978515625, 0.57745361328125, 0.5966644287109375, 0.615875244140625, 0.6350860595703125, 0.654296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 9.0, 4.0, 10.0, 8.0, 19.0, 20.0, 26.0, 29.0, 31.0, 35.0, 42.0, 52.0, 57.0, 52.0, 65.0, 59.0, 37.0, 59.0, 58.0, 47.0, 49.0, 55.0, 36.0, 25.0, 27.0, 22.0, 16.0, 13.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08734130859375, -0.0848073959350586, -0.08227348327636719, -0.07973957061767578, -0.07720565795898438, -0.07467174530029297, -0.07213783264160156, -0.06960391998291016, -0.06707000732421875, -0.06453609466552734, -0.06200218200683594, -0.05946826934814453, -0.056934356689453125, -0.05440044403076172, -0.05186653137207031, -0.049332618713378906, -0.0467987060546875, -0.044264793395996094, -0.04173088073730469, -0.03919696807861328, -0.036663055419921875, -0.03412914276123047, -0.03159523010253906, -0.029061317443847656, -0.02652740478515625, -0.023993492126464844, -0.021459579467773438, -0.01892566680908203, -0.016391754150390625, -0.013857841491699219, -0.011323928833007812, -0.008790016174316406, -0.006256103515625, -0.0037221908569335938, -0.0011882781982421875, 0.0013456344604492188, 0.003879547119140625, 0.006413459777832031, 0.008947372436523438, 0.011481285095214844, 0.01401519775390625, 0.016549110412597656, 0.019083023071289062, 0.02161693572998047, 0.024150848388671875, 0.02668476104736328, 0.029218673706054688, 0.031752586364746094, 0.0342864990234375, 0.036820411682128906, 0.03935432434082031, 0.04188823699951172, 0.044422149658203125, 0.04695606231689453, 0.04948997497558594, 0.052023887634277344, 0.05455780029296875, 0.057091712951660156, 0.05962562561035156, 0.06215953826904297, 0.06469345092773438, 0.06722736358642578, 0.06976127624511719, 0.0722951889038086, 0.0748291015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 9.0, 9.0, 10.0, 17.0, 17.0, 25.0, 30.0, 64.0, 91.0, 135.0, 170.0, 303.0, 478.0, 813.0, 1433.0, 2642.0, 5118.0, 11704.0, 29429.0, 92305.0, 621007.0, 3189995.0, 163804.0, 43990.0, 16164.0, 6935.0, 3295.0, 1721.0, 912.0, 529.0, 351.0, 229.0, 167.0, 98.0, 59.0, 57.0, 40.0, 37.0, 26.0, 14.0, 24.0, 2.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.34521484375, -0.33481597900390625, -0.3244171142578125, -0.31401824951171875, -0.303619384765625, -0.29322052001953125, -0.2828216552734375, -0.27242279052734375, -0.26202392578125, -0.25162506103515625, -0.2412261962890625, -0.23082733154296875, -0.220428466796875, -0.21002960205078125, -0.1996307373046875, -0.18923187255859375, -0.1788330078125, -0.16843414306640625, -0.1580352783203125, -0.14763641357421875, -0.137237548828125, -0.12683868408203125, -0.1164398193359375, -0.10604095458984375, -0.09564208984375, -0.08524322509765625, -0.0748443603515625, -0.06444549560546875, -0.054046630859375, -0.04364776611328125, -0.0332489013671875, -0.02285003662109375, -0.012451171875, -0.00205230712890625, 0.0083465576171875, 0.01874542236328125, 0.029144287109375, 0.03954315185546875, 0.0499420166015625, 0.06034088134765625, 0.07073974609375, 0.08113861083984375, 0.0915374755859375, 0.10193634033203125, 0.112335205078125, 0.12273406982421875, 0.1331329345703125, 0.14353179931640625, 0.1539306640625, 0.16432952880859375, 0.1747283935546875, 0.18512725830078125, 0.195526123046875, 0.20592498779296875, 0.2163238525390625, 0.22672271728515625, 0.23712158203125, 0.24752044677734375, 0.2579193115234375, 0.26831817626953125, 0.278717041015625, 0.28911590576171875, 0.2995147705078125, 0.30991363525390625, 0.3203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 10.0, 10.0, 17.0, 21.0, 14.0, 39.0, 43.0, 83.0, 114.0, 248.0, 599.0, 2024.0, 379.0, 153.0, 99.0, 63.0, 39.0, 37.0, 15.0, 20.0, 10.0, 7.0, 2.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10089111328125, -0.0971994400024414, -0.09350776672363281, -0.08981609344482422, -0.08612442016601562, -0.08243274688720703, -0.07874107360839844, -0.07504940032958984, -0.07135772705078125, -0.06766605377197266, -0.06397438049316406, -0.06028270721435547, -0.056591033935546875, -0.05289936065673828, -0.04920768737792969, -0.045516014099121094, -0.0418243408203125, -0.038132667541503906, -0.03444099426269531, -0.03074932098388672, -0.027057647705078125, -0.02336597442626953, -0.019674301147460938, -0.015982627868652344, -0.01229095458984375, -0.008599281311035156, -0.0049076080322265625, -0.0012159347534179688, 0.002475738525390625, 0.006167411804199219, 0.009859085083007812, 0.013550758361816406, 0.017242431640625, 0.020934104919433594, 0.024625778198242188, 0.02831745147705078, 0.032009124755859375, 0.03570079803466797, 0.03939247131347656, 0.043084144592285156, 0.04677581787109375, 0.050467491149902344, 0.05415916442871094, 0.05785083770751953, 0.061542510986328125, 0.06523418426513672, 0.06892585754394531, 0.0726175308227539, 0.0763092041015625, 0.0800008773803711, 0.08369255065917969, 0.08738422393798828, 0.09107589721679688, 0.09476757049560547, 0.09845924377441406, 0.10215091705322266, 0.10584259033203125, 0.10953426361083984, 0.11322593688964844, 0.11691761016845703, 0.12060928344726562, 0.12430095672607422, 0.1279926300048828, 0.1316843032836914, 0.1353759765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 5.0, 13.0, 20.0, 38.0, 40.0, 36.0, 73.0, 83.0, 104.0, 113.0, 97.0, 84.0, 80.0, 58.0, 42.0, 30.0, 26.0, 27.0, 12.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.7230468988418579, -0.7055160999298096, -0.6879853010177612, -0.6704544425010681, -0.6529236435890198, -0.6353928446769714, -0.6178620457649231, -0.60033118724823, -0.5828003883361816, -0.5652695894241333, -0.547738790512085, -0.5302079319953918, -0.5126771330833435, -0.49514633417129517, -0.4776155352592468, -0.4600847065448761, -0.44255390763282776, -0.4250231087207794, -0.4074922800064087, -0.38996148109436035, -0.3724306523799896, -0.3548998534679413, -0.33736902475357056, -0.3198382258415222, -0.3023074269294739, -0.28477662801742554, -0.2672457993030548, -0.24971500039100647, -0.23218417167663574, -0.2146533727645874, -0.19712255895137787, -0.17959174513816833, -0.1620609164237976, -0.14453010261058807, -0.12699928879737854, -0.1094684824347496, -0.09193766862154007, -0.07440685480833054, -0.0568760484457016, -0.039345234632492065, -0.021814420819282532, -0.004283608868718147, 0.013247203081846237, 0.030778013169765472, 0.048308826982975006, 0.06583964079618454, 0.08337044715881348, 0.10090126097202301, 0.11843207478523254, 0.13596288859844208, 0.1534937024116516, 0.17102450132369995, 0.18855533003807068, 0.20608612895011902, 0.22361694276332855, 0.24114775657653809, 0.2586785554885864, 0.27620935440063477, 0.2937401831150055, 0.31127098202705383, 0.32880181074142456, 0.3463326096534729, 0.36386340856552124, 0.38139423727989197, 0.3989250659942627]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 10.0, 3.0, 6.0, 5.0, 12.0, 10.0, 11.0, 15.0, 13.0, 12.0, 19.0, 30.0, 25.0, 31.0, 30.0, 37.0, 45.0, 40.0, 35.0, 38.0, 38.0, 58.0, 43.0, 49.0, 43.0, 40.0, 39.0, 47.0, 26.0, 26.0, 26.0, 20.0, 22.0, 20.0, 17.0, 16.0, 7.0, 9.0, 10.0, 6.0, 9.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28450214862823486, -0.2738912105560303, -0.2632802724838257, -0.2526693344116211, -0.2420584112405777, -0.2314474731683731, -0.22083653509616852, -0.21022561192512512, -0.19961467385292053, -0.18900373578071594, -0.17839279770851135, -0.16778185963630676, -0.15717093646526337, -0.14655999839305878, -0.1359490603208542, -0.1253381371498108, -0.11472718417644501, -0.10411624610424042, -0.09350531548261642, -0.08289437741041183, -0.07228344678878784, -0.06167250871658325, -0.05106157064437866, -0.04045064002275467, -0.02983970195055008, -0.019228767603635788, -0.008617831394076347, 0.0019931048154830933, 0.012604039162397385, 0.023214973509311676, 0.033825911581516266, 0.04443684220314026, 0.05504778027534485, 0.06565871834754944, 0.07626964896917343, 0.08688058704137802, 0.09749151766300201, 0.1081024557352066, 0.1187133938074112, 0.1293243169784546, 0.13993525505065918, 0.15054619312286377, 0.16115713119506836, 0.17176806926727295, 0.18237899243831635, 0.19298993051052094, 0.20360086858272552, 0.21421179175376892, 0.2248227447271347, 0.2354336827993393, 0.24604462087154388, 0.2566555440425873, 0.26726648211479187, 0.27787742018699646, 0.28848835825920105, 0.29909929633140564, 0.30971023440361023, 0.3203211724758148, 0.3309321105480194, 0.341543048620224, 0.3521539866924286, 0.3627648949623108, 0.3733758330345154, 0.38398677110671997, 0.39459770917892456]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 12.0, 7.0, 22.0, 37.0, 28.0, 65.0, 93.0, 151.0, 262.0, 425.0, 706.0, 1214.0, 2218.0, 4553.0, 9587.0, 23532.0, 65384.0, 184196.0, 358974.0, 247653.0, 92218.0, 32490.0, 12739.0, 5576.0, 2797.0, 1529.0, 805.0, 470.0, 291.0, 183.0, 100.0, 75.0, 49.0, 35.0, 26.0, 13.0, 13.0, 8.0, 9.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.42138671875, -0.4098930358886719, -0.39839935302734375, -0.3869056701660156, -0.3754119873046875, -0.3639183044433594, -0.35242462158203125, -0.3409309387207031, -0.329437255859375, -0.3179435729980469, -0.30644989013671875, -0.2949562072753906, -0.2834625244140625, -0.2719688415527344, -0.26047515869140625, -0.24898147583007812, -0.23748779296875, -0.22599411010742188, -0.21450042724609375, -0.20300674438476562, -0.1915130615234375, -0.18001937866210938, -0.16852569580078125, -0.15703201293945312, -0.145538330078125, -0.13404464721679688, -0.12255096435546875, -0.11105728149414062, -0.0995635986328125, -0.08806991577148438, -0.07657623291015625, -0.06508255004882812, -0.0535888671875, -0.042095184326171875, -0.03060150146484375, -0.019107818603515625, -0.0076141357421875, 0.003879547119140625, 0.01537322998046875, 0.026866912841796875, 0.038360595703125, 0.049854278564453125, 0.06134796142578125, 0.07284164428710938, 0.0843353271484375, 0.09582901000976562, 0.10732269287109375, 0.11881637573242188, 0.13031005859375, 0.14180374145507812, 0.15329742431640625, 0.16479110717773438, 0.1762847900390625, 0.18777847290039062, 0.19927215576171875, 0.21076583862304688, 0.222259521484375, 0.23375320434570312, 0.24524688720703125, 0.2567405700683594, 0.2682342529296875, 0.2797279357910156, 0.29122161865234375, 0.3027153015136719, 0.314208984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 7.0, 14.0, 11.0, 11.0, 15.0, 18.0, 31.0, 32.0, 34.0, 30.0, 49.0, 47.0, 45.0, 58.0, 49.0, 56.0, 48.0, 65.0, 56.0, 40.0, 44.0, 50.0, 47.0, 27.0, 23.0, 16.0, 9.0, 18.0, 14.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0870361328125, -0.08456993103027344, -0.08210372924804688, -0.07963752746582031, -0.07717132568359375, -0.07470512390136719, -0.07223892211914062, -0.06977272033691406, -0.0673065185546875, -0.06484031677246094, -0.062374114990234375, -0.05990791320800781, -0.05744171142578125, -0.05497550964355469, -0.052509307861328125, -0.05004310607910156, -0.047576904296875, -0.04511070251464844, -0.042644500732421875, -0.04017829895019531, -0.03771209716796875, -0.03524589538574219, -0.032779693603515625, -0.030313491821289062, -0.0278472900390625, -0.025381088256835938, -0.022914886474609375, -0.020448684692382812, -0.01798248291015625, -0.015516281127929688, -0.013050079345703125, -0.010583877563476562, -0.00811767578125, -0.0056514739990234375, -0.003185272216796875, -0.0007190704345703125, 0.00174713134765625, 0.0042133331298828125, 0.006679534912109375, 0.009145736694335938, 0.0116119384765625, 0.014078140258789062, 0.016544342041015625, 0.019010543823242188, 0.02147674560546875, 0.023942947387695312, 0.026409149169921875, 0.028875350952148438, 0.031341552734375, 0.03380775451660156, 0.036273956298828125, 0.03874015808105469, 0.04120635986328125, 0.04367256164550781, 0.046138763427734375, 0.04860496520996094, 0.0510711669921875, 0.05353736877441406, 0.056003570556640625, 0.05846977233886719, 0.06093597412109375, 0.06340217590332031, 0.06586837768554688, 0.06833457946777344, 0.07080078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 5.0, 5.0, 15.0, 13.0, 29.0, 43.0, 54.0, 68.0, 98.0, 168.0, 251.0, 384.0, 575.0, 1076.0, 2255.0, 5169.0, 16326.0, 65479.0, 275770.0, 462367.0, 163437.0, 36939.0, 10279.0, 3731.0, 1672.0, 890.0, 486.0, 290.0, 191.0, 174.0, 84.0, 62.0, 51.0, 34.0, 21.0, 17.0, 11.0, 10.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.417236328125, -0.4034690856933594, -0.38970184326171875, -0.3759346008300781, -0.3621673583984375, -0.3484001159667969, -0.33463287353515625, -0.3208656311035156, -0.307098388671875, -0.2933311462402344, -0.27956390380859375, -0.2657966613769531, -0.2520294189453125, -0.23826217651367188, -0.22449493408203125, -0.21072769165039062, -0.19696044921875, -0.18319320678710938, -0.16942596435546875, -0.15565872192382812, -0.1418914794921875, -0.12812423706054688, -0.11435699462890625, -0.10058975219726562, -0.086822509765625, -0.07305526733398438, -0.05928802490234375, -0.045520782470703125, -0.0317535400390625, -0.017986297607421875, -0.00421905517578125, 0.009548187255859375, 0.0233154296875, 0.037082672119140625, 0.05084991455078125, 0.06461715698242188, 0.0783843994140625, 0.09215164184570312, 0.10591888427734375, 0.11968612670898438, 0.133453369140625, 0.14722061157226562, 0.16098785400390625, 0.17475509643554688, 0.1885223388671875, 0.20228958129882812, 0.21605682373046875, 0.22982406616210938, 0.24359130859375, 0.2573585510253906, 0.27112579345703125, 0.2848930358886719, 0.2986602783203125, 0.3124275207519531, 0.32619476318359375, 0.3399620056152344, 0.353729248046875, 0.3674964904785156, 0.38126373291015625, 0.3950309753417969, 0.4087982177734375, 0.4225654602050781, 0.43633270263671875, 0.4500999450683594, 0.4638671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 13.0, 19.0, 12.0, 16.0, 16.0, 24.0, 39.0, 37.0, 49.0, 47.0, 49.0, 66.0, 54.0, 51.0, 63.0, 57.0, 61.0, 53.0, 38.0, 37.0, 33.0, 39.0, 27.0, 19.0, 13.0, 8.0, 14.0, 13.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4404296875, -0.428070068359375, -0.41571044921875, -0.403350830078125, -0.3909912109375, -0.378631591796875, -0.36627197265625, -0.353912353515625, -0.341552734375, -0.329193115234375, -0.31683349609375, -0.304473876953125, -0.2921142578125, -0.279754638671875, -0.26739501953125, -0.255035400390625, -0.24267578125, -0.230316162109375, -0.21795654296875, -0.205596923828125, -0.1932373046875, -0.180877685546875, -0.16851806640625, -0.156158447265625, -0.143798828125, -0.131439208984375, -0.11907958984375, -0.106719970703125, -0.0943603515625, -0.082000732421875, -0.06964111328125, -0.057281494140625, -0.044921875, -0.032562255859375, -0.02020263671875, -0.007843017578125, 0.0045166015625, 0.016876220703125, 0.02923583984375, 0.041595458984375, 0.053955078125, 0.066314697265625, 0.07867431640625, 0.091033935546875, 0.1033935546875, 0.115753173828125, 0.12811279296875, 0.140472412109375, 0.15283203125, 0.165191650390625, 0.17755126953125, 0.189910888671875, 0.2022705078125, 0.214630126953125, 0.22698974609375, 0.239349365234375, 0.251708984375, 0.264068603515625, 0.27642822265625, 0.288787841796875, 0.3011474609375, 0.313507080078125, 0.32586669921875, 0.338226318359375, 0.3505859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 11.0, 9.0, 17.0, 30.0, 64.0, 150.0, 425.0, 1684.0, 18677.0, 951589.0, 71732.0, 3093.0, 671.0, 225.0, 88.0, 38.0, 15.0, 18.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.8903274536132812, -0.8646392822265625, -0.8389511108398438, -0.813262939453125, -0.7875747680664062, -0.7618865966796875, -0.7361984252929688, -0.71051025390625, -0.6848220825195312, -0.6591339111328125, -0.6334457397460938, -0.607757568359375, -0.5820693969726562, -0.5563812255859375, -0.5306930541992188, -0.5050048828125, -0.47931671142578125, -0.4536285400390625, -0.42794036865234375, -0.402252197265625, -0.37656402587890625, -0.3508758544921875, -0.32518768310546875, -0.29949951171875, -0.27381134033203125, -0.2481231689453125, -0.22243499755859375, -0.196746826171875, -0.17105865478515625, -0.1453704833984375, -0.11968231201171875, -0.093994140625, -0.06830596923828125, -0.0426177978515625, -0.01692962646484375, 0.008758544921875, 0.03444671630859375, 0.0601348876953125, 0.08582305908203125, 0.11151123046875, 0.13719940185546875, 0.1628875732421875, 0.18857574462890625, 0.214263916015625, 0.23995208740234375, 0.2656402587890625, 0.29132843017578125, 0.3170166015625, 0.34270477294921875, 0.3683929443359375, 0.39408111572265625, 0.419769287109375, 0.44545745849609375, 0.4711456298828125, 0.49683380126953125, 0.52252197265625, 0.5482101440429688, 0.5738983154296875, 0.5995864868164062, 0.625274658203125, 0.6509628295898438, 0.6766510009765625, 0.7023391723632812, 0.72802734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 8.0, 11.0, 11.0, 11.0, 9.0, 22.0, 27.0, 34.0, 39.0, 48.0, 57.0, 59.0, 64.0, 92.0, 74.0, 75.0, 77.0, 62.0, 48.0, 30.0, 25.0, 19.0, 11.0, 13.0, 8.0, 10.0, 10.0, 9.0, 1.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.500980377197266e-05, -9.24253836274147e-05, -8.984096348285675e-05, -8.72565433382988e-05, -8.467212319374084e-05, -8.208770304918289e-05, -7.950328290462494e-05, -7.691886276006699e-05, -7.433444261550903e-05, -7.175002247095108e-05, -6.916560232639313e-05, -6.658118218183517e-05, -6.399676203727722e-05, -6.141234189271927e-05, -5.8827921748161316e-05, -5.624350160360336e-05, -5.365908145904541e-05, -5.107466131448746e-05, -4.8490241169929504e-05, -4.590582102537155e-05, -4.33214008808136e-05, -4.0736980736255646e-05, -3.815256059169769e-05, -3.556814044713974e-05, -3.298372030258179e-05, -3.0399300158023834e-05, -2.781488001346588e-05, -2.523045986890793e-05, -2.2646039724349976e-05, -2.0061619579792023e-05, -1.747719943523407e-05, -1.4892779290676117e-05, -1.2308359146118164e-05, -9.723939001560211e-06, -7.139518857002258e-06, -4.555098712444305e-06, -1.9706785678863525e-06, 6.137415766716003e-07, 3.1981617212295532e-06, 5.782581865787506e-06, 8.367002010345459e-06, 1.0951422154903412e-05, 1.3535842299461365e-05, 1.6120262444019318e-05, 1.870468258857727e-05, 2.1289102733135223e-05, 2.3873522877693176e-05, 2.645794302225113e-05, 2.9042363166809082e-05, 3.1626783311367035e-05, 3.421120345592499e-05, 3.679562360048294e-05, 3.9380043745040894e-05, 4.1964463889598846e-05, 4.45488840341568e-05, 4.713330417871475e-05, 4.9717724323272705e-05, 5.230214446783066e-05, 5.488656461238861e-05, 5.7470984756946564e-05, 6.0055404901504517e-05, 6.263982504606247e-05, 6.522424519062042e-05, 6.780866533517838e-05, 7.039308547973633e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 4.0, 14.0, 9.0, 9.0, 28.0, 41.0, 42.0, 82.0, 143.0, 300.0, 605.0, 1506.0, 3948.0, 19899.0, 867736.0, 141413.0, 8269.0, 2464.0, 1009.0, 469.0, 232.0, 110.0, 56.0, 35.0, 43.0, 20.0, 18.0, 7.0, 8.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72021484375, -0.6968154907226562, -0.6734161376953125, -0.6500167846679688, -0.626617431640625, -0.6032180786132812, -0.5798187255859375, -0.5564193725585938, -0.53302001953125, -0.5096206665039062, -0.4862213134765625, -0.46282196044921875, -0.439422607421875, -0.41602325439453125, -0.3926239013671875, -0.36922454833984375, -0.3458251953125, -0.32242584228515625, -0.2990264892578125, -0.27562713623046875, -0.252227783203125, -0.22882843017578125, -0.2054290771484375, -0.18202972412109375, -0.15863037109375, -0.13523101806640625, -0.1118316650390625, -0.08843231201171875, -0.065032958984375, -0.04163360595703125, -0.0182342529296875, 0.00516510009765625, 0.028564453125, 0.05196380615234375, 0.0753631591796875, 0.09876251220703125, 0.122161865234375, 0.14556121826171875, 0.1689605712890625, 0.19235992431640625, 0.21575927734375, 0.23915863037109375, 0.2625579833984375, 0.28595733642578125, 0.309356689453125, 0.33275604248046875, 0.3561553955078125, 0.37955474853515625, 0.4029541015625, 0.42635345458984375, 0.4497528076171875, 0.47315216064453125, 0.496551513671875, 0.5199508666992188, 0.5433502197265625, 0.5667495727539062, 0.59014892578125, 0.6135482788085938, 0.6369476318359375, 0.6603469848632812, 0.683746337890625, 0.7071456909179688, 0.7305450439453125, 0.7539443969726562, 0.77734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 5.0, 7.0, 9.0, 33.0, 51.0, 80.0, 196.0, 268.0, 159.0, 80.0, 34.0, 30.0, 16.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36376953125, -0.3517646789550781, -0.33975982666015625, -0.3277549743652344, -0.3157501220703125, -0.3037452697753906, -0.29174041748046875, -0.2797355651855469, -0.267730712890625, -0.2557258605957031, -0.24372100830078125, -0.23171615600585938, -0.2197113037109375, -0.20770645141601562, -0.19570159912109375, -0.18369674682617188, -0.17169189453125, -0.15968704223632812, -0.14768218994140625, -0.13567733764648438, -0.1236724853515625, -0.11166763305664062, -0.09966278076171875, -0.08765792846679688, -0.075653076171875, -0.06364822387695312, -0.05164337158203125, -0.039638519287109375, -0.0276336669921875, -0.015628814697265625, -0.00362396240234375, 0.008380889892578125, 0.0203857421875, 0.032390594482421875, 0.04439544677734375, 0.056400299072265625, 0.0684051513671875, 0.08041000366210938, 0.09241485595703125, 0.10441970825195312, 0.116424560546875, 0.12842941284179688, 0.14043426513671875, 0.15243911743164062, 0.1644439697265625, 0.17644882202148438, 0.18845367431640625, 0.20045852661132812, 0.21246337890625, 0.22446823120117188, 0.23647308349609375, 0.24847793579101562, 0.2604827880859375, 0.2724876403808594, 0.28449249267578125, 0.2964973449707031, 0.308502197265625, 0.3205070495605469, 0.33251190185546875, 0.3445167541503906, 0.3565216064453125, 0.3685264587402344, 0.38053131103515625, 0.3925361633300781, 0.404541015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 22.0, 26.0, 56.0, 104.0, 174.0, 196.0, 174.0, 120.0, 68.0, 28.0, 14.0, 9.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1920552253723145, -3.057668447494507, -2.923281669616699, -2.7888948917388916, -2.654508113861084, -2.5201210975646973, -2.3857343196868896, -2.251347541809082, -2.1169607639312744, -1.9825739860534668, -1.8481872081756592, -1.713800311088562, -1.5794135332107544, -1.4450267553329468, -1.3106398582458496, -1.176253080368042, -1.0418663024902344, -0.9074795246124268, -0.7730926871299744, -0.638705849647522, -0.5043190717697144, -0.36993229389190674, -0.23554545640945435, -0.10115861892700195, 0.033228158950805664, 0.16761496663093567, 0.3020017743110657, 0.4363885819911957, 0.5707753896713257, 0.7051621675491333, 0.8395490050315857, 0.9739358425140381, 1.1083226203918457, 1.2427093982696533, 1.377096176147461, 1.511483073234558, 1.6458698511123657, 1.7802566289901733, 1.9146435260772705, 2.049030303955078, 2.1834170818328857, 2.3178038597106934, 2.452190637588501, 2.5865774154663086, 2.7209644317626953, 2.855350971221924, 2.9897379875183105, 3.124124765396118, 3.258511543273926, 3.3928983211517334, 3.527285099029541, 3.6616718769073486, 3.7960586547851562, 3.930445671081543, 4.0648322105407715, 4.199219226837158, 4.333605766296387, 4.467992782592773, 4.602379322052002, 4.736766338348389, 4.871152877807617, 5.005539894104004, 5.139926433563232, 5.274313449859619, 5.408700466156006]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 7.0, 13.0, 6.0, 15.0, 17.0, 21.0, 34.0, 37.0, 33.0, 41.0, 48.0, 75.0, 59.0, 60.0, 69.0, 61.0, 60.0, 67.0, 53.0, 56.0, 35.0, 29.0, 24.0, 17.0, 16.0, 17.0, 10.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2340612411499023, -2.1520631313323975, -2.0700647830963135, -1.9880666732788086, -1.9060685634613037, -1.8240703344345093, -1.7420721054077148, -1.66007399559021, -1.5780757665634155, -1.496077537536621, -1.4140794277191162, -1.3320811986923218, -1.2500829696655273, -1.1680848598480225, -1.086086630821228, -1.0040884017944336, -0.9220902919769287, -0.840092122554779, -0.7580939531326294, -0.676095724105835, -0.5940975546836853, -0.5120993852615356, -0.4301011860370636, -0.34810298681259155, -0.2661048173904419, -0.18410663306713104, -0.10210844874382019, -0.02011026442050934, 0.061887919902801514, 0.14388608932495117, 0.22588428854942322, 0.30788248777389526, 0.3898806571960449, 0.4718788266181946, 0.5538769960403442, 0.6358752250671387, 0.7178733944892883, 0.799871563911438, 0.8818697929382324, 0.9638679623603821, 1.0458661317825317, 1.1278643608093262, 1.209862470626831, 1.2918606996536255, 1.37385892868042, 1.4558570384979248, 1.5378552675247192, 1.6198534965515137, 1.7018516063690186, 1.783849835395813, 1.8658479452133179, 1.9478461742401123, 2.029844284057617, 2.111842632293701, 2.193840742111206, 2.275838851928711, 2.357837200164795, 2.4398353099823, 2.521833658218384, 2.6038317680358887, 2.6858298778533936, 2.7678279876708984, 2.8498263359069824, 2.9318244457244873, 3.013822555541992]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 8.0, 9.0, 13.0, 14.0, 19.0, 42.0, 46.0, 106.0, 166.0, 251.0, 501.0, 1161.0, 2675.0, 8189.0, 33100.0, 245261.0, 3725134.0, 143959.0, 23636.0, 5953.0, 2113.0, 945.0, 416.0, 214.0, 146.0, 70.0, 45.0, 28.0, 21.0, 16.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58203125, -0.5655860900878906, -0.5491409301757812, -0.5326957702636719, -0.5162506103515625, -0.4998054504394531, -0.48336029052734375, -0.4669151306152344, -0.450469970703125, -0.4340248107910156, -0.41757965087890625, -0.4011344909667969, -0.3846893310546875, -0.3682441711425781, -0.35179901123046875, -0.3353538513183594, -0.31890869140625, -0.3024635314941406, -0.28601837158203125, -0.2695732116699219, -0.2531280517578125, -0.23668289184570312, -0.22023773193359375, -0.20379257202148438, -0.187347412109375, -0.17090225219726562, -0.15445709228515625, -0.13801193237304688, -0.1215667724609375, -0.10512161254882812, -0.08867645263671875, -0.07223129272460938, -0.0557861328125, -0.039340972900390625, -0.02289581298828125, -0.006450653076171875, 0.0099945068359375, 0.026439666748046875, 0.04288482666015625, 0.059329986572265625, 0.075775146484375, 0.09222030639648438, 0.10866546630859375, 0.12511062622070312, 0.1415557861328125, 0.15800094604492188, 0.17444610595703125, 0.19089126586914062, 0.20733642578125, 0.22378158569335938, 0.24022674560546875, 0.2566719055175781, 0.2731170654296875, 0.2895622253417969, 0.30600738525390625, 0.3224525451660156, 0.338897705078125, 0.3553428649902344, 0.37178802490234375, 0.3882331848144531, 0.4046783447265625, 0.4211235046386719, 0.43756866455078125, 0.4540138244628906, 0.470458984375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 10.0, 6.0, 9.0, 16.0, 16.0, 21.0, 17.0, 35.0, 39.0, 42.0, 39.0, 47.0, 55.0, 56.0, 58.0, 49.0, 69.0, 49.0, 56.0, 51.0, 43.0, 33.0, 35.0, 34.0, 27.0, 18.0, 15.0, 19.0, 9.0, 4.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09295654296875, -0.0903329849243164, -0.08770942687988281, -0.08508586883544922, -0.08246231079101562, -0.07983875274658203, -0.07721519470214844, -0.07459163665771484, -0.07196807861328125, -0.06934452056884766, -0.06672096252441406, -0.06409740447998047, -0.061473846435546875, -0.05885028839111328, -0.05622673034667969, -0.053603172302246094, -0.0509796142578125, -0.048356056213378906, -0.04573249816894531, -0.04310894012451172, -0.040485382080078125, -0.03786182403564453, -0.03523826599121094, -0.032614707946777344, -0.02999114990234375, -0.027367591857910156, -0.024744033813476562, -0.02212047576904297, -0.019496917724609375, -0.01687335968017578, -0.014249801635742188, -0.011626243591308594, -0.009002685546875, -0.006379127502441406, -0.0037555694580078125, -0.0011320114135742188, 0.001491546630859375, 0.004115104675292969, 0.0067386627197265625, 0.009362220764160156, 0.01198577880859375, 0.014609336853027344, 0.017232894897460938, 0.01985645294189453, 0.022480010986328125, 0.02510356903076172, 0.027727127075195312, 0.030350685119628906, 0.0329742431640625, 0.035597801208496094, 0.03822135925292969, 0.04084491729736328, 0.043468475341796875, 0.04609203338623047, 0.04871559143066406, 0.051339149475097656, 0.05396270751953125, 0.056586265563964844, 0.05920982360839844, 0.06183338165283203, 0.06445693969726562, 0.06708049774169922, 0.06970405578613281, 0.0723276138305664, 0.074951171875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 11.0, 22.0, 25.0, 39.0, 66.0, 96.0, 149.0, 199.0, 336.0, 560.0, 1026.0, 1811.0, 3666.0, 8166.0, 20392.0, 64351.0, 305988.0, 3284775.0, 387265.0, 74603.0, 23519.0, 8890.0, 3956.0, 1908.0, 998.0, 596.0, 326.0, 187.0, 128.0, 66.0, 41.0, 30.0, 27.0, 12.0, 11.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2676048278808594, -0.25713348388671875, -0.24666213989257812, -0.2361907958984375, -0.22571945190429688, -0.21524810791015625, -0.20477676391601562, -0.194305419921875, -0.18383407592773438, -0.17336273193359375, -0.16289138793945312, -0.1524200439453125, -0.14194869995117188, -0.13147735595703125, -0.12100601196289062, -0.11053466796875, -0.10006332397460938, -0.08959197998046875, -0.07912063598632812, -0.0686492919921875, -0.058177947998046875, -0.04770660400390625, -0.037235260009765625, -0.026763916015625, -0.016292572021484375, -0.00582122802734375, 0.004650115966796875, 0.0151214599609375, 0.025592803955078125, 0.03606414794921875, 0.046535491943359375, 0.0570068359375, 0.06747817993164062, 0.07794952392578125, 0.08842086791992188, 0.0988922119140625, 0.10936355590820312, 0.11983489990234375, 0.13030624389648438, 0.140777587890625, 0.15124893188476562, 0.16172027587890625, 0.17219161987304688, 0.1826629638671875, 0.19313430786132812, 0.20360565185546875, 0.21407699584960938, 0.22454833984375, 0.23501968383789062, 0.24549102783203125, 0.2559623718261719, 0.2664337158203125, 0.2769050598144531, 0.28737640380859375, 0.2978477478027344, 0.308319091796875, 0.3187904357910156, 0.32926177978515625, 0.3397331237792969, 0.3502044677734375, 0.3606758117675781, 0.37114715576171875, 0.3816184997558594, 0.39208984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 11.0, 8.0, 17.0, 15.0, 22.0, 34.0, 61.0, 71.0, 132.0, 226.0, 441.0, 1589.0, 690.0, 285.0, 148.0, 101.0, 54.0, 40.0, 28.0, 26.0, 16.0, 10.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.188232421875, -0.1832408905029297, -0.17824935913085938, -0.17325782775878906, -0.16826629638671875, -0.16327476501464844, -0.15828323364257812, -0.1532917022705078, -0.1483001708984375, -0.1433086395263672, -0.13831710815429688, -0.13332557678222656, -0.12833404541015625, -0.12334251403808594, -0.11835098266601562, -0.11335945129394531, -0.108367919921875, -0.10337638854980469, -0.09838485717773438, -0.09339332580566406, -0.08840179443359375, -0.08341026306152344, -0.07841873168945312, -0.07342720031738281, -0.0684356689453125, -0.06344413757324219, -0.058452606201171875, -0.05346107482910156, -0.04846954345703125, -0.04347801208496094, -0.038486480712890625, -0.03349494934082031, -0.02850341796875, -0.023511886596679688, -0.018520355224609375, -0.013528823852539062, -0.00853729248046875, -0.0035457611083984375, 0.001445770263671875, 0.0064373016357421875, 0.0114288330078125, 0.016420364379882812, 0.021411895751953125, 0.026403427124023438, 0.03139495849609375, 0.03638648986816406, 0.041378021240234375, 0.04636955261230469, 0.051361083984375, 0.05635261535644531, 0.061344146728515625, 0.06633567810058594, 0.07132720947265625, 0.07631874084472656, 0.08131027221679688, 0.08630180358886719, 0.0912933349609375, 0.09628486633300781, 0.10127639770507812, 0.10626792907714844, 0.11125946044921875, 0.11625099182128906, 0.12124252319335938, 0.1262340545654297, 0.1312255859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 2.0, 8.0, 10.0, 18.0, 18.0, 41.0, 46.0, 58.0, 71.0, 81.0, 103.0, 118.0, 82.0, 89.0, 65.0, 57.0, 33.0, 34.0, 16.0, 13.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8403926491737366, -0.8158271908760071, -0.7912617921829224, -0.7666963338851929, -0.7421308755874634, -0.7175654172897339, -0.6929999589920044, -0.6684345602989197, -0.6438691020011902, -0.6193036437034607, -0.594738245010376, -0.5701727867126465, -0.545607328414917, -0.5210418701171875, -0.4964764416217804, -0.4719110131263733, -0.4473455548286438, -0.4227800965309143, -0.3982146680355072, -0.3736492395401001, -0.3490837812423706, -0.3245183229446411, -0.299952894449234, -0.2753874659538269, -0.2508220076560974, -0.2262565642595291, -0.20169112086296082, -0.17712567746639252, -0.15256023406982422, -0.12799479067325592, -0.10342934727668762, -0.07886390388011932, -0.05429840087890625, -0.02973295748233795, -0.005167514085769653, 0.019397929310798645, 0.04396337270736694, 0.06852881610393524, 0.09309425950050354, 0.11765970289707184, 0.14222514629364014, 0.16679058969020844, 0.19135603308677673, 0.21592147648334503, 0.24048691987991333, 0.2650523781776428, 0.2896178066730499, 0.31418323516845703, 0.3387486934661865, 0.363314151763916, 0.3878795802593231, 0.4124450087547302, 0.4370104670524597, 0.4615759253501892, 0.4861413538455963, 0.5107067823410034, 0.5352722406387329, 0.5598376989364624, 0.5844031572341919, 0.6089685559272766, 0.6335340142250061, 0.6580994725227356, 0.6826648712158203, 0.7072303295135498, 0.7317957878112793]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 4.0, 4.0, 10.0, 11.0, 20.0, 18.0, 25.0, 34.0, 32.0, 44.0, 46.0, 62.0, 51.0, 57.0, 61.0, 75.0, 56.0, 65.0, 55.0, 56.0, 42.0, 38.0, 27.0, 26.0, 19.0, 15.0, 16.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6737127900123596, -0.6516905426979065, -0.6296682953834534, -0.607646107673645, -0.5856238603591919, -0.5636016130447388, -0.5415793657302856, -0.5195571184158325, -0.4975348711013794, -0.47551262378692627, -0.45349040627479553, -0.4314681589603424, -0.4094459116458893, -0.38742369413375854, -0.3654014468193054, -0.3433791995048523, -0.32135698199272156, -0.29933473467826843, -0.2773125171661377, -0.25529026985168457, -0.23326802253723145, -0.21124579012393951, -0.18922355771064758, -0.16720131039619446, -0.14517907798290253, -0.12315683811903, -0.10113459825515747, -0.07911236584186554, -0.05709012597799301, -0.03506788611412048, -0.013045653700828552, 0.008976593613624573, 0.030998826026916504, 0.05302106589078903, 0.07504330575466156, 0.09706553816795349, 0.11908777803182602, 0.14111001789569855, 0.16313225030899048, 0.1851544976234436, 0.20717673003673553, 0.22919896245002747, 0.2512212097644806, 0.27324342727661133, 0.29526567459106445, 0.3172879219055176, 0.3393101692199707, 0.36133241653442383, 0.38335463404655457, 0.4053768813610077, 0.4273990988731384, 0.44942134618759155, 0.4714435935020447, 0.4934658408164978, 0.5154880285263062, 0.5375102758407593, 0.5595325231552124, 0.5815547704696655, 0.6035770177841187, 0.6255992650985718, 0.6476214528083801, 0.6696437001228333, 0.6916659474372864, 0.7136881947517395, 0.7357104420661926]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 6.0, 9.0, 7.0, 27.0, 28.0, 45.0, 54.0, 96.0, 138.0, 211.0, 386.0, 642.0, 1162.0, 2211.0, 4800.0, 11090.0, 28469.0, 77075.0, 215689.0, 413197.0, 183565.0, 66543.0, 24373.0, 9833.0, 4333.0, 1983.0, 1063.0, 562.0, 348.0, 210.0, 134.0, 81.0, 48.0, 37.0, 28.0, 24.0, 8.0, 12.0, 11.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.406982421875, -0.3940315246582031, -0.38108062744140625, -0.3681297302246094, -0.3551788330078125, -0.3422279357910156, -0.32927703857421875, -0.3163261413574219, -0.303375244140625, -0.2904243469238281, -0.27747344970703125, -0.2645225524902344, -0.2515716552734375, -0.23862075805664062, -0.22566986083984375, -0.21271896362304688, -0.19976806640625, -0.18681716918945312, -0.17386627197265625, -0.16091537475585938, -0.1479644775390625, -0.13501358032226562, -0.12206268310546875, -0.10911178588867188, -0.096160888671875, -0.08320999145507812, -0.07025909423828125, -0.057308197021484375, -0.0443572998046875, -0.031406402587890625, -0.01845550537109375, -0.005504608154296875, 0.0074462890625, 0.020397186279296875, 0.03334808349609375, 0.046298980712890625, 0.0592498779296875, 0.07220077514648438, 0.08515167236328125, 0.09810256958007812, 0.111053466796875, 0.12400436401367188, 0.13695526123046875, 0.14990615844726562, 0.1628570556640625, 0.17580795288085938, 0.18875885009765625, 0.20170974731445312, 0.21466064453125, 0.22761154174804688, 0.24056243896484375, 0.2535133361816406, 0.2664642333984375, 0.2794151306152344, 0.29236602783203125, 0.3053169250488281, 0.318267822265625, 0.3312187194824219, 0.34416961669921875, 0.3571205139160156, 0.3700714111328125, 0.3830223083496094, 0.39597320556640625, 0.4089241027832031, 0.421875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 19.0, 12.0, 23.0, 11.0, 26.0, 25.0, 39.0, 49.0, 48.0, 50.0, 56.0, 54.0, 54.0, 65.0, 57.0, 68.0, 48.0, 48.0, 44.0, 57.0, 26.0, 23.0, 24.0, 19.0, 11.0, 14.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09686279296875, -0.09410953521728516, -0.09135627746582031, -0.08860301971435547, -0.08584976196289062, -0.08309650421142578, -0.08034324645996094, -0.0775899887084961, -0.07483673095703125, -0.0720834732055664, -0.06933021545410156, -0.06657695770263672, -0.06382369995117188, -0.06107044219970703, -0.05831718444824219, -0.055563926696777344, -0.0528106689453125, -0.050057411193847656, -0.04730415344238281, -0.04455089569091797, -0.041797637939453125, -0.03904438018798828, -0.03629112243652344, -0.033537864685058594, -0.03078460693359375, -0.028031349182128906, -0.025278091430664062, -0.02252483367919922, -0.019771575927734375, -0.01701831817626953, -0.014265060424804688, -0.011511802673339844, -0.008758544921875, -0.006005287170410156, -0.0032520294189453125, -0.0004987716674804688, 0.002254486083984375, 0.005007743835449219, 0.0077610015869140625, 0.010514259338378906, 0.01326751708984375, 0.016020774841308594, 0.018774032592773438, 0.02152729034423828, 0.024280548095703125, 0.02703380584716797, 0.029787063598632812, 0.032540321350097656, 0.0352935791015625, 0.038046836853027344, 0.04080009460449219, 0.04355335235595703, 0.046306610107421875, 0.04905986785888672, 0.05181312561035156, 0.054566383361816406, 0.05731964111328125, 0.060072898864746094, 0.06282615661621094, 0.06557941436767578, 0.06833267211914062, 0.07108592987060547, 0.07383918762207031, 0.07659244537353516, 0.079345703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 12.0, 11.0, 12.0, 17.0, 26.0, 56.0, 64.0, 98.0, 117.0, 189.0, 306.0, 435.0, 713.0, 1249.0, 2403.0, 5105.0, 12386.0, 33092.0, 94130.0, 269507.0, 392466.0, 150165.0, 52100.0, 18757.0, 7605.0, 3242.0, 1733.0, 895.0, 551.0, 387.0, 220.0, 155.0, 110.0, 71.0, 37.0, 33.0, 25.0, 23.0, 11.0, 14.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.3818359375, -0.3706779479980469, -0.35951995849609375, -0.3483619689941406, -0.3372039794921875, -0.3260459899902344, -0.31488800048828125, -0.3037300109863281, -0.292572021484375, -0.2814140319824219, -0.27025604248046875, -0.2590980529785156, -0.2479400634765625, -0.23678207397460938, -0.22562408447265625, -0.21446609497070312, -0.20330810546875, -0.19215011596679688, -0.18099212646484375, -0.16983413696289062, -0.1586761474609375, -0.14751815795898438, -0.13636016845703125, -0.12520217895507812, -0.114044189453125, -0.10288619995117188, -0.09172821044921875, -0.08057022094726562, -0.0694122314453125, -0.058254241943359375, -0.04709625244140625, -0.035938262939453125, -0.0247802734375, -0.013622283935546875, -0.00246429443359375, 0.008693695068359375, 0.0198516845703125, 0.031009674072265625, 0.04216766357421875, 0.053325653076171875, 0.064483642578125, 0.07564163208007812, 0.08679962158203125, 0.09795761108398438, 0.1091156005859375, 0.12027359008789062, 0.13143157958984375, 0.14258956909179688, 0.15374755859375, 0.16490554809570312, 0.17606353759765625, 0.18722152709960938, 0.1983795166015625, 0.20953750610351562, 0.22069549560546875, 0.23185348510742188, 0.243011474609375, 0.2541694641113281, 0.26532745361328125, 0.2764854431152344, 0.2876434326171875, 0.2988014221191406, 0.30995941162109375, 0.3211174011230469, 0.332275390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 7.0, 9.0, 13.0, 17.0, 12.0, 16.0, 16.0, 19.0, 22.0, 39.0, 29.0, 40.0, 51.0, 36.0, 48.0, 47.0, 52.0, 57.0, 44.0, 36.0, 47.0, 40.0, 42.0, 36.0, 46.0, 22.0, 24.0, 23.0, 18.0, 19.0, 12.0, 10.0, 8.0, 9.0, 6.0, 2.0, 10.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307373046875, -0.2962837219238281, -0.28519439697265625, -0.2741050720214844, -0.2630157470703125, -0.2519264221191406, -0.24083709716796875, -0.22974777221679688, -0.218658447265625, -0.20756912231445312, -0.19647979736328125, -0.18539047241210938, -0.1743011474609375, -0.16321182250976562, -0.15212249755859375, -0.14103317260742188, -0.12994384765625, -0.11885452270507812, -0.10776519775390625, -0.09667587280273438, -0.0855865478515625, -0.07449722290039062, -0.06340789794921875, -0.052318572998046875, -0.041229248046875, -0.030139923095703125, -0.01905059814453125, -0.007961273193359375, 0.0031280517578125, 0.014217376708984375, 0.02530670166015625, 0.036396026611328125, 0.0474853515625, 0.058574676513671875, 0.06966400146484375, 0.08075332641601562, 0.0918426513671875, 0.10293197631835938, 0.11402130126953125, 0.12511062622070312, 0.136199951171875, 0.14728927612304688, 0.15837860107421875, 0.16946792602539062, 0.1805572509765625, 0.19164657592773438, 0.20273590087890625, 0.21382522583007812, 0.22491455078125, 0.23600387573242188, 0.24709320068359375, 0.2581825256347656, 0.2692718505859375, 0.2803611755371094, 0.29145050048828125, 0.3025398254394531, 0.313629150390625, 0.3247184753417969, 0.33580780029296875, 0.3468971252441406, 0.3579864501953125, 0.3690757751464844, 0.38016510009765625, 0.3912544250488281, 0.40234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 3.0, 17.0, 10.0, 22.0, 25.0, 27.0, 44.0, 57.0, 99.0, 159.0, 267.0, 528.0, 988.0, 2075.0, 4703.0, 12394.0, 44770.0, 253012.0, 561008.0, 127038.0, 26320.0, 8321.0, 3323.0, 1455.0, 812.0, 403.0, 225.0, 137.0, 86.0, 57.0, 41.0, 38.0, 17.0, 18.0, 16.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2464599609375, -0.23927688598632812, -0.23209381103515625, -0.22491073608398438, -0.2177276611328125, -0.21054458618164062, -0.20336151123046875, -0.19617843627929688, -0.188995361328125, -0.18181228637695312, -0.17462921142578125, -0.16744613647460938, -0.1602630615234375, -0.15307998657226562, -0.14589691162109375, -0.13871383666992188, -0.13153076171875, -0.12434768676757812, -0.11716461181640625, -0.10998153686523438, -0.1027984619140625, -0.09561538696289062, -0.08843231201171875, -0.08124923706054688, -0.074066162109375, -0.06688308715820312, -0.05970001220703125, -0.052516937255859375, -0.0453338623046875, -0.038150787353515625, -0.03096771240234375, -0.023784637451171875, -0.0166015625, -0.009418487548828125, -0.00223541259765625, 0.004947662353515625, 0.0121307373046875, 0.019313812255859375, 0.02649688720703125, 0.033679962158203125, 0.040863037109375, 0.048046112060546875, 0.05522918701171875, 0.062412261962890625, 0.0695953369140625, 0.07677841186523438, 0.08396148681640625, 0.09114456176757812, 0.09832763671875, 0.10551071166992188, 0.11269378662109375, 0.11987686157226562, 0.1270599365234375, 0.13424301147460938, 0.14142608642578125, 0.14860916137695312, 0.155792236328125, 0.16297531127929688, 0.17015838623046875, 0.17734146118164062, 0.1845245361328125, 0.19170761108398438, 0.19889068603515625, 0.20607376098632812, 0.2132568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 3.0, 7.0, 3.0, 16.0, 12.0, 19.0, 26.0, 22.0, 35.0, 25.0, 48.0, 57.0, 65.0, 87.0, 91.0, 73.0, 82.0, 70.0, 50.0, 38.0, 33.0, 36.0, 24.0, 18.0, 6.0, 11.0, 10.0, 10.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.851289749145508e-05, -8.572917431592941e-05, -8.294545114040375e-05, -8.016172796487808e-05, -7.737800478935242e-05, -7.459428161382675e-05, -7.181055843830109e-05, -6.902683526277542e-05, -6.624311208724976e-05, -6.345938891172409e-05, -6.0675665736198425e-05, -5.789194256067276e-05, -5.5108219385147095e-05, -5.232449620962143e-05, -4.9540773034095764e-05, -4.67570498585701e-05, -4.3973326683044434e-05, -4.118960350751877e-05, -3.84058803319931e-05, -3.562215715646744e-05, -3.283843398094177e-05, -3.0054710805416107e-05, -2.7270987629890442e-05, -2.4487264454364777e-05, -2.170354127883911e-05, -1.8919818103313446e-05, -1.613609492778778e-05, -1.3352371752262115e-05, -1.056864857673645e-05, -7.784925401210785e-06, -5.00120222568512e-06, -2.2174790501594543e-06, 5.662441253662109e-07, 3.3499673008918762e-06, 6.1336904764175415e-06, 8.917413651943207e-06, 1.1701136827468872e-05, 1.4484860002994537e-05, 1.7268583178520203e-05, 2.0052306354045868e-05, 2.2836029529571533e-05, 2.56197527050972e-05, 2.8403475880622864e-05, 3.118719905614853e-05, 3.3970922231674194e-05, 3.675464540719986e-05, 3.9538368582725525e-05, 4.232209175825119e-05, 4.5105814933776855e-05, 4.788953810930252e-05, 5.0673261284828186e-05, 5.345698446035385e-05, 5.6240707635879517e-05, 5.902443081140518e-05, 6.180815398693085e-05, 6.459187716245651e-05, 6.737560033798218e-05, 7.015932351350784e-05, 7.294304668903351e-05, 7.572676986455917e-05, 7.851049304008484e-05, 8.12942162156105e-05, 8.407793939113617e-05, 8.686166256666183e-05, 8.96453857421875e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 8.0, 8.0, 18.0, 12.0, 21.0, 16.0, 47.0, 64.0, 82.0, 131.0, 187.0, 303.0, 542.0, 911.0, 1755.0, 3373.0, 7466.0, 18502.0, 65114.0, 361303.0, 460041.0, 88996.0, 22726.0, 8759.0, 3844.0, 1889.0, 959.0, 521.0, 325.0, 185.0, 115.0, 96.0, 72.0, 58.0, 26.0, 25.0, 14.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1746826171875, -0.16846466064453125, -0.1622467041015625, -0.15602874755859375, -0.149810791015625, -0.14359283447265625, -0.1373748779296875, -0.13115692138671875, -0.12493896484375, -0.11872100830078125, -0.1125030517578125, -0.10628509521484375, -0.100067138671875, -0.09384918212890625, -0.0876312255859375, -0.08141326904296875, -0.0751953125, -0.06897735595703125, -0.0627593994140625, -0.05654144287109375, -0.050323486328125, -0.04410552978515625, -0.0378875732421875, -0.03166961669921875, -0.02545166015625, -0.01923370361328125, -0.0130157470703125, -0.00679779052734375, -0.000579833984375, 0.00563812255859375, 0.0118560791015625, 0.01807403564453125, 0.0242919921875, 0.03050994873046875, 0.0367279052734375, 0.04294586181640625, 0.049163818359375, 0.05538177490234375, 0.0615997314453125, 0.06781768798828125, 0.07403564453125, 0.08025360107421875, 0.0864715576171875, 0.09268951416015625, 0.098907470703125, 0.10512542724609375, 0.1113433837890625, 0.11756134033203125, 0.123779296875, 0.12999725341796875, 0.1362152099609375, 0.14243316650390625, 0.148651123046875, 0.15486907958984375, 0.1610870361328125, 0.16730499267578125, 0.17352294921875, 0.17974090576171875, 0.1859588623046875, 0.19217681884765625, 0.198394775390625, 0.20461273193359375, 0.2108306884765625, 0.21704864501953125, 0.2232666015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 2.0, 6.0, 10.0, 6.0, 11.0, 16.0, 36.0, 39.0, 58.0, 72.0, 105.0, 112.0, 120.0, 114.0, 83.0, 50.0, 36.0, 31.0, 21.0, 20.0, 9.0, 8.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1266613006591797, -0.12160873413085938, -0.11655616760253906, -0.11150360107421875, -0.10645103454589844, -0.10139846801757812, -0.09634590148925781, -0.0912933349609375, -0.08624076843261719, -0.08118820190429688, -0.07613563537597656, -0.07108306884765625, -0.06603050231933594, -0.060977935791015625, -0.05592536926269531, -0.050872802734375, -0.04582023620605469, -0.040767669677734375, -0.03571510314941406, -0.03066253662109375, -0.025609970092773438, -0.020557403564453125, -0.015504837036132812, -0.0104522705078125, -0.0053997039794921875, -0.000347137451171875, 0.0047054290771484375, 0.00975799560546875, 0.014810562133789062, 0.019863128662109375, 0.024915695190429688, 0.02996826171875, 0.03502082824707031, 0.040073394775390625, 0.04512596130371094, 0.05017852783203125, 0.05523109436035156, 0.060283660888671875, 0.06533622741699219, 0.0703887939453125, 0.07544136047363281, 0.08049392700195312, 0.08554649353027344, 0.09059906005859375, 0.09565162658691406, 0.10070419311523438, 0.10575675964355469, 0.110809326171875, 0.11586189270019531, 0.12091445922851562, 0.12596702575683594, 0.13101959228515625, 0.13607215881347656, 0.14112472534179688, 0.1461772918701172, 0.1512298583984375, 0.1562824249267578, 0.16133499145507812, 0.16638755798339844, 0.17144012451171875, 0.17649269104003906, 0.18154525756835938, 0.1865978240966797, 0.191650390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 24.0, 78.0, 161.0, 279.0, 265.0, 120.0, 51.0, 21.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.543674945831299, -7.349928379058838, -7.156182289123535, -6.962435722351074, -6.7686896324157715, -6.5749430656433105, -6.381196975708008, -6.187450408935547, -5.993703842163086, -5.799957275390625, -5.606211185455322, -5.412464618682861, -5.218718528747559, -5.024971961975098, -4.831225395202637, -4.637479305267334, -4.443733215332031, -4.24998664855957, -4.056240558624268, -3.8624939918518066, -3.668747901916504, -3.475001335144043, -3.281255006790161, -3.0875086784362793, -2.8937623500823975, -2.7000160217285156, -2.506269693374634, -2.312523365020752, -2.118776798248291, -1.9250305891036987, -1.7312841415405273, -1.5375378131866455, -1.3437910079956055, -1.1500446796417236, -0.956298291683197, -0.7625519037246704, -0.5688055753707886, -0.37505924701690674, -0.18131279945373535, 0.012433528900146484, 0.20617985725402832, 0.39992621541023254, 0.5936725735664368, 0.7874189615249634, 0.9811652898788452, 1.174911618232727, 1.3686580657958984, 1.5624043941497803, 1.756150722503662, 1.949897050857544, 2.143643379211426, 2.3373899459838867, 2.5311360359191895, 2.7248826026916504, 2.9186289310455322, 3.112375259399414, 3.306121587753296, 3.4998679161071777, 3.6936142444610596, 3.8873605728149414, 4.081107139587402, 4.274853229522705, 4.468599796295166, 4.662345886230469, 4.85609245300293]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 8.0, 6.0, 7.0, 5.0, 7.0, 3.0, 8.0, 17.0, 15.0, 12.0, 15.0, 20.0, 23.0, 12.0, 35.0, 31.0, 26.0, 29.0, 41.0, 41.0, 29.0, 43.0, 44.0, 44.0, 56.0, 25.0, 42.0, 41.0, 41.0, 28.0, 29.0, 22.0, 21.0, 20.0, 21.0, 23.0, 17.0, 20.0, 8.0, 11.0, 15.0, 7.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.6317119598388672, -1.5812482833862305, -1.5307846069335938, -1.4803208112716675, -1.4298571348190308, -1.379393458366394, -1.3289297819137573, -1.278465986251831, -1.2280023097991943, -1.1775386333465576, -1.127074956893921, -1.0766111612319946, -1.026147484779358, -0.9756838083267212, -0.9252201318740845, -0.874756395816803, -0.8242927193641663, -0.7738290429115295, -0.723365306854248, -0.6729016304016113, -0.6224378943443298, -0.5719742178916931, -0.5215104818344116, -0.4710468053817749, -0.4205830991268158, -0.3701193928718567, -0.3196556866168976, -0.2691919803619385, -0.21872828900814056, -0.16826459765434265, -0.11780089139938354, -0.06733718514442444, -0.016873478889465332, 0.033590223640203476, 0.08405392616987228, 0.1345176249742508, 0.1849813312292099, 0.2354450225830078, 0.2859087288379669, 0.336372435092926, 0.38683614134788513, 0.43729984760284424, 0.48776355385780334, 0.5382272601127625, 0.5886909365653992, 0.6391546726226807, 0.6896183490753174, 0.7400820255279541, 0.7905457615852356, 0.8410094380378723, 0.8914731740951538, 0.9419368505477905, 0.992400586605072, 1.0428643226623535, 1.0933279991149902, 1.143791675567627, 1.1942553520202637, 1.2447190284729004, 1.295182704925537, 1.3456465005874634, 1.3961101770401, 1.4465738534927368, 1.4970375299453735, 1.5475013256072998, 1.5979650020599365]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 6.0, 5.0, 8.0, 5.0, 12.0, 13.0, 13.0, 23.0, 22.0, 43.0, 51.0, 80.0, 125.0, 175.0, 262.0, 380.0, 601.0, 1062.0, 1775.0, 3299.0, 6829.0, 15284.0, 42081.0, 181016.0, 3594070.0, 260992.0, 51674.0, 17752.0, 7748.0, 3826.0, 2006.0, 1137.0, 642.0, 408.0, 274.0, 165.0, 136.0, 85.0, 48.0, 48.0, 32.0, 17.0, 11.0, 12.0, 13.0, 8.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.33349609375, -0.3232612609863281, -0.31302642822265625, -0.3027915954589844, -0.2925567626953125, -0.2823219299316406, -0.27208709716796875, -0.2618522644042969, -0.251617431640625, -0.24138259887695312, -0.23114776611328125, -0.22091293334960938, -0.2106781005859375, -0.20044326782226562, -0.19020843505859375, -0.17997360229492188, -0.16973876953125, -0.15950393676757812, -0.14926910400390625, -0.13903427124023438, -0.1287994384765625, -0.11856460571289062, -0.10832977294921875, -0.09809494018554688, -0.087860107421875, -0.07762527465820312, -0.06739044189453125, -0.057155609130859375, -0.0469207763671875, -0.036685943603515625, -0.02645111083984375, -0.016216278076171875, -0.0059814453125, 0.004253387451171875, 0.01448822021484375, 0.024723052978515625, 0.0349578857421875, 0.045192718505859375, 0.05542755126953125, 0.06566238403320312, 0.075897216796875, 0.08613204956054688, 0.09636688232421875, 0.10660171508789062, 0.1168365478515625, 0.12707138061523438, 0.13730621337890625, 0.14754104614257812, 0.15777587890625, 0.16801071166992188, 0.17824554443359375, 0.18848037719726562, 0.1987152099609375, 0.20895004272460938, 0.21918487548828125, 0.22941970825195312, 0.239654541015625, 0.24988937377929688, 0.26012420654296875, 0.2703590393066406, 0.2805938720703125, 0.2908287048339844, 0.30106353759765625, 0.3112983703613281, 0.321533203125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 11.0, 12.0, 14.0, 22.0, 23.0, 37.0, 16.0, 37.0, 55.0, 33.0, 59.0, 66.0, 62.0, 49.0, 51.0, 57.0, 62.0, 51.0, 38.0, 36.0, 43.0, 29.0, 33.0, 17.0, 17.0, 17.0, 11.0, 9.0, 8.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09954833984375, -0.09669303894042969, -0.09383773803710938, -0.09098243713378906, -0.08812713623046875, -0.08527183532714844, -0.08241653442382812, -0.07956123352050781, -0.0767059326171875, -0.07385063171386719, -0.07099533081054688, -0.06814002990722656, -0.06528472900390625, -0.06242942810058594, -0.059574127197265625, -0.05671882629394531, -0.053863525390625, -0.05100822448730469, -0.048152923583984375, -0.04529762268066406, -0.04244232177734375, -0.03958702087402344, -0.036731719970703125, -0.03387641906738281, -0.0310211181640625, -0.028165817260742188, -0.025310516357421875, -0.022455215454101562, -0.01959991455078125, -0.016744613647460938, -0.013889312744140625, -0.011034011840820312, -0.0081787109375, -0.0053234100341796875, -0.002468109130859375, 0.0003871917724609375, 0.00324249267578125, 0.0060977935791015625, 0.008953094482421875, 0.011808395385742188, 0.0146636962890625, 0.017518997192382812, 0.020374298095703125, 0.023229598999023438, 0.02608489990234375, 0.028940200805664062, 0.031795501708984375, 0.03465080261230469, 0.037506103515625, 0.04036140441894531, 0.043216705322265625, 0.04607200622558594, 0.04892730712890625, 0.05178260803222656, 0.054637908935546875, 0.05749320983886719, 0.0603485107421875, 0.06320381164550781, 0.06605911254882812, 0.06891441345214844, 0.07176971435546875, 0.07462501525878906, 0.07748031616210938, 0.08033561706542969, 0.08319091796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 14.0, 18.0, 30.0, 30.0, 42.0, 79.0, 100.0, 176.0, 254.0, 464.0, 667.0, 1259.0, 2158.0, 4120.0, 8424.0, 17619.0, 42692.0, 126008.0, 943593.0, 2782044.0, 170252.0, 52563.0, 21235.0, 9785.0, 4737.0, 2454.0, 1382.0, 782.0, 505.0, 271.0, 179.0, 124.0, 68.0, 52.0, 31.0, 27.0, 11.0, 6.0, 9.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.289794921875, -0.2812995910644531, -0.27280426025390625, -0.2643089294433594, -0.2558135986328125, -0.24731826782226562, -0.23882293701171875, -0.23032760620117188, -0.221832275390625, -0.21333694458007812, -0.20484161376953125, -0.19634628295898438, -0.1878509521484375, -0.17935562133789062, -0.17086029052734375, -0.16236495971679688, -0.15386962890625, -0.14537429809570312, -0.13687896728515625, -0.12838363647460938, -0.1198883056640625, -0.11139297485351562, -0.10289764404296875, -0.09440231323242188, -0.085906982421875, -0.07741165161132812, -0.06891632080078125, -0.060420989990234375, -0.0519256591796875, -0.043430328369140625, -0.03493499755859375, -0.026439666748046875, -0.0179443359375, -0.009449005126953125, -0.00095367431640625, 0.007541656494140625, 0.0160369873046875, 0.024532318115234375, 0.03302764892578125, 0.041522979736328125, 0.050018310546875, 0.058513641357421875, 0.06700897216796875, 0.07550430297851562, 0.0839996337890625, 0.09249496459960938, 0.10099029541015625, 0.10948562622070312, 0.11798095703125, 0.12647628784179688, 0.13497161865234375, 0.14346694946289062, 0.1519622802734375, 0.16045761108398438, 0.16895294189453125, 0.17744827270507812, 0.185943603515625, 0.19443893432617188, 0.20293426513671875, 0.21142959594726562, 0.2199249267578125, 0.22842025756835938, 0.23691558837890625, 0.24541091918945312, 0.25390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 10.0, 8.0, 18.0, 23.0, 34.0, 38.0, 48.0, 70.0, 105.0, 250.0, 565.0, 1859.0, 464.0, 205.0, 93.0, 66.0, 53.0, 39.0, 20.0, 24.0, 15.0, 11.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.1294078826904297, -0.12514877319335938, -0.12088966369628906, -0.11663055419921875, -0.11237144470214844, -0.10811233520507812, -0.10385322570800781, -0.0995941162109375, -0.09533500671386719, -0.09107589721679688, -0.08681678771972656, -0.08255767822265625, -0.07829856872558594, -0.07403945922851562, -0.06978034973144531, -0.065521240234375, -0.06126213073730469, -0.057003021240234375, -0.05274391174316406, -0.04848480224609375, -0.04422569274902344, -0.039966583251953125, -0.03570747375488281, -0.0314483642578125, -0.027189254760742188, -0.022930145263671875, -0.018671035766601562, -0.01441192626953125, -0.010152816772460938, -0.005893707275390625, -0.0016345977783203125, 0.00262451171875, 0.0068836212158203125, 0.011142730712890625, 0.015401840209960938, 0.01966094970703125, 0.023920059204101562, 0.028179168701171875, 0.03243827819824219, 0.0366973876953125, 0.04095649719238281, 0.045215606689453125, 0.04947471618652344, 0.05373382568359375, 0.05799293518066406, 0.062252044677734375, 0.06651115417480469, 0.070770263671875, 0.07502937316894531, 0.07928848266601562, 0.08354759216308594, 0.08780670166015625, 0.09206581115722656, 0.09632492065429688, 0.10058403015136719, 0.1048431396484375, 0.10910224914550781, 0.11336135864257812, 0.11762046813964844, 0.12187957763671875, 0.12613868713378906, 0.13039779663085938, 0.1346569061279297, 0.138916015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 8.0, 14.0, 18.0, 33.0, 45.0, 81.0, 103.0, 115.0, 144.0, 135.0, 95.0, 77.0, 58.0, 32.0, 16.0, 10.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9768815636634827, -0.9480293989181519, -0.9191772937774658, -0.8903251886367798, -0.861473023891449, -0.8326208591461182, -0.8037687540054321, -0.7749166488647461, -0.7460644841194153, -0.7172123193740845, -0.6883602142333984, -0.6595081090927124, -0.6306559443473816, -0.6018037796020508, -0.5729516744613647, -0.5440995693206787, -0.5152474045753479, -0.4863952696323395, -0.45754313468933105, -0.42869099974632263, -0.3998388648033142, -0.3709867298603058, -0.34213459491729736, -0.31328245997428894, -0.2844303250312805, -0.2555781900882721, -0.22672605514526367, -0.19787392020225525, -0.16902178525924683, -0.1401696503162384, -0.11131751537322998, -0.08246538043022156, -0.053613245487213135, -0.024761110544204712, 0.004091024398803711, 0.032943159341812134, 0.06179529428482056, 0.09064742922782898, 0.1194995641708374, 0.14835169911384583, 0.17720383405685425, 0.20605596899986267, 0.2349081039428711, 0.2637602388858795, 0.29261237382888794, 0.32146450877189636, 0.3503166437149048, 0.3791687786579132, 0.40802091360092163, 0.43687304854393005, 0.4657251834869385, 0.4945773184299469, 0.5234294533729553, 0.5522816181182861, 0.5811337232589722, 0.6099858283996582, 0.638837993144989, 0.6676901578903198, 0.6965422630310059, 0.7253943681716919, 0.7542465329170227, 0.7830986976623535, 0.8119508028030396, 0.8408029079437256, 0.8696550726890564]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 10.0, 10.0, 16.0, 17.0, 17.0, 16.0, 27.0, 30.0, 37.0, 38.0, 32.0, 46.0, 41.0, 51.0, 54.0, 59.0, 56.0, 56.0, 60.0, 50.0, 49.0, 27.0, 36.0, 32.0, 25.0, 28.0, 15.0, 10.0, 10.0, 14.0, 4.0, 7.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6143176555633545, -0.59740149974823, -0.5804852843284607, -0.5635691285133362, -0.5466529726982117, -0.5297367572784424, -0.5128206014633179, -0.49590444564819336, -0.47898826003074646, -0.46207207441329956, -0.44515591859817505, -0.42823973298072815, -0.41132354736328125, -0.39440739154815674, -0.37749120593070984, -0.36057502031326294, -0.3436588644981384, -0.32674267888069153, -0.309826523065567, -0.2929103374481201, -0.2759941816329956, -0.2590779960155487, -0.2421618103981018, -0.2252456396818161, -0.2083294689655304, -0.1914132982492447, -0.17449712753295898, -0.15758094191551208, -0.14066477119922638, -0.12374860048294067, -0.10683242231607437, -0.08991624414920807, -0.07300001382827759, -0.056083839386701584, -0.03916766494512558, -0.022251490503549576, -0.005335316061973572, 0.011580854654312134, 0.028497032821178436, 0.04541321098804474, 0.062329381704330444, 0.07924555242061615, 0.09616173058748245, 0.11307790875434875, 0.12999407947063446, 0.14691025018692017, 0.16382643580436707, 0.18074260652065277, 0.19765877723693848, 0.21457494795322418, 0.2314911186695099, 0.2484073042869568, 0.2653234601020813, 0.2822396457195282, 0.2991558313369751, 0.3160719871520996, 0.3329881727695465, 0.3499043583869934, 0.3668205142021179, 0.3837366998195648, 0.4006528854370117, 0.41756904125213623, 0.43448522686958313, 0.45140141248703003, 0.46831756830215454]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 3.0, 9.0, 12.0, 17.0, 22.0, 30.0, 42.0, 70.0, 106.0, 149.0, 225.0, 395.0, 653.0, 1104.0, 1965.0, 3811.0, 7660.0, 16502.0, 37485.0, 90838.0, 218776.0, 355663.0, 179963.0, 74039.0, 31197.0, 13824.0, 6408.0, 3349.0, 1782.0, 975.0, 538.0, 308.0, 175.0, 153.0, 91.0, 70.0, 40.0, 23.0, 22.0, 17.0, 13.0, 6.0, 7.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357421875, -0.3463859558105469, -0.33535003662109375, -0.3243141174316406, -0.3132781982421875, -0.3022422790527344, -0.29120635986328125, -0.2801704406738281, -0.269134521484375, -0.2580986022949219, -0.24706268310546875, -0.23602676391601562, -0.2249908447265625, -0.21395492553710938, -0.20291900634765625, -0.19188308715820312, -0.18084716796875, -0.16981124877929688, -0.15877532958984375, -0.14773941040039062, -0.1367034912109375, -0.12566757202148438, -0.11463165283203125, -0.10359573364257812, -0.092559814453125, -0.08152389526367188, -0.07048797607421875, -0.059452056884765625, -0.0484161376953125, -0.037380218505859375, -0.02634429931640625, -0.015308380126953125, -0.0042724609375, 0.006763458251953125, 0.01779937744140625, 0.028835296630859375, 0.0398712158203125, 0.050907135009765625, 0.06194305419921875, 0.07297897338867188, 0.084014892578125, 0.09505081176757812, 0.10608673095703125, 0.11712265014648438, 0.1281585693359375, 0.13919448852539062, 0.15023040771484375, 0.16126632690429688, 0.17230224609375, 0.18333816528320312, 0.19437408447265625, 0.20541000366210938, 0.2164459228515625, 0.22748184204101562, 0.23851776123046875, 0.24955368041992188, 0.260589599609375, 0.2716255187988281, 0.28266143798828125, 0.2936973571777344, 0.3047332763671875, 0.3157691955566406, 0.32680511474609375, 0.3378410339355469, 0.348876953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 6.0, 9.0, 7.0, 23.0, 16.0, 25.0, 30.0, 25.0, 40.0, 45.0, 43.0, 63.0, 46.0, 58.0, 49.0, 56.0, 58.0, 55.0, 47.0, 60.0, 40.0, 38.0, 25.0, 16.0, 37.0, 14.0, 15.0, 14.0, 11.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09770965576171875, -0.0948333740234375, -0.09195709228515625, -0.089080810546875, -0.08620452880859375, -0.0833282470703125, -0.08045196533203125, -0.07757568359375, -0.07469940185546875, -0.0718231201171875, -0.06894683837890625, -0.066070556640625, -0.06319427490234375, -0.0603179931640625, -0.05744171142578125, -0.0545654296875, -0.05168914794921875, -0.0488128662109375, -0.04593658447265625, -0.043060302734375, -0.04018402099609375, -0.0373077392578125, -0.03443145751953125, -0.03155517578125, -0.02867889404296875, -0.0258026123046875, -0.02292633056640625, -0.020050048828125, -0.01717376708984375, -0.0142974853515625, -0.01142120361328125, -0.008544921875, -0.00566864013671875, -0.0027923583984375, 8.392333984375e-05, 0.002960205078125, 0.00583648681640625, 0.0087127685546875, 0.01158905029296875, 0.01446533203125, 0.01734161376953125, 0.0202178955078125, 0.02309417724609375, 0.025970458984375, 0.02884674072265625, 0.0317230224609375, 0.03459930419921875, 0.0374755859375, 0.04035186767578125, 0.0432281494140625, 0.04610443115234375, 0.048980712890625, 0.05185699462890625, 0.0547332763671875, 0.05760955810546875, 0.06048583984375, 0.06336212158203125, 0.0662384033203125, 0.06911468505859375, 0.071990966796875, 0.07486724853515625, 0.0777435302734375, 0.08061981201171875, 0.08349609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 15.0, 13.0, 12.0, 14.0, 22.0, 37.0, 36.0, 57.0, 69.0, 91.0, 95.0, 159.0, 191.0, 268.0, 430.0, 626.0, 1038.0, 2026.0, 4747.0, 14116.0, 48729.0, 175023.0, 457098.0, 242639.0, 69256.0, 19251.0, 6339.0, 2481.0, 1229.0, 736.0, 488.0, 294.0, 192.0, 170.0, 137.0, 100.0, 70.0, 47.0, 45.0, 35.0, 21.0, 22.0, 26.0, 9.0, 7.0, 10.0, 5.0, 2.0, 5.0, 6.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.38916015625, -0.37723541259765625, -0.3653106689453125, -0.35338592529296875, -0.341461181640625, -0.32953643798828125, -0.3176116943359375, -0.30568695068359375, -0.29376220703125, -0.28183746337890625, -0.2699127197265625, -0.25798797607421875, -0.246063232421875, -0.23413848876953125, -0.2222137451171875, -0.21028900146484375, -0.1983642578125, -0.18643951416015625, -0.1745147705078125, -0.16259002685546875, -0.150665283203125, -0.13874053955078125, -0.1268157958984375, -0.11489105224609375, -0.10296630859375, -0.09104156494140625, -0.0791168212890625, -0.06719207763671875, -0.055267333984375, -0.04334259033203125, -0.0314178466796875, -0.01949310302734375, -0.007568359375, 0.00435638427734375, 0.0162811279296875, 0.02820587158203125, 0.040130615234375, 0.05205535888671875, 0.0639801025390625, 0.07590484619140625, 0.08782958984375, 0.09975433349609375, 0.1116790771484375, 0.12360382080078125, 0.135528564453125, 0.14745330810546875, 0.1593780517578125, 0.17130279541015625, 0.1832275390625, 0.19515228271484375, 0.2070770263671875, 0.21900177001953125, 0.230926513671875, 0.24285125732421875, 0.2547760009765625, 0.26670074462890625, 0.27862548828125, 0.29055023193359375, 0.3024749755859375, 0.31439971923828125, 0.326324462890625, 0.33824920654296875, 0.3501739501953125, 0.36209869384765625, 0.3740234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 7.0, 4.0, 5.0, 7.0, 11.0, 11.0, 20.0, 26.0, 27.0, 29.0, 21.0, 29.0, 28.0, 43.0, 44.0, 49.0, 41.0, 44.0, 49.0, 42.0, 49.0, 45.0, 56.0, 41.0, 47.0, 33.0, 31.0, 26.0, 23.0, 10.0, 17.0, 24.0, 15.0, 10.0, 7.0, 7.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.375732421875, -0.3642005920410156, -0.35266876220703125, -0.3411369323730469, -0.3296051025390625, -0.3180732727050781, -0.30654144287109375, -0.2950096130371094, -0.283477783203125, -0.2719459533691406, -0.26041412353515625, -0.24888229370117188, -0.2373504638671875, -0.22581863403320312, -0.21428680419921875, -0.20275497436523438, -0.19122314453125, -0.17969131469726562, -0.16815948486328125, -0.15662765502929688, -0.1450958251953125, -0.13356399536132812, -0.12203216552734375, -0.11050033569335938, -0.098968505859375, -0.08743667602539062, -0.07590484619140625, -0.06437301635742188, -0.0528411865234375, -0.041309356689453125, -0.02977752685546875, -0.018245697021484375, -0.0067138671875, 0.004817962646484375, 0.01634979248046875, 0.027881622314453125, 0.0394134521484375, 0.050945281982421875, 0.06247711181640625, 0.07400894165039062, 0.085540771484375, 0.09707260131835938, 0.10860443115234375, 0.12013626098632812, 0.1316680908203125, 0.14319992065429688, 0.15473175048828125, 0.16626358032226562, 0.17779541015625, 0.18932723999023438, 0.20085906982421875, 0.21239089965820312, 0.2239227294921875, 0.23545455932617188, 0.24698638916015625, 0.2585182189941406, 0.270050048828125, 0.2815818786621094, 0.29311370849609375, 0.3046455383300781, 0.3161773681640625, 0.3277091979980469, 0.33924102783203125, 0.3507728576660156, 0.3623046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 12.0, 14.0, 26.0, 35.0, 50.0, 112.0, 176.0, 397.0, 705.0, 1667.0, 4826.0, 16776.0, 95970.0, 750650.0, 146071.0, 21411.0, 5851.0, 2012.0, 836.0, 408.0, 237.0, 106.0, 77.0, 38.0, 29.0, 21.0, 9.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.294403076171875, -0.28192138671875, -0.269439697265625, -0.2569580078125, -0.244476318359375, -0.23199462890625, -0.219512939453125, -0.20703125, -0.194549560546875, -0.18206787109375, -0.169586181640625, -0.1571044921875, -0.144622802734375, -0.13214111328125, -0.119659423828125, -0.107177734375, -0.094696044921875, -0.08221435546875, -0.069732666015625, -0.0572509765625, -0.044769287109375, -0.03228759765625, -0.019805908203125, -0.00732421875, 0.005157470703125, 0.01763916015625, 0.030120849609375, 0.0426025390625, 0.055084228515625, 0.06756591796875, 0.080047607421875, 0.092529296875, 0.105010986328125, 0.11749267578125, 0.129974365234375, 0.1424560546875, 0.154937744140625, 0.16741943359375, 0.179901123046875, 0.1923828125, 0.204864501953125, 0.21734619140625, 0.229827880859375, 0.2423095703125, 0.254791259765625, 0.26727294921875, 0.279754638671875, 0.292236328125, 0.304718017578125, 0.31719970703125, 0.329681396484375, 0.3421630859375, 0.354644775390625, 0.36712646484375, 0.379608154296875, 0.39208984375, 0.404571533203125, 0.41705322265625, 0.429534912109375, 0.4420166015625, 0.454498291015625, 0.46697998046875, 0.479461669921875, 0.491943359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 12.0, 26.0, 31.0, 27.0, 52.0, 69.0, 80.0, 95.0, 109.0, 101.0, 95.0, 76.0, 55.0, 58.0, 30.0, 20.0, 15.0, 16.0, 4.0, 1.0, 6.0, 4.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010794401168823242, -0.00010433513671159744, -0.00010072626173496246, -9.711738675832748e-05, -9.35085117816925e-05, -8.989963680505753e-05, -8.629076182842255e-05, -8.268188685178757e-05, -7.907301187515259e-05, -7.546413689851761e-05, -7.185526192188263e-05, -6.824638694524765e-05, -6.463751196861267e-05, -6.102863699197769e-05, -5.741976201534271e-05, -5.381088703870773e-05, -5.0202012062072754e-05, -4.6593137085437775e-05, -4.2984262108802795e-05, -3.9375387132167816e-05, -3.576651215553284e-05, -3.215763717889786e-05, -2.854876220226288e-05, -2.49398872256279e-05, -2.133101224899292e-05, -1.772213727235794e-05, -1.4113262295722961e-05, -1.0504387319087982e-05, -6.895512342453003e-06, -3.2866373658180237e-06, 3.2223761081695557e-07, 3.931112587451935e-06, 7.539987564086914e-06, 1.1148862540721893e-05, 1.4757737517356873e-05, 1.8366612493991852e-05, 2.197548747062683e-05, 2.558436244726181e-05, 2.919323742389679e-05, 3.280211240053177e-05, 3.641098737716675e-05, 4.001986235380173e-05, 4.3628737330436707e-05, 4.7237612307071686e-05, 5.0846487283706665e-05, 5.4455362260341644e-05, 5.8064237236976624e-05, 6.16731122136116e-05, 6.528198719024658e-05, 6.889086216688156e-05, 7.249973714351654e-05, 7.610861212015152e-05, 7.97174870967865e-05, 8.332636207342148e-05, 8.693523705005646e-05, 9.054411202669144e-05, 9.415298700332642e-05, 9.77618619799614e-05, 0.00010137073695659637, 0.00010497961193323135, 0.00010858848690986633, 0.00011219736188650131, 0.00011580623686313629, 0.00011941511183977127, 0.00012302398681640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 7.0, 11.0, 8.0, 13.0, 22.0, 34.0, 37.0, 51.0, 47.0, 116.0, 203.0, 318.0, 568.0, 1203.0, 2461.0, 5890.0, 18347.0, 77814.0, 653983.0, 234940.0, 34990.0, 10160.0, 3685.0, 1635.0, 852.0, 444.0, 231.0, 146.0, 101.0, 52.0, 45.0, 30.0, 18.0, 23.0, 11.0, 15.0, 10.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.322998046875, -0.3128242492675781, -0.30265045166015625, -0.2924766540527344, -0.2823028564453125, -0.2721290588378906, -0.26195526123046875, -0.2517814636230469, -0.241607666015625, -0.23143386840820312, -0.22126007080078125, -0.21108627319335938, -0.2009124755859375, -0.19073867797851562, -0.18056488037109375, -0.17039108276367188, -0.16021728515625, -0.15004348754882812, -0.13986968994140625, -0.12969589233398438, -0.1195220947265625, -0.10934829711914062, -0.09917449951171875, -0.08900070190429688, -0.078826904296875, -0.06865310668945312, -0.05847930908203125, -0.048305511474609375, -0.0381317138671875, -0.027957916259765625, -0.01778411865234375, -0.007610321044921875, 0.0025634765625, 0.012737274169921875, 0.02291107177734375, 0.033084869384765625, 0.0432586669921875, 0.053432464599609375, 0.06360626220703125, 0.07378005981445312, 0.083953857421875, 0.09412765502929688, 0.10430145263671875, 0.11447525024414062, 0.1246490478515625, 0.13482284545898438, 0.14499664306640625, 0.15517044067382812, 0.16534423828125, 0.17551803588867188, 0.18569183349609375, 0.19586563110351562, 0.2060394287109375, 0.21621322631835938, 0.22638702392578125, 0.23656082153320312, 0.246734619140625, 0.2569084167480469, 0.26708221435546875, 0.2772560119628906, 0.2874298095703125, 0.2976036071777344, 0.30777740478515625, 0.3179512023925781, 0.328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 12.0, 4.0, 10.0, 13.0, 17.0, 13.0, 27.0, 42.0, 57.0, 104.0, 115.0, 135.0, 124.0, 82.0, 58.0, 43.0, 33.0, 18.0, 15.0, 13.0, 8.0, 11.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2060546875, -0.1990814208984375, -0.192108154296875, -0.1851348876953125, -0.17816162109375, -0.1711883544921875, -0.164215087890625, -0.1572418212890625, -0.1502685546875, -0.1432952880859375, -0.136322021484375, -0.1293487548828125, -0.12237548828125, -0.1154022216796875, -0.108428955078125, -0.1014556884765625, -0.094482421875, -0.0875091552734375, -0.080535888671875, -0.0735626220703125, -0.06658935546875, -0.0596160888671875, -0.052642822265625, -0.0456695556640625, -0.0386962890625, -0.0317230224609375, -0.024749755859375, -0.0177764892578125, -0.01080322265625, -0.0038299560546875, 0.003143310546875, 0.0101165771484375, 0.01708984375, 0.0240631103515625, 0.031036376953125, 0.0380096435546875, 0.04498291015625, 0.0519561767578125, 0.058929443359375, 0.0659027099609375, 0.0728759765625, 0.0798492431640625, 0.086822509765625, 0.0937957763671875, 0.10076904296875, 0.1077423095703125, 0.114715576171875, 0.1216888427734375, 0.128662109375, 0.1356353759765625, 0.142608642578125, 0.1495819091796875, 0.15655517578125, 0.1635284423828125, 0.170501708984375, 0.1774749755859375, 0.1844482421875, 0.1914215087890625, 0.198394775390625, 0.2053680419921875, 0.21234130859375, 0.2193145751953125, 0.226287841796875, 0.2332611083984375, 0.240234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 25.0, 56.0, 175.0, 258.0, 268.0, 124.0, 58.0, 19.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.959728240966797, -6.760721683502197, -6.561715602874756, -6.362709045410156, -6.163702487945557, -5.964695930480957, -5.765689849853516, -5.566683292388916, -5.367676734924316, -5.168670177459717, -4.969664096832275, -4.770657539367676, -4.571650981903076, -4.372644424438477, -4.173638343811035, -3.9746317863464355, -3.775625467300415, -3.5766191482543945, -3.377612590789795, -3.1786062717437744, -2.979599714279175, -2.7805933952331543, -2.5815868377685547, -2.382580518722534, -2.1835741996765137, -1.9845677614212036, -1.7855613231658936, -1.586555004119873, -1.3875484466552734, -1.188542127609253, -0.9895356893539429, -0.7905292510986328, -0.5915226936340332, -0.39251625537872314, -0.19350984692573547, 0.005496561527252197, 0.20450299978256226, 0.4035094380378723, 0.6025158166885376, 0.8015222549438477, 1.0005286931991577, 1.1995351314544678, 1.3985415697097778, 1.597548007965088, 1.7965543270111084, 1.995560884475708, 2.1945672035217285, 2.393573760986328, 2.5925800800323486, 2.791586399078369, 2.9905929565429688, 3.1895992755889893, 3.388605833053589, 3.5876121520996094, 3.786618709564209, 3.9856250286102295, 4.18463134765625, 4.38363790512085, 4.582643985748291, 4.781650543212891, 4.98065710067749, 5.17966365814209, 5.378669738769531, 5.577676296234131, 5.7766828536987305]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 3.0, 2.0, 6.0, 5.0, 14.0, 15.0, 20.0, 12.0, 17.0, 17.0, 27.0, 29.0, 34.0, 41.0, 38.0, 43.0, 50.0, 40.0, 63.0, 50.0, 44.0, 57.0, 46.0, 33.0, 39.0, 41.0, 23.0, 25.0, 16.0, 30.0, 29.0, 17.0, 16.0, 12.0, 15.0, 9.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.408890724182129, -2.3427348136901855, -2.2765791416168213, -2.210423231124878, -2.1442675590515137, -2.0781116485595703, -2.011955976486206, -1.9458000659942627, -1.8796442747116089, -1.813488483428955, -1.7473326921463013, -1.6811769008636475, -1.615020990371704, -1.5488653182983398, -1.4827094078063965, -1.4165536165237427, -1.3503978252410889, -1.284242033958435, -1.2180862426757812, -1.1519304513931274, -1.0857746601104736, -1.0196187496185303, -0.9534629583358765, -0.8873071670532227, -0.8211513757705688, -0.754995584487915, -0.6888397932052612, -0.6226839423179626, -0.5565281510353088, -0.49037235975265503, -0.42421653866767883, -0.35806071758270264, -0.2919048070907593, -0.22574900090694427, -0.15959319472312927, -0.09343738853931427, -0.027281582355499268, 0.03887420892715454, 0.10503003001213074, 0.17118585109710693, 0.23734164237976074, 0.30349743366241455, 0.36965325474739075, 0.43580907583236694, 0.5019648671150208, 0.5681206583976746, 0.6342765092849731, 0.700432300567627, 0.7665880918502808, 0.8327438831329346, 0.8988996744155884, 0.965055525302887, 1.0312113761901855, 1.0973670482635498, 1.1635229587554932, 1.229678750038147, 1.2958345413208008, 1.3619903326034546, 1.4281461238861084, 1.4943019151687622, 1.560457706451416, 1.6266136169433594, 1.6927694082260132, 1.758925199508667, 1.8250809907913208]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 13.0, 6.0, 28.0, 37.0, 42.0, 71.0, 82.0, 110.0, 135.0, 236.0, 358.0, 579.0, 978.0, 1544.0, 2767.0, 5283.0, 10358.0, 21986.0, 55126.0, 196142.0, 3297933.0, 451735.0, 87922.0, 31758.0, 13668.0, 6909.0, 3656.0, 1919.0, 1096.0, 632.0, 376.0, 261.0, 157.0, 127.0, 73.0, 50.0, 41.0, 24.0, 16.0, 14.0, 11.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.337890625, -0.3278656005859375, -0.317840576171875, -0.3078155517578125, -0.29779052734375, -0.2877655029296875, -0.277740478515625, -0.2677154541015625, -0.2576904296875, -0.2476654052734375, -0.237640380859375, -0.2276153564453125, -0.21759033203125, -0.2075653076171875, -0.197540283203125, -0.1875152587890625, -0.177490234375, -0.1674652099609375, -0.157440185546875, -0.1474151611328125, -0.13739013671875, -0.1273651123046875, -0.117340087890625, -0.1073150634765625, -0.0972900390625, -0.0872650146484375, -0.077239990234375, -0.0672149658203125, -0.05718994140625, -0.0471649169921875, -0.037139892578125, -0.0271148681640625, -0.01708984375, -0.0070648193359375, 0.002960205078125, 0.0129852294921875, 0.02301025390625, 0.0330352783203125, 0.043060302734375, 0.0530853271484375, 0.0631103515625, 0.0731353759765625, 0.083160400390625, 0.0931854248046875, 0.10321044921875, 0.1132354736328125, 0.123260498046875, 0.1332855224609375, 0.143310546875, 0.1533355712890625, 0.163360595703125, 0.1733856201171875, 0.18341064453125, 0.1934356689453125, 0.203460693359375, 0.2134857177734375, 0.2235107421875, 0.2335357666015625, 0.243560791015625, 0.2535858154296875, 0.26361083984375, 0.2736358642578125, 0.283660888671875, 0.2936859130859375, 0.3037109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 3.0, 9.0, 9.0, 13.0, 15.0, 22.0, 17.0, 30.0, 38.0, 28.0, 22.0, 44.0, 39.0, 36.0, 47.0, 49.0, 44.0, 38.0, 56.0, 44.0, 44.0, 45.0, 37.0, 38.0, 33.0, 24.0, 31.0, 25.0, 24.0, 21.0, 12.0, 10.0, 8.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0919189453125, -0.0893096923828125, -0.086700439453125, -0.0840911865234375, -0.08148193359375, -0.0788726806640625, -0.076263427734375, -0.0736541748046875, -0.071044921875, -0.0684356689453125, -0.065826416015625, -0.0632171630859375, -0.06060791015625, -0.0579986572265625, -0.055389404296875, -0.0527801513671875, -0.0501708984375, -0.0475616455078125, -0.044952392578125, -0.0423431396484375, -0.03973388671875, -0.0371246337890625, -0.034515380859375, -0.0319061279296875, -0.029296875, -0.0266876220703125, -0.024078369140625, -0.0214691162109375, -0.01885986328125, -0.0162506103515625, -0.013641357421875, -0.0110321044921875, -0.0084228515625, -0.0058135986328125, -0.003204345703125, -0.0005950927734375, 0.00201416015625, 0.0046234130859375, 0.007232666015625, 0.0098419189453125, 0.012451171875, 0.0150604248046875, 0.017669677734375, 0.0202789306640625, 0.02288818359375, 0.0254974365234375, 0.028106689453125, 0.0307159423828125, 0.0333251953125, 0.0359344482421875, 0.038543701171875, 0.0411529541015625, 0.04376220703125, 0.0463714599609375, 0.048980712890625, 0.0515899658203125, 0.05419921875, 0.0568084716796875, 0.059417724609375, 0.0620269775390625, 0.06463623046875, 0.0672454833984375, 0.069854736328125, 0.0724639892578125, 0.0750732421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 12.0, 8.0, 14.0, 29.0, 42.0, 71.0, 125.0, 180.0, 265.0, 436.0, 694.0, 1254.0, 2120.0, 4281.0, 8749.0, 19859.0, 54918.0, 209763.0, 2977486.0, 735644.0, 115217.0, 35767.0, 14031.0, 6192.0, 3007.0, 1707.0, 943.0, 534.0, 334.0, 219.0, 137.0, 73.0, 68.0, 48.0, 20.0, 14.0, 5.0, 4.0, 2.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.365478515625, -0.3555450439453125, -0.345611572265625, -0.3356781005859375, -0.32574462890625, -0.3158111572265625, -0.305877685546875, -0.2959442138671875, -0.2860107421875, -0.2760772705078125, -0.266143798828125, -0.2562103271484375, -0.24627685546875, -0.2363433837890625, -0.226409912109375, -0.2164764404296875, -0.20654296875, -0.1966094970703125, -0.186676025390625, -0.1767425537109375, -0.16680908203125, -0.1568756103515625, -0.146942138671875, -0.1370086669921875, -0.1270751953125, -0.1171417236328125, -0.107208251953125, -0.0972747802734375, -0.08734130859375, -0.0774078369140625, -0.067474365234375, -0.0575408935546875, -0.047607421875, -0.0376739501953125, -0.027740478515625, -0.0178070068359375, -0.00787353515625, 0.0020599365234375, 0.011993408203125, 0.0219268798828125, 0.0318603515625, 0.0417938232421875, 0.051727294921875, 0.0616607666015625, 0.07159423828125, 0.0815277099609375, 0.091461181640625, 0.1013946533203125, 0.111328125, 0.1212615966796875, 0.131195068359375, 0.1411285400390625, 0.15106201171875, 0.1609954833984375, 0.170928955078125, 0.1808624267578125, 0.1907958984375, 0.2007293701171875, 0.210662841796875, 0.2205963134765625, 0.23052978515625, 0.2404632568359375, 0.250396728515625, 0.2603302001953125, 0.270263671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 10.0, 16.0, 18.0, 31.0, 42.0, 63.0, 135.0, 230.0, 749.0, 1780.0, 450.0, 197.0, 129.0, 68.0, 45.0, 23.0, 19.0, 11.0, 9.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2392578125, -0.23227882385253906, -0.22529983520507812, -0.2183208465576172, -0.21134185791015625, -0.2043628692626953, -0.19738388061523438, -0.19040489196777344, -0.1834259033203125, -0.17644691467285156, -0.16946792602539062, -0.1624889373779297, -0.15550994873046875, -0.1485309600830078, -0.14155197143554688, -0.13457298278808594, -0.127593994140625, -0.12061500549316406, -0.11363601684570312, -0.10665702819824219, -0.09967803955078125, -0.09269905090332031, -0.08572006225585938, -0.07874107360839844, -0.0717620849609375, -0.06478309631347656, -0.057804107666015625, -0.05082511901855469, -0.04384613037109375, -0.03686714172363281, -0.029888153076171875, -0.022909164428710938, -0.01593017578125, -0.008951187133789062, -0.001972198486328125, 0.0050067901611328125, 0.01198577880859375, 0.018964767456054688, 0.025943756103515625, 0.03292274475097656, 0.0399017333984375, 0.04688072204589844, 0.053859710693359375, 0.06083869934082031, 0.06781768798828125, 0.07479667663574219, 0.08177566528320312, 0.08875465393066406, 0.095733642578125, 0.10271263122558594, 0.10969161987304688, 0.11667060852050781, 0.12364959716796875, 0.1306285858154297, 0.13760757446289062, 0.14458656311035156, 0.1515655517578125, 0.15854454040527344, 0.16552352905273438, 0.1725025177001953, 0.17948150634765625, 0.1864604949951172, 0.19343948364257812, 0.20041847229003906, 0.2073974609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 15.0, 27.0, 42.0, 61.0, 140.0, 165.0, 181.0, 151.0, 108.0, 69.0, 22.0, 12.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0860226154327393, -1.0345354080200195, -0.9830483198165894, -0.9315611720085144, -0.8800740242004395, -0.8285868167877197, -0.7770997285842896, -0.7256125211715698, -0.6741254329681396, -0.6226382851600647, -0.5711511373519897, -0.5196639895439148, -0.46817684173583984, -0.4166896641254425, -0.36520251631736755, -0.3137153685092926, -0.26222819089889526, -0.2107410430908203, -0.15925389528274536, -0.10776673257350922, -0.056279584765434265, -0.00479242205619812, 0.04669472575187683, 0.09818187355995178, 0.14966902136802673, 0.20115616917610168, 0.25264331698417664, 0.304130494594574, 0.3556176424026489, 0.4071047902107239, 0.45859193801879883, 0.5100790858268738, 0.5615662336349487, 0.6130533814430237, 0.6645405292510986, 0.7160276770591736, 0.7675148248672485, 0.8190020322799683, 0.8704891204833984, 0.9219763278961182, 0.9734634160995483, 1.024950623512268, 1.0764377117156982, 1.127924919128418, 1.1794120073318481, 1.2308992147445679, 1.282386302947998, 1.3338735103607178, 1.3853607177734375, 1.4368479251861572, 1.4883350133895874, 1.5398222208023071, 1.5913093090057373, 1.642796516418457, 1.6942836046218872, 1.745770812034607, 1.797257900238037, 1.8487451076507568, 1.900232195854187, 1.9517194032669067, 2.003206491470337, 2.0546936988830566, 2.1061809062957764, 2.157667875289917, 2.2091550827026367]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 11.0, 9.0, 14.0, 19.0, 21.0, 15.0, 25.0, 29.0, 22.0, 32.0, 29.0, 40.0, 34.0, 33.0, 35.0, 33.0, 50.0, 45.0, 36.0, 35.0, 36.0, 36.0, 47.0, 37.0, 31.0, 34.0, 26.0, 19.0, 21.0, 27.0, 20.0, 20.0, 12.0, 15.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5539281964302063, -0.5358335971832275, -0.517738938331604, -0.49964430928230286, -0.4815496802330017, -0.46345505118370056, -0.4453604221343994, -0.42726579308509827, -0.4091711640357971, -0.39107653498649597, -0.3729819059371948, -0.3548872768878937, -0.33679264783859253, -0.3186980187892914, -0.30060338973999023, -0.2825087606906891, -0.26441413164138794, -0.2463195025920868, -0.22822487354278564, -0.2101302444934845, -0.19203561544418335, -0.1739409863948822, -0.15584635734558105, -0.1377517282962799, -0.11965709924697876, -0.10156247019767761, -0.08346784114837646, -0.06537321209907532, -0.04727858304977417, -0.029183954000473022, -0.011089324951171875, 0.0070053040981292725, 0.02509993314743042, 0.04319456219673157, 0.061289191246032715, 0.07938382029533386, 0.09747844934463501, 0.11557307839393616, 0.1336677074432373, 0.15176233649253845, 0.1698569655418396, 0.18795159459114075, 0.2060462236404419, 0.22414085268974304, 0.2422354817390442, 0.26033011078834534, 0.2784247398376465, 0.29651936888694763, 0.3146139979362488, 0.3327086269855499, 0.3508032560348511, 0.3688978850841522, 0.38699251413345337, 0.4050871431827545, 0.42318177223205566, 0.4412764012813568, 0.45937103033065796, 0.4774656593799591, 0.49556028842926025, 0.5136549472808838, 0.5317495465278625, 0.5498441457748413, 0.5679388046264648, 0.5860334634780884, 0.6041280627250671]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 6.0, 5.0, 7.0, 20.0, 24.0, 27.0, 42.0, 61.0, 60.0, 113.0, 193.0, 255.0, 396.0, 662.0, 1052.0, 1743.0, 3130.0, 5587.0, 10550.0, 21009.0, 44021.0, 106517.0, 473797.0, 243234.0, 70249.0, 31624.0, 15788.0, 7924.0, 4299.0, 2405.0, 1364.0, 847.0, 546.0, 327.0, 209.0, 156.0, 92.0, 60.0, 54.0, 34.0, 16.0, 19.0, 15.0, 9.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.3315010070800781, -0.31998443603515625, -0.3084678649902344, -0.2969512939453125, -0.2854347229003906, -0.27391815185546875, -0.2624015808105469, -0.250885009765625, -0.23936843872070312, -0.22785186767578125, -0.21633529663085938, -0.2048187255859375, -0.19330215454101562, -0.18178558349609375, -0.17026901245117188, -0.15875244140625, -0.14723587036132812, -0.13571929931640625, -0.12420272827148438, -0.1126861572265625, -0.10116958618164062, -0.08965301513671875, -0.07813644409179688, -0.066619873046875, -0.055103302001953125, -0.04358673095703125, -0.032070159912109375, -0.0205535888671875, -0.009037017822265625, 0.00247955322265625, 0.013996124267578125, 0.0255126953125, 0.037029266357421875, 0.04854583740234375, 0.060062408447265625, 0.0715789794921875, 0.08309555053710938, 0.09461212158203125, 0.10612869262695312, 0.117645263671875, 0.12916183471679688, 0.14067840576171875, 0.15219497680664062, 0.1637115478515625, 0.17522811889648438, 0.18674468994140625, 0.19826126098632812, 0.20977783203125, 0.22129440307617188, 0.23281097412109375, 0.24432754516601562, 0.2558441162109375, 0.2673606872558594, 0.27887725830078125, 0.2903938293457031, 0.301910400390625, 0.3134269714355469, 0.32494354248046875, 0.3364601135253906, 0.3479766845703125, 0.3594932556152344, 0.37100982666015625, 0.3825263977050781, 0.39404296875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 2.0, 5.0, 10.0, 10.0, 14.0, 15.0, 13.0, 24.0, 21.0, 29.0, 27.0, 34.0, 31.0, 29.0, 52.0, 40.0, 51.0, 55.0, 54.0, 43.0, 45.0, 55.0, 35.0, 39.0, 45.0, 39.0, 31.0, 23.0, 20.0, 22.0, 20.0, 14.0, 10.0, 9.0, 8.0, 10.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09454345703125, -0.09180355072021484, -0.08906364440917969, -0.08632373809814453, -0.08358383178710938, -0.08084392547607422, -0.07810401916503906, -0.0753641128540039, -0.07262420654296875, -0.0698843002319336, -0.06714439392089844, -0.06440448760986328, -0.061664581298828125, -0.05892467498779297, -0.05618476867675781, -0.053444862365722656, -0.0507049560546875, -0.047965049743652344, -0.04522514343261719, -0.04248523712158203, -0.039745330810546875, -0.03700542449951172, -0.03426551818847656, -0.031525611877441406, -0.02878570556640625, -0.026045799255371094, -0.023305892944335938, -0.02056598663330078, -0.017826080322265625, -0.015086174011230469, -0.012346267700195312, -0.009606361389160156, -0.006866455078125, -0.004126548767089844, -0.0013866424560546875, 0.0013532638549804688, 0.004093170166015625, 0.006833076477050781, 0.009572982788085938, 0.012312889099121094, 0.01505279541015625, 0.017792701721191406, 0.020532608032226562, 0.02327251434326172, 0.026012420654296875, 0.02875232696533203, 0.03149223327636719, 0.034232139587402344, 0.0369720458984375, 0.039711952209472656, 0.04245185852050781, 0.04519176483154297, 0.047931671142578125, 0.05067157745361328, 0.05341148376464844, 0.056151390075683594, 0.05889129638671875, 0.061631202697753906, 0.06437110900878906, 0.06711101531982422, 0.06985092163085938, 0.07259082794189453, 0.07533073425292969, 0.07807064056396484, 0.080810546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 10.0, 13.0, 28.0, 40.0, 50.0, 59.0, 89.0, 125.0, 185.0, 293.0, 477.0, 827.0, 1684.0, 5262.0, 23685.0, 158650.0, 749165.0, 86337.0, 14537.0, 3775.0, 1352.0, 656.0, 428.0, 252.0, 178.0, 91.0, 76.0, 55.0, 49.0, 33.0, 21.0, 16.0, 10.0, 11.0, 7.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.703125, -0.6820449829101562, -0.6609649658203125, -0.6398849487304688, -0.618804931640625, -0.5977249145507812, -0.5766448974609375, -0.5555648803710938, -0.53448486328125, -0.5134048461914062, -0.4923248291015625, -0.47124481201171875, -0.450164794921875, -0.42908477783203125, -0.4080047607421875, -0.38692474365234375, -0.3658447265625, -0.34476470947265625, -0.3236846923828125, -0.30260467529296875, -0.281524658203125, -0.26044464111328125, -0.2393646240234375, -0.21828460693359375, -0.19720458984375, -0.17612457275390625, -0.1550445556640625, -0.13396453857421875, -0.112884521484375, -0.09180450439453125, -0.0707244873046875, -0.04964447021484375, -0.028564453125, -0.00748443603515625, 0.0135955810546875, 0.03467559814453125, 0.055755615234375, 0.07683563232421875, 0.0979156494140625, 0.11899566650390625, 0.14007568359375, 0.16115570068359375, 0.1822357177734375, 0.20331573486328125, 0.224395751953125, 0.24547576904296875, 0.2665557861328125, 0.28763580322265625, 0.3087158203125, 0.32979583740234375, 0.3508758544921875, 0.37195587158203125, 0.393035888671875, 0.41411590576171875, 0.4351959228515625, 0.45627593994140625, 0.47735595703125, 0.49843597412109375, 0.5195159912109375, 0.5405960083007812, 0.561676025390625, 0.5827560424804688, 0.6038360595703125, 0.6249160766601562, 0.64599609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 8.0, 10.0, 10.0, 27.0, 32.0, 37.0, 49.0, 60.0, 59.0, 79.0, 92.0, 74.0, 97.0, 55.0, 77.0, 44.0, 39.0, 46.0, 29.0, 19.0, 19.0, 10.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48291015625, -0.46380615234375, -0.4447021484375, -0.42559814453125, -0.406494140625, -0.38739013671875, -0.3682861328125, -0.34918212890625, -0.330078125, -0.31097412109375, -0.2918701171875, -0.27276611328125, -0.253662109375, -0.23455810546875, -0.2154541015625, -0.19635009765625, -0.17724609375, -0.15814208984375, -0.1390380859375, -0.11993408203125, -0.100830078125, -0.08172607421875, -0.0626220703125, -0.04351806640625, -0.0244140625, -0.00531005859375, 0.0137939453125, 0.03289794921875, 0.052001953125, 0.07110595703125, 0.0902099609375, 0.10931396484375, 0.12841796875, 0.14752197265625, 0.1666259765625, 0.18572998046875, 0.204833984375, 0.22393798828125, 0.2430419921875, 0.26214599609375, 0.28125, 0.30035400390625, 0.3194580078125, 0.33856201171875, 0.357666015625, 0.37677001953125, 0.3958740234375, 0.41497802734375, 0.43408203125, 0.45318603515625, 0.4722900390625, 0.49139404296875, 0.510498046875, 0.52960205078125, 0.5487060546875, 0.56781005859375, 0.5869140625, 0.60601806640625, 0.6251220703125, 0.64422607421875, 0.663330078125, 0.68243408203125, 0.7015380859375, 0.72064208984375, 0.73974609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 16.0, 10.0, 20.0, 21.0, 34.0, 73.0, 134.0, 263.0, 592.0, 1568.0, 4463.0, 15223.0, 81682.0, 776384.0, 138229.0, 20805.0, 5731.0, 1915.0, 701.0, 307.0, 140.0, 70.0, 47.0, 40.0, 17.0, 19.0, 13.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2757682800292969, -0.26540374755859375, -0.2550392150878906, -0.2446746826171875, -0.23431015014648438, -0.22394561767578125, -0.21358108520507812, -0.203216552734375, -0.19285202026367188, -0.18248748779296875, -0.17212295532226562, -0.1617584228515625, -0.15139389038085938, -0.14102935791015625, -0.13066482543945312, -0.12030029296875, -0.10993576049804688, -0.09957122802734375, -0.08920669555664062, -0.0788421630859375, -0.06847763061523438, -0.05811309814453125, -0.047748565673828125, -0.037384033203125, -0.027019500732421875, -0.01665496826171875, -0.006290435791015625, 0.0040740966796875, 0.014438629150390625, 0.02480316162109375, 0.035167694091796875, 0.0455322265625, 0.055896759033203125, 0.06626129150390625, 0.07662582397460938, 0.0869903564453125, 0.09735488891601562, 0.10771942138671875, 0.11808395385742188, 0.128448486328125, 0.13881301879882812, 0.14917755126953125, 0.15954208374023438, 0.1699066162109375, 0.18027114868164062, 0.19063568115234375, 0.20100021362304688, 0.21136474609375, 0.22172927856445312, 0.23209381103515625, 0.24245834350585938, 0.2528228759765625, 0.2631874084472656, 0.27355194091796875, 0.2839164733886719, 0.294281005859375, 0.3046455383300781, 0.31501007080078125, 0.3253746032714844, 0.3357391357421875, 0.3461036682128906, 0.35646820068359375, 0.3668327331542969, 0.377197265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 16.0, 25.0, 35.0, 51.0, 66.0, 81.0, 102.0, 93.0, 116.0, 89.0, 81.0, 53.0, 38.0, 32.0, 19.0, 21.0, 16.0, 9.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.90493392944336e-05, -8.562393486499786e-05, -8.219853043556213e-05, -7.87731260061264e-05, -7.534772157669067e-05, -7.192231714725494e-05, -6.849691271781921e-05, -6.507150828838348e-05, -6.164610385894775e-05, -5.8220699429512024e-05, -5.4795295000076294e-05, -5.1369890570640564e-05, -4.7944486141204834e-05, -4.4519081711769104e-05, -4.1093677282333374e-05, -3.7668272852897644e-05, -3.4242868423461914e-05, -3.0817463994026184e-05, -2.7392059564590454e-05, -2.3966655135154724e-05, -2.0541250705718994e-05, -1.7115846276283264e-05, -1.3690441846847534e-05, -1.0265037417411804e-05, -6.839632987976074e-06, -3.4142285585403442e-06, 1.1175870895385742e-08, 3.4365803003311157e-06, 6.861984729766846e-06, 1.0287389159202576e-05, 1.3712793588638306e-05, 1.7138198018074036e-05, 2.0563602447509766e-05, 2.3989006876945496e-05, 2.7414411306381226e-05, 3.0839815735816956e-05, 3.4265220165252686e-05, 3.7690624594688416e-05, 4.1116029024124146e-05, 4.4541433453559875e-05, 4.7966837882995605e-05, 5.1392242312431335e-05, 5.4817646741867065e-05, 5.8243051171302795e-05, 6.166845560073853e-05, 6.509386003017426e-05, 6.851926445960999e-05, 7.194466888904572e-05, 7.537007331848145e-05, 7.879547774791718e-05, 8.22208821773529e-05, 8.564628660678864e-05, 8.907169103622437e-05, 9.24970954656601e-05, 9.592249989509583e-05, 9.934790432453156e-05, 0.00010277330875396729, 0.00010619871318340302, 0.00010962411761283875, 0.00011304952204227448, 0.0001164749264717102, 0.00011990033090114594, 0.00012332573533058167, 0.0001267511397600174, 0.00013017654418945312]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 2.0, 5.0, 6.0, 11.0, 18.0, 15.0, 20.0, 62.0, 74.0, 121.0, 224.0, 377.0, 798.0, 2189.0, 7520.0, 45395.0, 830141.0, 142060.0, 13699.0, 3440.0, 1201.0, 531.0, 242.0, 158.0, 83.0, 49.0, 30.0, 23.0, 19.0, 11.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.4022483825683594, -0.38994598388671875, -0.3776435852050781, -0.3653411865234375, -0.3530387878417969, -0.34073638916015625, -0.3284339904785156, -0.316131591796875, -0.3038291931152344, -0.29152679443359375, -0.2792243957519531, -0.2669219970703125, -0.2546195983886719, -0.24231719970703125, -0.23001480102539062, -0.21771240234375, -0.20541000366210938, -0.19310760498046875, -0.18080520629882812, -0.1685028076171875, -0.15620040893554688, -0.14389801025390625, -0.13159561157226562, -0.119293212890625, -0.10699081420898438, -0.09468841552734375, -0.08238601684570312, -0.0700836181640625, -0.057781219482421875, -0.04547882080078125, -0.033176422119140625, -0.0208740234375, -0.008571624755859375, 0.00373077392578125, 0.016033172607421875, 0.0283355712890625, 0.040637969970703125, 0.05294036865234375, 0.06524276733398438, 0.077545166015625, 0.08984756469726562, 0.10214996337890625, 0.11445236206054688, 0.1267547607421875, 0.13905715942382812, 0.15135955810546875, 0.16366195678710938, 0.17596435546875, 0.18826675415039062, 0.20056915283203125, 0.21287155151367188, 0.2251739501953125, 0.23747634887695312, 0.24977874755859375, 0.2620811462402344, 0.274383544921875, 0.2866859436035156, 0.29898834228515625, 0.3112907409667969, 0.3235931396484375, 0.3358955383300781, 0.34819793701171875, 0.3605003356933594, 0.372802734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 3.0, 9.0, 5.0, 10.0, 20.0, 26.0, 60.0, 77.0, 137.0, 173.0, 147.0, 115.0, 69.0, 35.0, 26.0, 20.0, 9.0, 8.0, 8.0, 4.0, 2.0, 4.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2000732421875, -0.19359397888183594, -0.18711471557617188, -0.1806354522705078, -0.17415618896484375, -0.1676769256591797, -0.16119766235351562, -0.15471839904785156, -0.1482391357421875, -0.14175987243652344, -0.13528060913085938, -0.1288013458251953, -0.12232208251953125, -0.11584281921386719, -0.10936355590820312, -0.10288429260253906, -0.096405029296875, -0.08992576599121094, -0.08344650268554688, -0.07696723937988281, -0.07048797607421875, -0.06400871276855469, -0.057529449462890625, -0.05105018615722656, -0.0445709228515625, -0.03809165954589844, -0.031612396240234375, -0.025133132934570312, -0.01865386962890625, -0.012174606323242188, -0.005695343017578125, 0.0007839202880859375, 0.00726318359375, 0.013742446899414062, 0.020221710205078125, 0.026700973510742188, 0.03318023681640625, 0.03965950012207031, 0.046138763427734375, 0.05261802673339844, 0.0590972900390625, 0.06557655334472656, 0.07205581665039062, 0.07853507995605469, 0.08501434326171875, 0.09149360656738281, 0.09797286987304688, 0.10445213317871094, 0.110931396484375, 0.11741065979003906, 0.12388992309570312, 0.1303691864013672, 0.13684844970703125, 0.1433277130126953, 0.14980697631835938, 0.15628623962402344, 0.1627655029296875, 0.16924476623535156, 0.17572402954101562, 0.1822032928466797, 0.18868255615234375, 0.1951618194580078, 0.20164108276367188, 0.20812034606933594, 0.214599609375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 25.0, 44.0, 62.0, 106.0, 152.0, 173.0, 184.0, 117.0, 54.0, 42.0, 16.0, 6.0, 9.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.174990653991699, -5.056013584136963, -4.937036514282227, -4.818059921264648, -4.699082851409912, -4.580105781555176, -4.4611287117004395, -4.342152118682861, -4.223175048828125, -4.104197978973389, -3.9852211475372314, -3.866244077682495, -3.747267246246338, -3.6282901763916016, -3.5093133449554443, -3.390336275100708, -3.271359443664551, -3.1523823738098145, -3.0334055423736572, -2.914428472518921, -2.7954516410827637, -2.6764745712280273, -2.55749773979187, -2.438520669937134, -2.3195436000823975, -2.200566530227661, -2.081589698791504, -1.9626127481460571, -1.8436357975006104, -1.724658727645874, -1.6056818962097168, -1.4867048263549805, -1.3677279949188232, -1.2487510442733765, -1.1297740936279297, -1.010797142982483, -0.8918201923370361, -0.7728431820869446, -0.6538662314414978, -0.534889280796051, -0.41591233015060425, -0.29693537950515747, -0.1779584139585495, -0.05898144841194153, 0.05999550223350525, 0.17897248268127441, 0.2979494333267212, 0.41692638397216797, 0.5359033346176147, 0.6548802852630615, 0.7738572359085083, 0.8928341865539551, 1.0118111371994019, 1.1307880878448486, 1.249765157699585, 1.3687419891357422, 1.4877190589904785, 1.6066960096359253, 1.725672960281372, 1.8446499109268188, 1.9636268615722656, 2.082603931427002, 2.201580762863159, 2.3205578327178955, 2.4395346641540527]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 8.0, 8.0, 13.0, 17.0, 15.0, 22.0, 14.0, 31.0, 33.0, 33.0, 29.0, 41.0, 33.0, 42.0, 46.0, 50.0, 48.0, 55.0, 40.0, 42.0, 40.0, 38.0, 40.0, 46.0, 32.0, 35.0, 25.0, 20.0, 19.0, 19.0, 6.0, 12.0, 3.0, 7.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.117844581604004, -2.0538840293884277, -1.9899237155914307, -1.9259631633758545, -1.8620027303695679, -1.7980422973632812, -1.734081745147705, -1.6701213121414185, -1.6061608791351318, -1.5422004461288452, -1.4782400131225586, -1.4142794609069824, -1.3503190279006958, -1.2863585948944092, -1.222398042678833, -1.1584376096725464, -1.0944771766662598, -1.0305167436599731, -0.9665562510490417, -0.9025957584381104, -0.8386353254318237, -0.7746748924255371, -0.7107143998146057, -0.6467539072036743, -0.5827934741973877, -0.5188330411911011, -0.4548725485801697, -0.39091208577156067, -0.32695162296295166, -0.26299116015434265, -0.19903069734573364, -0.13507023453712463, -0.07110965251922607, -0.007149189710617065, 0.05681127309799194, 0.12077173590660095, 0.18473219871520996, 0.24869266152381897, 0.312653124332428, 0.376613587141037, 0.440574049949646, 0.5045344829559326, 0.568494975566864, 0.6324554681777954, 0.696415901184082, 0.7603763341903687, 0.8243368268013, 0.8882973194122314, 0.9522577524185181, 1.0162181854248047, 1.0801787376403809, 1.1441391706466675, 1.208099603652954, 1.2720600366592407, 1.3360204696655273, 1.3999810218811035, 1.4639414548873901, 1.5279018878936768, 1.591862440109253, 1.6558228731155396, 1.7197833061218262, 1.7837437391281128, 1.8477041721343994, 1.9116647243499756, 1.9756251573562622]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 7.0, 3.0, 8.0, 6.0, 8.0, 28.0, 27.0, 36.0, 57.0, 101.0, 137.0, 232.0, 376.0, 642.0, 1162.0, 2161.0, 4893.0, 11863.0, 35312.0, 164787.0, 3613065.0, 283796.0, 48619.0, 15221.0, 5947.0, 2780.0, 1354.0, 709.0, 356.0, 231.0, 142.0, 79.0, 56.0, 21.0, 21.0, 15.0, 7.0, 6.0, 11.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37841796875, -0.3636474609375, -0.348876953125, -0.3341064453125, -0.3193359375, -0.3045654296875, -0.289794921875, -0.2750244140625, -0.26025390625, -0.2454833984375, -0.230712890625, -0.2159423828125, -0.201171875, -0.1864013671875, -0.171630859375, -0.1568603515625, -0.14208984375, -0.1273193359375, -0.112548828125, -0.0977783203125, -0.0830078125, -0.0682373046875, -0.053466796875, -0.0386962890625, -0.02392578125, -0.0091552734375, 0.005615234375, 0.0203857421875, 0.03515625, 0.0499267578125, 0.064697265625, 0.0794677734375, 0.09423828125, 0.1090087890625, 0.123779296875, 0.1385498046875, 0.1533203125, 0.1680908203125, 0.182861328125, 0.1976318359375, 0.21240234375, 0.2271728515625, 0.241943359375, 0.2567138671875, 0.271484375, 0.2862548828125, 0.301025390625, 0.3157958984375, 0.33056640625, 0.3453369140625, 0.360107421875, 0.3748779296875, 0.3896484375, 0.4044189453125, 0.419189453125, 0.4339599609375, 0.44873046875, 0.4635009765625, 0.478271484375, 0.4930419921875, 0.5078125, 0.5225830078125, 0.537353515625, 0.5521240234375, 0.56689453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 8.0, 10.0, 21.0, 19.0, 16.0, 21.0, 34.0, 29.0, 54.0, 45.0, 51.0, 48.0, 56.0, 52.0, 57.0, 59.0, 59.0, 60.0, 37.0, 34.0, 27.0, 42.0, 34.0, 29.0, 21.0, 9.0, 14.0, 11.0, 8.0, 3.0, 2.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11590576171875, -0.11249542236328125, -0.1090850830078125, -0.10567474365234375, -0.102264404296875, -0.09885406494140625, -0.0954437255859375, -0.09203338623046875, -0.088623046875, -0.08521270751953125, -0.0818023681640625, -0.07839202880859375, -0.074981689453125, -0.07157135009765625, -0.0681610107421875, -0.06475067138671875, -0.06134033203125, -0.05792999267578125, -0.0545196533203125, -0.05110931396484375, -0.047698974609375, -0.04428863525390625, -0.0408782958984375, -0.03746795654296875, -0.0340576171875, -0.03064727783203125, -0.0272369384765625, -0.02382659912109375, -0.020416259765625, -0.01700592041015625, -0.0135955810546875, -0.01018524169921875, -0.00677490234375, -0.00336456298828125, 4.57763671875e-05, 0.00345611572265625, 0.006866455078125, 0.01027679443359375, 0.0136871337890625, 0.01709747314453125, 0.0205078125, 0.02391815185546875, 0.0273284912109375, 0.03073883056640625, 0.034149169921875, 0.03755950927734375, 0.0409698486328125, 0.04438018798828125, 0.04779052734375, 0.05120086669921875, 0.0546112060546875, 0.05802154541015625, 0.061431884765625, 0.06484222412109375, 0.0682525634765625, 0.07166290283203125, 0.0750732421875, 0.07848358154296875, 0.0818939208984375, 0.08530426025390625, 0.088714599609375, 0.09212493896484375, 0.0955352783203125, 0.09894561767578125, 0.10235595703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 7.0, 7.0, 12.0, 17.0, 32.0, 47.0, 65.0, 102.0, 155.0, 265.0, 493.0, 1047.0, 2190.0, 5869.0, 17292.0, 69574.0, 842248.0, 3119235.0, 100540.0, 22849.0, 7121.0, 2647.0, 1203.0, 555.0, 254.0, 165.0, 85.0, 74.0, 53.0, 26.0, 18.0, 20.0, 6.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.591796875, -0.5762672424316406, -0.5607376098632812, -0.5452079772949219, -0.5296783447265625, -0.5141487121582031, -0.49861907958984375, -0.4830894470214844, -0.467559814453125, -0.4520301818847656, -0.43650054931640625, -0.4209709167480469, -0.4054412841796875, -0.3899116516113281, -0.37438201904296875, -0.3588523864746094, -0.34332275390625, -0.3277931213378906, -0.31226348876953125, -0.2967338562011719, -0.2812042236328125, -0.2656745910644531, -0.25014495849609375, -0.23461532592773438, -0.219085693359375, -0.20355606079101562, -0.18802642822265625, -0.17249679565429688, -0.1569671630859375, -0.14143753051757812, -0.12590789794921875, -0.11037826538085938, -0.0948486328125, -0.07931900024414062, -0.06378936767578125, -0.048259735107421875, -0.0327301025390625, -0.017200469970703125, -0.00167083740234375, 0.013858795166015625, 0.029388427734375, 0.044918060302734375, 0.06044769287109375, 0.07597732543945312, 0.0915069580078125, 0.10703659057617188, 0.12256622314453125, 0.13809585571289062, 0.15362548828125, 0.16915512084960938, 0.18468475341796875, 0.20021438598632812, 0.2157440185546875, 0.23127365112304688, 0.24680328369140625, 0.2623329162597656, 0.277862548828125, 0.2933921813964844, 0.30892181396484375, 0.3244514465332031, 0.3399810791015625, 0.3555107116699219, 0.37104034423828125, 0.3865699768066406, 0.402099609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 4.0, 14.0, 13.0, 42.0, 67.0, 120.0, 246.0, 1086.0, 1815.0, 312.0, 140.0, 73.0, 48.0, 24.0, 17.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3203125, -0.3127002716064453, -0.3050880432128906, -0.29747581481933594, -0.28986358642578125, -0.28225135803222656, -0.2746391296386719, -0.2670269012451172, -0.2594146728515625, -0.2518024444580078, -0.24419021606445312, -0.23657798767089844, -0.22896575927734375, -0.22135353088378906, -0.21374130249023438, -0.2061290740966797, -0.198516845703125, -0.1909046173095703, -0.18329238891601562, -0.17568016052246094, -0.16806793212890625, -0.16045570373535156, -0.15284347534179688, -0.1452312469482422, -0.1376190185546875, -0.1300067901611328, -0.12239456176757812, -0.11478233337402344, -0.10717010498046875, -0.09955787658691406, -0.09194564819335938, -0.08433341979980469, -0.07672119140625, -0.06910896301269531, -0.061496734619140625, -0.05388450622558594, -0.04627227783203125, -0.03866004943847656, -0.031047821044921875, -0.023435592651367188, -0.0158233642578125, -0.008211135864257812, -0.000598907470703125, 0.0070133209228515625, 0.01462554931640625, 0.022237777709960938, 0.029850006103515625, 0.03746223449707031, 0.045074462890625, 0.05268669128417969, 0.060298919677734375, 0.06791114807128906, 0.07552337646484375, 0.08313560485839844, 0.09074783325195312, 0.09836006164550781, 0.1059722900390625, 0.11358451843261719, 0.12119674682617188, 0.12880897521972656, 0.13642120361328125, 0.14403343200683594, 0.15164566040039062, 0.1592578887939453, 0.1668701171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 12.0, 14.0, 34.0, 77.0, 127.0, 149.0, 163.0, 154.0, 122.0, 75.0, 32.0, 15.0, 8.0, 6.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.333051085472107, -1.2877261638641357, -1.242401361465454, -1.197076439857483, -1.1517516374588013, -1.10642671585083, -1.0611019134521484, -1.0157769918441772, -0.970452070236206, -0.9251272082328796, -0.8798023462295532, -0.834477424621582, -0.7891525626182556, -0.7438277006149292, -0.6985028386116028, -0.6531779766082764, -0.60785311460495, -0.5625282526016235, -0.5172033905982971, -0.4718784987926483, -0.4265536069869995, -0.3812287449836731, -0.3359038829803467, -0.2905789911746979, -0.24525412917137146, -0.19992925226688385, -0.15460437536239624, -0.10927951335906982, -0.06395463645458221, -0.018629759550094604, 0.02669510245323181, 0.07201999425888062, 0.11734485626220703, 0.16266973316669464, 0.20799461007118225, 0.25331947207450867, 0.29864436388015747, 0.3439692258834839, 0.3892940878868103, 0.4346189796924591, 0.4799438416957855, 0.5252687335014343, 0.5705935955047607, 0.6159184575080872, 0.6612433195114136, 0.7065682411193848, 0.7518930435180664, 0.7972179651260376, 0.842542827129364, 0.8878676891326904, 0.9331925511360168, 0.9785174131393433, 1.0238423347473145, 1.069167137145996, 1.1144920587539673, 1.1598169803619385, 1.2051417827606201, 1.2504667043685913, 1.295791506767273, 1.3411164283752441, 1.3864412307739258, 1.431766152381897, 1.4770910739898682, 1.5224158763885498, 1.567740797996521]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 5.0, 13.0, 6.0, 14.0, 10.0, 19.0, 10.0, 24.0, 21.0, 18.0, 30.0, 22.0, 45.0, 27.0, 38.0, 33.0, 34.0, 44.0, 34.0, 57.0, 35.0, 38.0, 39.0, 44.0, 32.0, 42.0, 34.0, 32.0, 31.0, 18.0, 22.0, 23.0, 20.0, 14.0, 12.0, 10.0, 12.0, 8.0, 6.0, 10.0, 1.0, 0.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5121451616287231, -0.4962048828601837, -0.4802646040916443, -0.46432432532310486, -0.44838404655456543, -0.4324437379837036, -0.4165034592151642, -0.40056318044662476, -0.3846229016780853, -0.3686826229095459, -0.35274234414100647, -0.33680206537246704, -0.3208617568016052, -0.3049215078353882, -0.28898119926452637, -0.27304092049598694, -0.2571006417274475, -0.24116036295890808, -0.22522008419036865, -0.20927979052066803, -0.1933395117521286, -0.17739923298358917, -0.16145893931388855, -0.14551866054534912, -0.1295783817768097, -0.11363810300827026, -0.09769781678915024, -0.08175753057003021, -0.06581725180149078, -0.049876973032951355, -0.03393668681383133, -0.017996400594711304, -0.002056121826171875, 0.013884160667657852, 0.02982444316148758, 0.045764725655317307, 0.061705008149147034, 0.07764528691768646, 0.09358557313680649, 0.10952585935592651, 0.12546613812446594, 0.14140641689300537, 0.1573466956615448, 0.17328698933124542, 0.18922726809978485, 0.20516754686832428, 0.2211078405380249, 0.23704811930656433, 0.25298839807510376, 0.2689286768436432, 0.2848689556121826, 0.30080923438072205, 0.3167495131492615, 0.3326898217201233, 0.3486301004886627, 0.36457037925720215, 0.3805106580257416, 0.396450936794281, 0.41239121556282043, 0.42833149433135986, 0.4442718029022217, 0.4602120518684387, 0.47615236043930054, 0.49209263920783997, 0.5080329179763794]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 5.0, 12.0, 12.0, 14.0, 19.0, 16.0, 37.0, 55.0, 72.0, 117.0, 186.0, 326.0, 510.0, 960.0, 1821.0, 3827.0, 8228.0, 18628.0, 42113.0, 117213.0, 495981.0, 242218.0, 65523.0, 27105.0, 12215.0, 5668.0, 2591.0, 1274.0, 733.0, 379.0, 217.0, 148.0, 94.0, 63.0, 38.0, 38.0, 26.0, 26.0, 10.0, 11.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.410888671875, -0.40000152587890625, -0.3891143798828125, -0.37822723388671875, -0.367340087890625, -0.35645294189453125, -0.3455657958984375, -0.33467864990234375, -0.32379150390625, -0.31290435791015625, -0.3020172119140625, -0.29113006591796875, -0.280242919921875, -0.26935577392578125, -0.2584686279296875, -0.24758148193359375, -0.2366943359375, -0.22580718994140625, -0.2149200439453125, -0.20403289794921875, -0.193145751953125, -0.18225860595703125, -0.1713714599609375, -0.16048431396484375, -0.14959716796875, -0.13871002197265625, -0.1278228759765625, -0.11693572998046875, -0.106048583984375, -0.09516143798828125, -0.0842742919921875, -0.07338714599609375, -0.0625, -0.05161285400390625, -0.0407257080078125, -0.02983856201171875, -0.018951416015625, -0.00806427001953125, 0.0028228759765625, 0.01371002197265625, 0.02459716796875, 0.03548431396484375, 0.0463714599609375, 0.05725860595703125, 0.068145751953125, 0.07903289794921875, 0.0899200439453125, 0.10080718994140625, 0.1116943359375, 0.12258148193359375, 0.1334686279296875, 0.14435577392578125, 0.155242919921875, 0.16613006591796875, 0.1770172119140625, 0.18790435791015625, 0.19879150390625, 0.20967864990234375, 0.2205657958984375, 0.23145294189453125, 0.242340087890625, 0.25322723388671875, 0.2641143798828125, 0.27500152587890625, 0.285888671875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 5.0, 9.0, 3.0, 15.0, 8.0, 13.0, 22.0, 20.0, 12.0, 17.0, 35.0, 31.0, 38.0, 49.0, 44.0, 48.0, 53.0, 47.0, 47.0, 45.0, 46.0, 42.0, 47.0, 46.0, 32.0, 35.0, 28.0, 29.0, 40.0, 13.0, 12.0, 15.0, 11.0, 11.0, 3.0, 5.0, 3.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1104736328125, -0.10744094848632812, -0.10440826416015625, -0.10137557983398438, -0.0983428955078125, -0.09531021118164062, -0.09227752685546875, -0.08924484252929688, -0.086212158203125, -0.08317947387695312, -0.08014678955078125, -0.07711410522460938, -0.0740814208984375, -0.07104873657226562, -0.06801605224609375, -0.06498336791992188, -0.06195068359375, -0.058917999267578125, -0.05588531494140625, -0.052852630615234375, -0.0498199462890625, -0.046787261962890625, -0.04375457763671875, -0.040721893310546875, -0.037689208984375, -0.034656524658203125, -0.03162384033203125, -0.028591156005859375, -0.0255584716796875, -0.022525787353515625, -0.01949310302734375, -0.016460418701171875, -0.013427734375, -0.010395050048828125, -0.00736236572265625, -0.004329681396484375, -0.0012969970703125, 0.001735687255859375, 0.00476837158203125, 0.007801055908203125, 0.010833740234375, 0.013866424560546875, 0.01689910888671875, 0.019931793212890625, 0.0229644775390625, 0.025997161865234375, 0.02902984619140625, 0.032062530517578125, 0.03509521484375, 0.038127899169921875, 0.04116058349609375, 0.044193267822265625, 0.0472259521484375, 0.050258636474609375, 0.05329132080078125, 0.056324005126953125, 0.059356689453125, 0.062389373779296875, 0.06542205810546875, 0.06845474243164062, 0.0714874267578125, 0.07452011108398438, 0.07755279541015625, 0.08058547973632812, 0.0836181640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 8.0, 16.0, 8.0, 26.0, 21.0, 33.0, 43.0, 77.0, 96.0, 122.0, 217.0, 378.0, 700.0, 1375.0, 3287.0, 8711.0, 23850.0, 71573.0, 555055.0, 299907.0, 52503.0, 18488.0, 6740.0, 2640.0, 1195.0, 568.0, 328.0, 190.0, 128.0, 82.0, 47.0, 33.0, 26.0, 14.0, 16.0, 8.0, 7.0, 12.0, 4.0, 6.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.50390625, -0.4894561767578125, -0.475006103515625, -0.4605560302734375, -0.44610595703125, -0.4316558837890625, -0.417205810546875, -0.4027557373046875, -0.3883056640625, -0.3738555908203125, -0.359405517578125, -0.3449554443359375, -0.33050537109375, -0.3160552978515625, -0.301605224609375, -0.2871551513671875, -0.272705078125, -0.2582550048828125, -0.243804931640625, -0.2293548583984375, -0.21490478515625, -0.2004547119140625, -0.186004638671875, -0.1715545654296875, -0.1571044921875, -0.1426544189453125, -0.128204345703125, -0.1137542724609375, -0.09930419921875, -0.0848541259765625, -0.070404052734375, -0.0559539794921875, -0.04150390625, -0.0270538330078125, -0.012603759765625, 0.0018463134765625, 0.01629638671875, 0.0307464599609375, 0.045196533203125, 0.0596466064453125, 0.0740966796875, 0.0885467529296875, 0.102996826171875, 0.1174468994140625, 0.13189697265625, 0.1463470458984375, 0.160797119140625, 0.1752471923828125, 0.189697265625, 0.2041473388671875, 0.218597412109375, 0.2330474853515625, 0.24749755859375, 0.2619476318359375, 0.276397705078125, 0.2908477783203125, 0.3052978515625, 0.3197479248046875, 0.334197998046875, 0.3486480712890625, 0.36309814453125, 0.3775482177734375, 0.391998291015625, 0.4064483642578125, 0.4208984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 8.0, 5.0, 12.0, 7.0, 21.0, 23.0, 13.0, 29.0, 36.0, 38.0, 45.0, 42.0, 52.0, 62.0, 58.0, 67.0, 43.0, 51.0, 63.0, 57.0, 37.0, 43.0, 24.0, 39.0, 25.0, 17.0, 17.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 6.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51220703125, -0.49631500244140625, -0.4804229736328125, -0.46453094482421875, -0.448638916015625, -0.43274688720703125, -0.4168548583984375, -0.40096282958984375, -0.38507080078125, -0.36917877197265625, -0.3532867431640625, -0.33739471435546875, -0.321502685546875, -0.30561065673828125, -0.2897186279296875, -0.27382659912109375, -0.2579345703125, -0.24204254150390625, -0.2261505126953125, -0.21025848388671875, -0.194366455078125, -0.17847442626953125, -0.1625823974609375, -0.14669036865234375, -0.13079833984375, -0.11490631103515625, -0.0990142822265625, -0.08312225341796875, -0.067230224609375, -0.05133819580078125, -0.0354461669921875, -0.01955413818359375, -0.003662109375, 0.01222991943359375, 0.0281219482421875, 0.04401397705078125, 0.059906005859375, 0.07579803466796875, 0.0916900634765625, 0.10758209228515625, 0.12347412109375, 0.13936614990234375, 0.1552581787109375, 0.17115020751953125, 0.187042236328125, 0.20293426513671875, 0.2188262939453125, 0.23471832275390625, 0.2506103515625, 0.26650238037109375, 0.2823944091796875, 0.29828643798828125, 0.314178466796875, 0.33007049560546875, 0.3459625244140625, 0.36185455322265625, 0.37774658203125, 0.39363861083984375, 0.4095306396484375, 0.42542266845703125, 0.441314697265625, 0.45720672607421875, 0.4730987548828125, 0.48899078369140625, 0.5048828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 12.0, 13.0, 26.0, 44.0, 56.0, 117.0, 227.0, 417.0, 998.0, 2785.0, 11527.0, 95868.0, 805375.0, 113222.0, 12775.0, 3071.0, 1049.0, 433.0, 223.0, 122.0, 82.0, 37.0, 18.0, 17.0, 9.0, 7.0, 1.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.21498489379882812, -0.20584869384765625, -0.19671249389648438, -0.1875762939453125, -0.17844009399414062, -0.16930389404296875, -0.16016769409179688, -0.151031494140625, -0.14189529418945312, -0.13275909423828125, -0.12362289428710938, -0.1144866943359375, -0.10535049438476562, -0.09621429443359375, -0.08707809448242188, -0.07794189453125, -0.06880569458007812, -0.05966949462890625, -0.050533294677734375, -0.0413970947265625, -0.032260894775390625, -0.02312469482421875, -0.013988494873046875, -0.004852294921875, 0.004283905029296875, 0.01342010498046875, 0.022556304931640625, 0.0316925048828125, 0.040828704833984375, 0.04996490478515625, 0.059101104736328125, 0.0682373046875, 0.07737350463867188, 0.08650970458984375, 0.09564590454101562, 0.1047821044921875, 0.11391830444335938, 0.12305450439453125, 0.13219070434570312, 0.141326904296875, 0.15046310424804688, 0.15959930419921875, 0.16873550415039062, 0.1778717041015625, 0.18700790405273438, 0.19614410400390625, 0.20528030395507812, 0.21441650390625, 0.22355270385742188, 0.23268890380859375, 0.24182510375976562, 0.2509613037109375, 0.2600975036621094, 0.26923370361328125, 0.2783699035644531, 0.287506103515625, 0.2966423034667969, 0.30577850341796875, 0.3149147033691406, 0.3240509033203125, 0.3331871032714844, 0.34232330322265625, 0.3514595031738281, 0.360595703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 11.0, 8.0, 13.0, 20.0, 32.0, 67.0, 71.0, 123.0, 128.0, 151.0, 117.0, 93.0, 48.0, 35.0, 30.0, 17.0, 12.0, 10.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00019311904907226562, -0.00018816813826560974, -0.00018321722745895386, -0.00017826631665229797, -0.0001733154058456421, -0.0001683644950389862, -0.00016341358423233032, -0.00015846267342567444, -0.00015351176261901855, -0.00014856085181236267, -0.0001436099410057068, -0.0001386590301990509, -0.00013370811939239502, -0.00012875720858573914, -0.00012380629777908325, -0.00011885538697242737, -0.00011390447616577148, -0.0001089535653591156, -0.00010400265455245972, -9.905174374580383e-05, -9.410083293914795e-05, -8.914992213249207e-05, -8.419901132583618e-05, -7.92481005191803e-05, -7.429718971252441e-05, -6.934627890586853e-05, -6.439536809921265e-05, -5.944445729255676e-05, -5.449354648590088e-05, -4.9542635679244995e-05, -4.459172487258911e-05, -3.964081406593323e-05, -3.4689903259277344e-05, -2.973899245262146e-05, -2.4788081645965576e-05, -1.9837170839309692e-05, -1.4886260032653809e-05, -9.935349225997925e-06, -4.984438419342041e-06, -3.3527612686157227e-08, 4.9173831939697266e-06, 9.86829400062561e-06, 1.4819204807281494e-05, 1.9770115613937378e-05, 2.4721026420593262e-05, 2.9671937227249146e-05, 3.462284803390503e-05, 3.957375884056091e-05, 4.45246696472168e-05, 4.947558045387268e-05, 5.4426491260528564e-05, 5.937740206718445e-05, 6.432831287384033e-05, 6.927922368049622e-05, 7.42301344871521e-05, 7.918104529380798e-05, 8.413195610046387e-05, 8.908286690711975e-05, 9.403377771377563e-05, 9.898468852043152e-05, 0.0001039355993270874, 0.00010888651013374329, 0.00011383742094039917, 0.00011878833174705505, 0.00012373924255371094]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0, 5.0, 6.0, 10.0, 13.0, 23.0, 26.0, 34.0, 46.0, 87.0, 110.0, 196.0, 299.0, 467.0, 867.0, 1537.0, 3254.0, 8587.0, 31554.0, 202050.0, 648713.0, 116819.0, 21517.0, 6357.0, 2753.0, 1352.0, 742.0, 410.0, 252.0, 162.0, 98.0, 67.0, 45.0, 20.0, 22.0, 18.0, 8.0, 7.0, 8.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1787109375, -0.17301368713378906, -0.16731643676757812, -0.1616191864013672, -0.15592193603515625, -0.1502246856689453, -0.14452743530273438, -0.13883018493652344, -0.1331329345703125, -0.12743568420410156, -0.12173843383789062, -0.11604118347167969, -0.11034393310546875, -0.10464668273925781, -0.09894943237304688, -0.09325218200683594, -0.087554931640625, -0.08185768127441406, -0.07616043090820312, -0.07046318054199219, -0.06476593017578125, -0.05906867980957031, -0.053371429443359375, -0.04767417907714844, -0.0419769287109375, -0.03627967834472656, -0.030582427978515625, -0.024885177612304688, -0.01918792724609375, -0.013490676879882812, -0.007793426513671875, -0.0020961761474609375, 0.00360107421875, 0.009298324584960938, 0.014995574951171875, 0.020692825317382812, 0.02639007568359375, 0.03208732604980469, 0.037784576416015625, 0.04348182678222656, 0.0491790771484375, 0.05487632751464844, 0.060573577880859375, 0.06627082824707031, 0.07196807861328125, 0.07766532897949219, 0.08336257934570312, 0.08905982971191406, 0.094757080078125, 0.10045433044433594, 0.10615158081054688, 0.11184883117675781, 0.11754608154296875, 0.12324333190917969, 0.12894058227539062, 0.13463783264160156, 0.1403350830078125, 0.14603233337402344, 0.15172958374023438, 0.1574268341064453, 0.16312408447265625, 0.1688213348388672, 0.17451858520507812, 0.18021583557128906, 0.1859130859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 10.0, 14.0, 22.0, 25.0, 39.0, 92.0, 91.0, 101.0, 118.0, 142.0, 102.0, 72.0, 49.0, 37.0, 25.0, 14.0, 14.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.12697792053222656, -0.12163162231445312, -0.11628532409667969, -0.11093902587890625, -0.10559272766113281, -0.10024642944335938, -0.09490013122558594, -0.0895538330078125, -0.08420753479003906, -0.07886123657226562, -0.07351493835449219, -0.06816864013671875, -0.06282234191894531, -0.057476043701171875, -0.05212974548339844, -0.046783447265625, -0.04143714904785156, -0.036090850830078125, -0.030744552612304688, -0.02539825439453125, -0.020051956176757812, -0.014705657958984375, -0.009359359741210938, -0.0040130615234375, 0.0013332366943359375, 0.006679534912109375, 0.012025833129882812, 0.01737213134765625, 0.022718429565429688, 0.028064727783203125, 0.03341102600097656, 0.03875732421875, 0.04410362243652344, 0.049449920654296875, 0.05479621887207031, 0.06014251708984375, 0.06548881530761719, 0.07083511352539062, 0.07618141174316406, 0.0815277099609375, 0.08687400817871094, 0.09222030639648438, 0.09756660461425781, 0.10291290283203125, 0.10825920104980469, 0.11360549926757812, 0.11895179748535156, 0.124298095703125, 0.12964439392089844, 0.13499069213867188, 0.1403369903564453, 0.14568328857421875, 0.1510295867919922, 0.15637588500976562, 0.16172218322753906, 0.1670684814453125, 0.17241477966308594, 0.17776107788085938, 0.1831073760986328, 0.18845367431640625, 0.1937999725341797, 0.19914627075195312, 0.20449256896972656, 0.2098388671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 17.0, 21.0, 42.0, 118.0, 167.0, 227.0, 186.0, 120.0, 61.0, 27.0, 11.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578588485717773, -5.4339165687561035, -5.289245128631592, -5.144573211669922, -4.999901294708252, -4.855229377746582, -4.71055793762207, -4.5658860206604, -4.4212141036987305, -4.2765421867370605, -4.131870746612549, -3.987198829650879, -3.842526912689209, -3.697855234146118, -3.5531835556030273, -3.4085116386413574, -3.2638401985168457, -3.119168519973755, -2.974496603012085, -2.829824924468994, -2.685153007507324, -2.5404813289642334, -2.3958096504211426, -2.2511377334594727, -2.106466054916382, -1.9617942571640015, -1.817122459411621, -1.6724507808685303, -1.52777898311615, -1.3831071853637695, -1.2384355068206787, -1.0937637090682983, -0.949091911315918, -0.8044201135635376, -0.659748375415802, -0.5150766372680664, -0.37040483951568604, -0.22573304176330566, -0.08106130361557007, 0.06361043453216553, 0.2082822322845459, 0.3529540002346039, 0.49762576818466187, 0.6422975063323975, 0.7869693040847778, 0.9316411018371582, 1.076312780380249, 1.2209845781326294, 1.3656563758850098, 1.5103281736373901, 1.6549999713897705, 1.7996716499328613, 1.9443434476852417, 2.089015245437622, 2.233686923980713, 2.378358840942383, 2.5230305194854736, 2.6677021980285645, 2.8123741149902344, 2.957045793533325, 3.101717472076416, 3.246389389038086, 3.3910610675811768, 3.5357327461242676, 3.6804046630859375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 3.0, 8.0, 17.0, 11.0, 12.0, 30.0, 24.0, 20.0, 20.0, 39.0, 33.0, 48.0, 38.0, 44.0, 50.0, 56.0, 60.0, 53.0, 56.0, 42.0, 44.0, 39.0, 41.0, 28.0, 43.0, 18.0, 16.0, 17.0, 24.0, 17.0, 10.0, 8.0, 7.0, 8.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8105566501617432, -1.7394604682922363, -1.6683642864227295, -1.5972681045532227, -1.5261719226837158, -1.455075740814209, -1.3839796781539917, -1.3128834962844849, -1.241787314414978, -1.1706911325454712, -1.0995949506759644, -1.0284987688064575, -0.9574026465415955, -0.8863064646720886, -0.8152103424072266, -0.7441141605377197, -0.6730179786682129, -0.601921796798706, -0.5308256149291992, -0.45972949266433716, -0.3886333107948303, -0.3175371289253235, -0.24644097685813904, -0.1753448247909546, -0.10424864292144775, -0.03315247595310211, 0.03794369101524353, 0.10903985798358917, 0.18013602495193481, 0.25123220682144165, 0.3223283588886261, 0.39342451095581055, 0.4645209312438965, 0.5356171131134033, 0.6067132949829102, 0.6778094172477722, 0.748905599117279, 0.8200017809867859, 0.891097903251648, 0.9621940851211548, 1.0332902669906616, 1.1043864488601685, 1.1754826307296753, 1.2465788125991821, 1.3176748752593994, 1.3887710571289062, 1.459867238998413, 1.53096342086792, 1.6020596027374268, 1.6731557846069336, 1.7442519664764404, 1.8153481483459473, 1.886444330215454, 1.957540512084961, 2.0286366939544678, 2.0997328758239746, 2.1708288192749023, 2.241925001144409, 2.313021183013916, 2.384117364883423, 2.4552135467529297, 2.5263097286224365, 2.5974059104919434, 2.668501853942871, 2.739598274230957]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 1.0, 7.0, 7.0, 16.0, 18.0, 21.0, 33.0, 43.0, 76.0, 129.0, 215.0, 369.0, 715.0, 1403.0, 2990.0, 7243.0, 20670.0, 78737.0, 950472.0, 3000242.0, 92867.0, 23752.0, 8022.0, 3218.0, 1459.0, 667.0, 343.0, 181.0, 114.0, 70.0, 50.0, 45.0, 23.0, 19.0, 19.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5348129272460938, -0.5164031982421875, -0.49799346923828125, -0.479583740234375, -0.46117401123046875, -0.4427642822265625, -0.42435455322265625, -0.40594482421875, -0.38753509521484375, -0.3691253662109375, -0.35071563720703125, -0.332305908203125, -0.31389617919921875, -0.2954864501953125, -0.27707672119140625, -0.2586669921875, -0.24025726318359375, -0.2218475341796875, -0.20343780517578125, -0.185028076171875, -0.16661834716796875, -0.1482086181640625, -0.12979888916015625, -0.11138916015625, -0.09297943115234375, -0.0745697021484375, -0.05615997314453125, -0.037750244140625, -0.01934051513671875, -0.0009307861328125, 0.01747894287109375, 0.035888671875, 0.05429840087890625, 0.0727081298828125, 0.09111785888671875, 0.109527587890625, 0.12793731689453125, 0.1463470458984375, 0.16475677490234375, 0.18316650390625, 0.20157623291015625, 0.2199859619140625, 0.23839569091796875, 0.256805419921875, 0.27521514892578125, 0.2936248779296875, 0.31203460693359375, 0.3304443359375, 0.34885406494140625, 0.3672637939453125, 0.38567352294921875, 0.404083251953125, 0.42249298095703125, 0.4409027099609375, 0.45931243896484375, 0.47772216796875, 0.49613189697265625, 0.5145416259765625, 0.5329513549804688, 0.551361083984375, 0.5697708129882812, 0.5881805419921875, 0.6065902709960938, 0.625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 15.0, 10.0, 17.0, 14.0, 21.0, 20.0, 34.0, 36.0, 38.0, 50.0, 57.0, 71.0, 53.0, 73.0, 78.0, 49.0, 50.0, 50.0, 47.0, 40.0, 43.0, 32.0, 18.0, 24.0, 11.0, 15.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10906982421875, -0.10496807098388672, -0.10086631774902344, -0.09676456451416016, -0.09266281127929688, -0.0885610580444336, -0.08445930480957031, -0.08035755157470703, -0.07625579833984375, -0.07215404510498047, -0.06805229187011719, -0.0639505386352539, -0.059848785400390625, -0.055747032165527344, -0.05164527893066406, -0.04754352569580078, -0.0434417724609375, -0.03934001922607422, -0.03523826599121094, -0.031136512756347656, -0.027034759521484375, -0.022933006286621094, -0.018831253051757812, -0.014729499816894531, -0.01062774658203125, -0.006525993347167969, -0.0024242401123046875, 0.0016775131225585938, 0.005779266357421875, 0.009881019592285156, 0.013982772827148438, 0.01808452606201172, 0.022186279296875, 0.02628803253173828, 0.030389785766601562, 0.034491539001464844, 0.038593292236328125, 0.042695045471191406, 0.04679679870605469, 0.05089855194091797, 0.05500030517578125, 0.05910205841064453, 0.06320381164550781, 0.0673055648803711, 0.07140731811523438, 0.07550907135009766, 0.07961082458496094, 0.08371257781982422, 0.0878143310546875, 0.09191608428955078, 0.09601783752441406, 0.10011959075927734, 0.10422134399414062, 0.1083230972290039, 0.11242485046386719, 0.11652660369873047, 0.12062835693359375, 0.12473011016845703, 0.1288318634033203, 0.1329336166381836, 0.13703536987304688, 0.14113712310791016, 0.14523887634277344, 0.14934062957763672, 0.1534423828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 3.0, 12.0, 9.0, 23.0, 22.0, 33.0, 53.0, 66.0, 97.0, 126.0, 187.0, 237.0, 422.0, 579.0, 834.0, 1393.0, 2264.0, 4007.0, 7570.0, 16065.0, 38816.0, 113913.0, 680108.0, 3045051.0, 184003.0, 54648.0, 21516.0, 9812.0, 4937.0, 2713.0, 1636.0, 980.0, 679.0, 421.0, 280.0, 204.0, 150.0, 106.0, 81.0, 65.0, 43.0, 32.0, 22.0, 6.0, 11.0, 19.0, 10.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.367919921875, -0.3557281494140625, -0.343536376953125, -0.3313446044921875, -0.31915283203125, -0.3069610595703125, -0.294769287109375, -0.2825775146484375, -0.2703857421875, -0.2581939697265625, -0.246002197265625, -0.2338104248046875, -0.22161865234375, -0.2094268798828125, -0.197235107421875, -0.1850433349609375, -0.1728515625, -0.1606597900390625, -0.148468017578125, -0.1362762451171875, -0.12408447265625, -0.1118927001953125, -0.099700927734375, -0.0875091552734375, -0.0753173828125, -0.0631256103515625, -0.050933837890625, -0.0387420654296875, -0.02655029296875, -0.0143585205078125, -0.002166748046875, 0.0100250244140625, 0.022216796875, 0.0344085693359375, 0.046600341796875, 0.0587921142578125, 0.07098388671875, 0.0831756591796875, 0.095367431640625, 0.1075592041015625, 0.1197509765625, 0.1319427490234375, 0.144134521484375, 0.1563262939453125, 0.16851806640625, 0.1807098388671875, 0.192901611328125, 0.2050933837890625, 0.21728515625, 0.2294769287109375, 0.241668701171875, 0.2538604736328125, 0.26605224609375, 0.2782440185546875, 0.290435791015625, 0.3026275634765625, 0.3148193359375, 0.3270111083984375, 0.339202880859375, 0.3513946533203125, 0.36358642578125, 0.3757781982421875, 0.387969970703125, 0.4001617431640625, 0.412353515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 11.0, 6.0, 9.0, 18.0, 21.0, 21.0, 44.0, 63.0, 94.0, 114.0, 236.0, 680.0, 1934.0, 357.0, 142.0, 98.0, 56.0, 44.0, 27.0, 19.0, 21.0, 9.0, 6.0, 6.0, 5.0, 6.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1885986328125, -0.18214035034179688, -0.17568206787109375, -0.16922378540039062, -0.1627655029296875, -0.15630722045898438, -0.14984893798828125, -0.14339065551757812, -0.136932373046875, -0.13047409057617188, -0.12401580810546875, -0.11755752563476562, -0.1110992431640625, -0.10464096069335938, -0.09818267822265625, -0.09172439575195312, -0.08526611328125, -0.07880783081054688, -0.07234954833984375, -0.06589126586914062, -0.0594329833984375, -0.052974700927734375, -0.04651641845703125, -0.040058135986328125, -0.033599853515625, -0.027141571044921875, -0.02068328857421875, -0.014225006103515625, -0.0077667236328125, -0.001308441162109375, 0.00514984130859375, 0.011608123779296875, 0.01806640625, 0.024524688720703125, 0.03098297119140625, 0.037441253662109375, 0.0438995361328125, 0.050357818603515625, 0.05681610107421875, 0.06327438354492188, 0.069732666015625, 0.07619094848632812, 0.08264923095703125, 0.08910751342773438, 0.0955657958984375, 0.10202407836914062, 0.10848236083984375, 0.11494064331054688, 0.12139892578125, 0.12785720825195312, 0.13431549072265625, 0.14077377319335938, 0.1472320556640625, 0.15369033813476562, 0.16014862060546875, 0.16660690307617188, 0.173065185546875, 0.17952346801757812, 0.18598175048828125, 0.19244003295898438, 0.1988983154296875, 0.20535659790039062, 0.21181488037109375, 0.21827316284179688, 0.2247314453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 10.0, 19.0, 57.0, 113.0, 228.0, 260.0, 169.0, 81.0, 42.0, 12.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6335906982421875, -2.5561323165893555, -2.4786739349365234, -2.4012155532836914, -2.3237571716308594, -2.2462987899780273, -2.1688404083251953, -2.0913820266723633, -2.0139236450195312, -1.9364652633666992, -1.8590068817138672, -1.7815485000610352, -1.7040901184082031, -1.626631736755371, -1.549173355102539, -1.471714973449707, -1.3942567110061646, -1.3167983293533325, -1.2393399477005005, -1.1618815660476685, -1.0844231843948364, -1.0069648027420044, -0.9295064806938171, -0.8520480990409851, -0.7745897173881531, -0.697131335735321, -0.619672954082489, -0.5422146320343018, -0.46475622057914734, -0.3872978389263153, -0.30983948707580566, -0.23238110542297363, -0.1549227237701416, -0.07746434956789017, -5.97536563873291e-06, 0.0774523913860321, 0.15491077303886414, 0.23236915469169617, 0.3098275065422058, 0.38728588819503784, 0.4647442698478699, 0.5422026515007019, 0.6196610331535339, 0.6971193552017212, 0.7745777368545532, 0.8520361185073853, 0.9294945001602173, 1.0069528818130493, 1.0844112634658813, 1.1618696451187134, 1.2393280267715454, 1.3167864084243774, 1.3942447900772095, 1.4717031717300415, 1.549161434173584, 1.626619815826416, 1.704078197479248, 1.78153657913208, 1.858994960784912, 1.9364533424377441, 2.013911724090576, 2.091370105743408, 2.1688284873962402, 2.2462868690490723, 2.3237452507019043]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 15.0, 18.0, 18.0, 20.0, 18.0, 23.0, 19.0, 38.0, 37.0, 32.0, 48.0, 44.0, 49.0, 44.0, 57.0, 61.0, 53.0, 47.0, 41.0, 47.0, 34.0, 35.0, 30.0, 25.0, 26.0, 18.0, 17.0, 12.0, 13.0, 6.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8055421113967896, -0.7815641760826111, -0.7575863003730774, -0.7336083650588989, -0.7096304893493652, -0.6856525540351868, -0.6616746187210083, -0.6376967430114746, -0.6137188673019409, -0.5897409319877625, -0.5657630562782288, -0.5417851209640503, -0.5178072452545166, -0.49382930994033813, -0.46985140442848206, -0.445873498916626, -0.4218955636024475, -0.39791765809059143, -0.37393975257873535, -0.3499618172645569, -0.3259839415550232, -0.3020060062408447, -0.27802810072898865, -0.25405019521713257, -0.2300722897052765, -0.2060943841934204, -0.18211647868156433, -0.15813855826854706, -0.13416065275669098, -0.1101827472448349, -0.08620482683181763, -0.06222692131996155, -0.03824895620346069, -0.014271046966314316, 0.009706862270832062, 0.03368477523326874, 0.05766268074512482, 0.0816405862569809, 0.10561850666999817, 0.12959641218185425, 0.15357431769371033, 0.1775522232055664, 0.20153012871742249, 0.22550804913043976, 0.24948595464229584, 0.2734638452529907, 0.2974417805671692, 0.32141968607902527, 0.34539759159088135, 0.3693754971027374, 0.3933534026145935, 0.417331337928772, 0.44130921363830566, 0.46528714895248413, 0.4892650544643402, 0.5132429599761963, 0.53722083568573, 0.5611987709999084, 0.5851766467094421, 0.6091545820236206, 0.6331324577331543, 0.6571103930473328, 0.6810883283615112, 0.7050662040710449, 0.7290441393852234]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 13.0, 9.0, 27.0, 30.0, 53.0, 94.0, 125.0, 248.0, 415.0, 707.0, 1324.0, 2493.0, 4800.0, 9497.0, 19990.0, 40600.0, 79600.0, 157342.0, 329229.0, 203331.0, 98442.0, 50311.0, 25025.0, 12198.0, 6083.0, 2941.0, 1537.0, 875.0, 475.0, 267.0, 154.0, 91.0, 72.0, 44.0, 32.0, 24.0, 8.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2509613037109375, -0.241180419921875, -0.2313995361328125, -0.22161865234375, -0.2118377685546875, -0.202056884765625, -0.1922760009765625, -0.1824951171875, -0.1727142333984375, -0.162933349609375, -0.1531524658203125, -0.14337158203125, -0.1335906982421875, -0.123809814453125, -0.1140289306640625, -0.104248046875, -0.0944671630859375, -0.084686279296875, -0.0749053955078125, -0.06512451171875, -0.0553436279296875, -0.045562744140625, -0.0357818603515625, -0.0260009765625, -0.0162200927734375, -0.006439208984375, 0.0033416748046875, 0.01312255859375, 0.0229034423828125, 0.032684326171875, 0.0424652099609375, 0.05224609375, 0.0620269775390625, 0.071807861328125, 0.0815887451171875, 0.09136962890625, 0.1011505126953125, 0.110931396484375, 0.1207122802734375, 0.1304931640625, 0.1402740478515625, 0.150054931640625, 0.1598358154296875, 0.16961669921875, 0.1793975830078125, 0.189178466796875, 0.1989593505859375, 0.208740234375, 0.2185211181640625, 0.228302001953125, 0.2380828857421875, 0.24786376953125, 0.2576446533203125, 0.267425537109375, 0.2772064208984375, 0.2869873046875, 0.2967681884765625, 0.306549072265625, 0.3163299560546875, 0.32611083984375, 0.3358917236328125, 0.345672607421875, 0.3554534912109375, 0.365234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 7.0, 14.0, 11.0, 5.0, 8.0, 21.0, 21.0, 16.0, 16.0, 22.0, 22.0, 28.0, 37.0, 41.0, 44.0, 52.0, 48.0, 55.0, 40.0, 54.0, 36.0, 47.0, 47.0, 35.0, 27.0, 24.0, 36.0, 33.0, 26.0, 22.0, 15.0, 13.0, 13.0, 11.0, 10.0, 8.0, 5.0, 9.0, 1.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1033935546875, -0.10030269622802734, -0.09721183776855469, -0.09412097930908203, -0.09103012084960938, -0.08793926239013672, -0.08484840393066406, -0.0817575454711914, -0.07866668701171875, -0.0755758285522461, -0.07248497009277344, -0.06939411163330078, -0.06630325317382812, -0.06321239471435547, -0.06012153625488281, -0.057030677795410156, -0.0539398193359375, -0.050848960876464844, -0.04775810241699219, -0.04466724395751953, -0.041576385498046875, -0.03848552703857422, -0.03539466857910156, -0.032303810119628906, -0.02921295166015625, -0.026122093200683594, -0.023031234741210938, -0.01994037628173828, -0.016849517822265625, -0.013758659362792969, -0.010667800903320312, -0.007576942443847656, -0.004486083984375, -0.0013952255249023438, 0.0016956329345703125, 0.004786491394042969, 0.007877349853515625, 0.010968208312988281, 0.014059066772460938, 0.017149925231933594, 0.02024078369140625, 0.023331642150878906, 0.026422500610351562, 0.02951335906982422, 0.032604217529296875, 0.03569507598876953, 0.03878593444824219, 0.041876792907714844, 0.0449676513671875, 0.048058509826660156, 0.05114936828613281, 0.05424022674560547, 0.057331085205078125, 0.06042194366455078, 0.06351280212402344, 0.0666036605834961, 0.06969451904296875, 0.0727853775024414, 0.07587623596191406, 0.07896709442138672, 0.08205795288085938, 0.08514881134033203, 0.08823966979980469, 0.09133052825927734, 0.09442138671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 8.0, 24.0, 28.0, 27.0, 43.0, 66.0, 91.0, 113.0, 174.0, 247.0, 385.0, 683.0, 1229.0, 3382.0, 15507.0, 105175.0, 663638.0, 218269.0, 29863.0, 5536.0, 1809.0, 784.0, 469.0, 264.0, 221.0, 125.0, 85.0, 62.0, 66.0, 45.0, 31.0, 19.0, 18.0, 10.0, 3.0, 9.0, 7.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75, -0.725555419921875, -0.70111083984375, -0.676666259765625, -0.6522216796875, -0.627777099609375, -0.60333251953125, -0.578887939453125, -0.554443359375, -0.529998779296875, -0.50555419921875, -0.481109619140625, -0.4566650390625, -0.432220458984375, -0.40777587890625, -0.383331298828125, -0.35888671875, -0.334442138671875, -0.30999755859375, -0.285552978515625, -0.2611083984375, -0.236663818359375, -0.21221923828125, -0.187774658203125, -0.163330078125, -0.138885498046875, -0.11444091796875, -0.089996337890625, -0.0655517578125, -0.041107177734375, -0.01666259765625, 0.007781982421875, 0.0322265625, 0.056671142578125, 0.08111572265625, 0.105560302734375, 0.1300048828125, 0.154449462890625, 0.17889404296875, 0.203338623046875, 0.227783203125, 0.252227783203125, 0.27667236328125, 0.301116943359375, 0.3255615234375, 0.350006103515625, 0.37445068359375, 0.398895263671875, 0.42333984375, 0.447784423828125, 0.47222900390625, 0.496673583984375, 0.5211181640625, 0.545562744140625, 0.57000732421875, 0.594451904296875, 0.618896484375, 0.643341064453125, 0.66778564453125, 0.692230224609375, 0.7166748046875, 0.741119384765625, 0.76556396484375, 0.790008544921875, 0.814453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 8.0, 9.0, 8.0, 14.0, 21.0, 19.0, 29.0, 31.0, 35.0, 40.0, 37.0, 55.0, 43.0, 43.0, 49.0, 55.0, 59.0, 51.0, 55.0, 48.0, 50.0, 37.0, 38.0, 26.0, 18.0, 24.0, 19.0, 15.0, 18.0, 4.0, 8.0, 6.0, 5.0, 6.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5070266723632812, -0.4886627197265625, -0.47029876708984375, -0.451934814453125, -0.43357086181640625, -0.4152069091796875, -0.39684295654296875, -0.37847900390625, -0.36011505126953125, -0.3417510986328125, -0.32338714599609375, -0.305023193359375, -0.28665924072265625, -0.2682952880859375, -0.24993133544921875, -0.2315673828125, -0.21320343017578125, -0.1948394775390625, -0.17647552490234375, -0.158111572265625, -0.13974761962890625, -0.1213836669921875, -0.10301971435546875, -0.08465576171875, -0.06629180908203125, -0.0479278564453125, -0.02956390380859375, -0.011199951171875, 0.00716400146484375, 0.0255279541015625, 0.04389190673828125, 0.062255859375, 0.08061981201171875, 0.0989837646484375, 0.11734771728515625, 0.135711669921875, 0.15407562255859375, 0.1724395751953125, 0.19080352783203125, 0.20916748046875, 0.22753143310546875, 0.2458953857421875, 0.26425933837890625, 0.282623291015625, 0.30098724365234375, 0.3193511962890625, 0.33771514892578125, 0.3560791015625, 0.37444305419921875, 0.3928070068359375, 0.41117095947265625, 0.429534912109375, 0.44789886474609375, 0.4662628173828125, 0.48462677001953125, 0.50299072265625, 0.5213546752929688, 0.5397186279296875, 0.5580825805664062, 0.576446533203125, 0.5948104858398438, 0.6131744384765625, 0.6315383911132812, 0.64990234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 7.0, 10.0, 12.0, 20.0, 40.0, 54.0, 121.0, 205.0, 495.0, 1149.0, 3132.0, 14443.0, 141881.0, 813672.0, 60985.0, 8534.0, 2240.0, 795.0, 357.0, 183.0, 80.0, 53.0, 27.0, 21.0, 10.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63037109375, -0.6120147705078125, -0.593658447265625, -0.5753021240234375, -0.55694580078125, -0.5385894775390625, -0.520233154296875, -0.5018768310546875, -0.4835205078125, -0.4651641845703125, -0.446807861328125, -0.4284515380859375, -0.41009521484375, -0.3917388916015625, -0.373382568359375, -0.3550262451171875, -0.336669921875, -0.3183135986328125, -0.299957275390625, -0.2816009521484375, -0.26324462890625, -0.2448883056640625, -0.226531982421875, -0.2081756591796875, -0.1898193359375, -0.1714630126953125, -0.153106689453125, -0.1347503662109375, -0.11639404296875, -0.0980377197265625, -0.079681396484375, -0.0613250732421875, -0.04296875, -0.0246124267578125, -0.006256103515625, 0.0121002197265625, 0.03045654296875, 0.0488128662109375, 0.067169189453125, 0.0855255126953125, 0.1038818359375, 0.1222381591796875, 0.140594482421875, 0.1589508056640625, 0.17730712890625, 0.1956634521484375, 0.214019775390625, 0.2323760986328125, 0.250732421875, 0.2690887451171875, 0.287445068359375, 0.3058013916015625, 0.32415771484375, 0.3425140380859375, 0.360870361328125, 0.3792266845703125, 0.3975830078125, 0.4159393310546875, 0.434295654296875, 0.4526519775390625, 0.47100830078125, 0.4893646240234375, 0.507720947265625, 0.5260772705078125, 0.54443359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 21.0, 20.0, 43.0, 47.0, 75.0, 98.0, 112.0, 139.0, 122.0, 71.0, 85.0, 42.0, 32.0, 31.0, 17.0, 18.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.279085159301758e-05, -7.890816777944565e-05, -7.502548396587372e-05, -7.114280015230179e-05, -6.726011633872986e-05, -6.337743252515793e-05, -5.9494748711586e-05, -5.561206489801407e-05, -5.172938108444214e-05, -4.784669727087021e-05, -4.396401345729828e-05, -4.008132964372635e-05, -3.619864583015442e-05, -3.231596201658249e-05, -2.843327820301056e-05, -2.455059438943863e-05, -2.06679105758667e-05, -1.678522676229477e-05, -1.290254294872284e-05, -9.01985913515091e-06, -5.1371753215789795e-06, -1.2544915080070496e-06, 2.6281923055648804e-06, 6.51087611913681e-06, 1.039355993270874e-05, 1.427624374628067e-05, 1.81589275598526e-05, 2.204161137342453e-05, 2.592429518699646e-05, 2.980697900056839e-05, 3.368966281414032e-05, 3.757234662771225e-05, 4.145503044128418e-05, 4.533771425485611e-05, 4.922039806842804e-05, 5.310308188199997e-05, 5.69857656955719e-05, 6.086844950914383e-05, 6.475113332271576e-05, 6.863381713628769e-05, 7.251650094985962e-05, 7.639918476343155e-05, 8.028186857700348e-05, 8.416455239057541e-05, 8.804723620414734e-05, 9.192992001771927e-05, 9.58126038312912e-05, 9.969528764486313e-05, 0.00010357797145843506, 0.00010746065527200699, 0.00011134333908557892, 0.00011522602289915085, 0.00011910870671272278, 0.0001229913905262947, 0.00012687407433986664, 0.00013075675815343857, 0.0001346394419670105, 0.00013852212578058243, 0.00014240480959415436, 0.0001462874934077263, 0.00015017017722129822, 0.00015405286103487015, 0.00015793554484844208, 0.000161818228662014, 0.00016570091247558594]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 9.0, 15.0, 27.0, 18.0, 46.0, 38.0, 79.0, 116.0, 227.0, 377.0, 732.0, 1630.0, 3959.0, 12517.0, 67374.0, 660942.0, 258411.0, 29781.0, 7133.0, 2615.0, 1118.0, 601.0, 267.0, 170.0, 100.0, 56.0, 49.0, 33.0, 31.0, 11.0, 14.0, 10.0, 8.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.494384765625, -0.48130035400390625, -0.4682159423828125, -0.45513153076171875, -0.442047119140625, -0.42896270751953125, -0.4158782958984375, -0.40279388427734375, -0.38970947265625, -0.37662506103515625, -0.3635406494140625, -0.35045623779296875, -0.337371826171875, -0.32428741455078125, -0.3112030029296875, -0.29811859130859375, -0.2850341796875, -0.27194976806640625, -0.2588653564453125, -0.24578094482421875, -0.232696533203125, -0.21961212158203125, -0.2065277099609375, -0.19344329833984375, -0.18035888671875, -0.16727447509765625, -0.1541900634765625, -0.14110565185546875, -0.128021240234375, -0.11493682861328125, -0.1018524169921875, -0.08876800537109375, -0.07568359375, -0.06259918212890625, -0.0495147705078125, -0.03643035888671875, -0.023345947265625, -0.01026153564453125, 0.0028228759765625, 0.01590728759765625, 0.02899169921875, 0.04207611083984375, 0.0551605224609375, 0.06824493408203125, 0.081329345703125, 0.09441375732421875, 0.1074981689453125, 0.12058258056640625, 0.1336669921875, 0.14675140380859375, 0.1598358154296875, 0.17292022705078125, 0.186004638671875, 0.19908905029296875, 0.2121734619140625, 0.22525787353515625, 0.23834228515625, 0.25142669677734375, 0.2645111083984375, 0.27759552001953125, 0.290679931640625, 0.30376434326171875, 0.3168487548828125, 0.32993316650390625, 0.343017578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 3.0, 9.0, 9.0, 6.0, 8.0, 23.0, 10.0, 18.0, 41.0, 50.0, 58.0, 94.0, 105.0, 112.0, 97.0, 91.0, 65.0, 51.0, 32.0, 28.0, 18.0, 10.0, 12.0, 3.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.261474609375, -0.253173828125, -0.244873046875, -0.236572265625, -0.228271484375, -0.219970703125, -0.211669921875, -0.203369140625, -0.195068359375, -0.186767578125, -0.178466796875, -0.170166015625, -0.161865234375, -0.153564453125, -0.145263671875, -0.136962890625, -0.128662109375, -0.120361328125, -0.112060546875, -0.103759765625, -0.095458984375, -0.087158203125, -0.078857421875, -0.070556640625, -0.062255859375, -0.053955078125, -0.045654296875, -0.037353515625, -0.029052734375, -0.020751953125, -0.012451171875, -0.004150390625, 0.004150390625, 0.012451171875, 0.020751953125, 0.029052734375, 0.037353515625, 0.045654296875, 0.053955078125, 0.062255859375, 0.070556640625, 0.078857421875, 0.087158203125, 0.095458984375, 0.103759765625, 0.112060546875, 0.120361328125, 0.128662109375, 0.136962890625, 0.145263671875, 0.153564453125, 0.161865234375, 0.170166015625, 0.178466796875, 0.186767578125, 0.195068359375, 0.203369140625, 0.211669921875, 0.219970703125, 0.228271484375, 0.236572265625, 0.244873046875, 0.253173828125, 0.261474609375, 0.269775390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 25.0, 52.0, 92.0, 162.0, 206.0, 187.0, 141.0, 69.0, 24.0, 20.0, 7.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888030529022217, -3.6912710666656494, -3.494511604309082, -3.2977523803710938, -3.1009926795959473, -2.904233455657959, -2.7074739933013916, -2.510714530944824, -2.313955068588257, -2.1171956062316895, -1.920436143875122, -1.7236768007278442, -1.5269173383712769, -1.3301578760147095, -1.1333985328674316, -0.9366390705108643, -0.7398796081542969, -0.5431201457977295, -0.3463607430458069, -0.14960134029388428, 0.047158122062683105, 0.2439175844192505, 0.4406769275665283, 0.6374363899230957, 0.8341958522796631, 1.0309553146362305, 1.2277147769927979, 1.4244741201400757, 1.621233582496643, 1.8179930448532104, 2.0147523880004883, 2.2115118503570557, 2.408270835876465, 2.6050302982330322, 2.8017897605895996, 2.998548984527588, 3.1953086853027344, 3.3920679092407227, 3.58882737159729, 3.7855868339538574, 3.982346296310425, 4.179105758666992, 4.3758649826049805, 4.572624683380127, 4.769383907318115, 4.966143608093262, 5.16290283203125, 5.359662055969238, 5.556421756744385, 5.753180980682373, 5.9499406814575195, 6.146699905395508, 6.343459606170654, 6.540218830108643, 6.736978530883789, 6.933737754821777, 7.130496978759766, 7.327256202697754, 7.5240159034729, 7.720775127410889, 7.917534828186035, 8.114294052124023, 8.311053276062012, 8.5078125, 8.704572677612305]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 9.0, 7.0, 11.0, 12.0, 16.0, 11.0, 21.0, 24.0, 18.0, 35.0, 35.0, 26.0, 28.0, 30.0, 27.0, 46.0, 45.0, 44.0, 44.0, 49.0, 45.0, 36.0, 39.0, 39.0, 35.0, 36.0, 28.0, 25.0, 22.0, 22.0, 20.0, 10.0, 14.0, 11.0, 15.0, 12.0, 8.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.72670316696167, -2.643937587738037, -2.5611722469329834, -2.4784066677093506, -2.3956410884857178, -2.312875747680664, -2.2301101684570312, -2.1473445892333984, -2.0645790100097656, -1.9818135499954224, -1.8990479707717896, -1.8162825107574463, -1.7335169315338135, -1.6507514715194702, -1.567986011505127, -1.4852204322814941, -1.4024550914764404, -1.3196896314620972, -1.2369240522384644, -1.154158592224121, -1.0713930130004883, -0.988627552986145, -0.9058620929718018, -0.8230965733528137, -0.7403310537338257, -0.6575655341148376, -0.5748000144958496, -0.49203455448150635, -0.4092690348625183, -0.3265035152435303, -0.24373802542686462, -0.16097253561019897, -0.07820701599121094, 0.004558488726615906, 0.08732399344444275, 0.1700894981622696, 0.25285500288009644, 0.3356205224990845, 0.4183860123157501, 0.5011515021324158, 0.5839170217514038, 0.6666825413703918, 0.7494480609893799, 0.8322135210037231, 0.9149790406227112, 0.9977445602416992, 1.0805100202560425, 1.1632754802703857, 1.2460410594940186, 1.3288065195083618, 1.4115720987319946, 1.494337558746338, 1.5771031379699707, 1.659868597984314, 1.7426340579986572, 1.82539963722229, 1.9081650972366333, 1.9909305572509766, 2.0736961364746094, 2.156461715698242, 2.239227056503296, 2.3219926357269287, 2.4047582149505615, 2.4875235557556152, 2.570289134979248]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 13.0, 12.0, 19.0, 27.0, 35.0, 53.0, 85.0, 125.0, 171.0, 288.0, 397.0, 589.0, 933.0, 1479.0, 2483.0, 3968.0, 6713.0, 12776.0, 26128.0, 61341.0, 199088.0, 2955625.0, 708090.0, 125347.0, 44842.0, 19573.0, 10169.0, 5610.0, 3108.0, 1835.0, 1178.0, 748.0, 483.0, 300.0, 224.0, 132.0, 110.0, 48.0, 37.0, 28.0, 22.0, 21.0, 17.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.354248046875, -0.34236907958984375, -0.3304901123046875, -0.31861114501953125, -0.306732177734375, -0.29485321044921875, -0.2829742431640625, -0.27109527587890625, -0.25921630859375, -0.24733734130859375, -0.2354583740234375, -0.22357940673828125, -0.211700439453125, -0.19982147216796875, -0.1879425048828125, -0.17606353759765625, -0.1641845703125, -0.15230560302734375, -0.1404266357421875, -0.12854766845703125, -0.116668701171875, -0.10478973388671875, -0.0929107666015625, -0.08103179931640625, -0.06915283203125, -0.05727386474609375, -0.0453948974609375, -0.03351593017578125, -0.021636962890625, -0.00975799560546875, 0.0021209716796875, 0.01399993896484375, 0.02587890625, 0.03775787353515625, 0.0496368408203125, 0.06151580810546875, 0.073394775390625, 0.08527374267578125, 0.0971527099609375, 0.10903167724609375, 0.12091064453125, 0.13278961181640625, 0.1446685791015625, 0.15654754638671875, 0.168426513671875, 0.18030548095703125, 0.1921844482421875, 0.20406341552734375, 0.2159423828125, 0.22782135009765625, 0.2397003173828125, 0.25157928466796875, 0.263458251953125, 0.27533721923828125, 0.2872161865234375, 0.29909515380859375, 0.31097412109375, 0.32285308837890625, 0.3347320556640625, 0.34661102294921875, 0.358489990234375, 0.37036895751953125, 0.3822479248046875, 0.39412689208984375, 0.406005859375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 8.0, 9.0, 8.0, 14.0, 10.0, 15.0, 8.0, 26.0, 21.0, 31.0, 26.0, 40.0, 26.0, 38.0, 41.0, 46.0, 42.0, 58.0, 49.0, 23.0, 53.0, 49.0, 35.0, 39.0, 44.0, 39.0, 32.0, 21.0, 21.0, 22.0, 17.0, 12.0, 12.0, 10.0, 12.0, 15.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1058349609375, -0.10247993469238281, -0.09912490844726562, -0.09576988220214844, -0.09241485595703125, -0.08905982971191406, -0.08570480346679688, -0.08234977722167969, -0.0789947509765625, -0.07563972473144531, -0.07228469848632812, -0.06892967224121094, -0.06557464599609375, -0.06221961975097656, -0.058864593505859375, -0.05550956726074219, -0.052154541015625, -0.04879951477050781, -0.045444488525390625, -0.04208946228027344, -0.03873443603515625, -0.03537940979003906, -0.032024383544921875, -0.028669357299804688, -0.0253143310546875, -0.021959304809570312, -0.018604278564453125, -0.015249252319335938, -0.01189422607421875, -0.008539199829101562, -0.005184173583984375, -0.0018291473388671875, 0.00152587890625, 0.0048809051513671875, 0.008235931396484375, 0.011590957641601562, 0.01494598388671875, 0.018301010131835938, 0.021656036376953125, 0.025011062622070312, 0.0283660888671875, 0.03172111511230469, 0.035076141357421875, 0.03843116760253906, 0.04178619384765625, 0.04514122009277344, 0.048496246337890625, 0.05185127258300781, 0.055206298828125, 0.05856132507324219, 0.061916351318359375, 0.06527137756347656, 0.06862640380859375, 0.07198143005371094, 0.07533645629882812, 0.07869148254394531, 0.0820465087890625, 0.08540153503417969, 0.08875656127929688, 0.09211158752441406, 0.09546661376953125, 0.09882164001464844, 0.10217666625976562, 0.10553169250488281, 0.10888671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 12.0, 17.0, 16.0, 15.0, 27.0, 49.0, 57.0, 88.0, 148.0, 274.0, 401.0, 650.0, 1247.0, 2220.0, 4596.0, 9543.0, 23360.0, 68074.0, 293350.0, 3211796.0, 439836.0, 87396.0, 28459.0, 11538.0, 5195.0, 2596.0, 1328.0, 770.0, 470.0, 253.0, 155.0, 104.0, 70.0, 41.0, 31.0, 29.0, 15.0, 10.0, 8.0, 7.0, 8.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50341796875, -0.48797607421875, -0.4725341796875, -0.45709228515625, -0.441650390625, -0.42620849609375, -0.4107666015625, -0.39532470703125, -0.3798828125, -0.36444091796875, -0.3489990234375, -0.33355712890625, -0.318115234375, -0.30267333984375, -0.2872314453125, -0.27178955078125, -0.25634765625, -0.24090576171875, -0.2254638671875, -0.21002197265625, -0.194580078125, -0.17913818359375, -0.1636962890625, -0.14825439453125, -0.1328125, -0.11737060546875, -0.1019287109375, -0.08648681640625, -0.071044921875, -0.05560302734375, -0.0401611328125, -0.02471923828125, -0.00927734375, 0.00616455078125, 0.0216064453125, 0.03704833984375, 0.052490234375, 0.06793212890625, 0.0833740234375, 0.09881591796875, 0.1142578125, 0.12969970703125, 0.1451416015625, 0.16058349609375, 0.176025390625, 0.19146728515625, 0.2069091796875, 0.22235107421875, 0.23779296875, 0.25323486328125, 0.2686767578125, 0.28411865234375, 0.299560546875, 0.31500244140625, 0.3304443359375, 0.34588623046875, 0.361328125, 0.37677001953125, 0.3922119140625, 0.40765380859375, 0.423095703125, 0.43853759765625, 0.4539794921875, 0.46942138671875, 0.48486328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 20.0, 19.0, 32.0, 34.0, 43.0, 73.0, 96.0, 138.0, 210.0, 463.0, 1566.0, 634.0, 255.0, 163.0, 92.0, 52.0, 34.0, 17.0, 25.0, 18.0, 10.0, 14.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2293701171875, -0.2216510772705078, -0.21393203735351562, -0.20621299743652344, -0.19849395751953125, -0.19077491760253906, -0.18305587768554688, -0.1753368377685547, -0.1676177978515625, -0.1598987579345703, -0.15217971801757812, -0.14446067810058594, -0.13674163818359375, -0.12902259826660156, -0.12130355834960938, -0.11358451843261719, -0.105865478515625, -0.09814643859863281, -0.09042739868164062, -0.08270835876464844, -0.07498931884765625, -0.06727027893066406, -0.059551239013671875, -0.05183219909667969, -0.0441131591796875, -0.03639411926269531, -0.028675079345703125, -0.020956039428710938, -0.01323699951171875, -0.0055179595947265625, 0.002201080322265625, 0.009920120239257812, 0.01763916015625, 0.025358200073242188, 0.033077239990234375, 0.04079627990722656, 0.04851531982421875, 0.05623435974121094, 0.06395339965820312, 0.07167243957519531, 0.0793914794921875, 0.08711051940917969, 0.09482955932617188, 0.10254859924316406, 0.11026763916015625, 0.11798667907714844, 0.12570571899414062, 0.1334247589111328, 0.141143798828125, 0.1488628387451172, 0.15658187866210938, 0.16430091857910156, 0.17201995849609375, 0.17973899841308594, 0.18745803833007812, 0.1951770782470703, 0.2028961181640625, 0.2106151580810547, 0.21833419799804688, 0.22605323791503906, 0.23377227783203125, 0.24149131774902344, 0.24921035766601562, 0.2569293975830078, 0.2646484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 7.0, 12.0, 10.0, 16.0, 36.0, 40.0, 65.0, 98.0, 113.0, 116.0, 148.0, 105.0, 77.0, 60.0, 36.0, 19.0, 18.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.112381935119629, -3.0518460273742676, -2.9913101196289062, -2.930774450302124, -2.8702385425567627, -2.8097026348114014, -2.74916672706604, -2.688631057739258, -2.6280951499938965, -2.567559242248535, -2.507023334503174, -2.4464876651763916, -2.3859517574310303, -2.325415849685669, -2.2648799419403076, -2.2043442726135254, -2.143808364868164, -2.0832724571228027, -2.0227365493774414, -1.9622007608413696, -1.9016649723052979, -1.8411290645599365, -1.7805932760238647, -1.7200573682785034, -1.659521460533142, -1.5989855527877808, -1.538449764251709, -1.4779138565063477, -1.4173780679702759, -1.3568421602249146, -1.2963063716888428, -1.2357704639434814, -1.1752345561981201, -1.1146986484527588, -1.054162859916687, -0.9936270117759705, -0.9330911636352539, -0.8725552558898926, -0.8120194673538208, -0.7514835596084595, -0.6909477710723877, -0.6304119229316711, -0.5698760747909546, -0.509340226650238, -0.4488043785095215, -0.38826850056648254, -0.327732652425766, -0.26719680428504944, -0.20666098594665527, -0.14612513780593872, -0.08558928221464157, -0.02505342662334442, 0.03548242151737213, 0.09601828455924988, 0.15655413269996643, 0.21708998084068298, 0.27762582898139954, 0.3381616771221161, 0.39869752526283264, 0.4592334032058716, 0.5197692513465881, 0.5803050994873047, 0.6408409476280212, 0.7013767957687378, 0.7619126439094543]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 7.0, 13.0, 17.0, 9.0, 25.0, 27.0, 21.0, 29.0, 21.0, 37.0, 30.0, 38.0, 55.0, 45.0, 44.0, 44.0, 40.0, 55.0, 39.0, 35.0, 44.0, 40.0, 37.0, 31.0, 26.0, 30.0, 25.0, 22.0, 13.0, 11.0, 14.0, 17.0, 8.0, 5.0, 15.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0752302408218384, -1.043684720993042, -1.0121392011642456, -0.9805936217308044, -0.9490481019020081, -0.9175025820732117, -0.8859570026397705, -0.8544114828109741, -0.8228659629821777, -0.7913204431533813, -0.759774923324585, -0.7282293438911438, -0.6966838240623474, -0.665138304233551, -0.6335927248001099, -0.6020472049713135, -0.5705016851425171, -0.5389561653137207, -0.5074106454849243, -0.47586506605148315, -0.44431954622268677, -0.4127740263938904, -0.3812284767627716, -0.34968292713165283, -0.31813740730285645, -0.28659188747406006, -0.2550463378429413, -0.2235008031129837, -0.19195526838302612, -0.16040973365306854, -0.12886419892311096, -0.09731866419315338, -0.06577318906784058, -0.034227654337882996, -0.002682119607925415, 0.028863415122032166, 0.060408949851989746, 0.09195448458194733, 0.12350001931190491, 0.1550455540418625, 0.18659108877182007, 0.21813662350177765, 0.24968215823173523, 0.281227707862854, 0.3127732276916504, 0.3443187475204468, 0.37586429715156555, 0.4074098467826843, 0.4389553666114807, 0.4705008864402771, 0.5020464658737183, 0.5335919857025146, 0.565137505531311, 0.5966830253601074, 0.6282285451889038, 0.659774124622345, 0.6913196444511414, 0.7228651642799377, 0.7544107437133789, 0.7859562635421753, 0.8175017833709717, 0.8490473031997681, 0.8805928230285645, 0.9121384024620056, 0.943683922290802]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 3.0, 3.0, 7.0, 9.0, 22.0, 18.0, 36.0, 42.0, 89.0, 158.0, 258.0, 514.0, 999.0, 2178.0, 5024.0, 12486.0, 34518.0, 100354.0, 258254.0, 346223.0, 183767.0, 65543.0, 22790.0, 8473.0, 3481.0, 1569.0, 800.0, 408.0, 194.0, 122.0, 85.0, 31.0, 42.0, 15.0, 8.0, 10.0, 5.0, 12.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4599609375, -0.4461479187011719, -0.43233489990234375, -0.4185218811035156, -0.4047088623046875, -0.3908958435058594, -0.37708282470703125, -0.3632698059082031, -0.349456787109375, -0.3356437683105469, -0.32183074951171875, -0.3080177307128906, -0.2942047119140625, -0.2803916931152344, -0.26657867431640625, -0.2527656555175781, -0.23895263671875, -0.22513961791992188, -0.21132659912109375, -0.19751358032226562, -0.1837005615234375, -0.16988754272460938, -0.15607452392578125, -0.14226150512695312, -0.128448486328125, -0.11463546752929688, -0.10082244873046875, -0.08700942993164062, -0.0731964111328125, -0.059383392333984375, -0.04557037353515625, -0.031757354736328125, -0.0179443359375, -0.004131317138671875, 0.00968170166015625, 0.023494720458984375, 0.0373077392578125, 0.051120758056640625, 0.06493377685546875, 0.07874679565429688, 0.092559814453125, 0.10637283325195312, 0.12018585205078125, 0.13399887084960938, 0.1478118896484375, 0.16162490844726562, 0.17543792724609375, 0.18925094604492188, 0.20306396484375, 0.21687698364257812, 0.23069000244140625, 0.24450302124023438, 0.2583160400390625, 0.2721290588378906, 0.28594207763671875, 0.2997550964355469, 0.313568115234375, 0.3273811340332031, 0.34119415283203125, 0.3550071716308594, 0.3688201904296875, 0.3826332092285156, 0.39644622802734375, 0.4102592468261719, 0.424072265625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 12.0, 12.0, 10.0, 14.0, 18.0, 22.0, 32.0, 30.0, 25.0, 35.0, 35.0, 43.0, 49.0, 42.0, 53.0, 45.0, 48.0, 48.0, 39.0, 45.0, 40.0, 51.0, 29.0, 26.0, 28.0, 37.0, 20.0, 11.0, 10.0, 14.0, 12.0, 5.0, 6.0, 5.0, 12.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.12066650390625, -0.11718940734863281, -0.11371231079101562, -0.11023521423339844, -0.10675811767578125, -0.10328102111816406, -0.09980392456054688, -0.09632682800292969, -0.0928497314453125, -0.08937263488769531, -0.08589553833007812, -0.08241844177246094, -0.07894134521484375, -0.07546424865722656, -0.07198715209960938, -0.06851005554199219, -0.065032958984375, -0.06155586242675781, -0.058078765869140625, -0.05460166931152344, -0.05112457275390625, -0.04764747619628906, -0.044170379638671875, -0.04069328308105469, -0.0372161865234375, -0.03373908996582031, -0.030261993408203125, -0.026784896850585938, -0.02330780029296875, -0.019830703735351562, -0.016353607177734375, -0.012876510620117188, -0.0093994140625, -0.0059223175048828125, -0.002445220947265625, 0.0010318756103515625, 0.00450897216796875, 0.007986068725585938, 0.011463165283203125, 0.014940261840820312, 0.0184173583984375, 0.021894454956054688, 0.025371551513671875, 0.028848648071289062, 0.03232574462890625, 0.03580284118652344, 0.039279937744140625, 0.04275703430175781, 0.046234130859375, 0.04971122741699219, 0.053188323974609375, 0.05666542053222656, 0.06014251708984375, 0.06361961364746094, 0.06709671020507812, 0.07057380676269531, 0.0740509033203125, 0.07752799987792969, 0.08100509643554688, 0.08448219299316406, 0.08795928955078125, 0.09143638610839844, 0.09491348266601562, 0.09839057922363281, 0.10186767578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 9.0, 19.0, 12.0, 25.0, 33.0, 51.0, 67.0, 77.0, 113.0, 132.0, 182.0, 255.0, 368.0, 500.0, 839.0, 1511.0, 3381.0, 9915.0, 39917.0, 191085.0, 518010.0, 217412.0, 45263.0, 11096.0, 3747.0, 1616.0, 870.0, 594.0, 400.0, 269.0, 176.0, 153.0, 103.0, 78.0, 65.0, 49.0, 39.0, 22.0, 23.0, 14.0, 11.0, 10.0, 10.0, 5.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.57177734375, -0.55364990234375, -0.5355224609375, -0.51739501953125, -0.499267578125, -0.48114013671875, -0.4630126953125, -0.44488525390625, -0.4267578125, -0.40863037109375, -0.3905029296875, -0.37237548828125, -0.354248046875, -0.33612060546875, -0.3179931640625, -0.29986572265625, -0.28173828125, -0.26361083984375, -0.2454833984375, -0.22735595703125, -0.209228515625, -0.19110107421875, -0.1729736328125, -0.15484619140625, -0.13671875, -0.11859130859375, -0.1004638671875, -0.08233642578125, -0.064208984375, -0.04608154296875, -0.0279541015625, -0.00982666015625, 0.00830078125, 0.02642822265625, 0.0445556640625, 0.06268310546875, 0.080810546875, 0.09893798828125, 0.1170654296875, 0.13519287109375, 0.1533203125, 0.17144775390625, 0.1895751953125, 0.20770263671875, 0.225830078125, 0.24395751953125, 0.2620849609375, 0.28021240234375, 0.29833984375, 0.31646728515625, 0.3345947265625, 0.35272216796875, 0.370849609375, 0.38897705078125, 0.4071044921875, 0.42523193359375, 0.443359375, 0.46148681640625, 0.4796142578125, 0.49774169921875, 0.515869140625, 0.53399658203125, 0.5521240234375, 0.57025146484375, 0.58837890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 6.0, 5.0, 6.0, 6.0, 5.0, 7.0, 17.0, 18.0, 18.0, 28.0, 36.0, 35.0, 26.0, 30.0, 48.0, 41.0, 40.0, 46.0, 41.0, 53.0, 48.0, 46.0, 52.0, 36.0, 34.0, 42.0, 38.0, 28.0, 30.0, 22.0, 20.0, 19.0, 19.0, 13.0, 9.0, 6.0, 4.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.5623016357421875, -0.543060302734375, -0.5238189697265625, -0.50457763671875, -0.4853363037109375, -0.466094970703125, -0.4468536376953125, -0.4276123046875, -0.4083709716796875, -0.389129638671875, -0.3698883056640625, -0.35064697265625, -0.3314056396484375, -0.312164306640625, -0.2929229736328125, -0.273681640625, -0.2544403076171875, -0.235198974609375, -0.2159576416015625, -0.19671630859375, -0.1774749755859375, -0.158233642578125, -0.1389923095703125, -0.1197509765625, -0.1005096435546875, -0.081268310546875, -0.0620269775390625, -0.04278564453125, -0.0235443115234375, -0.004302978515625, 0.0149383544921875, 0.0341796875, 0.0534210205078125, 0.072662353515625, 0.0919036865234375, 0.11114501953125, 0.1303863525390625, 0.149627685546875, 0.1688690185546875, 0.1881103515625, 0.2073516845703125, 0.226593017578125, 0.2458343505859375, 0.26507568359375, 0.2843170166015625, 0.303558349609375, 0.3227996826171875, 0.342041015625, 0.3612823486328125, 0.380523681640625, 0.3997650146484375, 0.41900634765625, 0.4382476806640625, 0.457489013671875, 0.4767303466796875, 0.4959716796875, 0.5152130126953125, 0.534454345703125, 0.5536956787109375, 0.57293701171875, 0.5921783447265625, 0.611419677734375, 0.6306610107421875, 0.64990234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 9.0, 8.0, 13.0, 28.0, 40.0, 53.0, 87.0, 164.0, 279.0, 463.0, 883.0, 1698.0, 3816.0, 9718.0, 28350.0, 103650.0, 405063.0, 361507.0, 91411.0, 25450.0, 8600.0, 3614.0, 1659.0, 821.0, 497.0, 256.0, 164.0, 97.0, 55.0, 29.0, 20.0, 14.0, 17.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.267578125, -0.25893402099609375, -0.2502899169921875, -0.24164581298828125, -0.233001708984375, -0.22435760498046875, -0.2157135009765625, -0.20706939697265625, -0.19842529296875, -0.18978118896484375, -0.1811370849609375, -0.17249298095703125, -0.163848876953125, -0.15520477294921875, -0.1465606689453125, -0.13791656494140625, -0.1292724609375, -0.12062835693359375, -0.1119842529296875, -0.10334014892578125, -0.094696044921875, -0.08605194091796875, -0.0774078369140625, -0.06876373291015625, -0.06011962890625, -0.05147552490234375, -0.0428314208984375, -0.03418731689453125, -0.025543212890625, -0.01689910888671875, -0.0082550048828125, 0.00038909912109375, 0.009033203125, 0.01767730712890625, 0.0263214111328125, 0.03496551513671875, 0.043609619140625, 0.05225372314453125, 0.0608978271484375, 0.06954193115234375, 0.07818603515625, 0.08683013916015625, 0.0954742431640625, 0.10411834716796875, 0.112762451171875, 0.12140655517578125, 0.1300506591796875, 0.13869476318359375, 0.1473388671875, 0.15598297119140625, 0.1646270751953125, 0.17327117919921875, 0.181915283203125, 0.19055938720703125, 0.1992034912109375, 0.20784759521484375, 0.21649169921875, 0.22513580322265625, 0.2337799072265625, 0.24242401123046875, 0.251068115234375, 0.25971221923828125, 0.2683563232421875, 0.27700042724609375, 0.28564453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 7.0, 13.0, 18.0, 30.0, 41.0, 26.0, 43.0, 46.0, 52.0, 69.0, 70.0, 68.0, 85.0, 80.0, 54.0, 53.0, 59.0, 39.0, 33.0, 21.0, 23.0, 13.0, 15.0, 5.0, 10.0, 4.0, 4.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.863210678100586e-05, -8.586607873439789e-05, -8.310005068778992e-05, -8.033402264118195e-05, -7.756799459457397e-05, -7.4801966547966e-05, -7.203593850135803e-05, -6.926991045475006e-05, -6.650388240814209e-05, -6.373785436153412e-05, -6.097182631492615e-05, -5.8205798268318176e-05, -5.5439770221710205e-05, -5.2673742175102234e-05, -4.990771412849426e-05, -4.714168608188629e-05, -4.437565803527832e-05, -4.160962998867035e-05, -3.884360194206238e-05, -3.607757389545441e-05, -3.3311545848846436e-05, -3.0545517802238464e-05, -2.7779489755630493e-05, -2.5013461709022522e-05, -2.224743366241455e-05, -1.948140561580658e-05, -1.671537756919861e-05, -1.3949349522590637e-05, -1.1183321475982666e-05, -8.417293429374695e-06, -5.651265382766724e-06, -2.8852373361587524e-06, -1.1920928955078125e-07, 2.64681875705719e-06, 5.412846803665161e-06, 8.178874850273132e-06, 1.0944902896881104e-05, 1.3710930943489075e-05, 1.6476958990097046e-05, 1.9242987036705017e-05, 2.2009015083312988e-05, 2.477504312992096e-05, 2.754107117652893e-05, 3.0307099223136902e-05, 3.307312726974487e-05, 3.5839155316352844e-05, 3.8605183362960815e-05, 4.137121140956879e-05, 4.413723945617676e-05, 4.690326750278473e-05, 4.96692955493927e-05, 5.243532359600067e-05, 5.520135164260864e-05, 5.7967379689216614e-05, 6.0733407735824585e-05, 6.349943578243256e-05, 6.626546382904053e-05, 6.90314918756485e-05, 7.179751992225647e-05, 7.456354796886444e-05, 7.732957601547241e-05, 8.009560406208038e-05, 8.286163210868835e-05, 8.562766015529633e-05, 8.83936882019043e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 6.0, 6.0, 13.0, 17.0, 22.0, 24.0, 40.0, 57.0, 107.0, 151.0, 242.0, 413.0, 597.0, 1077.0, 2055.0, 4175.0, 10195.0, 30771.0, 119759.0, 453819.0, 311269.0, 77320.0, 21662.0, 7516.0, 3349.0, 1628.0, 915.0, 443.0, 303.0, 181.0, 125.0, 85.0, 61.0, 38.0, 27.0, 24.0, 15.0, 10.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.24369049072265625, -0.2349395751953125, -0.22618865966796875, -0.217437744140625, -0.20868682861328125, -0.1999359130859375, -0.19118499755859375, -0.18243408203125, -0.17368316650390625, -0.1649322509765625, -0.15618133544921875, -0.147430419921875, -0.13867950439453125, -0.1299285888671875, -0.12117767333984375, -0.1124267578125, -0.10367584228515625, -0.0949249267578125, -0.08617401123046875, -0.077423095703125, -0.06867218017578125, -0.0599212646484375, -0.05117034912109375, -0.04241943359375, -0.03366851806640625, -0.0249176025390625, -0.01616668701171875, -0.007415771484375, 0.00133514404296875, 0.0100860595703125, 0.01883697509765625, 0.027587890625, 0.03633880615234375, 0.0450897216796875, 0.05384063720703125, 0.062591552734375, 0.07134246826171875, 0.0800933837890625, 0.08884429931640625, 0.09759521484375, 0.10634613037109375, 0.1150970458984375, 0.12384796142578125, 0.132598876953125, 0.14134979248046875, 0.1501007080078125, 0.15885162353515625, 0.1676025390625, 0.17635345458984375, 0.1851043701171875, 0.19385528564453125, 0.202606201171875, 0.21135711669921875, 0.2201080322265625, 0.22885894775390625, 0.23760986328125, 0.24636077880859375, 0.2551116943359375, 0.26386260986328125, 0.272613525390625, 0.28136444091796875, 0.2901153564453125, 0.29886627197265625, 0.3076171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 12.0, 6.0, 12.0, 19.0, 19.0, 28.0, 25.0, 37.0, 55.0, 72.0, 66.0, 86.0, 123.0, 85.0, 67.0, 61.0, 56.0, 38.0, 37.0, 22.0, 29.0, 8.0, 15.0, 10.0, 5.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26708984375, -0.2577629089355469, -0.24843597412109375, -0.23910903930664062, -0.2297821044921875, -0.22045516967773438, -0.21112823486328125, -0.20180130004882812, -0.192474365234375, -0.18314743041992188, -0.17382049560546875, -0.16449356079101562, -0.1551666259765625, -0.14583969116210938, -0.13651275634765625, -0.12718582153320312, -0.11785888671875, -0.10853195190429688, -0.09920501708984375, -0.08987808227539062, -0.0805511474609375, -0.07122421264648438, -0.06189727783203125, -0.052570343017578125, -0.043243408203125, -0.033916473388671875, -0.02458953857421875, -0.015262603759765625, -0.0059356689453125, 0.003391265869140625, 0.01271820068359375, 0.022045135498046875, 0.0313720703125, 0.040699005126953125, 0.05002593994140625, 0.059352874755859375, 0.0686798095703125, 0.07800674438476562, 0.08733367919921875, 0.09666061401367188, 0.105987548828125, 0.11531448364257812, 0.12464141845703125, 0.13396835327148438, 0.1432952880859375, 0.15262222290039062, 0.16194915771484375, 0.17127609252929688, 0.18060302734375, 0.18992996215820312, 0.19925689697265625, 0.20858383178710938, 0.2179107666015625, 0.22723770141601562, 0.23656463623046875, 0.24589157104492188, 0.255218505859375, 0.2645454406738281, 0.27387237548828125, 0.2831993103027344, 0.2925262451171875, 0.3018531799316406, 0.31118011474609375, 0.3205070495605469, 0.329833984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 14.0, 50.0, 112.0, 222.0, 270.0, 189.0, 88.0, 28.0, 16.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-13.355056762695312, -13.09546184539795, -12.83586597442627, -12.576271057128906, -12.316675186157227, -12.057080268859863, -11.7974853515625, -11.53788948059082, -11.278294563293457, -11.018699645996094, -10.759103775024414, -10.49950885772705, -10.239912986755371, -9.980318069458008, -9.720722198486328, -9.461127281188965, -9.201532363891602, -8.941937446594238, -8.682341575622559, -8.422746658325195, -8.163150787353516, -7.903555870056152, -7.643960475921631, -7.384365081787109, -7.12476921081543, -6.865173816680908, -6.605578422546387, -6.345983505249023, -6.086388111114502, -5.8267927169799805, -5.567197322845459, -5.3076019287109375, -5.048007011413574, -4.788411617279053, -4.528816223144531, -4.269221305847168, -4.0096259117126465, -3.750030517578125, -3.4904351234436035, -3.230839729309082, -2.9712445735931396, -2.711649179458618, -2.452054023742676, -2.1924586296081543, -1.9328633546829224, -1.6732680797576904, -1.413672685623169, -1.154077410697937, -0.8944821357727051, -0.6348868608474731, -0.37529152631759644, -0.11569619178771973, 0.1438990831375122, 0.40349435806274414, 0.6630897521972656, 0.9226850271224976, 1.1822803020477295, 1.4418755769729614, 1.7014708518981934, 1.9610662460327148, 2.2206616401672363, 2.4802567958831787, 2.7398521900177, 2.9994473457336426, 3.259042739868164]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 10.0, 14.0, 14.0, 19.0, 18.0, 23.0, 26.0, 31.0, 34.0, 35.0, 39.0, 45.0, 56.0, 63.0, 50.0, 56.0, 44.0, 52.0, 49.0, 31.0, 36.0, 47.0, 34.0, 26.0, 33.0, 24.0, 15.0, 17.0, 16.0, 14.0, 4.0, 6.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06724214553833, -2.9632089138031006, -2.859175682067871, -2.7551424503326416, -2.651109218597412, -2.5470759868621826, -2.443042755126953, -2.3390095233917236, -2.234976291656494, -2.1309430599212646, -2.026909828186035, -1.9228765964508057, -1.8188433647155762, -1.7148101329803467, -1.6107769012451172, -1.5067436695098877, -1.4027105569839478, -1.2986773252487183, -1.1946440935134888, -1.0906108617782593, -0.9865776300430298, -0.8825444579124451, -0.7785112261772156, -0.6744779944419861, -0.5704447627067566, -0.4664115309715271, -0.3623782992362976, -0.2583450973033905, -0.154311865568161, -0.050278663635253906, 0.053754568099975586, 0.15778779983520508, 0.26182103157043457, 0.36585426330566406, 0.46988749504089355, 0.573920726776123, 0.6779539585113525, 0.7819871306419373, 0.8860203623771667, 0.9900535941123962, 1.0940868854522705, 1.1981201171875, 1.3021533489227295, 1.406186580657959, 1.5102198123931885, 1.614253044128418, 1.7182862758636475, 1.822319507598877, 1.926352620124817, 2.030385732650757, 2.1344189643859863, 2.238452196121216, 2.3424854278564453, 2.446518659591675, 2.5505518913269043, 2.654585123062134, 2.7586183547973633, 2.8626515865325928, 2.9666848182678223, 3.0707180500030518, 3.1747512817382812, 3.2787845134735107, 3.3828177452087402, 3.4868509769439697, 3.590884208679199]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 8.0, 13.0, 10.0, 17.0, 22.0, 33.0, 50.0, 59.0, 64.0, 128.0, 178.0, 293.0, 486.0, 881.0, 1849.0, 4235.0, 15321.0, 292452.0, 3849497.0, 19367.0, 4902.0, 2008.0, 965.0, 550.0, 292.0, 186.0, 121.0, 83.0, 56.0, 45.0, 19.0, 24.0, 13.0, 19.0, 12.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.376953125, -1.3407821655273438, -1.3046112060546875, -1.2684402465820312, -1.232269287109375, -1.1960983276367188, -1.1599273681640625, -1.1237564086914062, -1.08758544921875, -1.0514144897460938, -1.0152435302734375, -0.9790725708007812, -0.942901611328125, -0.9067306518554688, -0.8705596923828125, -0.8343887329101562, -0.7982177734375, -0.7620468139648438, -0.7258758544921875, -0.6897048950195312, -0.653533935546875, -0.6173629760742188, -0.5811920166015625, -0.5450210571289062, -0.50885009765625, -0.47267913818359375, -0.4365081787109375, -0.40033721923828125, -0.364166259765625, -0.32799530029296875, -0.2918243408203125, -0.25565338134765625, -0.219482421875, -0.18331146240234375, -0.1471405029296875, -0.11096954345703125, -0.074798583984375, -0.03862762451171875, -0.0024566650390625, 0.03371429443359375, 0.06988525390625, 0.10605621337890625, 0.1422271728515625, 0.17839813232421875, 0.214569091796875, 0.25074005126953125, 0.2869110107421875, 0.32308197021484375, 0.3592529296875, 0.39542388916015625, 0.4315948486328125, 0.46776580810546875, 0.503936767578125, 0.5401077270507812, 0.5762786865234375, 0.6124496459960938, 0.64862060546875, 0.6847915649414062, 0.7209625244140625, 0.7571334838867188, 0.793304443359375, 0.8294754028320312, 0.8656463623046875, 0.9018173217773438, 0.93798828125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 11.0, 15.0, 12.0, 15.0, 20.0, 29.0, 29.0, 33.0, 34.0, 36.0, 46.0, 50.0, 51.0, 45.0, 59.0, 39.0, 42.0, 49.0, 41.0, 47.0, 46.0, 35.0, 27.0, 25.0, 25.0, 14.0, 12.0, 14.0, 13.0, 10.0, 8.0, 10.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.12378120422363281, -0.11975479125976562, -0.11572837829589844, -0.11170196533203125, -0.10767555236816406, -0.10364913940429688, -0.09962272644042969, -0.0955963134765625, -0.09156990051269531, -0.08754348754882812, -0.08351707458496094, -0.07949066162109375, -0.07546424865722656, -0.07143783569335938, -0.06741142272949219, -0.063385009765625, -0.05935859680175781, -0.055332183837890625, -0.05130577087402344, -0.04727935791015625, -0.04325294494628906, -0.039226531982421875, -0.03520011901855469, -0.0311737060546875, -0.027147293090820312, -0.023120880126953125, -0.019094467163085938, -0.01506805419921875, -0.011041641235351562, -0.007015228271484375, -0.0029888153076171875, 0.00103759765625, 0.0050640106201171875, 0.009090423583984375, 0.013116836547851562, 0.01714324951171875, 0.021169662475585938, 0.025196075439453125, 0.029222488403320312, 0.0332489013671875, 0.03727531433105469, 0.041301727294921875, 0.04532814025878906, 0.04935455322265625, 0.05338096618652344, 0.057407379150390625, 0.06143379211425781, 0.065460205078125, 0.06948661804199219, 0.07351303100585938, 0.07753944396972656, 0.08156585693359375, 0.08559226989746094, 0.08961868286132812, 0.09364509582519531, 0.0976715087890625, 0.10169792175292969, 0.10572433471679688, 0.10975074768066406, 0.11377716064453125, 0.11780357360839844, 0.12182998657226562, 0.1258563995361328, 0.1298828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 16.0, 23.0, 45.0, 71.0, 107.0, 163.0, 285.0, 485.0, 824.0, 1648.0, 3307.0, 8188.0, 34347.0, 3898512.0, 215603.0, 19352.0, 5789.0, 2492.0, 1297.0, 702.0, 405.0, 230.0, 139.0, 85.0, 61.0, 27.0, 22.0, 21.0, 9.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.96923828125, -0.9429244995117188, -0.9166107177734375, -0.8902969360351562, -0.863983154296875, -0.8376693725585938, -0.8113555908203125, -0.7850418090820312, -0.75872802734375, -0.7324142456054688, -0.7061004638671875, -0.6797866821289062, -0.653472900390625, -0.6271591186523438, -0.6008453369140625, -0.5745315551757812, -0.5482177734375, -0.5219039916992188, -0.4955902099609375, -0.46927642822265625, -0.442962646484375, -0.41664886474609375, -0.3903350830078125, -0.36402130126953125, -0.33770751953125, -0.31139373779296875, -0.2850799560546875, -0.25876617431640625, -0.232452392578125, -0.20613861083984375, -0.1798248291015625, -0.15351104736328125, -0.127197265625, -0.10088348388671875, -0.0745697021484375, -0.04825592041015625, -0.021942138671875, 0.00437164306640625, 0.0306854248046875, 0.05699920654296875, 0.08331298828125, 0.10962677001953125, 0.1359405517578125, 0.16225433349609375, 0.188568115234375, 0.21488189697265625, 0.2411956787109375, 0.26750946044921875, 0.2938232421875, 0.32013702392578125, 0.3464508056640625, 0.37276458740234375, 0.399078369140625, 0.42539215087890625, 0.4517059326171875, 0.47801971435546875, 0.50433349609375, 0.5306472778320312, 0.5569610595703125, 0.5832748413085938, 0.609588623046875, 0.6359024047851562, 0.6622161865234375, 0.6885299682617188, 0.71484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 8.0, 14.0, 26.0, 41.0, 70.0, 161.0, 3036.0, 429.0, 104.0, 49.0, 30.0, 14.0, 11.0, 8.0, 10.0, 5.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11838817596435547, -0.11488914489746094, -0.1113901138305664, -0.10789108276367188, -0.10439205169677734, -0.10089302062988281, -0.09739398956298828, -0.09389495849609375, -0.09039592742919922, -0.08689689636230469, -0.08339786529541016, -0.07989883422851562, -0.0763998031616211, -0.07290077209472656, -0.06940174102783203, -0.0659027099609375, -0.06240367889404297, -0.05890464782714844, -0.055405616760253906, -0.051906585693359375, -0.048407554626464844, -0.04490852355957031, -0.04140949249267578, -0.03791046142578125, -0.03441143035888672, -0.030912399291992188, -0.027413368225097656, -0.023914337158203125, -0.020415306091308594, -0.016916275024414062, -0.013417243957519531, -0.009918212890625, -0.006419181823730469, -0.0029201507568359375, 0.0005788803100585938, 0.004077911376953125, 0.007576942443847656, 0.011075973510742188, 0.014575004577636719, 0.01807403564453125, 0.02157306671142578, 0.025072097778320312, 0.028571128845214844, 0.032070159912109375, 0.035569190979003906, 0.03906822204589844, 0.04256725311279297, 0.0460662841796875, 0.04956531524658203, 0.05306434631347656, 0.056563377380371094, 0.060062408447265625, 0.06356143951416016, 0.06706047058105469, 0.07055950164794922, 0.07405853271484375, 0.07755756378173828, 0.08105659484863281, 0.08455562591552734, 0.08805465698242188, 0.0915536880493164, 0.09505271911621094, 0.09855175018310547, 0.10205078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 22.0, 52.0, 81.0, 126.0, 140.0, 180.0, 145.0, 123.0, 57.0, 33.0, 18.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.234216332435608, -1.2094447612762451, -1.1846730709075928, -1.1599013805389404, -1.1351298093795776, -1.1103582382202148, -1.0855865478515625, -1.0608148574829102, -1.0360432863235474, -1.0112717151641846, -0.9865000247955322, -0.9617283940315247, -0.9369567632675171, -0.9121851325035095, -0.887413501739502, -0.8626418709754944, -0.8378702402114868, -0.8130986094474792, -0.7883269786834717, -0.7635553479194641, -0.7387837171554565, -0.714012086391449, -0.6892404556274414, -0.6644688248634338, -0.6396971940994263, -0.6149255633354187, -0.5901539325714111, -0.5653823018074036, -0.540610671043396, -0.5158390402793884, -0.49106740951538086, -0.4662957787513733, -0.44152408838272095, -0.4167524576187134, -0.3919808268547058, -0.36720919609069824, -0.3424375653266907, -0.3176659345626831, -0.29289430379867554, -0.26812267303466797, -0.2433510422706604, -0.21857941150665283, -0.19380778074264526, -0.1690361499786377, -0.14426451921463013, -0.11949288845062256, -0.09472125768661499, -0.06994962692260742, -0.045177996158599854, -0.020406365394592285, 0.004365265369415283, 0.02913689613342285, 0.05390852689743042, 0.07868015766143799, 0.10345178842544556, 0.12822341918945312, 0.1529950499534607, 0.17776668071746826, 0.20253831148147583, 0.2273099422454834, 0.25208157300949097, 0.27685320377349854, 0.3016248345375061, 0.32639646530151367, 0.35116809606552124]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 8.0, 3.0, 8.0, 5.0, 9.0, 12.0, 8.0, 18.0, 17.0, 22.0, 21.0, 24.0, 38.0, 27.0, 33.0, 40.0, 45.0, 37.0, 43.0, 34.0, 36.0, 55.0, 35.0, 40.0, 44.0, 46.0, 29.0, 37.0, 41.0, 26.0, 28.0, 28.0, 18.0, 21.0, 13.0, 8.0, 13.0, 6.0, 9.0, 4.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.33159470558166504, -0.32265856862068176, -0.3137224018573761, -0.3047862648963928, -0.29585009813308716, -0.2869139611721039, -0.2779777944087982, -0.26904165744781494, -0.2601054906845093, -0.251169353723526, -0.24223318696022034, -0.23329703509807587, -0.2243608832359314, -0.21542474627494812, -0.20648859441280365, -0.19755244255065918, -0.1886163055896759, -0.17968015372753143, -0.17074400186538696, -0.1618078500032425, -0.15287169814109802, -0.14393556118011475, -0.13499940931797028, -0.1260632574558258, -0.11712710559368134, -0.10819095373153687, -0.0992548018693924, -0.09031865745782852, -0.08138250559568405, -0.07244635373353958, -0.06351020932197571, -0.05457405745983124, -0.04563790559768677, -0.0367017537355423, -0.027765605598688126, -0.018829455599188805, -0.009893305599689484, -0.0009571537375450134, 0.007978994399309158, 0.01691514253616333, 0.0258512943983078, 0.03478744626045227, 0.04372359439730644, 0.052659742534160614, 0.061595894396305084, 0.07053204625844955, 0.07946819067001343, 0.0884043425321579, 0.09734049439430237, 0.10627664625644684, 0.11521279811859131, 0.12414894253015518, 0.13308510184288025, 0.14202123880386353, 0.150957390666008, 0.15989354252815247, 0.16882969439029694, 0.1777658462524414, 0.18670199811458588, 0.19563814997673035, 0.20457428693771362, 0.2135104537010193, 0.22244659066200256, 0.23138274252414703, 0.2403188943862915]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 6.0, 5.0, 10.0, 9.0, 13.0, 23.0, 21.0, 35.0, 71.0, 133.0, 205.0, 364.0, 581.0, 1178.0, 2250.0, 4726.0, 10236.0, 22755.0, 51968.0, 113127.0, 209167.0, 261475.0, 190244.0, 98124.0, 44705.0, 19669.0, 8921.0, 4021.0, 2096.0, 1088.0, 544.0, 286.0, 193.0, 111.0, 58.0, 41.0, 27.0, 13.0, 17.0, 13.0, 8.0, 5.0, 7.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.342041015625, -0.3318023681640625, -0.321563720703125, -0.3113250732421875, -0.30108642578125, -0.2908477783203125, -0.280609130859375, -0.2703704833984375, -0.2601318359375, -0.2498931884765625, -0.239654541015625, -0.2294158935546875, -0.21917724609375, -0.2089385986328125, -0.198699951171875, -0.1884613037109375, -0.17822265625, -0.1679840087890625, -0.157745361328125, -0.1475067138671875, -0.13726806640625, -0.1270294189453125, -0.116790771484375, -0.1065521240234375, -0.0963134765625, -0.0860748291015625, -0.075836181640625, -0.0655975341796875, -0.05535888671875, -0.0451202392578125, -0.034881591796875, -0.0246429443359375, -0.014404296875, -0.0041656494140625, 0.006072998046875, 0.0163116455078125, 0.02655029296875, 0.0367889404296875, 0.047027587890625, 0.0572662353515625, 0.0675048828125, 0.0777435302734375, 0.087982177734375, 0.0982208251953125, 0.10845947265625, 0.1186981201171875, 0.128936767578125, 0.1391754150390625, 0.1494140625, 0.1596527099609375, 0.169891357421875, 0.1801300048828125, 0.19036865234375, 0.2006072998046875, 0.210845947265625, 0.2210845947265625, 0.2313232421875, 0.2415618896484375, 0.251800537109375, 0.2620391845703125, 0.27227783203125, 0.2825164794921875, 0.292755126953125, 0.3029937744140625, 0.313232421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 5.0, 8.0, 6.0, 9.0, 12.0, 16.0, 14.0, 31.0, 28.0, 28.0, 19.0, 29.0, 36.0, 39.0, 52.0, 49.0, 54.0, 42.0, 39.0, 44.0, 39.0, 35.0, 41.0, 47.0, 30.0, 37.0, 33.0, 20.0, 22.0, 18.0, 13.0, 12.0, 13.0, 10.0, 9.0, 4.0, 13.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.1419677734375, -0.1379375457763672, -0.13390731811523438, -0.12987709045410156, -0.12584686279296875, -0.12181663513183594, -0.11778640747070312, -0.11375617980957031, -0.1097259521484375, -0.10569572448730469, -0.10166549682617188, -0.09763526916503906, -0.09360504150390625, -0.08957481384277344, -0.08554458618164062, -0.08151435852050781, -0.077484130859375, -0.07345390319824219, -0.06942367553710938, -0.06539344787597656, -0.06136322021484375, -0.05733299255371094, -0.053302764892578125, -0.04927253723144531, -0.0452423095703125, -0.04121208190917969, -0.037181854248046875, -0.03315162658691406, -0.02912139892578125, -0.025091171264648438, -0.021060943603515625, -0.017030715942382812, -0.01300048828125, -0.008970260620117188, -0.004940032958984375, -0.0009098052978515625, 0.00312042236328125, 0.0071506500244140625, 0.011180877685546875, 0.015211105346679688, 0.0192413330078125, 0.023271560668945312, 0.027301788330078125, 0.03133201599121094, 0.03536224365234375, 0.03939247131347656, 0.043422698974609375, 0.04745292663574219, 0.051483154296875, 0.05551338195800781, 0.059543609619140625, 0.06357383728027344, 0.06760406494140625, 0.07163429260253906, 0.07566452026367188, 0.07969474792480469, 0.0837249755859375, 0.08775520324707031, 0.09178543090820312, 0.09581565856933594, 0.09984588623046875, 0.10387611389160156, 0.10790634155273438, 0.11193656921386719, 0.115966796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 4.0, 16.0, 24.0, 27.0, 36.0, 50.0, 61.0, 92.0, 119.0, 138.0, 208.0, 291.0, 415.0, 628.0, 1119.0, 2169.0, 5885.0, 21507.0, 109566.0, 505323.0, 319906.0, 59508.0, 12948.0, 4077.0, 1665.0, 886.0, 529.0, 376.0, 248.0, 198.0, 140.0, 102.0, 69.0, 57.0, 40.0, 36.0, 19.0, 9.0, 13.0, 14.0, 12.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6025390625, -0.5836029052734375, -0.564666748046875, -0.5457305908203125, -0.52679443359375, -0.5078582763671875, -0.488922119140625, -0.4699859619140625, -0.4510498046875, -0.4321136474609375, -0.413177490234375, -0.3942413330078125, -0.37530517578125, -0.3563690185546875, -0.337432861328125, -0.3184967041015625, -0.299560546875, -0.2806243896484375, -0.261688232421875, -0.2427520751953125, -0.22381591796875, -0.2048797607421875, -0.185943603515625, -0.1670074462890625, -0.1480712890625, -0.1291351318359375, -0.110198974609375, -0.0912628173828125, -0.07232666015625, -0.0533905029296875, -0.034454345703125, -0.0155181884765625, 0.00341796875, 0.0223541259765625, 0.041290283203125, 0.0602264404296875, 0.07916259765625, 0.0980987548828125, 0.117034912109375, 0.1359710693359375, 0.1549072265625, 0.1738433837890625, 0.192779541015625, 0.2117156982421875, 0.23065185546875, 0.2495880126953125, 0.268524169921875, 0.2874603271484375, 0.306396484375, 0.3253326416015625, 0.344268798828125, 0.3632049560546875, 0.38214111328125, 0.4010772705078125, 0.420013427734375, 0.4389495849609375, 0.4578857421875, 0.4768218994140625, 0.495758056640625, 0.5146942138671875, 0.53363037109375, 0.5525665283203125, 0.571502685546875, 0.5904388427734375, 0.609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 9.0, 8.0, 12.0, 20.0, 16.0, 20.0, 27.0, 42.0, 52.0, 47.0, 52.0, 72.0, 66.0, 64.0, 69.0, 70.0, 49.0, 69.0, 41.0, 43.0, 36.0, 27.0, 22.0, 20.0, 9.0, 8.0, 5.0, 6.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1328125, -1.1024246215820312, -1.0720367431640625, -1.0416488647460938, -1.011260986328125, -0.9808731079101562, -0.9504852294921875, -0.9200973510742188, -0.88970947265625, -0.8593215942382812, -0.8289337158203125, -0.7985458374023438, -0.768157958984375, -0.7377700805664062, -0.7073822021484375, -0.6769943237304688, -0.6466064453125, -0.6162185668945312, -0.5858306884765625, -0.5554428100585938, -0.525054931640625, -0.49466705322265625, -0.4642791748046875, -0.43389129638671875, -0.40350341796875, -0.37311553955078125, -0.3427276611328125, -0.31233978271484375, -0.281951904296875, -0.25156402587890625, -0.2211761474609375, -0.19078826904296875, -0.160400390625, -0.13001251220703125, -0.0996246337890625, -0.06923675537109375, -0.038848876953125, -0.00846099853515625, 0.0219268798828125, 0.05231475830078125, 0.08270263671875, 0.11309051513671875, 0.1434783935546875, 0.17386627197265625, 0.204254150390625, 0.23464202880859375, 0.2650299072265625, 0.29541778564453125, 0.3258056640625, 0.35619354248046875, 0.3865814208984375, 0.41696929931640625, 0.447357177734375, 0.47774505615234375, 0.5081329345703125, 0.5385208129882812, 0.56890869140625, 0.5992965698242188, 0.6296844482421875, 0.6600723266601562, 0.690460205078125, 0.7208480834960938, 0.7512359619140625, 0.7816238403320312, 0.81201171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 9.0, 18.0, 7.0, 10.0, 20.0, 28.0, 46.0, 55.0, 106.0, 163.0, 229.0, 425.0, 715.0, 1387.0, 2663.0, 6022.0, 15446.0, 49568.0, 207012.0, 531417.0, 167764.0, 41437.0, 13410.0, 5323.0, 2362.0, 1190.0, 643.0, 384.0, 237.0, 154.0, 110.0, 67.0, 36.0, 21.0, 24.0, 13.0, 11.0, 7.0, 2.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.34326171875, -0.33432960510253906, -0.3253974914550781, -0.3164653778076172, -0.30753326416015625, -0.2986011505126953, -0.2896690368652344, -0.28073692321777344, -0.2718048095703125, -0.26287269592285156, -0.2539405822753906, -0.2450084686279297, -0.23607635498046875, -0.2271442413330078, -0.21821212768554688, -0.20928001403808594, -0.200347900390625, -0.19141578674316406, -0.18248367309570312, -0.1735515594482422, -0.16461944580078125, -0.1556873321533203, -0.14675521850585938, -0.13782310485839844, -0.1288909912109375, -0.11995887756347656, -0.11102676391601562, -0.10209465026855469, -0.09316253662109375, -0.08423042297363281, -0.07529830932617188, -0.06636619567871094, -0.05743408203125, -0.04850196838378906, -0.039569854736328125, -0.030637741088867188, -0.02170562744140625, -0.012773513793945312, -0.003841400146484375, 0.0050907135009765625, 0.0140228271484375, 0.022954940795898438, 0.031887054443359375, 0.04081916809082031, 0.04975128173828125, 0.05868339538574219, 0.06761550903320312, 0.07654762268066406, 0.085479736328125, 0.09441184997558594, 0.10334396362304688, 0.11227607727050781, 0.12120819091796875, 0.1301403045654297, 0.13907241821289062, 0.14800453186035156, 0.1569366455078125, 0.16586875915527344, 0.17480087280273438, 0.1837329864501953, 0.19266510009765625, 0.2015972137451172, 0.21052932739257812, 0.21946144104003906, 0.2283935546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 4.0, 16.0, 14.0, 17.0, 25.0, 29.0, 49.0, 63.0, 76.0, 71.0, 90.0, 93.0, 76.0, 75.0, 70.0, 52.0, 37.0, 32.0, 22.0, 23.0, 20.0, 11.0, 7.0, 11.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012159347534179688, -0.00011834874749183655, -0.00011510401964187622, -0.0001118592917919159, -0.00010861456394195557, -0.00010536983609199524, -0.00010212510824203491, -9.888038039207458e-05, -9.563565254211426e-05, -9.239092469215393e-05, -8.91461968421936e-05, -8.590146899223328e-05, -8.265674114227295e-05, -7.941201329231262e-05, -7.61672854423523e-05, -7.292255759239197e-05, -6.967782974243164e-05, -6.643310189247131e-05, -6.318837404251099e-05, -5.994364619255066e-05, -5.669891834259033e-05, -5.3454190492630005e-05, -5.020946264266968e-05, -4.696473479270935e-05, -4.3720006942749023e-05, -4.0475279092788696e-05, -3.723055124282837e-05, -3.398582339286804e-05, -3.0741095542907715e-05, -2.7496367692947388e-05, -2.425163984298706e-05, -2.1006911993026733e-05, -1.7762184143066406e-05, -1.4517456293106079e-05, -1.1272728443145752e-05, -8.028000593185425e-06, -4.783272743225098e-06, -1.5385448932647705e-06, 1.7061829566955566e-06, 4.950910806655884e-06, 8.195638656616211e-06, 1.1440366506576538e-05, 1.4685094356536865e-05, 1.7929822206497192e-05, 2.117455005645752e-05, 2.4419277906417847e-05, 2.7664005756378174e-05, 3.09087336063385e-05, 3.415346145629883e-05, 3.7398189306259155e-05, 4.064291715621948e-05, 4.388764500617981e-05, 4.713237285614014e-05, 5.0377100706100464e-05, 5.362182855606079e-05, 5.686655640602112e-05, 6.0111284255981445e-05, 6.335601210594177e-05, 6.66007399559021e-05, 6.984546780586243e-05, 7.309019565582275e-05, 7.633492350578308e-05, 7.957965135574341e-05, 8.282437920570374e-05, 8.606910705566406e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 16.0, 12.0, 21.0, 36.0, 55.0, 94.0, 170.0, 342.0, 719.0, 1810.0, 5678.0, 29109.0, 360616.0, 592427.0, 45931.0, 7519.0, 2297.0, 845.0, 383.0, 207.0, 100.0, 48.0, 38.0, 23.0, 14.0, 8.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.55322265625, -0.5374641418457031, -0.5217056274414062, -0.5059471130371094, -0.4901885986328125, -0.4744300842285156, -0.45867156982421875, -0.4429130554199219, -0.427154541015625, -0.4113960266113281, -0.39563751220703125, -0.3798789978027344, -0.3641204833984375, -0.3483619689941406, -0.33260345458984375, -0.3168449401855469, -0.30108642578125, -0.2853279113769531, -0.26956939697265625, -0.2538108825683594, -0.2380523681640625, -0.22229385375976562, -0.20653533935546875, -0.19077682495117188, -0.175018310546875, -0.15925979614257812, -0.14350128173828125, -0.12774276733398438, -0.1119842529296875, -0.09622573852539062, -0.08046722412109375, -0.06470870971679688, -0.0489501953125, -0.033191680908203125, -0.01743316650390625, -0.001674652099609375, 0.0140838623046875, 0.029842376708984375, 0.04560089111328125, 0.061359405517578125, 0.077117919921875, 0.09287643432617188, 0.10863494873046875, 0.12439346313476562, 0.1401519775390625, 0.15591049194335938, 0.17166900634765625, 0.18742752075195312, 0.20318603515625, 0.21894454956054688, 0.23470306396484375, 0.2504615783691406, 0.2662200927734375, 0.2819786071777344, 0.29773712158203125, 0.3134956359863281, 0.329254150390625, 0.3450126647949219, 0.36077117919921875, 0.3765296936035156, 0.3922882080078125, 0.4080467224121094, 0.42380523681640625, 0.4395637512207031, 0.455322265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 4.0, 20.0, 20.0, 36.0, 52.0, 64.0, 89.0, 105.0, 133.0, 118.0, 101.0, 68.0, 52.0, 38.0, 26.0, 25.0, 16.0, 11.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451416015625, -0.43810272216796875, -0.4247894287109375, -0.41147613525390625, -0.398162841796875, -0.38484954833984375, -0.3715362548828125, -0.35822296142578125, -0.34490966796875, -0.33159637451171875, -0.3182830810546875, -0.30496978759765625, -0.291656494140625, -0.27834320068359375, -0.2650299072265625, -0.25171661376953125, -0.2384033203125, -0.22509002685546875, -0.2117767333984375, -0.19846343994140625, -0.185150146484375, -0.17183685302734375, -0.1585235595703125, -0.14521026611328125, -0.13189697265625, -0.11858367919921875, -0.1052703857421875, -0.09195709228515625, -0.078643798828125, -0.06533050537109375, -0.0520172119140625, -0.03870391845703125, -0.025390625, -0.01207733154296875, 0.0012359619140625, 0.01454925537109375, 0.027862548828125, 0.04117584228515625, 0.0544891357421875, 0.06780242919921875, 0.08111572265625, 0.09442901611328125, 0.1077423095703125, 0.12105560302734375, 0.134368896484375, 0.14768218994140625, 0.1609954833984375, 0.17430877685546875, 0.1876220703125, 0.20093536376953125, 0.2142486572265625, 0.22756195068359375, 0.240875244140625, 0.25418853759765625, 0.2675018310546875, 0.28081512451171875, 0.29412841796875, 0.30744171142578125, 0.3207550048828125, 0.33406829833984375, 0.347381591796875, 0.36069488525390625, 0.3740081787109375, 0.38732147216796875, 0.400634765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 9.0, 7.0, 22.0, 22.0, 36.0, 62.0, 72.0, 98.0, 120.0, 130.0, 127.0, 90.0, 77.0, 42.0, 30.0, 25.0, 12.0, 12.0, 5.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.974682807922363, -6.823716640472412, -6.672749996185303, -6.521783828735352, -6.3708176612854, -6.219851493835449, -6.06888484954834, -5.917918682098389, -5.7669525146484375, -5.615986347198486, -5.465019702911377, -5.314053535461426, -5.163087368011475, -5.012121200561523, -4.861154556274414, -4.710188388824463, -4.5592217445373535, -4.408255577087402, -4.257288932800293, -4.106322765350342, -3.9553565979003906, -3.8043901920318604, -3.65342378616333, -3.502457618713379, -3.3514912128448486, -3.2005248069763184, -3.049558639526367, -2.898592233657837, -2.7476258277893066, -2.5966596603393555, -2.445693254470825, -2.294726848602295, -2.143761157989502, -1.9927948713302612, -1.8418285846710205, -1.6908621788024902, -1.5398958921432495, -1.3889296054840088, -1.2379631996154785, -1.0869969129562378, -0.9360306262969971, -0.7850643396377563, -0.6340979933738708, -0.48313167691230774, -0.33216536045074463, -0.1811990737915039, -0.030232727527618408, 0.12073361873626709, 0.2716999053955078, 0.4226662218570709, 0.573632538318634, 0.7245988845825195, 0.8755651712417603, 1.026531457901001, 1.1774978637695312, 1.328464150428772, 1.4794304370880127, 1.6303967237472534, 1.7813630104064941, 1.9323294162750244, 2.0832958221435547, 2.234261989593506, 2.385228395462036, 2.5361948013305664, 2.6871609687805176]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 7.0, 6.0, 10.0, 11.0, 17.0, 16.0, 27.0, 20.0, 26.0, 31.0, 45.0, 43.0, 48.0, 39.0, 45.0, 42.0, 53.0, 59.0, 53.0, 47.0, 41.0, 46.0, 28.0, 42.0, 32.0, 12.0, 23.0, 21.0, 16.0, 22.0, 10.0, 11.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.678226947784424, -3.570671796798706, -3.463116407394409, -3.3555612564086914, -3.2480061054229736, -3.140450954437256, -3.032895565032959, -2.925340414047241, -2.8177852630615234, -2.7102301120758057, -2.602674722671509, -2.495119571685791, -2.3875644207000732, -2.2800092697143555, -2.1724538803100586, -2.064898729324341, -1.9573434591293335, -1.8497881889343262, -1.7422330379486084, -1.634677767753601, -1.5271226167678833, -1.419567346572876, -1.3120121955871582, -1.2044569253921509, -1.0969016551971436, -0.989346444606781, -0.8817912340164185, -0.7742359638214111, -0.6666808128356934, -0.559125542640686, -0.4515703320503235, -0.34401512145996094, -0.23645997047424316, -0.12890475988388062, -0.021349534392356873, 0.08620569109916687, 0.19376090168952942, 0.30131614208221436, 0.4088713526725769, 0.5164265632629395, 0.623981773853302, 0.7315369844436646, 0.8390921950340271, 0.9466474056243896, 1.054202675819397, 1.1617579460144043, 1.269313097000122, 1.3768682479858398, 1.4844235181808472, 1.5919787883758545, 1.6995339393615723, 1.8070892095565796, 1.9146443605422974, 2.0221996307373047, 2.1297547817230225, 2.2373099327087402, 2.344865322113037, 2.452420473098755, 2.5599758625030518, 2.6675310134887695, 2.7750861644744873, 2.882641315460205, 2.990196704864502, 3.0977518558502197, 3.2053070068359375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 11.0, 6.0, 13.0, 11.0, 15.0, 35.0, 47.0, 36.0, 76.0, 77.0, 129.0, 218.0, 292.0, 509.0, 925.0, 1833.0, 4169.0, 12924.0, 94924.0, 4020271.0, 42660.0, 8474.0, 3124.0, 1458.0, 772.0, 429.0, 276.0, 177.0, 113.0, 73.0, 64.0, 35.0, 28.0, 30.0, 10.0, 14.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.203125, -1.17254638671875, -1.1419677734375, -1.11138916015625, -1.080810546875, -1.05023193359375, -1.0196533203125, -0.98907470703125, -0.95849609375, -0.92791748046875, -0.8973388671875, -0.86676025390625, -0.836181640625, -0.80560302734375, -0.7750244140625, -0.74444580078125, -0.7138671875, -0.68328857421875, -0.6527099609375, -0.62213134765625, -0.591552734375, -0.56097412109375, -0.5303955078125, -0.49981689453125, -0.46923828125, -0.43865966796875, -0.4080810546875, -0.37750244140625, -0.346923828125, -0.31634521484375, -0.2857666015625, -0.25518798828125, -0.224609375, -0.19403076171875, -0.1634521484375, -0.13287353515625, -0.102294921875, -0.07171630859375, -0.0411376953125, -0.01055908203125, 0.02001953125, 0.05059814453125, 0.0811767578125, 0.11175537109375, 0.142333984375, 0.17291259765625, 0.2034912109375, 0.23406982421875, 0.2646484375, 0.29522705078125, 0.3258056640625, 0.35638427734375, 0.386962890625, 0.41754150390625, 0.4481201171875, 0.47869873046875, 0.50927734375, 0.53985595703125, 0.5704345703125, 0.60101318359375, 0.631591796875, 0.66217041015625, 0.6927490234375, 0.72332763671875, 0.75390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 10.0, 17.0, 16.0, 23.0, 31.0, 37.0, 51.0, 53.0, 54.0, 60.0, 69.0, 54.0, 56.0, 65.0, 47.0, 57.0, 43.0, 36.0, 39.0, 38.0, 35.0, 14.0, 11.0, 16.0, 13.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19692230224609375, -0.1914520263671875, -0.18598175048828125, -0.180511474609375, -0.17504119873046875, -0.1695709228515625, -0.16410064697265625, -0.15863037109375, -0.15316009521484375, -0.1476898193359375, -0.14221954345703125, -0.136749267578125, -0.13127899169921875, -0.1258087158203125, -0.12033843994140625, -0.1148681640625, -0.10939788818359375, -0.1039276123046875, -0.09845733642578125, -0.092987060546875, -0.08751678466796875, -0.0820465087890625, -0.07657623291015625, -0.07110595703125, -0.06563568115234375, -0.0601654052734375, -0.05469512939453125, -0.049224853515625, -0.04375457763671875, -0.0382843017578125, -0.03281402587890625, -0.02734375, -0.02187347412109375, -0.0164031982421875, -0.01093292236328125, -0.005462646484375, 7.62939453125e-06, 0.0054779052734375, 0.01094818115234375, 0.01641845703125, 0.02188873291015625, 0.0273590087890625, 0.03282928466796875, 0.038299560546875, 0.04376983642578125, 0.0492401123046875, 0.05471038818359375, 0.0601806640625, 0.06565093994140625, 0.0711212158203125, 0.07659149169921875, 0.082061767578125, 0.08753204345703125, 0.0930023193359375, 0.09847259521484375, 0.10394287109375, 0.10941314697265625, 0.1148834228515625, 0.12035369873046875, 0.125823974609375, 0.13129425048828125, 0.1367645263671875, 0.14223480224609375, 0.147705078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 7.0, 5.0, 6.0, 11.0, 21.0, 15.0, 30.0, 28.0, 40.0, 50.0, 91.0, 159.0, 227.0, 391.0, 678.0, 1340.0, 2516.0, 5908.0, 17157.0, 89098.0, 3952847.0, 94298.0, 17567.0, 5991.0, 2638.0, 1341.0, 669.0, 396.0, 244.0, 122.0, 98.0, 72.0, 58.0, 38.0, 31.0, 23.0, 12.0, 10.0, 7.0, 9.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.7705078125, -0.7444000244140625, -0.718292236328125, -0.6921844482421875, -0.66607666015625, -0.6399688720703125, -0.613861083984375, -0.5877532958984375, -0.5616455078125, -0.5355377197265625, -0.509429931640625, -0.4833221435546875, -0.45721435546875, -0.4311065673828125, -0.404998779296875, -0.3788909912109375, -0.352783203125, -0.3266754150390625, -0.300567626953125, -0.2744598388671875, -0.24835205078125, -0.2222442626953125, -0.196136474609375, -0.1700286865234375, -0.1439208984375, -0.1178131103515625, -0.091705322265625, -0.0655975341796875, -0.03948974609375, -0.0133819580078125, 0.012725830078125, 0.0388336181640625, 0.06494140625, 0.0910491943359375, 0.117156982421875, 0.1432647705078125, 0.16937255859375, 0.1954803466796875, 0.221588134765625, 0.2476959228515625, 0.2738037109375, 0.2999114990234375, 0.326019287109375, 0.3521270751953125, 0.37823486328125, 0.4043426513671875, 0.430450439453125, 0.4565582275390625, 0.482666015625, 0.5087738037109375, 0.534881591796875, 0.5609893798828125, 0.58709716796875, 0.6132049560546875, 0.639312744140625, 0.6654205322265625, 0.6915283203125, 0.7176361083984375, 0.743743896484375, 0.7698516845703125, 0.79595947265625, 0.8220672607421875, 0.848175048828125, 0.8742828369140625, 0.900390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 10.0, 22.0, 35.0, 40.0, 81.0, 458.0, 3070.0, 147.0, 73.0, 41.0, 21.0, 16.0, 13.0, 4.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.160400390625, -0.1540241241455078, -0.14764785766601562, -0.14127159118652344, -0.13489532470703125, -0.12851905822753906, -0.12214279174804688, -0.11576652526855469, -0.1093902587890625, -0.10301399230957031, -0.09663772583007812, -0.09026145935058594, -0.08388519287109375, -0.07750892639160156, -0.07113265991210938, -0.06475639343261719, -0.058380126953125, -0.05200386047363281, -0.045627593994140625, -0.03925132751464844, -0.03287506103515625, -0.026498794555664062, -0.020122528076171875, -0.013746261596679688, -0.0073699951171875, -0.0009937286376953125, 0.005382537841796875, 0.011758804321289062, 0.01813507080078125, 0.024511337280273438, 0.030887603759765625, 0.03726387023925781, 0.04364013671875, 0.05001640319824219, 0.056392669677734375, 0.06276893615722656, 0.06914520263671875, 0.07552146911621094, 0.08189773559570312, 0.08827400207519531, 0.0946502685546875, 0.10102653503417969, 0.10740280151367188, 0.11377906799316406, 0.12015533447265625, 0.12653160095214844, 0.13290786743164062, 0.1392841339111328, 0.145660400390625, 0.1520366668701172, 0.15841293334960938, 0.16478919982910156, 0.17116546630859375, 0.17754173278808594, 0.18391799926757812, 0.1902942657470703, 0.1966705322265625, 0.2030467987060547, 0.20942306518554688, 0.21579933166503906, 0.22217559814453125, 0.22855186462402344, 0.23492813110351562, 0.2413043975830078, 0.2476806640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 13.0, 14.0, 48.0, 71.0, 103.0, 139.0, 157.0, 157.0, 104.0, 70.0, 49.0, 27.0, 17.0, 10.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1545765399932861, -1.122490406036377, -1.0904042720794678, -1.0583181381225586, -1.0262320041656494, -0.9941458106040955, -0.9620596170425415, -0.9299734830856323, -0.8978873491287231, -0.865801215171814, -0.8337150812149048, -0.8016288876533508, -0.7695427536964417, -0.7374566197395325, -0.7053704261779785, -0.6732842922210693, -0.6411981582641602, -0.609112024307251, -0.5770258903503418, -0.5449396967887878, -0.5128535628318787, -0.4807674288749695, -0.4486812651157379, -0.41659510135650635, -0.38450896739959717, -0.352422833442688, -0.3203366696834564, -0.28825050592422485, -0.2561643719673157, -0.2240782231092453, -0.19199207425117493, -0.15990592539310455, -0.12781989574432373, -0.09573374688625336, -0.06364759802818298, -0.03156144917011261, 0.0005246996879577637, 0.03261084854602814, 0.06469699740409851, 0.09678314626216888, 0.12886929512023926, 0.16095544397830963, 0.19304159283638, 0.22512774169445038, 0.25721389055252075, 0.28930002450942993, 0.3213861882686615, 0.35347235202789307, 0.38555848598480225, 0.4176446199417114, 0.449730783700943, 0.48181694746017456, 0.5139030814170837, 0.5459892153739929, 0.5780754089355469, 0.610161542892456, 0.6422476768493652, 0.6743338108062744, 0.7064199447631836, 0.7385061383247375, 0.7705922722816467, 0.8026784062385559, 0.8347645998001099, 0.866850733757019, 0.8989368677139282]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 8.0, 9.0, 10.0, 13.0, 10.0, 21.0, 25.0, 27.0, 19.0, 27.0, 34.0, 27.0, 34.0, 27.0, 32.0, 40.0, 39.0, 39.0, 43.0, 42.0, 47.0, 42.0, 39.0, 43.0, 37.0, 24.0, 28.0, 29.0, 32.0, 14.0, 23.0, 14.0, 7.0, 16.0, 17.0, 16.0, 10.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3539687395095825, -0.34159860014915466, -0.3292284309864044, -0.31685829162597656, -0.3044881224632263, -0.29211798310279846, -0.2797478437423706, -0.26737767457962036, -0.2550075352191925, -0.24263738095760345, -0.2302672266960144, -0.21789708733558655, -0.2055269330739975, -0.19315677881240845, -0.1807866245508194, -0.16841647028923035, -0.1560463160276413, -0.14367616176605225, -0.1313060075044632, -0.11893586069345474, -0.10656571388244629, -0.09419555962085724, -0.08182540535926819, -0.06945525854825974, -0.057085104286670685, -0.04471495375037193, -0.03234480321407318, -0.01997464895248413, -0.007604498416185379, 0.004765652120113373, 0.017135806381702423, 0.029505953192710876, 0.04187610745429993, 0.05424625799059868, 0.06661640852689743, 0.07898656278848648, 0.09135670959949493, 0.10372686386108398, 0.11609701812267303, 0.12846717238426208, 0.14083731174468994, 0.153207466006279, 0.16557762026786804, 0.1779477596282959, 0.19031791388988495, 0.202688068151474, 0.21505822241306305, 0.2274283766746521, 0.23979853093624115, 0.2521686851978302, 0.26453882455825806, 0.2769089937210083, 0.28927913308143616, 0.301649272441864, 0.31401944160461426, 0.3263895809650421, 0.33875975012779236, 0.3511298894882202, 0.36350005865097046, 0.3758701980113983, 0.38824036717414856, 0.4006105065345764, 0.41298067569732666, 0.4253508150577545, 0.4377209544181824]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 5.0, 9.0, 14.0, 16.0, 25.0, 33.0, 42.0, 74.0, 108.0, 161.0, 251.0, 406.0, 625.0, 1033.0, 1751.0, 3261.0, 5711.0, 10928.0, 21609.0, 42578.0, 82811.0, 150428.0, 222523.0, 213624.0, 137223.0, 74287.0, 38020.0, 18916.0, 9753.0, 5288.0, 2826.0, 1659.0, 941.0, 564.0, 377.0, 217.0, 154.0, 94.0, 73.0, 33.0, 30.0, 21.0, 13.0, 6.0, 4.0, 6.0, 5.0, 7.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18606948852539062, -0.17963409423828125, -0.17319869995117188, -0.1667633056640625, -0.16032791137695312, -0.15389251708984375, -0.14745712280273438, -0.141021728515625, -0.13458633422851562, -0.12815093994140625, -0.12171554565429688, -0.1152801513671875, -0.10884475708007812, -0.10240936279296875, -0.09597396850585938, -0.08953857421875, -0.08310317993164062, -0.07666778564453125, -0.07023239135742188, -0.0637969970703125, -0.057361602783203125, -0.05092620849609375, -0.044490814208984375, -0.038055419921875, -0.031620025634765625, -0.02518463134765625, -0.018749237060546875, -0.0123138427734375, -0.005878448486328125, 0.00055694580078125, 0.006992340087890625, 0.013427734375, 0.019863128662109375, 0.02629852294921875, 0.032733917236328125, 0.0391693115234375, 0.045604705810546875, 0.05204010009765625, 0.058475494384765625, 0.064910888671875, 0.07134628295898438, 0.07778167724609375, 0.08421707153320312, 0.0906524658203125, 0.09708786010742188, 0.10352325439453125, 0.10995864868164062, 0.11639404296875, 0.12282943725585938, 0.12926483154296875, 0.13570022583007812, 0.1421356201171875, 0.14857101440429688, 0.15500640869140625, 0.16144180297851562, 0.167877197265625, 0.17431259155273438, 0.18074798583984375, 0.18718338012695312, 0.1936187744140625, 0.20005416870117188, 0.20648956298828125, 0.21292495727539062, 0.2193603515625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 11.0, 6.0, 11.0, 9.0, 8.0, 13.0, 17.0, 27.0, 25.0, 36.0, 47.0, 36.0, 57.0, 60.0, 60.0, 54.0, 58.0, 58.0, 52.0, 39.0, 41.0, 41.0, 41.0, 39.0, 33.0, 21.0, 24.0, 22.0, 9.0, 9.0, 8.0, 6.0, 6.0, 4.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1815185546875, -0.17624282836914062, -0.17096710205078125, -0.16569137573242188, -0.1604156494140625, -0.15513992309570312, -0.14986419677734375, -0.14458847045898438, -0.139312744140625, -0.13403701782226562, -0.12876129150390625, -0.12348556518554688, -0.1182098388671875, -0.11293411254882812, -0.10765838623046875, -0.10238265991210938, -0.09710693359375, -0.09183120727539062, -0.08655548095703125, -0.08127975463867188, -0.0760040283203125, -0.07072830200195312, -0.06545257568359375, -0.060176849365234375, -0.054901123046875, -0.049625396728515625, -0.04434967041015625, -0.039073944091796875, -0.0337982177734375, -0.028522491455078125, -0.02324676513671875, -0.017971038818359375, -0.0126953125, -0.007419586181640625, -0.00214385986328125, 0.003131866455078125, 0.0084075927734375, 0.013683319091796875, 0.01895904541015625, 0.024234771728515625, 0.029510498046875, 0.034786224365234375, 0.04006195068359375, 0.045337677001953125, 0.0506134033203125, 0.055889129638671875, 0.06116485595703125, 0.06644058227539062, 0.07171630859375, 0.07699203491210938, 0.08226776123046875, 0.08754348754882812, 0.0928192138671875, 0.09809494018554688, 0.10337066650390625, 0.10864639282226562, 0.113922119140625, 0.11919784545898438, 0.12447357177734375, 0.12974929809570312, 0.1350250244140625, 0.14030075073242188, 0.14557647705078125, 0.15085220336914062, 0.1561279296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 8.0, 16.0, 24.0, 38.0, 64.0, 78.0, 167.0, 289.0, 500.0, 881.0, 2025.0, 6477.0, 59449.0, 779118.0, 181711.0, 12093.0, 2860.0, 1159.0, 690.0, 352.0, 230.0, 133.0, 77.0, 42.0, 19.0, 14.0, 14.0, 8.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.7346878051757812, -0.7081451416015625, -0.6816024780273438, -0.655059814453125, -0.6285171508789062, -0.6019744873046875, -0.5754318237304688, -0.54888916015625, -0.5223464965820312, -0.4958038330078125, -0.46926116943359375, -0.442718505859375, -0.41617584228515625, -0.3896331787109375, -0.36309051513671875, -0.3365478515625, -0.31000518798828125, -0.2834625244140625, -0.25691986083984375, -0.230377197265625, -0.20383453369140625, -0.1772918701171875, -0.15074920654296875, -0.12420654296875, -0.09766387939453125, -0.0711212158203125, -0.04457855224609375, -0.018035888671875, 0.00850677490234375, 0.0350494384765625, 0.06159210205078125, 0.088134765625, 0.11467742919921875, 0.1412200927734375, 0.16776275634765625, 0.194305419921875, 0.22084808349609375, 0.2473907470703125, 0.27393341064453125, 0.30047607421875, 0.32701873779296875, 0.3535614013671875, 0.38010406494140625, 0.406646728515625, 0.43318939208984375, 0.4597320556640625, 0.48627471923828125, 0.5128173828125, 0.5393600463867188, 0.5659027099609375, 0.5924453735351562, 0.618988037109375, 0.6455307006835938, 0.6720733642578125, 0.6986160278320312, 0.72515869140625, 0.7517013549804688, 0.7782440185546875, 0.8047866821289062, 0.831329345703125, 0.8578720092773438, 0.8844146728515625, 0.9109573364257812, 0.9375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 12.0, 10.0, 8.0, 15.0, 11.0, 12.0, 13.0, 23.0, 19.0, 32.0, 29.0, 33.0, 34.0, 37.0, 53.0, 38.0, 49.0, 54.0, 49.0, 44.0, 38.0, 49.0, 38.0, 55.0, 41.0, 29.0, 30.0, 23.0, 20.0, 22.0, 13.0, 11.0, 6.0, 13.0, 6.0, 5.0, 5.0, 1.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.63037109375, -0.609375, -0.58837890625, -0.5673828125, -0.54638671875, -0.525390625, -0.50439453125, -0.4833984375, -0.46240234375, -0.44140625, -0.42041015625, -0.3994140625, -0.37841796875, -0.357421875, -0.33642578125, -0.3154296875, -0.29443359375, -0.2734375, -0.25244140625, -0.2314453125, -0.21044921875, -0.189453125, -0.16845703125, -0.1474609375, -0.12646484375, -0.10546875, -0.08447265625, -0.0634765625, -0.04248046875, -0.021484375, -0.00048828125, 0.0205078125, 0.04150390625, 0.0625, 0.08349609375, 0.1044921875, 0.12548828125, 0.146484375, 0.16748046875, 0.1884765625, 0.20947265625, 0.23046875, 0.25146484375, 0.2724609375, 0.29345703125, 0.314453125, 0.33544921875, 0.3564453125, 0.37744140625, 0.3984375, 0.41943359375, 0.4404296875, 0.46142578125, 0.482421875, 0.50341796875, 0.5244140625, 0.54541015625, 0.56640625, 0.58740234375, 0.6083984375, 0.62939453125, 0.650390625, 0.67138671875, 0.6923828125, 0.71337890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 12.0, 16.0, 29.0, 41.0, 72.0, 123.0, 263.0, 781.0, 2641.0, 13549.0, 354984.0, 651490.0, 19498.0, 3387.0, 915.0, 363.0, 175.0, 77.0, 47.0, 36.0, 18.0, 11.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77294921875, -0.7488555908203125, -0.724761962890625, -0.7006683349609375, -0.67657470703125, -0.6524810791015625, -0.628387451171875, -0.6042938232421875, -0.5802001953125, -0.5561065673828125, -0.532012939453125, -0.5079193115234375, -0.48382568359375, -0.4597320556640625, -0.435638427734375, -0.4115447998046875, -0.387451171875, -0.3633575439453125, -0.339263916015625, -0.3151702880859375, -0.29107666015625, -0.2669830322265625, -0.242889404296875, -0.2187957763671875, -0.1947021484375, -0.1706085205078125, -0.146514892578125, -0.1224212646484375, -0.09832763671875, -0.0742340087890625, -0.050140380859375, -0.0260467529296875, -0.001953125, 0.0221405029296875, 0.046234130859375, 0.0703277587890625, 0.09442138671875, 0.1185150146484375, 0.142608642578125, 0.1667022705078125, 0.1907958984375, 0.2148895263671875, 0.238983154296875, 0.2630767822265625, 0.28717041015625, 0.3112640380859375, 0.335357666015625, 0.3594512939453125, 0.383544921875, 0.4076385498046875, 0.431732177734375, 0.4558258056640625, 0.47991943359375, 0.5040130615234375, 0.528106689453125, 0.5522003173828125, 0.5762939453125, 0.6003875732421875, 0.624481201171875, 0.6485748291015625, 0.67266845703125, 0.6967620849609375, 0.720855712890625, 0.7449493408203125, 0.76904296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 11.0, 19.0, 31.0, 22.0, 38.0, 60.0, 60.0, 63.0, 79.0, 78.0, 96.0, 91.0, 72.0, 63.0, 48.0, 39.0, 24.0, 23.0, 15.0, 16.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011283159255981445, -0.0001102769747376442, -0.00010772235691547394, -0.00010516773909330368, -0.00010261312127113342, -0.00010005850344896317, -9.750388562679291e-05, -9.494926780462265e-05, -9.239464998245239e-05, -8.984003216028214e-05, -8.728541433811188e-05, -8.473079651594162e-05, -8.217617869377136e-05, -7.96215608716011e-05, -7.706694304943085e-05, -7.451232522726059e-05, -7.195770740509033e-05, -6.940308958292007e-05, -6.684847176074982e-05, -6.429385393857956e-05, -6.17392361164093e-05, -5.9184618294239044e-05, -5.663000047206879e-05, -5.407538264989853e-05, -5.152076482772827e-05, -4.8966147005558014e-05, -4.6411529183387756e-05, -4.38569113612175e-05, -4.130229353904724e-05, -3.8747675716876984e-05, -3.6193057894706726e-05, -3.363844007253647e-05, -3.108382225036621e-05, -2.8529204428195953e-05, -2.5974586606025696e-05, -2.3419968783855438e-05, -2.086535096168518e-05, -1.8310733139514923e-05, -1.5756115317344666e-05, -1.3201497495174408e-05, -1.064687967300415e-05, -8.092261850833893e-06, -5.537644028663635e-06, -2.9830262064933777e-06, -4.284083843231201e-07, 2.1262094378471375e-06, 4.680827260017395e-06, 7.235445082187653e-06, 9.79006290435791e-06, 1.2344680726528168e-05, 1.4899298548698425e-05, 1.7453916370868683e-05, 2.000853419303894e-05, 2.2563152015209198e-05, 2.5117769837379456e-05, 2.7672387659549713e-05, 3.022700548171997e-05, 3.278162330389023e-05, 3.5336241126060486e-05, 3.7890858948230743e-05, 4.0445476770401e-05, 4.300009459257126e-05, 4.5554712414741516e-05, 4.8109330236911774e-05, 5.066394805908203e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 15.0, 15.0, 25.0, 42.0, 68.0, 111.0, 179.0, 337.0, 624.0, 1564.0, 4845.0, 23724.0, 474279.0, 509575.0, 24999.0, 4999.0, 1709.0, 668.0, 320.0, 179.0, 100.0, 58.0, 36.0, 27.0, 19.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72998046875, -0.7097091674804688, -0.6894378662109375, -0.6691665649414062, -0.648895263671875, -0.6286239624023438, -0.6083526611328125, -0.5880813598632812, -0.56781005859375, -0.5475387573242188, -0.5272674560546875, -0.5069961547851562, -0.486724853515625, -0.46645355224609375, -0.4461822509765625, -0.42591094970703125, -0.4056396484375, -0.38536834716796875, -0.3650970458984375, -0.34482574462890625, -0.324554443359375, -0.30428314208984375, -0.2840118408203125, -0.26374053955078125, -0.24346923828125, -0.22319793701171875, -0.2029266357421875, -0.18265533447265625, -0.162384033203125, -0.14211273193359375, -0.1218414306640625, -0.10157012939453125, -0.081298828125, -0.06102752685546875, -0.0407562255859375, -0.02048492431640625, -0.000213623046875, 0.02005767822265625, 0.0403289794921875, 0.06060028076171875, 0.08087158203125, 0.10114288330078125, 0.1214141845703125, 0.14168548583984375, 0.161956787109375, 0.18222808837890625, 0.2024993896484375, 0.22277069091796875, 0.2430419921875, 0.26331329345703125, 0.2835845947265625, 0.30385589599609375, 0.324127197265625, 0.34439849853515625, 0.3646697998046875, 0.38494110107421875, 0.40521240234375, 0.42548370361328125, 0.4457550048828125, 0.46602630615234375, 0.486297607421875, 0.5065689086914062, 0.5268402099609375, 0.5471115112304688, 0.5673828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 11.0, 21.0, 29.0, 42.0, 92.0, 151.0, 192.0, 157.0, 128.0, 74.0, 35.0, 23.0, 22.0, 9.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.689544677734375, -0.66912841796875, -0.648712158203125, -0.6282958984375, -0.607879638671875, -0.58746337890625, -0.567047119140625, -0.546630859375, -0.526214599609375, -0.50579833984375, -0.485382080078125, -0.4649658203125, -0.444549560546875, -0.42413330078125, -0.403717041015625, -0.38330078125, -0.362884521484375, -0.34246826171875, -0.322052001953125, -0.3016357421875, -0.281219482421875, -0.26080322265625, -0.240386962890625, -0.219970703125, -0.199554443359375, -0.17913818359375, -0.158721923828125, -0.1383056640625, -0.117889404296875, -0.09747314453125, -0.077056884765625, -0.056640625, -0.036224365234375, -0.01580810546875, 0.004608154296875, 0.0250244140625, 0.045440673828125, 0.06585693359375, 0.086273193359375, 0.106689453125, 0.127105712890625, 0.14752197265625, 0.167938232421875, 0.1883544921875, 0.208770751953125, 0.22918701171875, 0.249603271484375, 0.27001953125, 0.290435791015625, 0.31085205078125, 0.331268310546875, 0.3516845703125, 0.372100830078125, 0.39251708984375, 0.412933349609375, 0.433349609375, 0.453765869140625, 0.47418212890625, 0.494598388671875, 0.5150146484375, 0.535430908203125, 0.55584716796875, 0.576263427734375, 0.5966796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 17.0, 34.0, 76.0, 108.0, 186.0, 206.0, 162.0, 111.0, 48.0, 17.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.378572463989258, -7.137697696685791, -6.896822929382324, -6.655948638916016, -6.415073871612549, -6.174199104309082, -5.933324813842773, -5.692450046539307, -5.45157527923584, -5.210700511932373, -4.969825744628906, -4.728951454162598, -4.488076686859131, -4.247201919555664, -4.0063276290893555, -3.7654528617858887, -3.524578094482422, -3.283703327178955, -3.0428287982940674, -2.8019542694091797, -2.561079502105713, -2.320204734802246, -2.0793302059173584, -1.8384555578231812, -1.597580909729004, -1.3567062616348267, -1.1158316135406494, -0.8749569654464722, -0.6340823173522949, -0.3932076692581177, -0.15233302116394043, 0.08854162693023682, 0.32941627502441406, 0.5702909231185913, 0.8111655712127686, 1.0520402193069458, 1.292914867401123, 1.5337895154953003, 1.7746641635894775, 2.0155386924743652, 2.256413459777832, 2.497288227081299, 2.7381627559661865, 2.979037284851074, 3.219912052154541, 3.460786819458008, 3.7016613483428955, 3.942535877227783, 4.18341064453125, 4.424285411834717, 4.665160179138184, 4.906034469604492, 5.146909236907959, 5.387784004211426, 5.628658294677734, 5.869533061981201, 6.110407829284668, 6.351282596588135, 6.592157363891602, 6.83303165435791, 7.073906421661377, 7.314781188964844, 7.555655479431152, 7.796530246734619, 8.037405014038086]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 5.0, 12.0, 9.0, 16.0, 15.0, 19.0, 24.0, 14.0, 32.0, 26.0, 40.0, 30.0, 30.0, 31.0, 28.0, 36.0, 42.0, 37.0, 56.0, 33.0, 40.0, 37.0, 41.0, 37.0, 36.0, 37.0, 30.0, 29.0, 26.0, 19.0, 16.0, 16.0, 13.0, 13.0, 10.0, 11.0, 10.0, 7.0, 4.0, 4.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.8540115356445312, -2.768737316131592, -2.6834630966186523, -2.598189115524292, -2.5129148960113525, -2.427640676498413, -2.3423664569854736, -2.2570924758911133, -2.171818256378174, -2.0865440368652344, -2.001269817352295, -1.915995717048645, -1.8307216167449951, -1.7454473972320557, -1.6601731777191162, -1.5748990774154663, -1.4896248579025269, -1.4043506383895874, -1.3190765380859375, -1.233802318572998, -1.1485282182693481, -1.0632539987564087, -0.977979838848114, -0.8927056789398193, -0.8074315190315247, -0.72215735912323, -0.6368831992149353, -0.5516090393066406, -0.46633484959602356, -0.3810606896877289, -0.2957864999771118, -0.21051234006881714, -0.12523818016052246, -0.039964012801647186, 0.04531015455722809, 0.13058432936668396, 0.21585848927497864, 0.3011326491832733, 0.3864068388938904, 0.47168099880218506, 0.5569551587104797, 0.6422293186187744, 0.7275034785270691, 0.8127776384353638, 0.8980518579483032, 0.9833259582519531, 1.0686001777648926, 1.153874397277832, 1.239148497581482, 1.3244227170944214, 1.4096968173980713, 1.4949710369110107, 1.5802451372146606, 1.6655193567276, 1.75079345703125, 1.8360676765441895, 1.921341896057129, 2.0066161155700684, 2.091890335083008, 2.177164316177368, 2.2624385356903076, 2.347712755203247, 2.4329869747161865, 2.518260955810547, 2.6035351753234863]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 9.0, 7.0, 18.0, 14.0, 24.0, 23.0, 38.0, 57.0, 82.0, 137.0, 193.0, 512.0, 1380.0, 6939.0, 4096548.0, 82655.0, 3781.0, 949.0, 365.0, 188.0, 94.0, 69.0, 45.0, 38.0, 22.0, 22.0, 20.0, 14.0, 8.0, 5.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8935546875, -1.8359222412109375, -1.778289794921875, -1.7206573486328125, -1.66302490234375, -1.6053924560546875, -1.547760009765625, -1.4901275634765625, -1.4324951171875, -1.3748626708984375, -1.317230224609375, -1.2595977783203125, -1.20196533203125, -1.1443328857421875, -1.086700439453125, -1.0290679931640625, -0.971435546875, -0.9138031005859375, -0.856170654296875, -0.7985382080078125, -0.74090576171875, -0.6832733154296875, -0.625640869140625, -0.5680084228515625, -0.5103759765625, -0.4527435302734375, -0.395111083984375, -0.3374786376953125, -0.27984619140625, -0.2222137451171875, -0.164581298828125, -0.1069488525390625, -0.04931640625, 0.0083160400390625, 0.065948486328125, 0.1235809326171875, 0.18121337890625, 0.2388458251953125, 0.296478271484375, 0.3541107177734375, 0.4117431640625, 0.4693756103515625, 0.527008056640625, 0.5846405029296875, 0.64227294921875, 0.6999053955078125, 0.757537841796875, 0.8151702880859375, 0.872802734375, 0.9304351806640625, 0.988067626953125, 1.0457000732421875, 1.10333251953125, 1.1609649658203125, 1.218597412109375, 1.2762298583984375, 1.3338623046875, 1.3914947509765625, 1.449127197265625, 1.5067596435546875, 1.56439208984375, 1.6220245361328125, 1.679656982421875, 1.7372894287109375, 1.794921875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 10.0, 5.0, 9.0, 14.0, 16.0, 17.0, 31.0, 31.0, 48.0, 58.0, 51.0, 70.0, 67.0, 61.0, 61.0, 64.0, 59.0, 43.0, 44.0, 54.0, 36.0, 19.0, 21.0, 23.0, 19.0, 14.0, 7.0, 10.0, 8.0, 3.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.187255859375, -0.18157196044921875, -0.1758880615234375, -0.17020416259765625, -0.164520263671875, -0.15883636474609375, -0.1531524658203125, -0.14746856689453125, -0.14178466796875, -0.13610076904296875, -0.1304168701171875, -0.12473297119140625, -0.119049072265625, -0.11336517333984375, -0.1076812744140625, -0.10199737548828125, -0.0963134765625, -0.09062957763671875, -0.0849456787109375, -0.07926177978515625, -0.073577880859375, -0.06789398193359375, -0.0622100830078125, -0.05652618408203125, -0.05084228515625, -0.04515838623046875, -0.0394744873046875, -0.03379058837890625, -0.028106689453125, -0.02242279052734375, -0.0167388916015625, -0.01105499267578125, -0.00537109375, 0.00031280517578125, 0.0059967041015625, 0.01168060302734375, 0.017364501953125, 0.02304840087890625, 0.0287322998046875, 0.03441619873046875, 0.04010009765625, 0.04578399658203125, 0.0514678955078125, 0.05715179443359375, 0.062835693359375, 0.06851959228515625, 0.0742034912109375, 0.07988739013671875, 0.0855712890625, 0.09125518798828125, 0.0969390869140625, 0.10262298583984375, 0.108306884765625, 0.11399078369140625, 0.1196746826171875, 0.12535858154296875, 0.13104248046875, 0.13672637939453125, 0.1424102783203125, 0.14809417724609375, 0.153778076171875, 0.15946197509765625, 0.1651458740234375, 0.17082977294921875, 0.176513671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 12.0, 17.0, 14.0, 18.0, 19.0, 20.0, 45.0, 63.0, 76.0, 92.0, 180.0, 261.0, 423.0, 830.0, 1892.0, 6209.0, 44661.0, 4102177.0, 28829.0, 4872.0, 1648.0, 712.0, 386.0, 243.0, 166.0, 123.0, 83.0, 52.0, 34.0, 27.0, 27.0, 18.0, 15.0, 8.0, 5.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1201171875, -1.0832977294921875, -1.046478271484375, -1.0096588134765625, -0.97283935546875, -0.9360198974609375, -0.899200439453125, -0.8623809814453125, -0.8255615234375, -0.7887420654296875, -0.751922607421875, -0.7151031494140625, -0.67828369140625, -0.6414642333984375, -0.604644775390625, -0.5678253173828125, -0.531005859375, -0.4941864013671875, -0.457366943359375, -0.4205474853515625, -0.38372802734375, -0.3469085693359375, -0.310089111328125, -0.2732696533203125, -0.2364501953125, -0.1996307373046875, -0.162811279296875, -0.1259918212890625, -0.08917236328125, -0.0523529052734375, -0.015533447265625, 0.0212860107421875, 0.05810546875, 0.0949249267578125, 0.131744384765625, 0.1685638427734375, 0.20538330078125, 0.2422027587890625, 0.279022216796875, 0.3158416748046875, 0.3526611328125, 0.3894805908203125, 0.426300048828125, 0.4631195068359375, 0.49993896484375, 0.5367584228515625, 0.573577880859375, 0.6103973388671875, 0.647216796875, 0.6840362548828125, 0.720855712890625, 0.7576751708984375, 0.79449462890625, 0.8313140869140625, 0.868133544921875, 0.9049530029296875, 0.9417724609375, 0.9785919189453125, 1.015411376953125, 1.0522308349609375, 1.08905029296875, 1.1258697509765625, 1.162689208984375, 1.1995086669921875, 1.236328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 8.0, 7.0, 8.0, 11.0, 27.0, 59.0, 367.0, 3437.0, 86.0, 30.0, 12.0, 13.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.299560546875, -0.2919025421142578, -0.2842445373535156, -0.27658653259277344, -0.26892852783203125, -0.26127052307128906, -0.2536125183105469, -0.2459545135498047, -0.2382965087890625, -0.2306385040283203, -0.22298049926757812, -0.21532249450683594, -0.20766448974609375, -0.20000648498535156, -0.19234848022460938, -0.1846904754638672, -0.177032470703125, -0.1693744659423828, -0.16171646118164062, -0.15405845642089844, -0.14640045166015625, -0.13874244689941406, -0.13108444213867188, -0.12342643737792969, -0.1157684326171875, -0.10811042785644531, -0.10045242309570312, -0.09279441833496094, -0.08513641357421875, -0.07747840881347656, -0.06982040405273438, -0.06216239929199219, -0.05450439453125, -0.04684638977050781, -0.039188385009765625, -0.03153038024902344, -0.02387237548828125, -0.016214370727539062, -0.008556365966796875, -0.0008983612060546875, 0.0067596435546875, 0.014417648315429688, 0.022075653076171875, 0.029733657836914062, 0.03739166259765625, 0.04504966735839844, 0.052707672119140625, 0.06036567687988281, 0.068023681640625, 0.07568168640136719, 0.08333969116210938, 0.09099769592285156, 0.09865570068359375, 0.10631370544433594, 0.11397171020507812, 0.12162971496582031, 0.1292877197265625, 0.1369457244873047, 0.14460372924804688, 0.15226173400878906, 0.15991973876953125, 0.16757774353027344, 0.17523574829101562, 0.1828937530517578, 0.1905517578125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 20.0, 12.0, 16.0, 29.0, 30.0, 49.0, 49.0, 59.0, 68.0, 94.0, 80.0, 75.0, 85.0, 67.0, 55.0, 40.0, 32.0, 28.0, 19.0, 18.0, 19.0, 9.0, 6.0, 8.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360433429479599, -0.34699639678001404, -0.3335593342781067, -0.32012230157852173, -0.30668526887893677, -0.2932482361793518, -0.27981117367744446, -0.2663741409778595, -0.25293707847595215, -0.239500030875206, -0.22606299817562103, -0.21262595057487488, -0.19918891787528992, -0.18575187027454376, -0.1723148226737976, -0.15887778997421265, -0.14544075727462769, -0.13200370967388153, -0.11856667697429657, -0.10512962937355042, -0.09169258922338486, -0.0782555490732193, -0.06481850147247314, -0.05138146132230759, -0.03794442117214203, -0.02450737915933132, -0.011070337146520615, 0.0023667067289352417, 0.0158037468791008, 0.029240787029266357, 0.04267783463001251, 0.05611487478017807, 0.06955191493034363, 0.08298895508050919, 0.09642599523067474, 0.1098630428314209, 0.12330008298158646, 0.13673712313175201, 0.15017417073249817, 0.16361120343208313, 0.17704825103282928, 0.19048529863357544, 0.2039223313331604, 0.21735937893390656, 0.2307964265346527, 0.24423345923423767, 0.257670521736145, 0.27110755443573, 0.28454458713531494, 0.2979816198348999, 0.31141868233680725, 0.3248557150363922, 0.3382927477359772, 0.3517298102378845, 0.3651668429374695, 0.37860387563705444, 0.3920409083366394, 0.40547794103622437, 0.4189150035381317, 0.4323520362377167, 0.44578906893730164, 0.459226131439209, 0.47266316413879395, 0.4861001968383789, 0.49953725934028625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 8.0, 8.0, 15.0, 10.0, 14.0, 18.0, 25.0, 20.0, 36.0, 24.0, 24.0, 28.0, 33.0, 41.0, 35.0, 44.0, 58.0, 48.0, 35.0, 48.0, 37.0, 39.0, 33.0, 32.0, 37.0, 27.0, 28.0, 32.0, 19.0, 19.0, 16.0, 18.0, 12.0, 14.0, 17.0, 9.0, 8.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.3270885944366455, -0.3178388476371765, -0.30858907103538513, -0.29933932423591614, -0.29008957743644714, -0.28083983063697815, -0.27159005403518677, -0.2623403072357178, -0.2530905604362488, -0.2438407987356186, -0.2345910519361496, -0.2253412902355194, -0.21609154343605042, -0.20684178173542023, -0.19759202003479004, -0.18834227323532104, -0.17909251153469086, -0.16984274983406067, -0.16059300303459167, -0.1513432413339615, -0.1420934945344925, -0.1328437328338623, -0.12359397858381271, -0.11434422433376312, -0.10509447008371353, -0.09584471583366394, -0.08659496158361435, -0.07734520733356476, -0.06809544563293457, -0.05884569510817528, -0.04959593713283539, -0.0403461828827858, -0.031096428632736206, -0.021846674382686615, -0.012596918269991875, -0.0033471621572971344, 0.005902592092752457, 0.015152346342802048, 0.024402104318141937, 0.03365185856819153, 0.04290161281824112, 0.05215136706829071, 0.0614011213183403, 0.07065087556838989, 0.07990063726902008, 0.08915038406848907, 0.09840014576911926, 0.10764990001916885, 0.11689965426921844, 0.12614941596984863, 0.13539916276931763, 0.14464892446994781, 0.1538986712694168, 0.163148432970047, 0.172398179769516, 0.18164794147014618, 0.19089770317077637, 0.20014746487140656, 0.20939721167087555, 0.21864697337150574, 0.22789672017097473, 0.23714648187160492, 0.2463962435722351, 0.2556459903717041, 0.2648957371711731]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 3.0, 2.0, 9.0, 6.0, 13.0, 17.0, 27.0, 57.0, 66.0, 125.0, 199.0, 335.0, 559.0, 1024.0, 2056.0, 4279.0, 9685.0, 23698.0, 61696.0, 161742.0, 348977.0, 261906.0, 104181.0, 39381.0, 15562.0, 6602.0, 2991.0, 1473.0, 774.0, 482.0, 240.0, 145.0, 89.0, 55.0, 26.0, 24.0, 9.0, 15.0, 9.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2919921875, -0.28359413146972656, -0.2751960754394531, -0.2667980194091797, -0.25839996337890625, -0.2500019073486328, -0.24160385131835938, -0.23320579528808594, -0.2248077392578125, -0.21640968322753906, -0.20801162719726562, -0.1996135711669922, -0.19121551513671875, -0.1828174591064453, -0.17441940307617188, -0.16602134704589844, -0.157623291015625, -0.14922523498535156, -0.14082717895507812, -0.1324291229248047, -0.12403106689453125, -0.11563301086425781, -0.10723495483398438, -0.09883689880371094, -0.0904388427734375, -0.08204078674316406, -0.07364273071289062, -0.06524467468261719, -0.05684661865234375, -0.04844856262207031, -0.040050506591796875, -0.03165245056152344, -0.02325439453125, -0.014856338500976562, -0.006458282470703125, 0.0019397735595703125, 0.01033782958984375, 0.018735885620117188, 0.027133941650390625, 0.03553199768066406, 0.0439300537109375, 0.05232810974121094, 0.060726165771484375, 0.06912422180175781, 0.07752227783203125, 0.08592033386230469, 0.09431838989257812, 0.10271644592285156, 0.111114501953125, 0.11951255798339844, 0.12791061401367188, 0.1363086700439453, 0.14470672607421875, 0.1531047821044922, 0.16150283813476562, 0.16990089416503906, 0.1782989501953125, 0.18669700622558594, 0.19509506225585938, 0.2034931182861328, 0.21189117431640625, 0.2202892303466797, 0.22868728637695312, 0.23708534240722656, 0.2454833984375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 10.0, 6.0, 7.0, 15.0, 15.0, 23.0, 23.0, 32.0, 35.0, 46.0, 47.0, 60.0, 59.0, 63.0, 48.0, 52.0, 60.0, 61.0, 62.0, 45.0, 40.0, 28.0, 32.0, 25.0, 20.0, 17.0, 15.0, 11.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17270278930664062, -0.16693878173828125, -0.16117477416992188, -0.1554107666015625, -0.14964675903320312, -0.14388275146484375, -0.13811874389648438, -0.132354736328125, -0.12659072875976562, -0.12082672119140625, -0.11506271362304688, -0.1092987060546875, -0.10353469848632812, -0.09777069091796875, -0.09200668334960938, -0.08624267578125, -0.08047866821289062, -0.07471466064453125, -0.06895065307617188, -0.0631866455078125, -0.057422637939453125, -0.05165863037109375, -0.045894622802734375, -0.040130615234375, -0.034366607666015625, -0.02860260009765625, -0.022838592529296875, -0.0170745849609375, -0.011310577392578125, -0.00554656982421875, 0.000217437744140625, 0.0059814453125, 0.011745452880859375, 0.01750946044921875, 0.023273468017578125, 0.0290374755859375, 0.034801483154296875, 0.04056549072265625, 0.046329498291015625, 0.052093505859375, 0.057857513427734375, 0.06362152099609375, 0.06938552856445312, 0.0751495361328125, 0.08091354370117188, 0.08667755126953125, 0.09244155883789062, 0.09820556640625, 0.10396957397460938, 0.10973358154296875, 0.11549758911132812, 0.1212615966796875, 0.12702560424804688, 0.13278961181640625, 0.13855361938476562, 0.144317626953125, 0.15008163452148438, 0.15584564208984375, 0.16160964965820312, 0.1673736572265625, 0.17313766479492188, 0.17890167236328125, 0.18466567993164062, 0.1904296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 3.0, 10.0, 8.0, 15.0, 24.0, 31.0, 40.0, 56.0, 94.0, 135.0, 248.0, 330.0, 555.0, 827.0, 1509.0, 3538.0, 14075.0, 150825.0, 773466.0, 86467.0, 9930.0, 2815.0, 1357.0, 746.0, 479.0, 309.0, 205.0, 162.0, 86.0, 63.0, 43.0, 25.0, 17.0, 18.0, 9.0, 8.0, 4.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.66162109375, -0.6423873901367188, -0.6231536865234375, -0.6039199829101562, -0.584686279296875, -0.5654525756835938, -0.5462188720703125, -0.5269851684570312, -0.50775146484375, -0.48851776123046875, -0.4692840576171875, -0.45005035400390625, -0.430816650390625, -0.41158294677734375, -0.3923492431640625, -0.37311553955078125, -0.3538818359375, -0.33464813232421875, -0.3154144287109375, -0.29618072509765625, -0.276947021484375, -0.25771331787109375, -0.2384796142578125, -0.21924591064453125, -0.20001220703125, -0.18077850341796875, -0.1615447998046875, -0.14231109619140625, -0.123077392578125, -0.10384368896484375, -0.0846099853515625, -0.06537628173828125, -0.046142578125, -0.02690887451171875, -0.0076751708984375, 0.01155853271484375, 0.030792236328125, 0.05002593994140625, 0.0692596435546875, 0.08849334716796875, 0.10772705078125, 0.12696075439453125, 0.1461944580078125, 0.16542816162109375, 0.184661865234375, 0.20389556884765625, 0.2231292724609375, 0.24236297607421875, 0.2615966796875, 0.28083038330078125, 0.3000640869140625, 0.31929779052734375, 0.338531494140625, 0.35776519775390625, 0.3769989013671875, 0.39623260498046875, 0.41546630859375, 0.43470001220703125, 0.4539337158203125, 0.47316741943359375, 0.492401123046875, 0.5116348266601562, 0.5308685302734375, 0.5501022338867188, 0.5693359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 2.0, 3.0, 4.0, 7.0, 6.0, 21.0, 14.0, 22.0, 24.0, 28.0, 44.0, 24.0, 38.0, 41.0, 54.0, 52.0, 41.0, 54.0, 45.0, 46.0, 43.0, 41.0, 45.0, 44.0, 43.0, 36.0, 29.0, 27.0, 13.0, 20.0, 19.0, 11.0, 22.0, 9.0, 11.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.669921875, -0.6458206176757812, -0.6217193603515625, -0.5976181030273438, -0.573516845703125, -0.5494155883789062, -0.5253143310546875, -0.5012130737304688, -0.47711181640625, -0.45301055908203125, -0.4289093017578125, -0.40480804443359375, -0.380706787109375, -0.35660552978515625, -0.3325042724609375, -0.30840301513671875, -0.2843017578125, -0.26020050048828125, -0.2360992431640625, -0.21199798583984375, -0.187896728515625, -0.16379547119140625, -0.1396942138671875, -0.11559295654296875, -0.09149169921875, -0.06739044189453125, -0.0432891845703125, -0.01918792724609375, 0.004913330078125, 0.02901458740234375, 0.0531158447265625, 0.07721710205078125, 0.101318359375, 0.12541961669921875, 0.1495208740234375, 0.17362213134765625, 0.197723388671875, 0.22182464599609375, 0.2459259033203125, 0.27002716064453125, 0.29412841796875, 0.31822967529296875, 0.3423309326171875, 0.36643218994140625, 0.390533447265625, 0.41463470458984375, 0.4387359619140625, 0.46283721923828125, 0.4869384765625, 0.5110397338867188, 0.5351409912109375, 0.5592422485351562, 0.583343505859375, 0.6074447631835938, 0.6315460205078125, 0.6556472778320312, 0.67974853515625, 0.7038497924804688, 0.7279510498046875, 0.7520523071289062, 0.776153564453125, 0.8002548217773438, 0.8243560791015625, 0.8484573364257812, 0.87255859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 7.0, 6.0, 9.0, 12.0, 20.0, 27.0, 39.0, 77.0, 96.0, 208.0, 410.0, 915.0, 3829.0, 43632.0, 895610.0, 95672.0, 5655.0, 1279.0, 471.0, 218.0, 130.0, 81.0, 45.0, 37.0, 25.0, 6.0, 10.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.650390625, -0.633544921875, -0.61669921875, -0.599853515625, -0.5830078125, -0.566162109375, -0.54931640625, -0.532470703125, -0.515625, -0.498779296875, -0.48193359375, -0.465087890625, -0.4482421875, -0.431396484375, -0.41455078125, -0.397705078125, -0.380859375, -0.364013671875, -0.34716796875, -0.330322265625, -0.3134765625, -0.296630859375, -0.27978515625, -0.262939453125, -0.24609375, -0.229248046875, -0.21240234375, -0.195556640625, -0.1787109375, -0.161865234375, -0.14501953125, -0.128173828125, -0.111328125, -0.094482421875, -0.07763671875, -0.060791015625, -0.0439453125, -0.027099609375, -0.01025390625, 0.006591796875, 0.0234375, 0.040283203125, 0.05712890625, 0.073974609375, 0.0908203125, 0.107666015625, 0.12451171875, 0.141357421875, 0.158203125, 0.175048828125, 0.19189453125, 0.208740234375, 0.2255859375, 0.242431640625, 0.25927734375, 0.276123046875, 0.29296875, 0.309814453125, 0.32666015625, 0.343505859375, 0.3603515625, 0.377197265625, 0.39404296875, 0.410888671875, 0.427734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 9.0, 6.0, 9.0, 16.0, 21.0, 23.0, 39.0, 75.0, 142.0, 201.0, 178.0, 105.0, 54.0, 36.0, 19.0, 16.0, 9.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013971328735351562, -0.00013558007776737213, -0.00013144686818122864, -0.00012731365859508514, -0.00012318044900894165, -0.00011904723942279816, -0.00011491402983665466, -0.00011078082025051117, -0.00010664761066436768, -0.00010251440107822418, -9.838119149208069e-05, -9.42479819059372e-05, -9.01147723197937e-05, -8.598156273365021e-05, -8.184835314750671e-05, -7.771514356136322e-05, -7.358193397521973e-05, -6.944872438907623e-05, -6.531551480293274e-05, -6.118230521678925e-05, -5.704909563064575e-05, -5.291588604450226e-05, -4.8782676458358765e-05, -4.464946687221527e-05, -4.051625728607178e-05, -3.6383047699928284e-05, -3.224983811378479e-05, -2.8116628527641296e-05, -2.3983418941497803e-05, -1.985020935535431e-05, -1.5716999769210815e-05, -1.1583790183067322e-05, -7.450580596923828e-06, -3.3173710107803345e-06, 8.158385753631592e-07, 4.949048161506653e-06, 9.082257747650146e-06, 1.321546733379364e-05, 1.7348676919937134e-05, 2.1481886506080627e-05, 2.561509609222412e-05, 2.9748305678367615e-05, 3.388151526451111e-05, 3.80147248506546e-05, 4.2147934436798096e-05, 4.628114402294159e-05, 5.041435360908508e-05, 5.454756319522858e-05, 5.868077278137207e-05, 6.281398236751556e-05, 6.694719195365906e-05, 7.108040153980255e-05, 7.521361112594604e-05, 7.934682071208954e-05, 8.348003029823303e-05, 8.761323988437653e-05, 9.174644947052002e-05, 9.587965905666351e-05, 0.00010001286864280701, 0.0001041460782289505, 0.000108279287815094, 0.00011241249740123749, 0.00011654570698738098, 0.00012067891657352448, 0.00012481212615966797]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 14.0, 11.0, 22.0, 23.0, 30.0, 51.0, 66.0, 109.0, 174.0, 327.0, 560.0, 1207.0, 2684.0, 8252.0, 39104.0, 397253.0, 534426.0, 48889.0, 9508.0, 3053.0, 1253.0, 655.0, 332.0, 186.0, 128.0, 72.0, 47.0, 31.0, 17.0, 22.0, 9.0, 5.0, 5.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.396240234375, -0.3855476379394531, -0.37485504150390625, -0.3641624450683594, -0.3534698486328125, -0.3427772521972656, -0.33208465576171875, -0.3213920593261719, -0.310699462890625, -0.3000068664550781, -0.28931427001953125, -0.2786216735839844, -0.2679290771484375, -0.2572364807128906, -0.24654388427734375, -0.23585128784179688, -0.22515869140625, -0.21446609497070312, -0.20377349853515625, -0.19308090209960938, -0.1823883056640625, -0.17169570922851562, -0.16100311279296875, -0.15031051635742188, -0.139617919921875, -0.12892532348632812, -0.11823272705078125, -0.10754013061523438, -0.0968475341796875, -0.08615493774414062, -0.07546234130859375, -0.06476974487304688, -0.0540771484375, -0.043384552001953125, -0.03269195556640625, -0.021999359130859375, -0.0113067626953125, -0.000614166259765625, 0.01007843017578125, 0.020771026611328125, 0.031463623046875, 0.042156219482421875, 0.05284881591796875, 0.06354141235351562, 0.0742340087890625, 0.08492660522460938, 0.09561920166015625, 0.10631179809570312, 0.11700439453125, 0.12769699096679688, 0.13838958740234375, 0.14908218383789062, 0.1597747802734375, 0.17046737670898438, 0.18115997314453125, 0.19185256958007812, 0.202545166015625, 0.21323776245117188, 0.22393035888671875, 0.23462295532226562, 0.2453155517578125, 0.2560081481933594, 0.26670074462890625, 0.2773933410644531, 0.2880859375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 0.0, 5.0, 6.0, 15.0, 12.0, 24.0, 24.0, 31.0, 38.0, 39.0, 54.0, 89.0, 82.0, 109.0, 79.0, 84.0, 59.0, 62.0, 39.0, 37.0, 26.0, 20.0, 17.0, 9.0, 3.0, 14.0, 4.0, 5.0, 0.0, 1.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2364501953125, -0.22855567932128906, -0.22066116333007812, -0.2127666473388672, -0.20487213134765625, -0.1969776153564453, -0.18908309936523438, -0.18118858337402344, -0.1732940673828125, -0.16539955139160156, -0.15750503540039062, -0.1496105194091797, -0.14171600341796875, -0.1338214874267578, -0.12592697143554688, -0.11803245544433594, -0.110137939453125, -0.10224342346191406, -0.09434890747070312, -0.08645439147949219, -0.07855987548828125, -0.07066535949707031, -0.06277084350585938, -0.05487632751464844, -0.0469818115234375, -0.03908729553222656, -0.031192779541015625, -0.023298263549804688, -0.01540374755859375, -0.0075092315673828125, 0.000385284423828125, 0.008279800415039062, 0.01617431640625, 0.024068832397460938, 0.031963348388671875, 0.03985786437988281, 0.04775238037109375, 0.05564689636230469, 0.06354141235351562, 0.07143592834472656, 0.0793304443359375, 0.08722496032714844, 0.09511947631835938, 0.10301399230957031, 0.11090850830078125, 0.11880302429199219, 0.12669754028320312, 0.13459205627441406, 0.142486572265625, 0.15038108825683594, 0.15827560424804688, 0.1661701202392578, 0.17406463623046875, 0.1819591522216797, 0.18985366821289062, 0.19774818420410156, 0.2056427001953125, 0.21353721618652344, 0.22143173217773438, 0.2293262481689453, 0.23722076416015625, 0.2451152801513672, 0.2530097961425781, 0.26090431213378906, 0.268798828125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 0.0, 4.0, 16.0, 51.0, 241.0, 434.0, 190.0, 48.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.789283752441406, -19.3896427154541, -18.99000358581543, -18.590362548828125, -18.19072151184082, -17.79108238220215, -17.391441345214844, -16.99180030822754, -16.592161178588867, -16.192520141601562, -15.792880058288574, -15.393239974975586, -14.993599891662598, -14.59395980834961, -14.194318771362305, -13.794678688049316, -13.395037651062012, -12.995397567749023, -12.595756530761719, -12.19611644744873, -11.796476364135742, -11.396835327148438, -10.99719524383545, -10.597555160522461, -10.197914123535156, -9.798274040222168, -9.398633003234863, -8.998992919921875, -8.599352836608887, -8.199712753295898, -7.800071716308594, -7.4004316329956055, -7.000791549682617, -6.601150989532471, -6.201510906219482, -5.801870346069336, -5.402230262756348, -5.002589702606201, -4.602949142456055, -4.203309059143066, -3.80366849899292, -3.4040281772613525, -3.004387855529785, -2.6047472953796387, -2.2051069736480713, -1.805466651916504, -1.4058260917663574, -1.00618577003479, -0.6065454483032227, -0.2069050669670105, 0.19273531436920166, 0.5923757553100586, 0.992016077041626, 1.3916563987731934, 1.7912969589233398, 2.1909372806549072, 2.5905776023864746, 2.990217924118042, 3.3898582458496094, 3.789498805999756, 4.189139366149902, 4.588779449462891, 4.988420009613037, 5.388060569763184, 5.787700653076172]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 9.0, 10.0, 11.0, 12.0, 13.0, 23.0, 14.0, 27.0, 22.0, 52.0, 39.0, 33.0, 44.0, 58.0, 47.0, 57.0, 52.0, 53.0, 39.0, 43.0, 56.0, 26.0, 33.0, 30.0, 36.0, 24.0, 21.0, 20.0, 13.0, 18.0, 11.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0], "bins": [-4.043496131896973, -3.9377517700195312, -3.83200740814209, -3.7262630462646484, -3.620518445968628, -3.5147740840911865, -3.409029722213745, -3.3032853603363037, -3.197540760040283, -3.091796398162842, -2.9860520362854004, -2.880307674407959, -2.7745630741119385, -2.668818712234497, -2.5630743503570557, -2.4573299884796143, -2.351585626602173, -2.2458412647247314, -2.14009690284729, -2.0343523025512695, -1.9286079406738281, -1.8228635787963867, -1.7171192169189453, -1.611374855041504, -1.505630373954773, -1.3998860120773315, -1.2941415309906006, -1.1883971691131592, -1.0826528072357178, -0.9769083261489868, -0.8711639642715454, -0.7654195427894592, -0.659675121307373, -0.5539306998252869, -0.44818630814552307, -0.3424419164657593, -0.2366974949836731, -0.13095307350158691, -0.025208711624145508, 0.08053570985794067, 0.18628013134002686, 0.29202455282211304, 0.39776894450187683, 0.5035133361816406, 0.6092577576637268, 0.715002179145813, 0.8207465410232544, 0.9264909625053406, 1.0322353839874268, 1.1379797458648682, 1.2437242269515991, 1.3494685888290405, 1.4552130699157715, 1.560957431793213, 1.6667017936706543, 1.7724461555480957, 1.8781906366348267, 1.983934998512268, 2.089679479598999, 2.1954238414764404, 2.301168203353882, 2.4069128036499023, 2.5126571655273438, 2.618401527404785, 2.7241458892822266]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 11.0, 18.0, 20.0, 28.0, 30.0, 46.0, 69.0, 106.0, 139.0, 216.0, 281.0, 405.0, 805.0, 1791.0, 5526.0, 32924.0, 4059632.0, 78694.0, 8547.0, 2385.0, 940.0, 565.0, 309.0, 227.0, 148.0, 120.0, 83.0, 55.0, 41.0, 27.0, 26.0, 10.0, 11.0, 6.0, 8.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.068359375, -1.0375213623046875, -1.006683349609375, -0.9758453369140625, -0.94500732421875, -0.9141693115234375, -0.883331298828125, -0.8524932861328125, -0.8216552734375, -0.7908172607421875, -0.759979248046875, -0.7291412353515625, -0.69830322265625, -0.6674652099609375, -0.636627197265625, -0.6057891845703125, -0.574951171875, -0.5441131591796875, -0.513275146484375, -0.4824371337890625, -0.45159912109375, -0.4207611083984375, -0.389923095703125, -0.3590850830078125, -0.3282470703125, -0.2974090576171875, -0.266571044921875, -0.2357330322265625, -0.20489501953125, -0.1740570068359375, -0.143218994140625, -0.1123809814453125, -0.08154296875, -0.0507049560546875, -0.019866943359375, 0.0109710693359375, 0.04180908203125, 0.0726470947265625, 0.103485107421875, 0.1343231201171875, 0.1651611328125, 0.1959991455078125, 0.226837158203125, 0.2576751708984375, 0.28851318359375, 0.3193511962890625, 0.350189208984375, 0.3810272216796875, 0.411865234375, 0.4427032470703125, 0.473541259765625, 0.5043792724609375, 0.53521728515625, 0.5660552978515625, 0.596893310546875, 0.6277313232421875, 0.6585693359375, 0.6894073486328125, 0.720245361328125, 0.7510833740234375, 0.78192138671875, 0.8127593994140625, 0.843597412109375, 0.8744354248046875, 0.9052734375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 13.0, 6.0, 12.0, 20.0, 23.0, 32.0, 31.0, 51.0, 52.0, 59.0, 64.0, 73.0, 63.0, 66.0, 91.0, 58.0, 67.0, 35.0, 53.0, 29.0, 27.0, 22.0, 15.0, 11.0, 8.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221435546875, -0.2147083282470703, -0.20798110961914062, -0.20125389099121094, -0.19452667236328125, -0.18779945373535156, -0.18107223510742188, -0.1743450164794922, -0.1676177978515625, -0.1608905792236328, -0.15416336059570312, -0.14743614196777344, -0.14070892333984375, -0.13398170471191406, -0.12725448608398438, -0.12052726745605469, -0.113800048828125, -0.10707283020019531, -0.10034561157226562, -0.09361839294433594, -0.08689117431640625, -0.08016395568847656, -0.07343673706054688, -0.06670951843261719, -0.0599822998046875, -0.05325508117675781, -0.046527862548828125, -0.03980064392089844, -0.03307342529296875, -0.026346206665039062, -0.019618988037109375, -0.012891769409179688, -0.00616455078125, 0.0005626678466796875, 0.007289886474609375, 0.014017105102539062, 0.02074432373046875, 0.027471542358398438, 0.034198760986328125, 0.04092597961425781, 0.0476531982421875, 0.05438041687011719, 0.061107635498046875, 0.06783485412597656, 0.07456207275390625, 0.08128929138183594, 0.08801651000976562, 0.09474372863769531, 0.101470947265625, 0.10819816589355469, 0.11492538452148438, 0.12165260314941406, 0.12837982177734375, 0.13510704040527344, 0.14183425903320312, 0.1485614776611328, 0.1552886962890625, 0.1620159149169922, 0.16874313354492188, 0.17547035217285156, 0.18219757080078125, 0.18892478942871094, 0.19565200805664062, 0.2023792266845703, 0.2091064453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 18.0, 20.0, 22.0, 40.0, 47.0, 63.0, 106.0, 158.0, 189.0, 315.0, 493.0, 771.0, 1311.0, 2896.0, 8133.0, 37223.0, 3742097.0, 365999.0, 22988.0, 5936.0, 2306.0, 1191.0, 636.0, 439.0, 265.0, 176.0, 119.0, 84.0, 51.0, 42.0, 37.0, 20.0, 20.0, 12.0, 14.0, 4.0, 9.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7109375, -0.6893081665039062, -0.6676788330078125, -0.6460494995117188, -0.624420166015625, -0.6027908325195312, -0.5811614990234375, -0.5595321655273438, -0.53790283203125, -0.5162734985351562, -0.4946441650390625, -0.47301483154296875, -0.451385498046875, -0.42975616455078125, -0.4081268310546875, -0.38649749755859375, -0.3648681640625, -0.34323883056640625, -0.3216094970703125, -0.29998016357421875, -0.278350830078125, -0.25672149658203125, -0.2350921630859375, -0.21346282958984375, -0.19183349609375, -0.17020416259765625, -0.1485748291015625, -0.12694549560546875, -0.105316162109375, -0.08368682861328125, -0.0620574951171875, -0.04042816162109375, -0.018798828125, 0.00283050537109375, 0.0244598388671875, 0.04608917236328125, 0.067718505859375, 0.08934783935546875, 0.1109771728515625, 0.13260650634765625, 0.15423583984375, 0.17586517333984375, 0.1974945068359375, 0.21912384033203125, 0.240753173828125, 0.26238250732421875, 0.2840118408203125, 0.30564117431640625, 0.3272705078125, 0.34889984130859375, 0.3705291748046875, 0.39215850830078125, 0.413787841796875, 0.43541717529296875, 0.4570465087890625, 0.47867584228515625, 0.50030517578125, 0.5219345092773438, 0.5435638427734375, 0.5651931762695312, 0.586822509765625, 0.6084518432617188, 0.6300811767578125, 0.6517105102539062, 0.67333984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 11.0, 9.0, 8.0, 13.0, 35.0, 67.0, 162.0, 2738.0, 776.0, 139.0, 51.0, 29.0, 12.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.389404296875, -0.3788490295410156, -0.36829376220703125, -0.3577384948730469, -0.3471832275390625, -0.3366279602050781, -0.32607269287109375, -0.3155174255371094, -0.304962158203125, -0.2944068908691406, -0.28385162353515625, -0.2732963562011719, -0.2627410888671875, -0.2521858215332031, -0.24163055419921875, -0.23107528686523438, -0.22052001953125, -0.20996475219726562, -0.19940948486328125, -0.18885421752929688, -0.1782989501953125, -0.16774368286132812, -0.15718841552734375, -0.14663314819335938, -0.136077880859375, -0.12552261352539062, -0.11496734619140625, -0.10441207885742188, -0.0938568115234375, -0.08330154418945312, -0.07274627685546875, -0.062191009521484375, -0.0516357421875, -0.041080474853515625, -0.03052520751953125, -0.019969940185546875, -0.0094146728515625, 0.001140594482421875, 0.01169586181640625, 0.022251129150390625, 0.032806396484375, 0.043361663818359375, 0.05391693115234375, 0.06447219848632812, 0.0750274658203125, 0.08558273315429688, 0.09613800048828125, 0.10669326782226562, 0.11724853515625, 0.12780380249023438, 0.13835906982421875, 0.14891433715820312, 0.1594696044921875, 0.17002487182617188, 0.18058013916015625, 0.19113540649414062, 0.201690673828125, 0.21224594116210938, 0.22280120849609375, 0.23335647583007812, 0.2439117431640625, 0.2544670104980469, 0.26502227783203125, 0.2755775451660156, 0.2861328125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 7.0, 15.0, 30.0, 44.0, 82.0, 104.0, 137.0, 146.0, 141.0, 85.0, 66.0, 54.0, 27.0, 14.0, 10.0, 7.0, 8.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.486642837524414, -1.4486401081085205, -1.410637378692627, -1.3726346492767334, -1.3346319198608398, -1.2966291904449463, -1.2586264610290527, -1.2206237316131592, -1.1826210021972656, -1.144618272781372, -1.1066155433654785, -1.068612813949585, -1.0306100845336914, -0.9926073551177979, -0.9546045660972595, -0.916601836681366, -0.8785990476608276, -0.8405963182449341, -0.8025935888290405, -0.764590859413147, -0.7265881299972534, -0.6885854005813599, -0.6505826115608215, -0.612579882144928, -0.5745771527290344, -0.5365744233131409, -0.4985716938972473, -0.46056893467903137, -0.4225662052631378, -0.38456347584724426, -0.3465607166290283, -0.30855798721313477, -0.2705552577972412, -0.23255252838134766, -0.1945497840642929, -0.15654703974723816, -0.1185443103313446, -0.08054158091545105, -0.0425388365983963, -0.004536092281341553, 0.033466637134552, 0.07146937400102615, 0.1094721108675003, 0.14747485518455505, 0.1854775846004486, 0.22348031401634216, 0.2614830732345581, 0.29948580265045166, 0.3374885320663452, 0.37549126148223877, 0.4134939908981323, 0.45149675011634827, 0.4894994795322418, 0.527502179145813, 0.5655049681663513, 0.6035076975822449, 0.6415104269981384, 0.679513156414032, 0.7175158858299255, 0.7555186152458191, 0.7935214042663574, 0.831524133682251, 0.8695268630981445, 0.9075295925140381, 0.9455323219299316]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 5.0, 10.0, 17.0, 15.0, 11.0, 32.0, 30.0, 40.0, 61.0, 51.0, 69.0, 61.0, 67.0, 76.0, 78.0, 67.0, 75.0, 49.0, 41.0, 35.0, 19.0, 29.0, 18.0, 15.0, 16.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7889304161071777, -0.761100709438324, -0.7332710027694702, -0.7054412364959717, -0.6776115298271179, -0.6497818231582642, -0.6219521164894104, -0.5941224098205566, -0.5662926435470581, -0.5384629368782043, -0.5106332302093506, -0.48280349373817444, -0.4549737572669983, -0.42714405059814453, -0.39931434392929077, -0.3714846074581146, -0.34365490078926086, -0.3158251941204071, -0.28799545764923096, -0.2601657509803772, -0.23233601450920105, -0.2045063078403473, -0.17667658627033234, -0.14884686470031738, -0.12101714313030243, -0.09318742156028748, -0.06535769999027252, -0.037527985870838165, -0.009698264300823212, 0.018131449818611145, 0.0459611713886261, 0.07379089295864105, 0.101620614528656, 0.12945033609867096, 0.1572800576686859, 0.18510976433753967, 0.21293950080871582, 0.24076920747756958, 0.26859891414642334, 0.2964286506175995, 0.32425838708877563, 0.3520880937576294, 0.37991783022880554, 0.4077475368976593, 0.43557727336883545, 0.4634069800376892, 0.49123668670654297, 0.5190664529800415, 0.5468961000442505, 0.5747258067131042, 0.602555513381958, 0.6303852796554565, 0.6582149863243103, 0.6860446929931641, 0.7138743996620178, 0.7417041063308716, 0.7695338726043701, 0.7973635792732239, 0.8251932859420776, 0.8530230522155762, 0.8808527588844299, 0.9086824655532837, 0.9365121722221375, 0.9643418788909912, 0.9921716451644897]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 12.0, 24.0, 22.0, 63.0, 72.0, 148.0, 216.0, 345.0, 609.0, 1128.0, 2253.0, 4828.0, 10599.0, 25409.0, 60910.0, 148841.0, 357407.0, 257998.0, 102674.0, 42756.0, 17470.0, 7547.0, 3443.0, 1710.0, 824.0, 454.0, 304.0, 159.0, 104.0, 77.0, 45.0, 30.0, 16.0, 14.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31201171875, -0.3007850646972656, -0.28955841064453125, -0.2783317565917969, -0.2671051025390625, -0.2558784484863281, -0.24465179443359375, -0.23342514038085938, -0.222198486328125, -0.21097183227539062, -0.19974517822265625, -0.18851852416992188, -0.1772918701171875, -0.16606521606445312, -0.15483856201171875, -0.14361190795898438, -0.13238525390625, -0.12115859985351562, -0.10993194580078125, -0.09870529174804688, -0.0874786376953125, -0.07625198364257812, -0.06502532958984375, -0.053798675537109375, -0.042572021484375, -0.031345367431640625, -0.02011871337890625, -0.008892059326171875, 0.0023345947265625, 0.013561248779296875, 0.02478790283203125, 0.036014556884765625, 0.0472412109375, 0.058467864990234375, 0.06969451904296875, 0.08092117309570312, 0.0921478271484375, 0.10337448120117188, 0.11460113525390625, 0.12582778930664062, 0.137054443359375, 0.14828109741210938, 0.15950775146484375, 0.17073440551757812, 0.1819610595703125, 0.19318771362304688, 0.20441436767578125, 0.21564102172851562, 0.22686767578125, 0.23809432983398438, 0.24932098388671875, 0.2605476379394531, 0.2717742919921875, 0.2830009460449219, 0.29422760009765625, 0.3054542541503906, 0.316680908203125, 0.3279075622558594, 0.33913421630859375, 0.3503608703613281, 0.3615875244140625, 0.3728141784667969, 0.38404083251953125, 0.3952674865722656, 0.406494140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 5.0, 14.0, 13.0, 12.0, 15.0, 23.0, 26.0, 35.0, 21.0, 37.0, 46.0, 45.0, 54.0, 60.0, 50.0, 52.0, 58.0, 55.0, 59.0, 32.0, 52.0, 49.0, 32.0, 30.0, 24.0, 26.0, 19.0, 8.0, 10.0, 7.0, 5.0, 6.0, 4.0, 2.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.18852996826171875, -0.1830902099609375, -0.17765045166015625, -0.172210693359375, -0.16677093505859375, -0.1613311767578125, -0.15589141845703125, -0.15045166015625, -0.14501190185546875, -0.1395721435546875, -0.13413238525390625, -0.128692626953125, -0.12325286865234375, -0.1178131103515625, -0.11237335205078125, -0.10693359375, -0.10149383544921875, -0.0960540771484375, -0.09061431884765625, -0.085174560546875, -0.07973480224609375, -0.0742950439453125, -0.06885528564453125, -0.06341552734375, -0.05797576904296875, -0.0525360107421875, -0.04709625244140625, -0.041656494140625, -0.03621673583984375, -0.0307769775390625, -0.02533721923828125, -0.0198974609375, -0.01445770263671875, -0.0090179443359375, -0.00357818603515625, 0.001861572265625, 0.00730133056640625, 0.0127410888671875, 0.01818084716796875, 0.02362060546875, 0.02906036376953125, 0.0345001220703125, 0.03993988037109375, 0.045379638671875, 0.05081939697265625, 0.0562591552734375, 0.06169891357421875, 0.067138671875, 0.07257843017578125, 0.0780181884765625, 0.08345794677734375, 0.088897705078125, 0.09433746337890625, 0.0997772216796875, 0.10521697998046875, 0.11065673828125, 0.11609649658203125, 0.1215362548828125, 0.12697601318359375, 0.132415771484375, 0.13785552978515625, 0.1432952880859375, 0.14873504638671875, 0.1541748046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 8.0, 11.0, 18.0, 12.0, 28.0, 37.0, 47.0, 76.0, 105.0, 138.0, 250.0, 421.0, 706.0, 1586.0, 4358.0, 23477.0, 331090.0, 637429.0, 38694.0, 6014.0, 1818.0, 872.0, 474.0, 266.0, 204.0, 131.0, 75.0, 57.0, 34.0, 33.0, 18.0, 18.0, 9.0, 8.0, 7.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.84716796875, -0.8199386596679688, -0.7927093505859375, -0.7654800415039062, -0.738250732421875, -0.7110214233398438, -0.6837921142578125, -0.6565628051757812, -0.62933349609375, -0.6021041870117188, -0.5748748779296875, -0.5476455688476562, -0.520416259765625, -0.49318695068359375, -0.4659576416015625, -0.43872833251953125, -0.4114990234375, -0.38426971435546875, -0.3570404052734375, -0.32981109619140625, -0.302581787109375, -0.27535247802734375, -0.2481231689453125, -0.22089385986328125, -0.19366455078125, -0.16643524169921875, -0.1392059326171875, -0.11197662353515625, -0.084747314453125, -0.05751800537109375, -0.0302886962890625, -0.00305938720703125, 0.024169921875, 0.05139923095703125, 0.0786285400390625, 0.10585784912109375, 0.133087158203125, 0.16031646728515625, 0.1875457763671875, 0.21477508544921875, 0.24200439453125, 0.26923370361328125, 0.2964630126953125, 0.32369232177734375, 0.350921630859375, 0.37815093994140625, 0.4053802490234375, 0.43260955810546875, 0.4598388671875, 0.48706817626953125, 0.5142974853515625, 0.5415267944335938, 0.568756103515625, 0.5959854125976562, 0.6232147216796875, 0.6504440307617188, 0.67767333984375, 0.7049026489257812, 0.7321319580078125, 0.7593612670898438, 0.786590576171875, 0.8138198852539062, 0.8410491943359375, 0.8682785034179688, 0.8955078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 3.0, 6.0, 7.0, 13.0, 17.0, 17.0, 27.0, 31.0, 29.0, 37.0, 55.0, 62.0, 70.0, 67.0, 70.0, 71.0, 80.0, 63.0, 50.0, 48.0, 41.0, 33.0, 25.0, 19.0, 12.0, 15.0, 9.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94677734375, -0.916778564453125, -0.88677978515625, -0.856781005859375, -0.8267822265625, -0.796783447265625, -0.76678466796875, -0.736785888671875, -0.706787109375, -0.676788330078125, -0.64678955078125, -0.616790771484375, -0.5867919921875, -0.556793212890625, -0.52679443359375, -0.496795654296875, -0.466796875, -0.436798095703125, -0.40679931640625, -0.376800537109375, -0.3468017578125, -0.316802978515625, -0.28680419921875, -0.256805419921875, -0.226806640625, -0.196807861328125, -0.16680908203125, -0.136810302734375, -0.1068115234375, -0.076812744140625, -0.04681396484375, -0.016815185546875, 0.01318359375, 0.043182373046875, 0.07318115234375, 0.103179931640625, 0.1331787109375, 0.163177490234375, 0.19317626953125, 0.223175048828125, 0.253173828125, 0.283172607421875, 0.31317138671875, 0.343170166015625, 0.3731689453125, 0.403167724609375, 0.43316650390625, 0.463165283203125, 0.4931640625, 0.523162841796875, 0.55316162109375, 0.583160400390625, 0.6131591796875, 0.643157958984375, 0.67315673828125, 0.703155517578125, 0.733154296875, 0.763153076171875, 0.79315185546875, 0.823150634765625, 0.8531494140625, 0.883148193359375, 0.91314697265625, 0.943145751953125, 0.97314453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 8.0, 9.0, 9.0, 18.0, 36.0, 93.0, 157.0, 350.0, 875.0, 3410.0, 31486.0, 754889.0, 242754.0, 11513.0, 1884.0, 572.0, 228.0, 118.0, 65.0, 35.0, 24.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48974609375, -0.4774436950683594, -0.46514129638671875, -0.4528388977050781, -0.4405364990234375, -0.4282341003417969, -0.41593170166015625, -0.4036293029785156, -0.391326904296875, -0.3790245056152344, -0.36672210693359375, -0.3544197082519531, -0.3421173095703125, -0.3298149108886719, -0.31751251220703125, -0.3052101135253906, -0.29290771484375, -0.2806053161621094, -0.26830291748046875, -0.2560005187988281, -0.2436981201171875, -0.23139572143554688, -0.21909332275390625, -0.20679092407226562, -0.194488525390625, -0.18218612670898438, -0.16988372802734375, -0.15758132934570312, -0.1452789306640625, -0.13297653198242188, -0.12067413330078125, -0.10837173461914062, -0.0960693359375, -0.08376693725585938, -0.07146453857421875, -0.059162139892578125, -0.0468597412109375, -0.034557342529296875, -0.02225494384765625, -0.009952545166015625, 0.002349853515625, 0.014652252197265625, 0.02695465087890625, 0.039257049560546875, 0.0515594482421875, 0.06386184692382812, 0.07616424560546875, 0.08846664428710938, 0.10076904296875, 0.11307144165039062, 0.12537384033203125, 0.13767623901367188, 0.1499786376953125, 0.16228103637695312, 0.17458343505859375, 0.18688583374023438, 0.199188232421875, 0.21149063110351562, 0.22379302978515625, 0.23609542846679688, 0.2483978271484375, 0.2607002258300781, 0.27300262451171875, 0.2853050231933594, 0.297607421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 9.0, 7.0, 14.0, 21.0, 26.0, 25.0, 42.0, 37.0, 55.0, 63.0, 124.0, 141.0, 111.0, 52.0, 31.0, 44.0, 29.0, 27.0, 32.0, 22.0, 18.0, 10.0, 14.0, 6.0, 4.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.250640869140625e-05, -8.955877274274826e-05, -8.661113679409027e-05, -8.366350084543228e-05, -8.071586489677429e-05, -7.77682289481163e-05, -7.482059299945831e-05, -7.187295705080032e-05, -6.892532110214233e-05, -6.597768515348434e-05, -6.303004920482635e-05, -6.0082413256168365e-05, -5.7134777307510376e-05, -5.4187141358852386e-05, -5.12395054101944e-05, -4.829186946153641e-05, -4.534423351287842e-05, -4.239659756422043e-05, -3.944896161556244e-05, -3.650132566690445e-05, -3.355368971824646e-05, -3.060605376958847e-05, -2.765841782093048e-05, -2.471078187227249e-05, -2.1763145923614502e-05, -1.8815509974956512e-05, -1.5867874026298523e-05, -1.2920238077640533e-05, -9.972602128982544e-06, -7.0249661803245544e-06, -4.077330231666565e-06, -1.1296942830085754e-06, 1.817941665649414e-06, 4.7655776143074036e-06, 7.713213562965393e-06, 1.0660849511623383e-05, 1.3608485460281372e-05, 1.655612140893936e-05, 1.950375735759735e-05, 2.245139330625534e-05, 2.539902925491333e-05, 2.834666520357132e-05, 3.129430115222931e-05, 3.42419371008873e-05, 3.718957304954529e-05, 4.013720899820328e-05, 4.308484494686127e-05, 4.6032480895519257e-05, 4.8980116844177246e-05, 5.1927752792835236e-05, 5.4875388741493225e-05, 5.7823024690151215e-05, 6.0770660638809204e-05, 6.37182965874672e-05, 6.666593253612518e-05, 6.961356848478317e-05, 7.256120443344116e-05, 7.550884038209915e-05, 7.845647633075714e-05, 8.140411227941513e-05, 8.435174822807312e-05, 8.729938417673111e-05, 9.02470201253891e-05, 9.319465607404709e-05, 9.614229202270508e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 13.0, 12.0, 18.0, 43.0, 85.0, 142.0, 294.0, 718.0, 2026.0, 8993.0, 151272.0, 837154.0, 41084.0, 4496.0, 1211.0, 501.0, 239.0, 108.0, 54.0, 35.0, 16.0, 14.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.35398101806640625, -0.3410186767578125, -0.32805633544921875, -0.315093994140625, -0.30213165283203125, -0.2891693115234375, -0.27620697021484375, -0.26324462890625, -0.25028228759765625, -0.2373199462890625, -0.22435760498046875, -0.211395263671875, -0.19843292236328125, -0.1854705810546875, -0.17250823974609375, -0.1595458984375, -0.14658355712890625, -0.1336212158203125, -0.12065887451171875, -0.107696533203125, -0.09473419189453125, -0.0817718505859375, -0.06880950927734375, -0.05584716796875, -0.04288482666015625, -0.0299224853515625, -0.01696014404296875, -0.003997802734375, 0.00896453857421875, 0.0219268798828125, 0.03488922119140625, 0.0478515625, 0.06081390380859375, 0.0737762451171875, 0.08673858642578125, 0.099700927734375, 0.11266326904296875, 0.1256256103515625, 0.13858795166015625, 0.15155029296875, 0.16451263427734375, 0.1774749755859375, 0.19043731689453125, 0.203399658203125, 0.21636199951171875, 0.2293243408203125, 0.24228668212890625, 0.2552490234375, 0.26821136474609375, 0.2811737060546875, 0.29413604736328125, 0.307098388671875, 0.32006072998046875, 0.3330230712890625, 0.34598541259765625, 0.35894775390625, 0.37191009521484375, 0.3848724365234375, 0.39783477783203125, 0.410797119140625, 0.42375946044921875, 0.4367218017578125, 0.44968414306640625, 0.462646484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 10.0, 9.0, 17.0, 35.0, 65.0, 88.0, 138.0, 139.0, 145.0, 117.0, 84.0, 57.0, 31.0, 30.0, 13.0, 5.0, 10.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33251953125, -0.3206329345703125, -0.308746337890625, -0.2968597412109375, -0.28497314453125, -0.2730865478515625, -0.261199951171875, -0.2493133544921875, -0.2374267578125, -0.2255401611328125, -0.213653564453125, -0.2017669677734375, -0.18988037109375, -0.1779937744140625, -0.166107177734375, -0.1542205810546875, -0.142333984375, -0.1304473876953125, -0.118560791015625, -0.1066741943359375, -0.09478759765625, -0.0829010009765625, -0.071014404296875, -0.0591278076171875, -0.0472412109375, -0.0353546142578125, -0.023468017578125, -0.0115814208984375, 0.00030517578125, 0.0121917724609375, 0.024078369140625, 0.0359649658203125, 0.0478515625, 0.0597381591796875, 0.071624755859375, 0.0835113525390625, 0.09539794921875, 0.1072845458984375, 0.119171142578125, 0.1310577392578125, 0.1429443359375, 0.1548309326171875, 0.166717529296875, 0.1786041259765625, 0.19049072265625, 0.2023773193359375, 0.214263916015625, 0.2261505126953125, 0.238037109375, 0.2499237060546875, 0.261810302734375, 0.2736968994140625, 0.28558349609375, 0.2974700927734375, 0.309356689453125, 0.3212432861328125, 0.3331298828125, 0.3450164794921875, 0.356903076171875, 0.3687896728515625, 0.38067626953125, 0.3925628662109375, 0.404449462890625, 0.4163360595703125, 0.42822265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 20.0, 16.0, 46.0, 87.0, 168.0, 201.0, 219.0, 126.0, 71.0, 23.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.497528076171875, -5.284073829650879, -5.070620059967041, -4.857165813446045, -4.643712043762207, -4.430257797241211, -4.216803550720215, -4.003349304199219, -3.789895534515381, -3.576441526412964, -3.362987518310547, -3.149533271789551, -2.936079263687134, -2.722625255584717, -2.5091710090637207, -2.2957170009613037, -2.0822629928588867, -1.8688089847564697, -1.6553548574447632, -1.4419007301330566, -1.2284467220306396, -1.0149927139282227, -0.8015385866165161, -0.5880844593048096, -0.3746304512023926, -0.1611763834953308, 0.05227768421173096, 0.2657317519187927, 0.4791858196258545, 0.6926398277282715, 0.906093955039978, 1.1195480823516846, 1.3330020904541016, 1.5464560985565186, 1.759910225868225, 1.9733643531799316, 2.1868183612823486, 2.4002723693847656, 2.6137266159057617, 2.8271806240081787, 3.0406346321105957, 3.2540886402130127, 3.4675426483154297, 3.680996894836426, 3.8944509029388428, 4.10790491104126, 4.321359157562256, 4.534812927246094, 4.74826717376709, 4.961721420288086, 5.175175189971924, 5.38862943649292, 5.602083206176758, 5.815537452697754, 6.02899169921875, 6.242445945739746, 6.455899715423584, 6.66935396194458, 6.882807731628418, 7.096261978149414, 7.30971622467041, 7.523169994354248, 7.736624240875244, 7.950078010559082, 8.163532257080078]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 8.0, 4.0, 8.0, 12.0, 18.0, 13.0, 25.0, 35.0, 36.0, 35.0, 46.0, 55.0, 50.0, 51.0, 75.0, 87.0, 68.0, 61.0, 61.0, 44.0, 48.0, 31.0, 28.0, 21.0, 21.0, 21.0, 9.0, 6.0, 7.0, 3.0, 9.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.309183120727539, -2.1841118335723877, -2.0590405464172363, -1.9339690208435059, -1.8088977336883545, -1.6838264465332031, -1.5587550401687622, -1.4336836338043213, -1.30861234664917, -1.1835410594940186, -1.0584696531295776, -0.9333983063697815, -0.8083269596099854, -0.6832556128501892, -0.5581842660903931, -0.4331129193305969, -0.3080415725708008, -0.18297022581100464, -0.057898879051208496, 0.06717246770858765, 0.1922438144683838, 0.31731516122817993, 0.4423865079879761, 0.5674578547477722, 0.6925292015075684, 0.8176005482673645, 0.9426718950271606, 1.0677433013916016, 1.192814588546753, 1.3178858757019043, 1.4429572820663452, 1.5680286884307861, 1.6930994987487793, 1.8181707859039307, 1.9432421922683716, 2.0683135986328125, 2.193384885787964, 2.3184561729431152, 2.4435276985168457, 2.568598985671997, 2.6936702728271484, 2.8187415599823, 2.943812847137451, 3.0688843727111816, 3.193955659866333, 3.3190269470214844, 3.444098472595215, 3.569169759750366, 3.6942410469055176, 3.819312334060669, 3.9443836212158203, 4.069455146789551, 4.194526672363281, 4.3195977210998535, 4.444669246673584, 4.569740295410156, 4.694811820983887, 4.819883346557617, 4.9449543952941895, 5.07002592086792, 5.195096969604492, 5.320168495178223, 5.445240020751953, 5.570311069488525, 5.695382595062256]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 11.0, 22.0, 30.0, 42.0, 82.0, 130.0, 202.0, 329.0, 533.0, 866.0, 1613.0, 2944.0, 6139.0, 13825.0, 35502.0, 114275.0, 732187.0, 2844175.0, 325406.0, 70742.0, 24453.0, 10118.0, 4790.0, 2453.0, 1356.0, 749.0, 471.0, 288.0, 183.0, 107.0, 84.0, 44.0, 35.0, 21.0, 16.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.25, -0.24147415161132812, -0.23294830322265625, -0.22442245483398438, -0.2158966064453125, -0.20737075805664062, -0.19884490966796875, -0.19031906127929688, -0.181793212890625, -0.17326736450195312, -0.16474151611328125, -0.15621566772460938, -0.1476898193359375, -0.13916397094726562, -0.13063812255859375, -0.12211227416992188, -0.11358642578125, -0.10506057739257812, -0.09653472900390625, -0.08800888061523438, -0.0794830322265625, -0.07095718383789062, -0.06243133544921875, -0.053905487060546875, -0.045379638671875, -0.036853790283203125, -0.02832794189453125, -0.019802093505859375, -0.0112762451171875, -0.002750396728515625, 0.00577545166015625, 0.014301300048828125, 0.0228271484375, 0.031352996826171875, 0.03987884521484375, 0.048404693603515625, 0.0569305419921875, 0.06545639038085938, 0.07398223876953125, 0.08250808715820312, 0.091033935546875, 0.09955978393554688, 0.10808563232421875, 0.11661148071289062, 0.1251373291015625, 0.13366317749023438, 0.14218902587890625, 0.15071487426757812, 0.15924072265625, 0.16776657104492188, 0.17629241943359375, 0.18481826782226562, 0.1933441162109375, 0.20186996459960938, 0.21039581298828125, 0.21892166137695312, 0.227447509765625, 0.23597335815429688, 0.24449920654296875, 0.2530250549316406, 0.2615509033203125, 0.2700767517089844, 0.27860260009765625, 0.2871284484863281, 0.295654296875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 11.0, 17.0, 30.0, 34.0, 44.0, 77.0, 90.0, 101.0, 122.0, 121.0, 94.0, 79.0, 68.0, 49.0, 34.0, 16.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2060546875, -0.19619369506835938, -0.18633270263671875, -0.17647171020507812, -0.1666107177734375, -0.15674972534179688, -0.14688873291015625, -0.13702774047851562, -0.127166748046875, -0.11730575561523438, -0.10744476318359375, -0.09758377075195312, -0.0877227783203125, -0.07786178588867188, -0.06800079345703125, -0.058139801025390625, -0.04827880859375, -0.038417816162109375, -0.02855682373046875, -0.018695831298828125, -0.0088348388671875, 0.001026153564453125, 0.01088714599609375, 0.020748138427734375, 0.030609130859375, 0.040470123291015625, 0.05033111572265625, 0.060192108154296875, 0.0700531005859375, 0.07991409301757812, 0.08977508544921875, 0.09963607788085938, 0.1094970703125, 0.11935806274414062, 0.12921905517578125, 0.13908004760742188, 0.1489410400390625, 0.15880203247070312, 0.16866302490234375, 0.17852401733398438, 0.188385009765625, 0.19824600219726562, 0.20810699462890625, 0.21796798706054688, 0.2278289794921875, 0.23768997192382812, 0.24755096435546875, 0.2574119567871094, 0.26727294921875, 0.2771339416503906, 0.28699493408203125, 0.2968559265136719, 0.3067169189453125, 0.3165779113769531, 0.32643890380859375, 0.3362998962402344, 0.346160888671875, 0.3560218811035156, 0.36588287353515625, 0.3757438659667969, 0.3856048583984375, 0.3954658508300781, 0.40532684326171875, 0.4151878356933594, 0.425048828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 17.0, 20.0, 26.0, 36.0, 55.0, 113.0, 170.0, 336.0, 668.0, 1492.0, 3466.0, 9229.0, 29392.0, 136419.0, 2388922.0, 1476962.0, 107215.0, 25418.0, 8236.0, 3228.0, 1403.0, 638.0, 314.0, 179.0, 97.0, 56.0, 63.0, 29.0, 17.0, 9.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.375732421875, -0.36358642578125, -0.3514404296875, -0.33929443359375, -0.3271484375, -0.31500244140625, -0.3028564453125, -0.29071044921875, -0.278564453125, -0.26641845703125, -0.2542724609375, -0.24212646484375, -0.22998046875, -0.21783447265625, -0.2056884765625, -0.19354248046875, -0.181396484375, -0.16925048828125, -0.1571044921875, -0.14495849609375, -0.1328125, -0.12066650390625, -0.1085205078125, -0.09637451171875, -0.084228515625, -0.07208251953125, -0.0599365234375, -0.04779052734375, -0.03564453125, -0.02349853515625, -0.0113525390625, 0.00079345703125, 0.012939453125, 0.02508544921875, 0.0372314453125, 0.04937744140625, 0.0615234375, 0.07366943359375, 0.0858154296875, 0.09796142578125, 0.110107421875, 0.12225341796875, 0.1343994140625, 0.14654541015625, 0.15869140625, 0.17083740234375, 0.1829833984375, 0.19512939453125, 0.207275390625, 0.21942138671875, 0.2315673828125, 0.24371337890625, 0.255859375, 0.26800537109375, 0.2801513671875, 0.29229736328125, 0.304443359375, 0.31658935546875, 0.3287353515625, 0.34088134765625, 0.35302734375, 0.36517333984375, 0.3773193359375, 0.38946533203125, 0.401611328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 5.0, 8.0, 12.0, 14.0, 16.0, 18.0, 52.0, 40.0, 62.0, 78.0, 129.0, 203.0, 349.0, 606.0, 854.0, 612.0, 338.0, 211.0, 117.0, 95.0, 54.0, 54.0, 37.0, 17.0, 14.0, 22.0, 11.0, 6.0, 5.0, 10.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.327392578125, -0.3162879943847656, -0.30518341064453125, -0.2940788269042969, -0.2829742431640625, -0.2718696594238281, -0.26076507568359375, -0.24966049194335938, -0.238555908203125, -0.22745132446289062, -0.21634674072265625, -0.20524215698242188, -0.1941375732421875, -0.18303298950195312, -0.17192840576171875, -0.16082382202148438, -0.14971923828125, -0.13861465454101562, -0.12751007080078125, -0.11640548706054688, -0.1053009033203125, -0.09419631958007812, -0.08309173583984375, -0.07198715209960938, -0.060882568359375, -0.049777984619140625, -0.03867340087890625, -0.027568817138671875, -0.0164642333984375, -0.005359649658203125, 0.00574493408203125, 0.016849517822265625, 0.0279541015625, 0.039058685302734375, 0.05016326904296875, 0.061267852783203125, 0.0723724365234375, 0.08347702026367188, 0.09458160400390625, 0.10568618774414062, 0.116790771484375, 0.12789535522460938, 0.13899993896484375, 0.15010452270507812, 0.1612091064453125, 0.17231369018554688, 0.18341827392578125, 0.19452285766601562, 0.20562744140625, 0.21673202514648438, 0.22783660888671875, 0.23894119262695312, 0.2500457763671875, 0.2611503601074219, 0.27225494384765625, 0.2833595275878906, 0.294464111328125, 0.3055686950683594, 0.31667327880859375, 0.3277778625488281, 0.3388824462890625, 0.3499870300292969, 0.36109161376953125, 0.3721961975097656, 0.38330078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 7.0, 24.0, 36.0, 99.0, 174.0, 209.0, 171.0, 129.0, 57.0, 29.0, 16.0, 10.0, 2.0, 6.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.644477367401123, -2.50160551071167, -2.3587334156036377, -2.2158615589141846, -2.0729897022247314, -1.9301177263259888, -1.787245750427246, -1.644373893737793, -1.5015019178390503, -1.3586299419403076, -1.2157580852508545, -1.0728861093521118, -0.9300141930580139, -0.787142276763916, -0.6442703008651733, -0.5013984441757202, -0.35852646827697754, -0.21565453708171844, -0.07278260588645935, 0.07008934020996094, 0.21296125650405884, 0.35583317279815674, 0.4987051486968994, 0.6415770053863525, 0.7844489812850952, 0.9273208975791931, 1.070192813873291, 1.2130647897720337, 1.3559367656707764, 1.4988086223602295, 1.6416805982589722, 1.7845524549484253, 1.927424430847168, 2.070296287536621, 2.2131683826446533, 2.3560402393341064, 2.4989120960235596, 2.641784191131592, 2.784656047821045, 2.927527904510498, 3.070399761199951, 3.2132716178894043, 3.3561437129974365, 3.4990155696868896, 3.6418874263763428, 3.784759521484375, 3.927631378173828, 4.070503234863281, 4.213375091552734, 4.3562469482421875, 4.499118804931641, 4.641990661621094, 4.784862995147705, 4.927734851837158, 5.070606708526611, 5.2134785652160645, 5.356350898742676, 5.499222755432129, 5.642094612121582, 5.784966468811035, 5.9278388023376465, 6.0707106590271, 6.213582515716553, 6.356454372406006, 6.499326229095459]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 10.0, 14.0, 11.0, 24.0, 23.0, 33.0, 32.0, 43.0, 53.0, 65.0, 69.0, 71.0, 83.0, 77.0, 68.0, 56.0, 61.0, 40.0, 46.0, 38.0, 20.0, 30.0, 15.0, 11.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1088404655456543, -3.023874282836914, -2.938908100128174, -2.8539416790008545, -2.7689754962921143, -2.684009313583374, -2.5990428924560547, -2.5140767097473145, -2.429110527038574, -2.344144344329834, -2.2591781616210938, -2.1742117404937744, -2.089245557785034, -2.004279375076294, -1.9193130731582642, -1.8343467712402344, -1.7493805885314941, -1.664414405822754, -1.5794481039047241, -1.4944818019866943, -1.409515619277954, -1.3245494365692139, -1.239583134651184, -1.1546168327331543, -1.069650650024414, -0.984684407711029, -0.899718165397644, -0.814751923084259, -0.729785680770874, -0.644819438457489, -0.559853196144104, -0.474886953830719, -0.389920711517334, -0.304954469203949, -0.21998822689056396, -0.13502198457717896, -0.050055742263793945, 0.034910500049591064, 0.11987674236297607, 0.20484298467636108, 0.2898092269897461, 0.3747754693031311, 0.4597417116165161, 0.5447079539299011, 0.6296741962432861, 0.7146404385566711, 0.7996066808700562, 0.8845729231834412, 0.9695391654968262, 1.0545053482055664, 1.1394716501235962, 1.224437952041626, 1.3094041347503662, 1.3943703174591064, 1.4793366193771362, 1.564302921295166, 1.6492691040039062, 1.7342352867126465, 1.8192015886306763, 1.904167890548706, 1.9891340732574463, 2.0741002559661865, 2.159066677093506, 2.244032859802246, 2.3289990425109863]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 2.0, 8.0, 7.0, 11.0, 19.0, 30.0, 51.0, 70.0, 101.0, 165.0, 248.0, 376.0, 551.0, 910.0, 1627.0, 2721.0, 4889.0, 9601.0, 19709.0, 43188.0, 107464.0, 358771.0, 322380.0, 97372.0, 39610.0, 18335.0, 9106.0, 4643.0, 2652.0, 1428.0, 876.0, 554.0, 391.0, 244.0, 149.0, 95.0, 59.0, 45.0, 32.0, 20.0, 14.0, 9.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28515625, -0.27530670166015625, -0.2654571533203125, -0.25560760498046875, -0.245758056640625, -0.23590850830078125, -0.2260589599609375, -0.21620941162109375, -0.20635986328125, -0.19651031494140625, -0.1866607666015625, -0.17681121826171875, -0.166961669921875, -0.15711212158203125, -0.1472625732421875, -0.13741302490234375, -0.1275634765625, -0.11771392822265625, -0.1078643798828125, -0.09801483154296875, -0.088165283203125, -0.07831573486328125, -0.0684661865234375, -0.05861663818359375, -0.04876708984375, -0.03891754150390625, -0.0290679931640625, -0.01921844482421875, -0.009368896484375, 0.00048065185546875, 0.0103302001953125, 0.02017974853515625, 0.030029296875, 0.03987884521484375, 0.0497283935546875, 0.05957794189453125, 0.069427490234375, 0.07927703857421875, 0.0891265869140625, 0.09897613525390625, 0.10882568359375, 0.11867523193359375, 0.1285247802734375, 0.13837432861328125, 0.148223876953125, 0.15807342529296875, 0.1679229736328125, 0.17777252197265625, 0.1876220703125, 0.19747161865234375, 0.2073211669921875, 0.21717071533203125, 0.227020263671875, 0.23686981201171875, 0.2467193603515625, 0.25656890869140625, 0.26641845703125, 0.27626800537109375, 0.2861175537109375, 0.29596710205078125, 0.305816650390625, 0.31566619873046875, 0.3255157470703125, 0.33536529541015625, 0.34521484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 8.0, 12.0, 18.0, 20.0, 25.0, 39.0, 30.0, 40.0, 50.0, 51.0, 56.0, 65.0, 66.0, 67.0, 71.0, 55.0, 58.0, 41.0, 45.0, 39.0, 31.0, 25.0, 19.0, 12.0, 12.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1663227081298828, -0.16077041625976562, -0.15521812438964844, -0.14966583251953125, -0.14411354064941406, -0.13856124877929688, -0.1330089569091797, -0.1274566650390625, -0.12190437316894531, -0.11635208129882812, -0.11079978942871094, -0.10524749755859375, -0.09969520568847656, -0.09414291381835938, -0.08859062194824219, -0.083038330078125, -0.07748603820800781, -0.07193374633789062, -0.06638145446777344, -0.06082916259765625, -0.05527687072753906, -0.049724578857421875, -0.04417228698730469, -0.0386199951171875, -0.03306770324707031, -0.027515411376953125, -0.021963119506835938, -0.01641082763671875, -0.010858535766601562, -0.005306243896484375, 0.0002460479736328125, 0.00579833984375, 0.011350631713867188, 0.016902923583984375, 0.022455215454101562, 0.02800750732421875, 0.03355979919433594, 0.039112091064453125, 0.04466438293457031, 0.0502166748046875, 0.05576896667480469, 0.061321258544921875, 0.06687355041503906, 0.07242584228515625, 0.07797813415527344, 0.08353042602539062, 0.08908271789550781, 0.094635009765625, 0.10018730163574219, 0.10573959350585938, 0.11129188537597656, 0.11684417724609375, 0.12239646911621094, 0.12794876098632812, 0.1335010528564453, 0.1390533447265625, 0.1446056365966797, 0.15015792846679688, 0.15571022033691406, 0.16126251220703125, 0.16681480407714844, 0.17236709594726562, 0.1779193878173828, 0.1834716796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 8.0, 9.0, 20.0, 18.0, 39.0, 42.0, 104.0, 139.0, 223.0, 397.0, 877.0, 2331.0, 10240.0, 151502.0, 841687.0, 33415.0, 4547.0, 1445.0, 629.0, 334.0, 177.0, 113.0, 61.0, 55.0, 45.0, 14.0, 16.0, 15.0, 5.0, 4.0, 11.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.894744873046875, -0.86517333984375, -0.835601806640625, -0.8060302734375, -0.776458740234375, -0.74688720703125, -0.717315673828125, -0.687744140625, -0.658172607421875, -0.62860107421875, -0.599029541015625, -0.5694580078125, -0.539886474609375, -0.51031494140625, -0.480743408203125, -0.451171875, -0.421600341796875, -0.39202880859375, -0.362457275390625, -0.3328857421875, -0.303314208984375, -0.27374267578125, -0.244171142578125, -0.214599609375, -0.185028076171875, -0.15545654296875, -0.125885009765625, -0.0963134765625, -0.066741943359375, -0.03717041015625, -0.007598876953125, 0.02197265625, 0.051544189453125, 0.08111572265625, 0.110687255859375, 0.1402587890625, 0.169830322265625, 0.19940185546875, 0.228973388671875, 0.258544921875, 0.288116455078125, 0.31768798828125, 0.347259521484375, 0.3768310546875, 0.406402587890625, 0.43597412109375, 0.465545654296875, 0.4951171875, 0.524688720703125, 0.55426025390625, 0.583831787109375, 0.6134033203125, 0.642974853515625, 0.67254638671875, 0.702117919921875, 0.731689453125, 0.761260986328125, 0.79083251953125, 0.820404052734375, 0.8499755859375, 0.879547119140625, 0.90911865234375, 0.938690185546875, 0.96826171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 8.0, 11.0, 18.0, 24.0, 17.0, 26.0, 28.0, 44.0, 27.0, 42.0, 45.0, 65.0, 68.0, 63.0, 63.0, 62.0, 53.0, 45.0, 47.0, 45.0, 38.0, 31.0, 22.0, 23.0, 16.0, 18.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68505859375, -0.6613693237304688, -0.6376800537109375, -0.6139907836914062, -0.590301513671875, -0.5666122436523438, -0.5429229736328125, -0.5192337036132812, -0.49554443359375, -0.47185516357421875, -0.4481658935546875, -0.42447662353515625, -0.400787353515625, -0.37709808349609375, -0.3534088134765625, -0.32971954345703125, -0.3060302734375, -0.28234100341796875, -0.2586517333984375, -0.23496246337890625, -0.211273193359375, -0.18758392333984375, -0.1638946533203125, -0.14020538330078125, -0.11651611328125, -0.09282684326171875, -0.0691375732421875, -0.04544830322265625, -0.021759033203125, 0.00193023681640625, 0.0256195068359375, 0.04930877685546875, 0.072998046875, 0.09668731689453125, 0.1203765869140625, 0.14406585693359375, 0.167755126953125, 0.19144439697265625, 0.2151336669921875, 0.23882293701171875, 0.26251220703125, 0.28620147705078125, 0.3098907470703125, 0.33358001708984375, 0.357269287109375, 0.38095855712890625, 0.4046478271484375, 0.42833709716796875, 0.4520263671875, 0.47571563720703125, 0.4994049072265625, 0.5230941772460938, 0.546783447265625, 0.5704727172851562, 0.5941619873046875, 0.6178512573242188, 0.64154052734375, 0.6652297973632812, 0.6889190673828125, 0.7126083374023438, 0.736297607421875, 0.7599868774414062, 0.7836761474609375, 0.8073654174804688, 0.8310546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 3.0, 9.0, 5.0, 14.0, 19.0, 23.0, 45.0, 62.0, 110.0, 175.0, 362.0, 847.0, 3310.0, 22728.0, 598785.0, 398626.0, 18903.0, 3019.0, 778.0, 327.0, 160.0, 82.0, 49.0, 37.0, 19.0, 19.0, 7.0, 15.0, 2.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3642578125, -0.3524932861328125, -0.340728759765625, -0.3289642333984375, -0.31719970703125, -0.3054351806640625, -0.293670654296875, -0.2819061279296875, -0.2701416015625, -0.2583770751953125, -0.246612548828125, -0.2348480224609375, -0.22308349609375, -0.2113189697265625, -0.199554443359375, -0.1877899169921875, -0.176025390625, -0.1642608642578125, -0.152496337890625, -0.1407318115234375, -0.12896728515625, -0.1172027587890625, -0.105438232421875, -0.0936737060546875, -0.0819091796875, -0.0701446533203125, -0.058380126953125, -0.0466156005859375, -0.03485107421875, -0.0230865478515625, -0.011322021484375, 0.0004425048828125, 0.01220703125, 0.0239715576171875, 0.035736083984375, 0.0475006103515625, 0.05926513671875, 0.0710296630859375, 0.082794189453125, 0.0945587158203125, 0.1063232421875, 0.1180877685546875, 0.129852294921875, 0.1416168212890625, 0.15338134765625, 0.1651458740234375, 0.176910400390625, 0.1886749267578125, 0.200439453125, 0.2122039794921875, 0.223968505859375, 0.2357330322265625, 0.24749755859375, 0.2592620849609375, 0.271026611328125, 0.2827911376953125, 0.2945556640625, 0.3063201904296875, 0.318084716796875, 0.3298492431640625, 0.34161376953125, 0.3533782958984375, 0.365142822265625, 0.3769073486328125, 0.388671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 3.0, 10.0, 10.0, 14.0, 13.0, 5.0, 14.0, 11.0, 21.0, 19.0, 32.0, 40.0, 79.0, 102.0, 106.0, 111.0, 88.0, 69.0, 40.0, 28.0, 30.0, 23.0, 16.0, 13.0, 15.0, 7.0, 13.0, 11.0, 11.0, 7.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.212162017822266e-05, -7.000472396612167e-05, -6.788782775402069e-05, -6.577093154191971e-05, -6.365403532981873e-05, -6.153713911771774e-05, -5.942024290561676e-05, -5.730334669351578e-05, -5.5186450481414795e-05, -5.306955426931381e-05, -5.095265805721283e-05, -4.883576184511185e-05, -4.6718865633010864e-05, -4.460196942090988e-05, -4.24850732088089e-05, -4.0368176996707916e-05, -3.8251280784606934e-05, -3.613438457250595e-05, -3.401748836040497e-05, -3.1900592148303986e-05, -2.9783695936203003e-05, -2.766679972410202e-05, -2.5549903512001038e-05, -2.3433007299900055e-05, -2.1316111087799072e-05, -1.919921487569809e-05, -1.7082318663597107e-05, -1.4965422451496124e-05, -1.2848526239395142e-05, -1.0731630027294159e-05, -8.614733815193176e-06, -6.497837603092194e-06, -4.380941390991211e-06, -2.2640451788902283e-06, -1.471489667892456e-07, 1.969747245311737e-06, 4.08664345741272e-06, 6.203539669513702e-06, 8.320435881614685e-06, 1.0437332093715668e-05, 1.255422830581665e-05, 1.4671124517917633e-05, 1.6788020730018616e-05, 1.89049169421196e-05, 2.102181315422058e-05, 2.3138709366321564e-05, 2.5255605578422546e-05, 2.737250179052353e-05, 2.9489398002624512e-05, 3.1606294214725494e-05, 3.372319042682648e-05, 3.584008663892746e-05, 3.795698285102844e-05, 4.0073879063129425e-05, 4.219077527523041e-05, 4.430767148733139e-05, 4.642456769943237e-05, 4.8541463911533356e-05, 5.065836012363434e-05, 5.277525633573532e-05, 5.4892152547836304e-05, 5.7009048759937286e-05, 5.912594497203827e-05, 6.124284118413925e-05, 6.335973739624023e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 11.0, 13.0, 16.0, 18.0, 29.0, 48.0, 62.0, 102.0, 165.0, 231.0, 378.0, 772.0, 1487.0, 3791.0, 12822.0, 83157.0, 735016.0, 179788.0, 21291.0, 5191.0, 1953.0, 850.0, 470.0, 329.0, 171.0, 108.0, 67.0, 36.0, 45.0, 26.0, 20.0, 11.0, 22.0, 8.0, 8.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.26025390625, -0.2525215148925781, -0.24478912353515625, -0.23705673217773438, -0.2293243408203125, -0.22159194946289062, -0.21385955810546875, -0.20612716674804688, -0.198394775390625, -0.19066238403320312, -0.18292999267578125, -0.17519760131835938, -0.1674652099609375, -0.15973281860351562, -0.15200042724609375, -0.14426803588867188, -0.13653564453125, -0.12880325317382812, -0.12107086181640625, -0.11333847045898438, -0.1056060791015625, -0.09787368774414062, -0.09014129638671875, -0.08240890502929688, -0.074676513671875, -0.06694412231445312, -0.05921173095703125, -0.051479339599609375, -0.0437469482421875, -0.036014556884765625, -0.02828216552734375, -0.020549774169921875, -0.0128173828125, -0.005084991455078125, 0.00264739990234375, 0.010379791259765625, 0.0181121826171875, 0.025844573974609375, 0.03357696533203125, 0.041309356689453125, 0.049041748046875, 0.056774139404296875, 0.06450653076171875, 0.07223892211914062, 0.0799713134765625, 0.08770370483398438, 0.09543609619140625, 0.10316848754882812, 0.11090087890625, 0.11863327026367188, 0.12636566162109375, 0.13409805297851562, 0.1418304443359375, 0.14956283569335938, 0.15729522705078125, 0.16502761840820312, 0.172760009765625, 0.18049240112304688, 0.18822479248046875, 0.19595718383789062, 0.2036895751953125, 0.21142196655273438, 0.21915435791015625, 0.22688674926757812, 0.234619140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 11.0, 9.0, 23.0, 23.0, 40.0, 45.0, 70.0, 86.0, 89.0, 93.0, 102.0, 79.0, 65.0, 67.0, 37.0, 30.0, 28.0, 18.0, 19.0, 17.0, 8.0, 3.0, 6.0, 6.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27490234375, -0.2677001953125, -0.260498046875, -0.2532958984375, -0.24609375, -0.2388916015625, -0.231689453125, -0.2244873046875, -0.21728515625, -0.2100830078125, -0.202880859375, -0.1956787109375, -0.1884765625, -0.1812744140625, -0.174072265625, -0.1668701171875, -0.15966796875, -0.1524658203125, -0.145263671875, -0.1380615234375, -0.130859375, -0.1236572265625, -0.116455078125, -0.1092529296875, -0.10205078125, -0.0948486328125, -0.087646484375, -0.0804443359375, -0.0732421875, -0.0660400390625, -0.058837890625, -0.0516357421875, -0.04443359375, -0.0372314453125, -0.030029296875, -0.0228271484375, -0.015625, -0.0084228515625, -0.001220703125, 0.0059814453125, 0.01318359375, 0.0203857421875, 0.027587890625, 0.0347900390625, 0.0419921875, 0.0491943359375, 0.056396484375, 0.0635986328125, 0.07080078125, 0.0780029296875, 0.085205078125, 0.0924072265625, 0.099609375, 0.1068115234375, 0.114013671875, 0.1212158203125, 0.12841796875, 0.1356201171875, 0.142822265625, 0.1500244140625, 0.1572265625, 0.1644287109375, 0.171630859375, 0.1788330078125, 0.18603515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 25.0, 41.0, 95.0, 193.0, 264.0, 181.0, 99.0, 46.0, 19.0, 13.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.951864242553711, -6.775482177734375, -6.599099636077881, -6.422717094421387, -6.246335029602051, -6.069952964782715, -5.893570423126221, -5.717187881469727, -5.540805816650391, -5.364423751831055, -5.1880412101745605, -5.011658668518066, -4.8352766036987305, -4.6588945388793945, -4.4825119972229, -4.306129455566406, -4.12974739074707, -3.9533650875091553, -3.7769827842712402, -3.600600481033325, -3.42421817779541, -3.247835874557495, -3.07145357131958, -2.895071268081665, -2.71868896484375, -2.542306661605835, -2.36592435836792, -2.189542055130005, -2.01315975189209, -1.8367774486541748, -1.6603951454162598, -1.4840128421783447, -1.307631015777588, -1.1312487125396729, -0.9548664093017578, -0.7784841060638428, -0.6021018028259277, -0.4257194995880127, -0.24933719635009766, -0.07295489311218262, 0.10342741012573242, 0.27980971336364746, 0.4561920166015625, 0.6325743198394775, 0.8089566230773926, 0.9853389263153076, 1.1617212295532227, 1.3381035327911377, 1.5144858360290527, 1.6908681392669678, 1.8672504425048828, 2.043632745742798, 2.220015048980713, 2.396397352218628, 2.572779655456543, 2.749161958694458, 2.925544261932373, 3.101926565170288, 3.278308868408203, 3.454691171646118, 3.631073474884033, 3.8074557781219482, 3.9838380813598633, 4.160220146179199, 4.336602687835693]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 13.0, 13.0, 8.0, 19.0, 14.0, 20.0, 23.0, 29.0, 35.0, 29.0, 41.0, 32.0, 41.0, 56.0, 58.0, 69.0, 50.0, 51.0, 42.0, 44.0, 42.0, 49.0, 24.0, 32.0, 28.0, 22.0, 19.0, 15.0, 20.0, 12.0, 7.0, 9.0, 7.0, 1.0, 8.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.7267675399780273, -2.6436541080474854, -2.5605406761169434, -2.4774270057678223, -2.3943135738372803, -2.3112001419067383, -2.2280867099761963, -2.1449732780456543, -2.061859607696533, -1.9787461757659912, -1.8956326246261597, -1.8125191926956177, -1.7294056415557861, -1.6462922096252441, -1.5631787776947021, -1.4800653457641602, -1.3969519138336182, -1.3138384819030762, -1.2307249307632446, -1.1476114988327026, -1.064497947692871, -0.9813845157623291, -0.8982710838317871, -0.8151575922966003, -0.7320441007614136, -0.6489306092262268, -0.56581711769104, -0.48270368576049805, -0.3995901942253113, -0.3164767026901245, -0.23336324095726013, -0.15024977922439575, -0.06713652610778809, 0.015976950526237488, 0.09909042716026306, 0.18220390379428864, 0.2653173804283142, 0.348430871963501, 0.43154433369636536, 0.5146577954292297, 0.5977712869644165, 0.6808847784996033, 0.76399827003479, 0.847111701965332, 0.9302251935005188, 1.0133386850357056, 1.0964521169662476, 1.179565668106079, 1.262679100036621, 1.345792531967163, 1.4289060831069946, 1.5120195150375366, 1.5951330661773682, 1.6782464981079102, 1.7613599300384521, 1.8444733619689941, 1.9275869131088257, 2.0107004642486572, 2.093813896179199, 2.176927328109741, 2.260040760040283, 2.3431544303894043, 2.4262678623199463, 2.5093812942504883, 2.5924947261810303]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 9.0, 5.0, 9.0, 16.0, 16.0, 26.0, 33.0, 43.0, 71.0, 85.0, 140.0, 251.0, 665.0, 3257.0, 37980.0, 3972004.0, 170060.0, 7539.0, 1135.0, 361.0, 181.0, 88.0, 90.0, 48.0, 37.0, 28.0, 26.0, 17.0, 15.0, 11.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88232421875, -0.8544845581054688, -0.8266448974609375, -0.7988052368164062, -0.770965576171875, -0.7431259155273438, -0.7152862548828125, -0.6874465942382812, -0.65960693359375, -0.6317672729492188, -0.6039276123046875, -0.5760879516601562, -0.548248291015625, -0.5204086303710938, -0.4925689697265625, -0.46472930908203125, -0.4368896484375, -0.40904998779296875, -0.3812103271484375, -0.35337066650390625, -0.325531005859375, -0.29769134521484375, -0.2698516845703125, -0.24201202392578125, -0.21417236328125, -0.18633270263671875, -0.1584930419921875, -0.13065338134765625, -0.102813720703125, -0.07497406005859375, -0.0471343994140625, -0.01929473876953125, 0.008544921875, 0.03638458251953125, 0.0642242431640625, 0.09206390380859375, 0.119903564453125, 0.14774322509765625, 0.1755828857421875, 0.20342254638671875, 0.23126220703125, 0.25910186767578125, 0.2869415283203125, 0.31478118896484375, 0.342620849609375, 0.37046051025390625, 0.3983001708984375, 0.42613983154296875, 0.4539794921875, 0.48181915283203125, 0.5096588134765625, 0.5374984741210938, 0.565338134765625, 0.5931777954101562, 0.6210174560546875, 0.6488571166992188, 0.67669677734375, 0.7045364379882812, 0.7323760986328125, 0.7602157592773438, 0.788055419921875, 0.8158950805664062, 0.8437347412109375, 0.8715744018554688, 0.8994140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 6.0, 18.0, 32.0, 31.0, 46.0, 61.0, 62.0, 75.0, 65.0, 71.0, 96.0, 59.0, 71.0, 64.0, 61.0, 50.0, 40.0, 32.0, 19.0, 13.0, 13.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.1333465576171875, -0.126800537109375, -0.1202545166015625, -0.11370849609375, -0.1071624755859375, -0.100616455078125, -0.0940704345703125, -0.0875244140625, -0.0809783935546875, -0.074432373046875, -0.0678863525390625, -0.06134033203125, -0.0547943115234375, -0.048248291015625, -0.0417022705078125, -0.03515625, -0.0286102294921875, -0.022064208984375, -0.0155181884765625, -0.00897216796875, -0.0024261474609375, 0.004119873046875, 0.0106658935546875, 0.0172119140625, 0.0237579345703125, 0.030303955078125, 0.0368499755859375, 0.04339599609375, 0.0499420166015625, 0.056488037109375, 0.0630340576171875, 0.069580078125, 0.0761260986328125, 0.082672119140625, 0.0892181396484375, 0.09576416015625, 0.1023101806640625, 0.108856201171875, 0.1154022216796875, 0.1219482421875, 0.1284942626953125, 0.135040283203125, 0.1415863037109375, 0.14813232421875, 0.1546783447265625, 0.161224365234375, 0.1677703857421875, 0.17431640625, 0.1808624267578125, 0.187408447265625, 0.1939544677734375, 0.20050048828125, 0.2070465087890625, 0.213592529296875, 0.2201385498046875, 0.2266845703125, 0.2332305908203125, 0.239776611328125, 0.2463226318359375, 0.25286865234375, 0.2594146728515625, 0.265960693359375, 0.2725067138671875, 0.279052734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 5.0, 11.0, 25.0, 19.0, 39.0, 41.0, 101.0, 166.0, 287.0, 529.0, 965.0, 2004.0, 4233.0, 9279.0, 22245.0, 65106.0, 312343.0, 2961309.0, 661266.0, 99987.0, 30930.0, 12280.0, 5592.0, 2578.0, 1332.0, 635.0, 344.0, 219.0, 127.0, 93.0, 56.0, 37.0, 30.0, 18.0, 13.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21923828125, -0.2110137939453125, -0.202789306640625, -0.1945648193359375, -0.18634033203125, -0.1781158447265625, -0.169891357421875, -0.1616668701171875, -0.1534423828125, -0.1452178955078125, -0.136993408203125, -0.1287689208984375, -0.12054443359375, -0.1123199462890625, -0.104095458984375, -0.0958709716796875, -0.087646484375, -0.0794219970703125, -0.071197509765625, -0.0629730224609375, -0.05474853515625, -0.0465240478515625, -0.038299560546875, -0.0300750732421875, -0.0218505859375, -0.0136260986328125, -0.005401611328125, 0.0028228759765625, 0.01104736328125, 0.0192718505859375, 0.027496337890625, 0.0357208251953125, 0.0439453125, 0.0521697998046875, 0.060394287109375, 0.0686187744140625, 0.07684326171875, 0.0850677490234375, 0.093292236328125, 0.1015167236328125, 0.1097412109375, 0.1179656982421875, 0.126190185546875, 0.1344146728515625, 0.14263916015625, 0.1508636474609375, 0.159088134765625, 0.1673126220703125, 0.175537109375, 0.1837615966796875, 0.191986083984375, 0.2002105712890625, 0.20843505859375, 0.2166595458984375, 0.224884033203125, 0.2331085205078125, 0.2413330078125, 0.2495574951171875, 0.257781982421875, 0.2660064697265625, 0.27423095703125, 0.2824554443359375, 0.290679931640625, 0.2989044189453125, 0.30712890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 4.0, 8.0, 13.0, 12.0, 18.0, 36.0, 41.0, 55.0, 94.0, 153.0, 265.0, 527.0, 997.0, 796.0, 416.0, 218.0, 126.0, 77.0, 44.0, 44.0, 30.0, 18.0, 25.0, 10.0, 9.0, 5.0, 5.0, 1.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.30149078369140625, -0.2902374267578125, -0.27898406982421875, -0.267730712890625, -0.25647735595703125, -0.2452239990234375, -0.23397064208984375, -0.22271728515625, -0.21146392822265625, -0.2002105712890625, -0.18895721435546875, -0.177703857421875, -0.16645050048828125, -0.1551971435546875, -0.14394378662109375, -0.1326904296875, -0.12143707275390625, -0.1101837158203125, -0.09893035888671875, -0.087677001953125, -0.07642364501953125, -0.0651702880859375, -0.05391693115234375, -0.04266357421875, -0.03141021728515625, -0.0201568603515625, -0.00890350341796875, 0.002349853515625, 0.01360321044921875, 0.0248565673828125, 0.03610992431640625, 0.04736328125, 0.05861663818359375, 0.0698699951171875, 0.08112335205078125, 0.092376708984375, 0.10363006591796875, 0.1148834228515625, 0.12613677978515625, 0.13739013671875, 0.14864349365234375, 0.1598968505859375, 0.17115020751953125, 0.182403564453125, 0.19365692138671875, 0.2049102783203125, 0.21616363525390625, 0.2274169921875, 0.23867034912109375, 0.2499237060546875, 0.26117706298828125, 0.272430419921875, 0.28368377685546875, 0.2949371337890625, 0.30619049072265625, 0.31744384765625, 0.32869720458984375, 0.3399505615234375, 0.35120391845703125, 0.362457275390625, 0.37371063232421875, 0.3849639892578125, 0.39621734619140625, 0.407470703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 11.0, 30.0, 75.0, 141.0, 238.0, 225.0, 121.0, 66.0, 38.0, 20.0, 10.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3747329711914062, -2.2547757625579834, -2.1348185539245605, -2.0148611068725586, -1.8949040174484253, -1.774946689605713, -1.65498948097229, -1.5350322723388672, -1.4150750637054443, -1.2951178550720215, -1.175160527229309, -1.0552033185958862, -0.9352461099624634, -0.8152888417243958, -0.6953315734863281, -0.5753743648529053, -0.45541703701019287, -0.33545979857444763, -0.2155025452375412, -0.09554529190063477, 0.024411946535110474, 0.1443691849708557, 0.26432645320892334, 0.3842836618423462, 0.5042409300804138, 0.6241981983184814, 0.7441554069519043, 0.8641126751899719, 0.9840699434280396, 1.1040271520614624, 1.2239844799041748, 1.3439416885375977, 1.4638988971710205, 1.5838561058044434, 1.7038134336471558, 1.8237706422805786, 1.9437278509140015, 2.063685178756714, 2.1836423873901367, 2.3035995960235596, 2.4235568046569824, 2.5435140132904053, 2.663471221923828, 2.78342866897583, 2.903385877609253, 3.023343086242676, 3.1433002948760986, 3.2632575035095215, 3.3832149505615234, 3.5031721591949463, 3.623129367828369, 3.743086814880371, 3.863044023513794, 3.983001232147217, 4.102958679199219, 4.2229156494140625, 4.342872619628906, 4.462830066680908, 4.582787036895752, 4.702744483947754, 4.822701454162598, 4.9426589012146, 5.062616348266602, 5.182573318481445, 5.302530765533447]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 10.0, 11.0, 11.0, 20.0, 20.0, 16.0, 20.0, 17.0, 22.0, 33.0, 30.0, 39.0, 31.0, 33.0, 46.0, 45.0, 56.0, 47.0, 48.0, 35.0, 52.0, 37.0, 37.0, 42.0, 25.0, 27.0, 27.0, 25.0, 24.0, 11.0, 21.0, 14.0, 12.0, 14.0, 8.0, 2.0, 2.0, 3.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4438083171844482, -1.4006273746490479, -1.357446551322937, -1.3142656087875366, -1.2710846662521362, -1.2279038429260254, -1.184722900390625, -1.1415419578552246, -1.0983610153198242, -1.0551800727844238, -1.011999249458313, -0.9688183069229126, -0.9256373643875122, -0.8824564814567566, -0.839275598526001, -0.7960946559906006, -0.7529138326644897, -0.7097329497337341, -0.6665520071983337, -0.6233711242675781, -0.5801901817321777, -0.5370092988014221, -0.4938284158706665, -0.4506475031375885, -0.4074665904045105, -0.3642856776714325, -0.3211047649383545, -0.2779238820075989, -0.23474296927452087, -0.19156205654144287, -0.14838117361068726, -0.10520026087760925, -0.0620194673538208, -0.018838562071323395, 0.02434234321117401, 0.06752324104309082, 0.11070415377616882, 0.15388506650924683, 0.19706594944000244, 0.24024686217308044, 0.28342777490615845, 0.32660868763923645, 0.36978960037231445, 0.41297048330307007, 0.45615139603614807, 0.4993323087692261, 0.5425131916999817, 0.5856940746307373, 0.6288750171661377, 0.6720559000968933, 0.7152368426322937, 0.7584177255630493, 0.8015986680984497, 0.8447795510292053, 0.8879604339599609, 0.9311413764953613, 0.9743222594261169, 1.0175031423568726, 1.060684084892273, 1.1038649082183838, 1.1470458507537842, 1.1902267932891846, 1.233407735824585, 1.2765885591506958, 1.3197695016860962]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 11.0, 14.0, 12.0, 31.0, 44.0, 75.0, 129.0, 197.0, 323.0, 541.0, 966.0, 1764.0, 3374.0, 6820.0, 15219.0, 38180.0, 123211.0, 460620.0, 280041.0, 70587.0, 24961.0, 10673.0, 5049.0, 2512.0, 1332.0, 741.0, 439.0, 255.0, 156.0, 97.0, 72.0, 37.0, 30.0, 16.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35107421875, -0.3412628173828125, -0.331451416015625, -0.3216400146484375, -0.31182861328125, -0.3020172119140625, -0.292205810546875, -0.2823944091796875, -0.2725830078125, -0.2627716064453125, -0.252960205078125, -0.2431488037109375, -0.23333740234375, -0.2235260009765625, -0.213714599609375, -0.2039031982421875, -0.194091796875, -0.1842803955078125, -0.174468994140625, -0.1646575927734375, -0.15484619140625, -0.1450347900390625, -0.135223388671875, -0.1254119873046875, -0.1156005859375, -0.1057891845703125, -0.095977783203125, -0.0861663818359375, -0.07635498046875, -0.0665435791015625, -0.056732177734375, -0.0469207763671875, -0.037109375, -0.0272979736328125, -0.017486572265625, -0.0076751708984375, 0.00213623046875, 0.0119476318359375, 0.021759033203125, 0.0315704345703125, 0.0413818359375, 0.0511932373046875, 0.061004638671875, 0.0708160400390625, 0.08062744140625, 0.0904388427734375, 0.100250244140625, 0.1100616455078125, 0.119873046875, 0.1296844482421875, 0.139495849609375, 0.1493072509765625, 0.15911865234375, 0.1689300537109375, 0.178741455078125, 0.1885528564453125, 0.1983642578125, 0.2081756591796875, 0.217987060546875, 0.2277984619140625, 0.23760986328125, 0.2474212646484375, 0.257232666015625, 0.2670440673828125, 0.27685546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 11.0, 6.0, 10.0, 10.0, 12.0, 21.0, 22.0, 30.0, 34.0, 32.0, 47.0, 36.0, 41.0, 55.0, 52.0, 56.0, 63.0, 57.0, 43.0, 64.0, 51.0, 38.0, 34.0, 41.0, 26.0, 24.0, 28.0, 18.0, 13.0, 10.0, 7.0, 5.0, 5.0, 0.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12408447265625, -0.1192178726196289, -0.11435127258300781, -0.10948467254638672, -0.10461807250976562, -0.09975147247314453, -0.09488487243652344, -0.09001827239990234, -0.08515167236328125, -0.08028507232666016, -0.07541847229003906, -0.07055187225341797, -0.06568527221679688, -0.06081867218017578, -0.05595207214355469, -0.051085472106933594, -0.0462188720703125, -0.041352272033691406, -0.03648567199707031, -0.03161907196044922, -0.026752471923828125, -0.02188587188720703, -0.017019271850585938, -0.012152671813964844, -0.00728607177734375, -0.0024194717407226562, 0.0024471282958984375, 0.007313728332519531, 0.012180328369140625, 0.01704692840576172, 0.021913528442382812, 0.026780128479003906, 0.031646728515625, 0.036513328552246094, 0.04137992858886719, 0.04624652862548828, 0.051113128662109375, 0.05597972869873047, 0.06084632873535156, 0.06571292877197266, 0.07057952880859375, 0.07544612884521484, 0.08031272888183594, 0.08517932891845703, 0.09004592895507812, 0.09491252899169922, 0.09977912902832031, 0.1046457290649414, 0.1095123291015625, 0.1143789291381836, 0.11924552917480469, 0.12411212921142578, 0.12897872924804688, 0.13384532928466797, 0.13871192932128906, 0.14357852935791016, 0.14844512939453125, 0.15331172943115234, 0.15817832946777344, 0.16304492950439453, 0.16791152954101562, 0.17277812957763672, 0.1776447296142578, 0.1825113296508789, 0.1873779296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 7.0, 7.0, 6.0, 18.0, 23.0, 27.0, 63.0, 65.0, 114.0, 166.0, 322.0, 560.0, 1213.0, 3269.0, 13505.0, 97081.0, 803404.0, 107754.0, 14733.0, 3501.0, 1314.0, 568.0, 304.0, 169.0, 113.0, 67.0, 47.0, 40.0, 24.0, 20.0, 11.0, 10.0, 5.0, 5.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5439453125, -0.5255203247070312, -0.5070953369140625, -0.48867034912109375, -0.470245361328125, -0.45182037353515625, -0.4333953857421875, -0.41497039794921875, -0.39654541015625, -0.37812042236328125, -0.3596954345703125, -0.34127044677734375, -0.322845458984375, -0.30442047119140625, -0.2859954833984375, -0.26757049560546875, -0.2491455078125, -0.23072052001953125, -0.2122955322265625, -0.19387054443359375, -0.175445556640625, -0.15702056884765625, -0.1385955810546875, -0.12017059326171875, -0.10174560546875, -0.08332061767578125, -0.0648956298828125, -0.04647064208984375, -0.028045654296875, -0.00962066650390625, 0.0088043212890625, 0.02722930908203125, 0.045654296875, 0.06407928466796875, 0.0825042724609375, 0.10092926025390625, 0.119354248046875, 0.13777923583984375, 0.1562042236328125, 0.17462921142578125, 0.19305419921875, 0.21147918701171875, 0.2299041748046875, 0.24832916259765625, 0.266754150390625, 0.28517913818359375, 0.3036041259765625, 0.32202911376953125, 0.3404541015625, 0.35887908935546875, 0.3773040771484375, 0.39572906494140625, 0.414154052734375, 0.43257904052734375, 0.4510040283203125, 0.46942901611328125, 0.48785400390625, 0.5062789916992188, 0.5247039794921875, 0.5431289672851562, 0.561553955078125, 0.5799789428710938, 0.5984039306640625, 0.6168289184570312, 0.63525390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 8.0, 10.0, 15.0, 12.0, 11.0, 12.0, 18.0, 15.0, 16.0, 30.0, 35.0, 26.0, 29.0, 33.0, 39.0, 52.0, 39.0, 48.0, 43.0, 50.0, 44.0, 45.0, 38.0, 44.0, 36.0, 31.0, 35.0, 29.0, 16.0, 12.0, 13.0, 14.0, 12.0, 11.0, 13.0, 10.0, 6.0, 11.0, 4.0, 1.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49169921875, -0.47662353515625, -0.4615478515625, -0.44647216796875, -0.431396484375, -0.41632080078125, -0.4012451171875, -0.38616943359375, -0.37109375, -0.35601806640625, -0.3409423828125, -0.32586669921875, -0.310791015625, -0.29571533203125, -0.2806396484375, -0.26556396484375, -0.25048828125, -0.23541259765625, -0.2203369140625, -0.20526123046875, -0.190185546875, -0.17510986328125, -0.1600341796875, -0.14495849609375, -0.1298828125, -0.11480712890625, -0.0997314453125, -0.08465576171875, -0.069580078125, -0.05450439453125, -0.0394287109375, -0.02435302734375, -0.00927734375, 0.00579833984375, 0.0208740234375, 0.03594970703125, 0.051025390625, 0.06610107421875, 0.0811767578125, 0.09625244140625, 0.111328125, 0.12640380859375, 0.1414794921875, 0.15655517578125, 0.171630859375, 0.18670654296875, 0.2017822265625, 0.21685791015625, 0.23193359375, 0.24700927734375, 0.2620849609375, 0.27716064453125, 0.292236328125, 0.30731201171875, 0.3223876953125, 0.33746337890625, 0.3525390625, 0.36761474609375, 0.3826904296875, 0.39776611328125, 0.412841796875, 0.42791748046875, 0.4429931640625, 0.45806884765625, 0.47314453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 11.0, 8.0, 18.0, 29.0, 50.0, 110.0, 234.0, 708.0, 3475.0, 58670.0, 950600.0, 31041.0, 2541.0, 610.0, 216.0, 83.0, 55.0, 25.0, 4.0, 12.0, 11.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.421875, -0.40648651123046875, -0.3910980224609375, -0.37570953369140625, -0.360321044921875, -0.34493255615234375, -0.3295440673828125, -0.31415557861328125, -0.29876708984375, -0.28337860107421875, -0.2679901123046875, -0.25260162353515625, -0.237213134765625, -0.22182464599609375, -0.2064361572265625, -0.19104766845703125, -0.1756591796875, -0.16027069091796875, -0.1448822021484375, -0.12949371337890625, -0.114105224609375, -0.09871673583984375, -0.0833282470703125, -0.06793975830078125, -0.05255126953125, -0.03716278076171875, -0.0217742919921875, -0.00638580322265625, 0.009002685546875, 0.02439117431640625, 0.0397796630859375, 0.05516815185546875, 0.070556640625, 0.08594512939453125, 0.1013336181640625, 0.11672210693359375, 0.132110595703125, 0.14749908447265625, 0.1628875732421875, 0.17827606201171875, 0.19366455078125, 0.20905303955078125, 0.2244415283203125, 0.23983001708984375, 0.255218505859375, 0.27060699462890625, 0.2859954833984375, 0.30138397216796875, 0.3167724609375, 0.33216094970703125, 0.3475494384765625, 0.36293792724609375, 0.378326416015625, 0.39371490478515625, 0.4091033935546875, 0.42449188232421875, 0.43988037109375, 0.45526885986328125, 0.4706573486328125, 0.48604583740234375, 0.501434326171875, 0.5168228149414062, 0.5322113037109375, 0.5475997924804688, 0.56298828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 4.0, 9.0, 11.0, 11.0, 14.0, 11.0, 28.0, 10.0, 25.0, 38.0, 39.0, 60.0, 59.0, 74.0, 80.0, 81.0, 73.0, 65.0, 51.0, 47.0, 26.0, 28.0, 19.0, 23.0, 21.0, 14.0, 15.0, 13.0, 2.0, 6.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.225969314575195e-05, -4.1008926928043365e-05, -3.975816071033478e-05, -3.850739449262619e-05, -3.72566282749176e-05, -3.6005862057209015e-05, -3.475509583950043e-05, -3.350432962179184e-05, -3.225356340408325e-05, -3.1002797186374664e-05, -2.9752030968666077e-05, -2.850126475095749e-05, -2.72504985332489e-05, -2.5999732315540314e-05, -2.4748966097831726e-05, -2.349819988012314e-05, -2.224743366241455e-05, -2.0996667444705963e-05, -1.9745901226997375e-05, -1.8495135009288788e-05, -1.72443687915802e-05, -1.5993602573871613e-05, -1.4742836356163025e-05, -1.3492070138454437e-05, -1.224130392074585e-05, -1.0990537703037262e-05, -9.739771485328674e-06, -8.489005267620087e-06, -7.238239049911499e-06, -5.987472832202911e-06, -4.736706614494324e-06, -3.485940396785736e-06, -2.2351741790771484e-06, -9.844079613685608e-07, 2.6635825634002686e-07, 1.5171244740486145e-06, 2.767890691757202e-06, 4.01865690946579e-06, 5.2694231271743774e-06, 6.520189344882965e-06, 7.770955562591553e-06, 9.02172178030014e-06, 1.0272487998008728e-05, 1.1523254215717316e-05, 1.2774020433425903e-05, 1.4024786651134491e-05, 1.527555286884308e-05, 1.6526319086551666e-05, 1.7777085304260254e-05, 1.902785152196884e-05, 2.027861773967743e-05, 2.1529383957386017e-05, 2.2780150175094604e-05, 2.4030916392803192e-05, 2.528168261051178e-05, 2.6532448828220367e-05, 2.7783215045928955e-05, 2.9033981263637543e-05, 3.028474748134613e-05, 3.153551369905472e-05, 3.2786279916763306e-05, 3.403704613447189e-05, 3.528781235218048e-05, 3.653857856988907e-05, 3.7789344787597656e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 5.0, 8.0, 7.0, 17.0, 19.0, 25.0, 41.0, 84.0, 126.0, 218.0, 415.0, 938.0, 2125.0, 6542.0, 34683.0, 573705.0, 391022.0, 29068.0, 5820.0, 1946.0, 819.0, 386.0, 228.0, 119.0, 61.0, 39.0, 24.0, 17.0, 23.0, 8.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.314208984375, -0.30634498596191406, -0.2984809875488281, -0.2906169891357422, -0.28275299072265625, -0.2748889923095703, -0.2670249938964844, -0.25916099548339844, -0.2512969970703125, -0.24343299865722656, -0.23556900024414062, -0.2277050018310547, -0.21984100341796875, -0.2119770050048828, -0.20411300659179688, -0.19624900817871094, -0.188385009765625, -0.18052101135253906, -0.17265701293945312, -0.1647930145263672, -0.15692901611328125, -0.1490650177001953, -0.14120101928710938, -0.13333702087402344, -0.1254730224609375, -0.11760902404785156, -0.10974502563476562, -0.10188102722167969, -0.09401702880859375, -0.08615303039550781, -0.07828903198242188, -0.07042503356933594, -0.06256103515625, -0.05469703674316406, -0.046833038330078125, -0.03896903991699219, -0.03110504150390625, -0.023241043090820312, -0.015377044677734375, -0.0075130462646484375, 0.0003509521484375, 0.008214950561523438, 0.016078948974609375, 0.023942947387695312, 0.03180694580078125, 0.03967094421386719, 0.047534942626953125, 0.05539894104003906, 0.063262939453125, 0.07112693786621094, 0.07899093627929688, 0.08685493469238281, 0.09471893310546875, 0.10258293151855469, 0.11044692993164062, 0.11831092834472656, 0.1261749267578125, 0.13403892517089844, 0.14190292358398438, 0.1497669219970703, 0.15763092041015625, 0.1654949188232422, 0.17335891723632812, 0.18122291564941406, 0.1890869140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 4.0, 10.0, 8.0, 9.0, 13.0, 29.0, 30.0, 35.0, 35.0, 60.0, 80.0, 90.0, 84.0, 104.0, 78.0, 76.0, 61.0, 48.0, 31.0, 32.0, 20.0, 13.0, 10.0, 6.0, 6.0, 10.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14404296875, -0.13826370239257812, -0.13248443603515625, -0.12670516967773438, -0.1209259033203125, -0.11514663696289062, -0.10936737060546875, -0.10358810424804688, -0.097808837890625, -0.09202957153320312, -0.08625030517578125, -0.08047103881835938, -0.0746917724609375, -0.06891250610351562, -0.06313323974609375, -0.057353973388671875, -0.05157470703125, -0.045795440673828125, -0.04001617431640625, -0.034236907958984375, -0.0284576416015625, -0.022678375244140625, -0.01689910888671875, -0.011119842529296875, -0.005340576171875, 0.000438690185546875, 0.00621795654296875, 0.011997222900390625, 0.0177764892578125, 0.023555755615234375, 0.02933502197265625, 0.035114288330078125, 0.0408935546875, 0.046672821044921875, 0.05245208740234375, 0.058231353759765625, 0.0640106201171875, 0.06978988647460938, 0.07556915283203125, 0.08134841918945312, 0.087127685546875, 0.09290695190429688, 0.09868621826171875, 0.10446548461914062, 0.1102447509765625, 0.11602401733398438, 0.12180328369140625, 0.12758255004882812, 0.13336181640625, 0.13914108276367188, 0.14492034912109375, 0.15069961547851562, 0.1564788818359375, 0.16225814819335938, 0.16803741455078125, 0.17381668090820312, 0.179595947265625, 0.18537521362304688, 0.19115447998046875, 0.19693374633789062, 0.2027130126953125, 0.20849227905273438, 0.21427154541015625, 0.22005081176757812, 0.225830078125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 18.0, 42.0, 80.0, 132.0, 213.0, 233.0, 122.0, 65.0, 35.0, 20.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.564204692840576, -4.437135219573975, -4.310065746307373, -4.182995796203613, -4.055926322937012, -3.92885684967041, -3.8017873764038086, -3.674717903137207, -3.5476481914520264, -3.420578718185425, -3.293509006500244, -3.1664395332336426, -3.039370059967041, -2.9123003482818604, -2.785230875015259, -2.658161163330078, -2.5310916900634766, -2.404022216796875, -2.2769525051116943, -2.1498830318450928, -2.022813320159912, -1.8957438468933105, -1.768674373626709, -1.6416047811508179, -1.5145351886749268, -1.3874655961990356, -1.2603960037231445, -1.133326530456543, -1.0062569379806519, -0.8791873455047607, -0.7521178126335144, -0.6250482797622681, -0.49797916412353516, -0.37090960144996643, -0.2438400387763977, -0.11677047610282898, 0.010299086570739746, 0.13736867904663086, 0.2644382119178772, 0.39150774478912354, 0.5185773372650146, 0.6456469297409058, 0.7727164626121521, 0.8997859954833984, 1.0268555879592896, 1.1539251804351807, 1.2809946537017822, 1.4080642461776733, 1.5351338386535645, 1.6622034311294556, 1.7892730236053467, 1.9163424968719482, 2.043412208557129, 2.1704816818237305, 2.297551155090332, 2.4246206283569336, 2.5516903400421143, 2.678759813308716, 2.8058295249938965, 2.932898998260498, 3.0599684715270996, 3.1870381832122803, 3.314107656478882, 3.4411773681640625, 3.568246841430664]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 0.0, 5.0, 4.0, 11.0, 7.0, 11.0, 22.0, 7.0, 29.0, 20.0, 20.0, 30.0, 23.0, 43.0, 29.0, 39.0, 44.0, 62.0, 51.0, 61.0, 59.0, 51.0, 42.0, 41.0, 48.0, 40.0, 24.0, 34.0, 20.0, 31.0, 19.0, 6.0, 11.0, 10.0, 11.0, 6.0, 9.0, 9.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.350809097290039, -2.2788524627685547, -2.2068960666656494, -2.134939432144165, -2.0629830360412598, -1.9910264015197754, -1.9190698862075806, -1.8471133708953857, -1.7751567363739014, -1.7032002210617065, -1.6312437057495117, -1.5592870712280273, -1.4873305559158325, -1.4153740406036377, -1.3434175252914429, -1.271461009979248, -1.1995044946670532, -1.1275479793548584, -1.0555914640426636, -0.983634889125824, -0.9116783142089844, -0.8397217988967896, -0.7677652835845947, -0.6958087086677551, -0.6238521933555603, -0.5518956780433655, -0.4799391031265259, -0.40798258781433105, -0.33602604269981384, -0.26406949758529663, -0.1921129822731018, -0.12015640735626221, -0.04819989204406738, 0.023756645619869232, 0.09571318328380585, 0.16766971349716187, 0.23962625861167908, 0.3115828037261963, 0.3835393190383911, 0.4554958939552307, 0.5274524092674255, 0.5994089245796204, 0.67136549949646, 0.7433220148086548, 0.8152785301208496, 0.8872351050376892, 0.959191620349884, 1.0311481952667236, 1.1031047105789185, 1.1750612258911133, 1.247017741203308, 1.318974256515503, 1.3909308910369873, 1.4628874063491821, 1.534843921661377, 1.6068005561828613, 1.6787569522857666, 1.7507134675979614, 1.8226699829101562, 1.8946266174316406, 1.9665831327438354, 2.0385396480560303, 2.1104960441589355, 2.18245267868042, 2.2544093132019043]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 19.0, 15.0, 26.0, 28.0, 44.0, 81.0, 109.0, 167.0, 305.0, 533.0, 991.0, 1884.0, 3791.0, 8689.0, 21041.0, 63112.0, 267863.0, 1688217.0, 1754006.0, 279916.0, 65071.0, 21652.0, 8850.0, 3845.0, 1815.0, 946.0, 508.0, 259.0, 147.0, 128.0, 61.0, 54.0, 25.0, 23.0, 15.0, 10.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2010498046875, -0.1954669952392578, -0.18988418579101562, -0.18430137634277344, -0.17871856689453125, -0.17313575744628906, -0.16755294799804688, -0.1619701385498047, -0.1563873291015625, -0.1508045196533203, -0.14522171020507812, -0.13963890075683594, -0.13405609130859375, -0.12847328186035156, -0.12289047241210938, -0.11730766296386719, -0.111724853515625, -0.10614204406738281, -0.10055923461914062, -0.09497642517089844, -0.08939361572265625, -0.08381080627441406, -0.07822799682617188, -0.07264518737792969, -0.0670623779296875, -0.06147956848144531, -0.055896759033203125, -0.05031394958496094, -0.04473114013671875, -0.03914833068847656, -0.033565521240234375, -0.027982711791992188, -0.02239990234375, -0.016817092895507812, -0.011234283447265625, -0.0056514739990234375, -6.866455078125e-05, 0.0055141448974609375, 0.011096954345703125, 0.016679763793945312, 0.0222625732421875, 0.027845382690429688, 0.033428192138671875, 0.03901100158691406, 0.04459381103515625, 0.05017662048339844, 0.055759429931640625, 0.06134223937988281, 0.066925048828125, 0.07250785827636719, 0.07809066772460938, 0.08367347717285156, 0.08925628662109375, 0.09483909606933594, 0.10042190551757812, 0.10600471496582031, 0.1115875244140625, 0.11717033386230469, 0.12275314331054688, 0.12833595275878906, 0.13391876220703125, 0.13950157165527344, 0.14508438110351562, 0.1506671905517578, 0.15625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 11.0, 13.0, 16.0, 24.0, 35.0, 32.0, 53.0, 37.0, 53.0, 54.0, 55.0, 60.0, 70.0, 63.0, 57.0, 67.0, 54.0, 37.0, 40.0, 34.0, 37.0, 21.0, 21.0, 11.0, 9.0, 6.0, 5.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.13235092163085938, -0.12737274169921875, -0.12239456176757812, -0.1174163818359375, -0.11243820190429688, -0.10746002197265625, -0.10248184204101562, -0.097503662109375, -0.09252548217773438, -0.08754730224609375, -0.08256912231445312, -0.0775909423828125, -0.07261276245117188, -0.06763458251953125, -0.06265640258789062, -0.05767822265625, -0.052700042724609375, -0.04772186279296875, -0.042743682861328125, -0.0377655029296875, -0.032787322998046875, -0.02780914306640625, -0.022830963134765625, -0.017852783203125, -0.012874603271484375, -0.00789642333984375, -0.002918243408203125, 0.0020599365234375, 0.007038116455078125, 0.01201629638671875, 0.016994476318359375, 0.02197265625, 0.026950836181640625, 0.03192901611328125, 0.036907196044921875, 0.0418853759765625, 0.046863555908203125, 0.05184173583984375, 0.056819915771484375, 0.061798095703125, 0.06677627563476562, 0.07175445556640625, 0.07673263549804688, 0.0817108154296875, 0.08668899536132812, 0.09166717529296875, 0.09664535522460938, 0.10162353515625, 0.10660171508789062, 0.11157989501953125, 0.11655807495117188, 0.1215362548828125, 0.12651443481445312, 0.13149261474609375, 0.13647079467773438, 0.141448974609375, 0.14642715454101562, 0.15140533447265625, 0.15638351440429688, 0.1613616943359375, 0.16633987426757812, 0.17131805419921875, 0.17629623413085938, 0.1812744140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 18.0, 15.0, 23.0, 34.0, 42.0, 64.0, 91.0, 168.0, 290.0, 447.0, 832.0, 1589.0, 3517.0, 8255.0, 22268.0, 70737.0, 314877.0, 2468294.0, 1075450.0, 156252.0, 43232.0, 15232.0, 6397.0, 2928.0, 1334.0, 704.0, 427.0, 224.0, 154.0, 110.0, 66.0, 49.0, 42.0, 34.0, 17.0, 10.0, 12.0, 11.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20166015625, -0.1946544647216797, -0.18764877319335938, -0.18064308166503906, -0.17363739013671875, -0.16663169860839844, -0.15962600708007812, -0.1526203155517578, -0.1456146240234375, -0.1386089324951172, -0.13160324096679688, -0.12459754943847656, -0.11759185791015625, -0.11058616638183594, -0.10358047485351562, -0.09657478332519531, -0.089569091796875, -0.08256340026855469, -0.07555770874023438, -0.06855201721191406, -0.06154632568359375, -0.05454063415527344, -0.047534942626953125, -0.04052925109863281, -0.0335235595703125, -0.026517868041992188, -0.019512176513671875, -0.012506484985351562, -0.00550079345703125, 0.0015048980712890625, 0.008510589599609375, 0.015516281127929688, 0.02252197265625, 0.029527664184570312, 0.036533355712890625, 0.04353904724121094, 0.05054473876953125, 0.05755043029785156, 0.06455612182617188, 0.07156181335449219, 0.0785675048828125, 0.08557319641113281, 0.09257888793945312, 0.09958457946777344, 0.10659027099609375, 0.11359596252441406, 0.12060165405273438, 0.1276073455810547, 0.134613037109375, 0.1416187286376953, 0.14862442016601562, 0.15563011169433594, 0.16263580322265625, 0.16964149475097656, 0.17664718627929688, 0.1836528778076172, 0.1906585693359375, 0.1976642608642578, 0.20466995239257812, 0.21167564392089844, 0.21868133544921875, 0.22568702697753906, 0.23269271850585938, 0.2396984100341797, 0.2467041015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 6.0, 12.0, 11.0, 9.0, 21.0, 25.0, 42.0, 36.0, 53.0, 82.0, 94.0, 147.0, 249.0, 326.0, 544.0, 614.0, 552.0, 374.0, 266.0, 165.0, 116.0, 78.0, 59.0, 41.0, 35.0, 22.0, 16.0, 15.0, 20.0, 13.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.293212890625, -0.2839317321777344, -0.27465057373046875, -0.2653694152832031, -0.2560882568359375, -0.24680709838867188, -0.23752593994140625, -0.22824478149414062, -0.218963623046875, -0.20968246459960938, -0.20040130615234375, -0.19112014770507812, -0.1818389892578125, -0.17255783081054688, -0.16327667236328125, -0.15399551391601562, -0.14471435546875, -0.13543319702148438, -0.12615203857421875, -0.11687088012695312, -0.1075897216796875, -0.09830856323242188, -0.08902740478515625, -0.07974624633789062, -0.070465087890625, -0.061183929443359375, -0.05190277099609375, -0.042621612548828125, -0.0333404541015625, -0.024059295654296875, -0.01477813720703125, -0.005496978759765625, 0.0037841796875, 0.013065338134765625, 0.02234649658203125, 0.031627655029296875, 0.0409088134765625, 0.050189971923828125, 0.05947113037109375, 0.06875228881835938, 0.078033447265625, 0.08731460571289062, 0.09659576416015625, 0.10587692260742188, 0.1151580810546875, 0.12443923950195312, 0.13372039794921875, 0.14300155639648438, 0.15228271484375, 0.16156387329101562, 0.17084503173828125, 0.18012619018554688, 0.1894073486328125, 0.19868850708007812, 0.20796966552734375, 0.21725082397460938, 0.226531982421875, 0.23581314086914062, 0.24509429931640625, 0.2543754577636719, 0.2636566162109375, 0.2729377746582031, 0.28221893310546875, 0.2915000915527344, 0.30078125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 12.0, 18.0, 79.0, 182.0, 264.0, 264.0, 102.0, 40.0, 11.0, 13.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.816314220428467, -3.6478524208068848, -3.4793903827667236, -3.3109283447265625, -3.1424665451049805, -2.9740047454833984, -2.8055427074432373, -2.637080669403076, -2.468618869781494, -2.300157070159912, -2.131695032119751, -1.9632331132888794, -1.7947711944580078, -1.6263092756271362, -1.4578473567962646, -1.289385437965393, -1.1209235191345215, -0.9524616003036499, -0.7839996814727783, -0.6155377626419067, -0.44707584381103516, -0.2786139249801636, -0.11015200614929199, 0.05830991268157959, 0.22677183151245117, 0.39523375034332275, 0.5636956691741943, 0.7321575880050659, 0.9006195068359375, 1.069081425666809, 1.2375433444976807, 1.4060052633285522, 1.5744667053222656, 1.7429286241531372, 1.9113905429840088, 2.07985258102417, 2.248314380645752, 2.416776180267334, 2.585238218307495, 2.7537002563476562, 2.9221620559692383, 3.0906238555908203, 3.2590858936309814, 3.4275479316711426, 3.5960097312927246, 3.7644715309143066, 3.9329335689544678, 4.101395606994629, 4.269857406616211, 4.438319206237793, 4.606781005859375, 4.775243282318115, 4.943705081939697, 5.112166881561279, 5.2806291580200195, 5.449090957641602, 5.617552757263184, 5.786014556884766, 5.954476356506348, 6.122938632965088, 6.29140043258667, 6.459862232208252, 6.628324508666992, 6.796786308288574, 6.965248107910156]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 3.0, 6.0, 6.0, 3.0, 16.0, 12.0, 13.0, 25.0, 24.0, 24.0, 32.0, 54.0, 34.0, 53.0, 46.0, 58.0, 56.0, 67.0, 56.0, 53.0, 48.0, 51.0, 44.0, 33.0, 33.0, 35.0, 20.0, 18.0, 16.0, 14.0, 11.0, 6.0, 8.0, 1.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9549334049224854, -1.8999918699264526, -1.84505033493042, -1.7901086807250977, -1.735167145729065, -1.6802256107330322, -1.62528395652771, -1.5703424215316772, -1.5154008865356445, -1.4604593515396118, -1.405517816543579, -1.3505761623382568, -1.2956346273422241, -1.2406930923461914, -1.1857514381408691, -1.1308099031448364, -1.0758683681488037, -1.020926833152771, -0.9659852385520935, -0.911043643951416, -0.8561021089553833, -0.8011605739593506, -0.7462189793586731, -0.6912773847579956, -0.6363358497619629, -0.5813943147659302, -0.5264527201652527, -0.4715111553668976, -0.4165695905685425, -0.3616280257701874, -0.3066864609718323, -0.2517448961734772, -0.19680333137512207, -0.14186176657676697, -0.08692020177841187, -0.03197863698005676, 0.02296292781829834, 0.07790449261665344, 0.13284605741500854, 0.18778762221336365, 0.24272918701171875, 0.29767075181007385, 0.35261231660842896, 0.40755388140678406, 0.46249544620513916, 0.5174369812011719, 0.5723785758018494, 0.6273201704025269, 0.6822617053985596, 0.7372032403945923, 0.7921448349952698, 0.8470864295959473, 0.90202796459198, 0.9569694995880127, 1.011911153793335, 1.0668526887893677, 1.1217942237854004, 1.176735758781433, 1.2316772937774658, 1.286618947982788, 1.3415604829788208, 1.3965020179748535, 1.4514436721801758, 1.5063852071762085, 1.5613267421722412]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 11.0, 18.0, 39.0, 58.0, 75.0, 126.0, 214.0, 404.0, 695.0, 1348.0, 2730.0, 5830.0, 13473.0, 33998.0, 91163.0, 259671.0, 391909.0, 152623.0, 55616.0, 21469.0, 8929.0, 3980.0, 1947.0, 1032.0, 474.0, 273.0, 176.0, 116.0, 50.0, 35.0, 24.0, 18.0, 8.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260498046875, -0.2512779235839844, -0.24205780029296875, -0.23283767700195312, -0.2236175537109375, -0.21439743041992188, -0.20517730712890625, -0.19595718383789062, -0.186737060546875, -0.17751693725585938, -0.16829681396484375, -0.15907669067382812, -0.1498565673828125, -0.14063644409179688, -0.13141632080078125, -0.12219619750976562, -0.11297607421875, -0.10375595092773438, -0.09453582763671875, -0.08531570434570312, -0.0760955810546875, -0.06687545776367188, -0.05765533447265625, -0.048435211181640625, -0.039215087890625, -0.029994964599609375, -0.02077484130859375, -0.011554718017578125, -0.0023345947265625, 0.006885528564453125, 0.01610565185546875, 0.025325775146484375, 0.0345458984375, 0.043766021728515625, 0.05298614501953125, 0.062206268310546875, 0.0714263916015625, 0.08064651489257812, 0.08986663818359375, 0.09908676147460938, 0.108306884765625, 0.11752700805664062, 0.12674713134765625, 0.13596725463867188, 0.1451873779296875, 0.15440750122070312, 0.16362762451171875, 0.17284774780273438, 0.18206787109375, 0.19128799438476562, 0.20050811767578125, 0.20972824096679688, 0.2189483642578125, 0.22816848754882812, 0.23738861083984375, 0.24660873413085938, 0.255828857421875, 0.2650489807128906, 0.27426910400390625, 0.2834892272949219, 0.2927093505859375, 0.3019294738769531, 0.31114959716796875, 0.3203697204589844, 0.32958984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 9.0, 7.0, 12.0, 15.0, 24.0, 29.0, 29.0, 41.0, 31.0, 37.0, 33.0, 50.0, 45.0, 41.0, 50.0, 45.0, 53.0, 50.0, 38.0, 36.0, 44.0, 37.0, 33.0, 33.0, 20.0, 32.0, 16.0, 22.0, 12.0, 16.0, 11.0, 4.0, 7.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.111328125, -0.10741996765136719, -0.10351181030273438, -0.09960365295410156, -0.09569549560546875, -0.09178733825683594, -0.08787918090820312, -0.08397102355957031, -0.0800628662109375, -0.07615470886230469, -0.07224655151367188, -0.06833839416503906, -0.06443023681640625, -0.06052207946777344, -0.056613922119140625, -0.05270576477050781, -0.048797607421875, -0.04488945007324219, -0.040981292724609375, -0.03707313537597656, -0.03316497802734375, -0.029256820678710938, -0.025348663330078125, -0.021440505981445312, -0.0175323486328125, -0.013624191284179688, -0.009716033935546875, -0.0058078765869140625, -0.00189971923828125, 0.0020084381103515625, 0.005916595458984375, 0.009824752807617188, 0.01373291015625, 0.017641067504882812, 0.021549224853515625, 0.025457382202148438, 0.02936553955078125, 0.03327369689941406, 0.037181854248046875, 0.04109001159667969, 0.0449981689453125, 0.04890632629394531, 0.052814483642578125, 0.05672264099121094, 0.06063079833984375, 0.06453895568847656, 0.06844711303710938, 0.07235527038574219, 0.076263427734375, 0.08017158508300781, 0.08407974243164062, 0.08798789978027344, 0.09189605712890625, 0.09580421447753906, 0.09971237182617188, 0.10362052917480469, 0.1075286865234375, 0.11143684387207031, 0.11534500122070312, 0.11925315856933594, 0.12316131591796875, 0.12706947326660156, 0.13097763061523438, 0.1348857879638672, 0.1387939453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 7.0, 1.0, 10.0, 5.0, 12.0, 15.0, 22.0, 26.0, 37.0, 84.0, 158.0, 265.0, 439.0, 882.0, 2072.0, 6915.0, 59487.0, 883241.0, 82260.0, 8061.0, 2342.0, 975.0, 516.0, 287.0, 156.0, 106.0, 48.0, 32.0, 21.0, 19.0, 15.0, 12.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89111328125, -0.863739013671875, -0.83636474609375, -0.808990478515625, -0.7816162109375, -0.754241943359375, -0.72686767578125, -0.699493408203125, -0.672119140625, -0.644744873046875, -0.61737060546875, -0.589996337890625, -0.5626220703125, -0.535247802734375, -0.50787353515625, -0.480499267578125, -0.453125, -0.425750732421875, -0.39837646484375, -0.371002197265625, -0.3436279296875, -0.316253662109375, -0.28887939453125, -0.261505126953125, -0.234130859375, -0.206756591796875, -0.17938232421875, -0.152008056640625, -0.1246337890625, -0.097259521484375, -0.06988525390625, -0.042510986328125, -0.01513671875, 0.012237548828125, 0.03961181640625, 0.066986083984375, 0.0943603515625, 0.121734619140625, 0.14910888671875, 0.176483154296875, 0.203857421875, 0.231231689453125, 0.25860595703125, 0.285980224609375, 0.3133544921875, 0.340728759765625, 0.36810302734375, 0.395477294921875, 0.4228515625, 0.450225830078125, 0.47760009765625, 0.504974365234375, 0.5323486328125, 0.559722900390625, 0.58709716796875, 0.614471435546875, 0.641845703125, 0.669219970703125, 0.69659423828125, 0.723968505859375, 0.7513427734375, 0.778717041015625, 0.80609130859375, 0.833465576171875, 0.86083984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 3.0, 6.0, 8.0, 4.0, 11.0, 19.0, 14.0, 14.0, 19.0, 26.0, 22.0, 38.0, 33.0, 30.0, 28.0, 47.0, 41.0, 36.0, 48.0, 51.0, 43.0, 48.0, 47.0, 47.0, 45.0, 29.0, 36.0, 33.0, 27.0, 20.0, 19.0, 19.0, 18.0, 8.0, 7.0, 10.0, 14.0, 5.0, 4.0, 7.0, 5.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5356826782226562, -0.5176544189453125, -0.49962615966796875, -0.481597900390625, -0.46356964111328125, -0.4455413818359375, -0.42751312255859375, -0.40948486328125, -0.39145660400390625, -0.3734283447265625, -0.35540008544921875, -0.337371826171875, -0.31934356689453125, -0.3013153076171875, -0.28328704833984375, -0.2652587890625, -0.24723052978515625, -0.2292022705078125, -0.21117401123046875, -0.193145751953125, -0.17511749267578125, -0.1570892333984375, -0.13906097412109375, -0.12103271484375, -0.10300445556640625, -0.0849761962890625, -0.06694793701171875, -0.048919677734375, -0.03089141845703125, -0.0128631591796875, 0.00516510009765625, 0.023193359375, 0.04122161865234375, 0.0592498779296875, 0.07727813720703125, 0.095306396484375, 0.11333465576171875, 0.1313629150390625, 0.14939117431640625, 0.16741943359375, 0.18544769287109375, 0.2034759521484375, 0.22150421142578125, 0.239532470703125, 0.25756072998046875, 0.2755889892578125, 0.29361724853515625, 0.3116455078125, 0.32967376708984375, 0.3477020263671875, 0.36573028564453125, 0.383758544921875, 0.40178680419921875, 0.4198150634765625, 0.43784332275390625, 0.45587158203125, 0.47389984130859375, 0.4919281005859375, 0.5099563598632812, 0.527984619140625, 0.5460128784179688, 0.5640411376953125, 0.5820693969726562, 0.60009765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 14.0, 17.0, 16.0, 31.0, 38.0, 74.0, 99.0, 221.0, 467.0, 1192.0, 4269.0, 29781.0, 682211.0, 306369.0, 18682.0, 3255.0, 934.0, 376.0, 164.0, 106.0, 74.0, 37.0, 32.0, 25.0, 12.0, 9.0, 13.0, 7.0, 3.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.272216796875, -0.2641868591308594, -0.25615692138671875, -0.24812698364257812, -0.2400970458984375, -0.23206710815429688, -0.22403717041015625, -0.21600723266601562, -0.207977294921875, -0.19994735717773438, -0.19191741943359375, -0.18388748168945312, -0.1758575439453125, -0.16782760620117188, -0.15979766845703125, -0.15176773071289062, -0.14373779296875, -0.13570785522460938, -0.12767791748046875, -0.11964797973632812, -0.1116180419921875, -0.10358810424804688, -0.09555816650390625, -0.08752822875976562, -0.079498291015625, -0.07146835327148438, -0.06343841552734375, -0.055408477783203125, -0.0473785400390625, -0.039348602294921875, -0.03131866455078125, -0.023288726806640625, -0.0152587890625, -0.007228851318359375, 0.00080108642578125, 0.008831024169921875, 0.0168609619140625, 0.024890899658203125, 0.03292083740234375, 0.040950775146484375, 0.048980712890625, 0.057010650634765625, 0.06504058837890625, 0.07307052612304688, 0.0811004638671875, 0.08913040161132812, 0.09716033935546875, 0.10519027709960938, 0.11322021484375, 0.12125015258789062, 0.12928009033203125, 0.13731002807617188, 0.1453399658203125, 0.15336990356445312, 0.16139984130859375, 0.16942977905273438, 0.177459716796875, 0.18548965454101562, 0.19351959228515625, 0.20154953002929688, 0.2095794677734375, 0.21760940551757812, 0.22563934326171875, 0.23366928100585938, 0.24169921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 11.0, 11.0, 9.0, 13.0, 12.0, 19.0, 15.0, 21.0, 20.0, 26.0, 29.0, 33.0, 44.0, 59.0, 69.0, 88.0, 80.0, 79.0, 59.0, 54.0, 30.0, 22.0, 34.0, 28.0, 24.0, 15.0, 9.0, 10.0, 23.0, 9.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.1975250244140625e-05, -5.04031777381897e-05, -4.883110523223877e-05, -4.725903272628784e-05, -4.5686960220336914e-05, -4.4114887714385986e-05, -4.254281520843506e-05, -4.097074270248413e-05, -3.93986701965332e-05, -3.7826597690582275e-05, -3.625452518463135e-05, -3.468245267868042e-05, -3.311038017272949e-05, -3.1538307666778564e-05, -2.9966235160827637e-05, -2.839416265487671e-05, -2.682209014892578e-05, -2.5250017642974854e-05, -2.3677945137023926e-05, -2.2105872631072998e-05, -2.053380012512207e-05, -1.8961727619171143e-05, -1.7389655113220215e-05, -1.5817582607269287e-05, -1.424551010131836e-05, -1.2673437595367432e-05, -1.1101365089416504e-05, -9.529292583465576e-06, -7.957220077514648e-06, -6.385147571563721e-06, -4.813075065612793e-06, -3.2410025596618652e-06, -1.6689300537109375e-06, -9.685754776000977e-08, 1.475214958190918e-06, 3.0472874641418457e-06, 4.6193599700927734e-06, 6.191432476043701e-06, 7.763504981994629e-06, 9.335577487945557e-06, 1.0907649993896484e-05, 1.2479722499847412e-05, 1.405179500579834e-05, 1.5623867511749268e-05, 1.7195940017700195e-05, 1.8768012523651123e-05, 2.034008502960205e-05, 2.191215753555298e-05, 2.3484230041503906e-05, 2.5056302547454834e-05, 2.6628375053405762e-05, 2.820044755935669e-05, 2.9772520065307617e-05, 3.1344592571258545e-05, 3.291666507720947e-05, 3.44887375831604e-05, 3.606081008911133e-05, 3.7632882595062256e-05, 3.9204955101013184e-05, 4.077702760696411e-05, 4.234910011291504e-05, 4.392117261886597e-05, 4.5493245124816895e-05, 4.706531763076782e-05, 4.863739013671875e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 16.0, 12.0, 17.0, 22.0, 42.0, 44.0, 63.0, 104.0, 208.0, 403.0, 702.0, 1621.0, 4292.0, 17055.0, 165021.0, 784484.0, 59825.0, 9325.0, 2860.0, 1155.0, 533.0, 283.0, 137.0, 91.0, 70.0, 56.0, 29.0, 20.0, 19.0, 11.0, 12.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.23367691040039062, -0.22724151611328125, -0.22080612182617188, -0.2143707275390625, -0.20793533325195312, -0.20149993896484375, -0.19506454467773438, -0.188629150390625, -0.18219375610351562, -0.17575836181640625, -0.16932296752929688, -0.1628875732421875, -0.15645217895507812, -0.15001678466796875, -0.14358139038085938, -0.13714599609375, -0.13071060180664062, -0.12427520751953125, -0.11783981323242188, -0.1114044189453125, -0.10496902465820312, -0.09853363037109375, -0.09209823608398438, -0.085662841796875, -0.07922744750976562, -0.07279205322265625, -0.06635665893554688, -0.0599212646484375, -0.053485870361328125, -0.04705047607421875, -0.040615081787109375, -0.0341796875, -0.027744293212890625, -0.02130889892578125, -0.014873504638671875, -0.0084381103515625, -0.002002716064453125, 0.00443267822265625, 0.010868072509765625, 0.017303466796875, 0.023738861083984375, 0.03017425537109375, 0.036609649658203125, 0.0430450439453125, 0.049480438232421875, 0.05591583251953125, 0.062351226806640625, 0.06878662109375, 0.07522201538085938, 0.08165740966796875, 0.08809280395507812, 0.0945281982421875, 0.10096359252929688, 0.10739898681640625, 0.11383438110351562, 0.120269775390625, 0.12670516967773438, 0.13314056396484375, 0.13957595825195312, 0.1460113525390625, 0.15244674682617188, 0.15888214111328125, 0.16531753540039062, 0.1717529296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 14.0, 9.0, 16.0, 23.0, 24.0, 31.0, 53.0, 58.0, 75.0, 93.0, 95.0, 101.0, 62.0, 77.0, 52.0, 52.0, 30.0, 28.0, 25.0, 11.0, 6.0, 12.0, 14.0, 5.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1380615234375, -0.13275527954101562, -0.12744903564453125, -0.12214279174804688, -0.1168365478515625, -0.11153030395507812, -0.10622406005859375, -0.10091781616210938, -0.095611572265625, -0.09030532836914062, -0.08499908447265625, -0.07969284057617188, -0.0743865966796875, -0.06908035278320312, -0.06377410888671875, -0.058467864990234375, -0.05316162109375, -0.047855377197265625, -0.04254913330078125, -0.037242889404296875, -0.0319366455078125, -0.026630401611328125, -0.02132415771484375, -0.016017913818359375, -0.010711669921875, -0.005405426025390625, -9.918212890625e-05, 0.005207061767578125, 0.0105133056640625, 0.015819549560546875, 0.02112579345703125, 0.026432037353515625, 0.03173828125, 0.037044525146484375, 0.04235076904296875, 0.047657012939453125, 0.0529632568359375, 0.058269500732421875, 0.06357574462890625, 0.06888198852539062, 0.074188232421875, 0.07949447631835938, 0.08480072021484375, 0.09010696411132812, 0.0954132080078125, 0.10071945190429688, 0.10602569580078125, 0.11133193969726562, 0.11663818359375, 0.12194442749023438, 0.12725067138671875, 0.13255691528320312, 0.1378631591796875, 0.14316940307617188, 0.14847564697265625, 0.15378189086914062, 0.159088134765625, 0.16439437866210938, 0.16970062255859375, 0.17500686645507812, 0.1803131103515625, 0.18561935424804688, 0.19092559814453125, 0.19623184204101562, 0.2015380859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 9.0, 9.0, 32.0, 62.0, 134.0, 214.0, 233.0, 139.0, 82.0, 37.0, 19.0, 7.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.208428859710693, -4.077207088470459, -3.9459850788116455, -3.814763307571411, -3.6835412979125977, -3.5523195266723633, -3.421097755432129, -3.2898759841918945, -3.158653974533081, -3.0274322032928467, -2.896210193634033, -2.764988422393799, -2.6337666511535645, -2.502544641494751, -2.3713228702545166, -2.240100860595703, -2.1088790893554688, -1.9776571989059448, -1.846435308456421, -1.7152135372161865, -1.5839916467666626, -1.4527697563171387, -1.3215479850769043, -1.1903260946273804, -1.0591042041778564, -0.9278823137283325, -0.7966604828834534, -0.6654386520385742, -0.5342167615890503, -0.40299487113952637, -0.2717730402946472, -0.14055120944976807, -0.009329795837402344, 0.1218920648097992, 0.25311392545700073, 0.38433578610420227, 0.5155576467514038, 0.6467795372009277, 0.7780013680458069, 0.909223198890686, 1.04044508934021, 1.1716669797897339, 1.3028888702392578, 1.4341106414794922, 1.5653325319290161, 1.69655442237854, 1.8277761936187744, 1.9589980840682983, 2.0902199745178223, 2.2214417457580566, 2.35266375541687, 2.4838855266571045, 2.615107536315918, 2.7463293075561523, 2.8775510787963867, 3.008772850036621, 3.1399948596954346, 3.271216630935669, 3.4024386405944824, 3.533660411834717, 3.664882183074951, 3.7961041927337646, 3.927325963973999, 4.0585479736328125, 4.189769744873047]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 9.0, 11.0, 13.0, 14.0, 14.0, 20.0, 14.0, 20.0, 23.0, 30.0, 25.0, 30.0, 54.0, 57.0, 63.0, 65.0, 71.0, 60.0, 44.0, 44.0, 40.0, 25.0, 27.0, 40.0, 29.0, 31.0, 14.0, 28.0, 16.0, 13.0, 8.0, 8.0, 7.0, 6.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.5427541732788086, -2.4759275913238525, -2.4091010093688965, -2.3422744274139404, -2.2754478454589844, -2.2086212635040283, -2.1417946815490723, -2.074967861175537, -2.00814151763916, -1.941314935684204, -1.874488353729248, -1.807661771774292, -1.740835189819336, -1.6740086078643799, -1.6071819067001343, -1.5403553247451782, -1.4735286235809326, -1.4067020416259766, -1.3398754596710205, -1.2730488777160645, -1.2062222957611084, -1.1393957138061523, -1.0725690126419067, -1.0057424306869507, -0.9389158487319946, -0.8720892667770386, -0.8052626848220825, -0.7384360432624817, -0.6716094613075256, -0.6047828793525696, -0.5379562377929688, -0.4711296558380127, -0.4043029546737671, -0.33747637271881104, -0.2706497609615326, -0.20382316410541534, -0.1369965672492981, -0.07016998529434204, -0.0033433735370635986, 0.06348323822021484, 0.1303098201751709, 0.19713641703128815, 0.2639630138874054, 0.33078962564468384, 0.3976162075996399, 0.46444278955459595, 0.5312694311141968, 0.5980960130691528, 0.6649225950241089, 0.7317491769790649, 0.798575758934021, 0.8654024004936218, 0.9322289824485779, 0.9990555644035339, 1.0658822059631348, 1.1327087879180908, 1.1995353698730469, 1.266361951828003, 1.333188533782959, 1.400015115737915, 1.466841697692871, 1.5336682796478271, 1.6004949808120728, 1.6673215627670288, 1.7341481447219849]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 7.0, 8.0, 10.0, 14.0, 23.0, 34.0, 46.0, 46.0, 88.0, 186.0, 344.0, 1000.0, 3561.0, 18243.0, 178776.0, 3371254.0, 574292.0, 37526.0, 6461.0, 1521.0, 402.0, 125.0, 100.0, 46.0, 50.0, 35.0, 20.0, 18.0, 7.0, 6.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3242759704589844, -0.31334686279296875, -0.3024177551269531, -0.2914886474609375, -0.2805595397949219, -0.26963043212890625, -0.2587013244628906, -0.247772216796875, -0.23684310913085938, -0.22591400146484375, -0.21498489379882812, -0.2040557861328125, -0.19312667846679688, -0.18219757080078125, -0.17126846313476562, -0.16033935546875, -0.14941024780273438, -0.13848114013671875, -0.12755203247070312, -0.1166229248046875, -0.10569381713867188, -0.09476470947265625, -0.08383560180664062, -0.072906494140625, -0.061977386474609375, -0.05104827880859375, -0.040119171142578125, -0.0291900634765625, -0.018260955810546875, -0.00733184814453125, 0.003597259521484375, 0.0145263671875, 0.025455474853515625, 0.03638458251953125, 0.047313690185546875, 0.0582427978515625, 0.06917190551757812, 0.08010101318359375, 0.09103012084960938, 0.101959228515625, 0.11288833618164062, 0.12381744384765625, 0.13474655151367188, 0.1456756591796875, 0.15660476684570312, 0.16753387451171875, 0.17846298217773438, 0.18939208984375, 0.20032119750976562, 0.21125030517578125, 0.22217941284179688, 0.2331085205078125, 0.24403762817382812, 0.25496673583984375, 0.2658958435058594, 0.276824951171875, 0.2877540588378906, 0.29868316650390625, 0.3096122741699219, 0.3205413818359375, 0.3314704895019531, 0.34239959716796875, 0.3533287048339844, 0.3642578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 19.0, 23.0, 32.0, 46.0, 79.0, 81.0, 96.0, 81.0, 86.0, 95.0, 99.0, 75.0, 60.0, 44.0, 25.0, 28.0, 9.0, 9.0, 8.0, 4.0, 1.0], "bins": [-0.38427734375, -0.37678050994873047, -0.36928367614746094, -0.3617868423461914, -0.3542900085449219, -0.34679317474365234, -0.3392963409423828, -0.3317995071411133, -0.32430267333984375, -0.3168058395385742, -0.3093090057373047, -0.30181217193603516, -0.2943153381347656, -0.2868185043334961, -0.27932167053222656, -0.27182483673095703, -0.2643280029296875, -0.25683116912841797, -0.24933433532714844, -0.2418375015258789, -0.23434066772460938, -0.22684383392333984, -0.2193470001220703, -0.21185016632080078, -0.20435333251953125, -0.19685649871826172, -0.1893596649169922, -0.18186283111572266, -0.17436599731445312, -0.1668691635131836, -0.15937232971191406, -0.15187549591064453, -0.144378662109375, -0.13688182830810547, -0.12938499450683594, -0.1218881607055664, -0.11439132690429688, -0.10689449310302734, -0.09939765930175781, -0.09190082550048828, -0.08440399169921875, -0.07690715789794922, -0.06941032409667969, -0.061913490295410156, -0.054416656494140625, -0.046919822692871094, -0.03942298889160156, -0.03192615509033203, -0.0244293212890625, -0.01693248748779297, -0.009435653686523438, -0.0019388198852539062, 0.005558013916015625, 0.013054847717285156, 0.020551681518554688, 0.02804851531982422, 0.03554534912109375, 0.04304218292236328, 0.05053901672363281, 0.058035850524902344, 0.06553268432617188, 0.0730295181274414, 0.08052635192871094, 0.08802318572998047, 0.09552001953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 8.0, 10.0, 18.0, 20.0, 35.0, 44.0, 64.0, 104.0, 143.0, 237.0, 367.0, 697.0, 1416.0, 2890.0, 6488.0, 16230.0, 48863.0, 192786.0, 1692093.0, 1940628.0, 211703.0, 50526.0, 16531.0, 6404.0, 2764.0, 1337.0, 710.0, 443.0, 239.0, 138.0, 107.0, 63.0, 51.0, 29.0, 24.0, 13.0, 11.0, 6.0, 7.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.2412109375, -0.23432540893554688, -0.22743988037109375, -0.22055435180664062, -0.2136688232421875, -0.20678329467773438, -0.19989776611328125, -0.19301223754882812, -0.186126708984375, -0.17924118041992188, -0.17235565185546875, -0.16547012329101562, -0.1585845947265625, -0.15169906616210938, -0.14481353759765625, -0.13792800903320312, -0.13104248046875, -0.12415695190429688, -0.11727142333984375, -0.11038589477539062, -0.1035003662109375, -0.09661483764648438, -0.08972930908203125, -0.08284378051757812, -0.075958251953125, -0.06907272338867188, -0.06218719482421875, -0.055301666259765625, -0.0484161376953125, -0.041530609130859375, -0.03464508056640625, -0.027759552001953125, -0.0208740234375, -0.013988494873046875, -0.00710296630859375, -0.000217437744140625, 0.0066680908203125, 0.013553619384765625, 0.02043914794921875, 0.027324676513671875, 0.034210205078125, 0.041095733642578125, 0.04798126220703125, 0.054866790771484375, 0.0617523193359375, 0.06863784790039062, 0.07552337646484375, 0.08240890502929688, 0.08929443359375, 0.09617996215820312, 0.10306549072265625, 0.10995101928710938, 0.1168365478515625, 0.12372207641601562, 0.13060760498046875, 0.13749313354492188, 0.144378662109375, 0.15126419067382812, 0.15814971923828125, 0.16503524780273438, 0.1719207763671875, 0.17880630493164062, 0.18569183349609375, 0.19257736206054688, 0.199462890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 20.0, 22.0, 22.0, 37.0, 42.0, 62.0, 75.0, 138.0, 177.0, 248.0, 388.0, 550.0, 603.0, 515.0, 355.0, 217.0, 163.0, 111.0, 65.0, 56.0, 39.0, 22.0, 21.0, 24.0, 8.0, 12.0, 8.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.2640037536621094, -0.25530242919921875, -0.24660110473632812, -0.2378997802734375, -0.22919845581054688, -0.22049713134765625, -0.21179580688476562, -0.203094482421875, -0.19439315795898438, -0.18569183349609375, -0.17699050903320312, -0.1682891845703125, -0.15958786010742188, -0.15088653564453125, -0.14218521118164062, -0.13348388671875, -0.12478256225585938, -0.11608123779296875, -0.10737991333007812, -0.0986785888671875, -0.08997726440429688, -0.08127593994140625, -0.07257461547851562, -0.063873291015625, -0.055171966552734375, -0.04647064208984375, -0.037769317626953125, -0.0290679931640625, -0.020366668701171875, -0.01166534423828125, -0.002964019775390625, 0.0057373046875, 0.014438629150390625, 0.02313995361328125, 0.031841278076171875, 0.0405426025390625, 0.049243927001953125, 0.05794525146484375, 0.06664657592773438, 0.075347900390625, 0.08404922485351562, 0.09275054931640625, 0.10145187377929688, 0.1101531982421875, 0.11885452270507812, 0.12755584716796875, 0.13625717163085938, 0.14495849609375, 0.15365982055664062, 0.16236114501953125, 0.17106246948242188, 0.1797637939453125, 0.18846511840820312, 0.19716644287109375, 0.20586776733398438, 0.214569091796875, 0.22327041625976562, 0.23197174072265625, 0.24067306518554688, 0.2493743896484375, 0.2580757141113281, 0.26677703857421875, 0.2754783630371094, 0.2841796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 10.0, 5.0, 16.0, 50.0, 113.0, 248.0, 270.0, 182.0, 51.0, 26.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2951178550720215, -5.141499996185303, -4.987882137298584, -4.834264278411865, -4.6806464195251465, -4.527028560638428, -4.373410701751709, -4.219792366027832, -4.066174507141113, -3.9125566482543945, -3.758938789367676, -3.605320930480957, -3.4517030715942383, -3.2980852127075195, -3.1444671154022217, -2.990849256515503, -2.8372316360473633, -2.6836137771606445, -2.529995918273926, -2.376378059387207, -2.2227602005004883, -2.0691423416137695, -1.9155242443084717, -1.761906385421753, -1.6082885265350342, -1.4546706676483154, -1.3010528087615967, -1.1474348306655884, -0.9938169717788696, -0.8401991128921509, -0.6865811944007874, -0.5329632759094238, -0.3793454170227051, -0.22572752833366394, -0.0721096396446228, 0.08150824904441833, 0.23512613773345947, 0.3887439966201782, 0.5423619151115417, 0.6959798336029053, 0.849597692489624, 1.0032155513763428, 1.1568334102630615, 1.3104513883590698, 1.4640692472457886, 1.6176871061325073, 1.7713050842285156, 1.9249229431152344, 2.078540802001953, 2.232158660888672, 2.3857765197753906, 2.5393943786621094, 2.693012237548828, 2.846630096435547, 3.0002481937408447, 3.1538660526275635, 3.3074839115142822, 3.461101770401001, 3.6147196292877197, 3.7683374881744385, 3.9219555854797363, 4.075573444366455, 4.229191303253174, 4.382809162139893, 4.536427021026611]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 9.0, 8.0, 17.0, 19.0, 20.0, 23.0, 38.0, 43.0, 49.0, 55.0, 82.0, 57.0, 59.0, 74.0, 64.0, 65.0, 53.0, 47.0, 46.0, 32.0, 34.0, 27.0, 22.0, 13.0, 12.0, 12.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6164495944976807, -1.5438990592956543, -1.4713484048843384, -1.398797869682312, -1.326247215270996, -1.2536966800689697, -1.1811461448669434, -1.108595609664917, -1.036044955253601, -0.9634943604469299, -0.8909437656402588, -0.8183932304382324, -0.7458426356315613, -0.6732920408248901, -0.6007415056228638, -0.5281909108161926, -0.4556403160095215, -0.38308972120285034, -0.3105391561985016, -0.23798857629299164, -0.1654379963874817, -0.09288740158081055, -0.020336836576461792, 0.05221372842788696, 0.1247643232345581, 0.19731490314006805, 0.269865483045578, 0.34241604804992676, 0.4149666428565979, 0.48751723766326904, 0.5600677728652954, 0.6326183676719666, 0.7051692008972168, 0.7777197957038879, 0.8502703905105591, 0.9228209257125854, 0.9953715205192566, 1.0679221153259277, 1.140472650527954, 1.2130231857299805, 1.2855738401412964, 1.3581243753433228, 1.4306750297546387, 1.503225564956665, 1.5757761001586914, 1.6483267545700073, 1.7208772897720337, 1.7934279441833496, 1.865978479385376, 1.9385290145874023, 2.0110795497894287, 2.083630323410034, 2.1561808586120605, 2.228731393814087, 2.3012819290161133, 2.3738324642181396, 2.446382999420166, 2.5189335346221924, 2.5914840698242188, 2.664034843444824, 2.7365853786468506, 2.809135913848877, 2.8816864490509033, 2.9542369842529297, 3.026787757873535]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 10.0, 13.0, 12.0, 21.0, 28.0, 54.0, 86.0, 114.0, 216.0, 340.0, 574.0, 1029.0, 1701.0, 3379.0, 6416.0, 13016.0, 29270.0, 80410.0, 313437.0, 416502.0, 111884.0, 37436.0, 16122.0, 7529.0, 3994.0, 2144.0, 1162.0, 672.0, 375.0, 220.0, 138.0, 82.0, 41.0, 45.0, 29.0, 12.0, 11.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.267822265625, -0.2597389221191406, -0.25165557861328125, -0.24357223510742188, -0.2354888916015625, -0.22740554809570312, -0.21932220458984375, -0.21123886108398438, -0.203155517578125, -0.19507217407226562, -0.18698883056640625, -0.17890548706054688, -0.1708221435546875, -0.16273880004882812, -0.15465545654296875, -0.14657211303710938, -0.13848876953125, -0.13040542602539062, -0.12232208251953125, -0.11423873901367188, -0.1061553955078125, -0.09807205200195312, -0.08998870849609375, -0.08190536499023438, -0.073822021484375, -0.06573867797851562, -0.05765533447265625, -0.049571990966796875, -0.0414886474609375, -0.033405303955078125, -0.02532196044921875, -0.017238616943359375, -0.0091552734375, -0.001071929931640625, 0.00701141357421875, 0.015094757080078125, 0.0231781005859375, 0.031261444091796875, 0.03934478759765625, 0.047428131103515625, 0.055511474609375, 0.06359481811523438, 0.07167816162109375, 0.07976150512695312, 0.0878448486328125, 0.09592819213867188, 0.10401153564453125, 0.11209487915039062, 0.12017822265625, 0.12826156616210938, 0.13634490966796875, 0.14442825317382812, 0.1525115966796875, 0.16059494018554688, 0.16867828369140625, 0.17676162719726562, 0.184844970703125, 0.19292831420898438, 0.20101165771484375, 0.20909500122070312, 0.2171783447265625, 0.22526168823242188, 0.23334503173828125, 0.24142837524414062, 0.24951171875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 8.0, 3.0, 6.0, 9.0, 12.0, 12.0, 23.0, 13.0, 18.0, 20.0, 32.0, 30.0, 41.0, 41.0, 46.0, 40.0, 50.0, 46.0, 50.0, 44.0, 34.0, 44.0, 54.0, 43.0, 44.0, 39.0, 30.0, 19.0, 23.0, 19.0, 15.0, 16.0, 13.0, 13.0, 13.0, 6.0, 9.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.12109375, -0.11753368377685547, -0.11397361755371094, -0.1104135513305664, -0.10685348510742188, -0.10329341888427734, -0.09973335266113281, -0.09617328643798828, -0.09261322021484375, -0.08905315399169922, -0.08549308776855469, -0.08193302154541016, -0.07837295532226562, -0.0748128890991211, -0.07125282287597656, -0.06769275665283203, -0.0641326904296875, -0.06057262420654297, -0.05701255798339844, -0.053452491760253906, -0.049892425537109375, -0.046332359313964844, -0.04277229309082031, -0.03921222686767578, -0.03565216064453125, -0.03209209442138672, -0.028532028198242188, -0.024971961975097656, -0.021411895751953125, -0.017851829528808594, -0.014291763305664062, -0.010731697082519531, -0.007171630859375, -0.0036115646362304688, -5.14984130859375e-05, 0.0035085678100585938, 0.007068634033203125, 0.010628700256347656, 0.014188766479492188, 0.01774883270263672, 0.02130889892578125, 0.02486896514892578, 0.028429031372070312, 0.031989097595214844, 0.035549163818359375, 0.039109230041503906, 0.04266929626464844, 0.04622936248779297, 0.0497894287109375, 0.05334949493408203, 0.05690956115722656, 0.060469627380371094, 0.06402969360351562, 0.06758975982666016, 0.07114982604980469, 0.07470989227294922, 0.07826995849609375, 0.08183002471923828, 0.08539009094238281, 0.08895015716552734, 0.09251022338867188, 0.0960702896118164, 0.09963035583496094, 0.10319042205810547, 0.10675048828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 13.0, 11.0, 16.0, 24.0, 47.0, 71.0, 124.0, 208.0, 362.0, 761.0, 2216.0, 10468.0, 195567.0, 811767.0, 21360.0, 3267.0, 1102.0, 507.0, 267.0, 154.0, 75.0, 48.0, 31.0, 23.0, 14.0, 11.0, 9.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.919921875, -0.8937606811523438, -0.8675994873046875, -0.8414382934570312, -0.815277099609375, -0.7891159057617188, -0.7629547119140625, -0.7367935180664062, -0.71063232421875, -0.6844711303710938, -0.6583099365234375, -0.6321487426757812, -0.605987548828125, -0.5798263549804688, -0.5536651611328125, -0.5275039672851562, -0.5013427734375, -0.47518157958984375, -0.4490203857421875, -0.42285919189453125, -0.396697998046875, -0.37053680419921875, -0.3443756103515625, -0.31821441650390625, -0.29205322265625, -0.26589202880859375, -0.2397308349609375, -0.21356964111328125, -0.187408447265625, -0.16124725341796875, -0.1350860595703125, -0.10892486572265625, -0.082763671875, -0.05660247802734375, -0.0304412841796875, -0.00428009033203125, 0.021881103515625, 0.04804229736328125, 0.0742034912109375, 0.10036468505859375, 0.12652587890625, 0.15268707275390625, 0.1788482666015625, 0.20500946044921875, 0.231170654296875, 0.25733184814453125, 0.2834930419921875, 0.30965423583984375, 0.3358154296875, 0.36197662353515625, 0.3881378173828125, 0.41429901123046875, 0.440460205078125, 0.46662139892578125, 0.4927825927734375, 0.5189437866210938, 0.54510498046875, 0.5712661743164062, 0.5974273681640625, 0.6235885620117188, 0.649749755859375, 0.6759109497070312, 0.7020721435546875, 0.7282333374023438, 0.75439453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 11.0, 16.0, 9.0, 14.0, 17.0, 23.0, 26.0, 29.0, 32.0, 36.0, 52.0, 59.0, 55.0, 45.0, 52.0, 62.0, 61.0, 50.0, 44.0, 39.0, 33.0, 32.0, 37.0, 27.0, 19.0, 32.0, 14.0, 12.0, 12.0, 11.0, 11.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.521484375, -0.5054244995117188, -0.4893646240234375, -0.47330474853515625, -0.457244873046875, -0.44118499755859375, -0.4251251220703125, -0.40906524658203125, -0.39300537109375, -0.37694549560546875, -0.3608856201171875, -0.34482574462890625, -0.328765869140625, -0.31270599365234375, -0.2966461181640625, -0.28058624267578125, -0.2645263671875, -0.24846649169921875, -0.2324066162109375, -0.21634674072265625, -0.200286865234375, -0.18422698974609375, -0.1681671142578125, -0.15210723876953125, -0.13604736328125, -0.11998748779296875, -0.1039276123046875, -0.08786773681640625, -0.071807861328125, -0.05574798583984375, -0.0396881103515625, -0.02362823486328125, -0.007568359375, 0.00849151611328125, 0.0245513916015625, 0.04061126708984375, 0.056671142578125, 0.07273101806640625, 0.0887908935546875, 0.10485076904296875, 0.12091064453125, 0.13697052001953125, 0.1530303955078125, 0.16909027099609375, 0.185150146484375, 0.20121002197265625, 0.2172698974609375, 0.23332977294921875, 0.2493896484375, 0.26544952392578125, 0.2815093994140625, 0.29756927490234375, 0.313629150390625, 0.32968902587890625, 0.3457489013671875, 0.36180877685546875, 0.37786865234375, 0.39392852783203125, 0.4099884033203125, 0.42604827880859375, 0.442108154296875, 0.45816802978515625, 0.4742279052734375, 0.49028778076171875, 0.50634765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 9.0, 9.0, 21.0, 19.0, 22.0, 32.0, 53.0, 88.0, 137.0, 162.0, 268.0, 551.0, 1006.0, 2292.0, 6869.0, 34471.0, 624995.0, 340168.0, 27157.0, 5928.0, 2085.0, 954.0, 450.0, 281.0, 173.0, 107.0, 69.0, 45.0, 37.0, 24.0, 16.0, 7.0, 12.0, 6.0, 4.0, 2.0, 2.0, 2.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2030029296875, -0.196441650390625, -0.18988037109375, -0.183319091796875, -0.1767578125, -0.170196533203125, -0.16363525390625, -0.157073974609375, -0.1505126953125, -0.143951416015625, -0.13739013671875, -0.130828857421875, -0.124267578125, -0.117706298828125, -0.11114501953125, -0.104583740234375, -0.0980224609375, -0.091461181640625, -0.08489990234375, -0.078338623046875, -0.07177734375, -0.065216064453125, -0.05865478515625, -0.052093505859375, -0.0455322265625, -0.038970947265625, -0.03240966796875, -0.025848388671875, -0.019287109375, -0.012725830078125, -0.00616455078125, 0.000396728515625, 0.0069580078125, 0.013519287109375, 0.02008056640625, 0.026641845703125, 0.033203125, 0.039764404296875, 0.04632568359375, 0.052886962890625, 0.0594482421875, 0.066009521484375, 0.07257080078125, 0.079132080078125, 0.085693359375, 0.092254638671875, 0.09881591796875, 0.105377197265625, 0.1119384765625, 0.118499755859375, 0.12506103515625, 0.131622314453125, 0.13818359375, 0.144744873046875, 0.15130615234375, 0.157867431640625, 0.1644287109375, 0.170989990234375, 0.17755126953125, 0.184112548828125, 0.190673828125, 0.197235107421875, 0.20379638671875, 0.210357666015625, 0.2169189453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 0.0, 4.0, 5.0, 5.0, 18.0, 13.0, 18.0, 23.0, 52.0, 89.0, 129.0, 156.0, 169.0, 109.0, 68.0, 50.0, 25.0, 12.0, 14.0, 10.0, 12.0, 7.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.232759475708008e-05, -8.96817073225975e-05, -8.703581988811493e-05, -8.438993245363235e-05, -8.174404501914978e-05, -7.90981575846672e-05, -7.645227015018463e-05, -7.380638271570206e-05, -7.116049528121948e-05, -6.851460784673691e-05, -6.586872041225433e-05, -6.322283297777176e-05, -6.0576945543289185e-05, -5.793105810880661e-05, -5.5285170674324036e-05, -5.263928323984146e-05, -4.999339580535889e-05, -4.734750837087631e-05, -4.470162093639374e-05, -4.205573350191116e-05, -3.940984606742859e-05, -3.6763958632946014e-05, -3.411807119846344e-05, -3.1472183763980865e-05, -2.882629632949829e-05, -2.6180408895015717e-05, -2.3534521460533142e-05, -2.0888634026050568e-05, -1.8242746591567993e-05, -1.559685915708542e-05, -1.2950971722602844e-05, -1.030508428812027e-05, -7.659196853637695e-06, -5.013309419155121e-06, -2.3674219846725464e-06, 2.784654498100281e-07, 2.9243528842926025e-06, 5.570240318775177e-06, 8.216127753257751e-06, 1.0862015187740326e-05, 1.35079026222229e-05, 1.6153790056705475e-05, 1.879967749118805e-05, 2.1445564925670624e-05, 2.4091452360153198e-05, 2.6737339794635773e-05, 2.9383227229118347e-05, 3.202911466360092e-05, 3.4675002098083496e-05, 3.732088953256607e-05, 3.9966776967048645e-05, 4.261266440153122e-05, 4.5258551836013794e-05, 4.790443927049637e-05, 5.055032670497894e-05, 5.319621413946152e-05, 5.584210157394409e-05, 5.8487989008426666e-05, 6.113387644290924e-05, 6.377976387739182e-05, 6.642565131187439e-05, 6.907153874635696e-05, 7.171742618083954e-05, 7.436331361532211e-05, 7.700920104980469e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 11.0, 11.0, 21.0, 32.0, 19.0, 43.0, 76.0, 106.0, 175.0, 287.0, 562.0, 1186.0, 2868.0, 9577.0, 61208.0, 813484.0, 136966.0, 14820.0, 3926.0, 1526.0, 668.0, 353.0, 206.0, 131.0, 80.0, 61.0, 26.0, 37.0, 19.0, 14.0, 13.0, 5.0, 3.0, 6.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1685791015625, -0.16248130798339844, -0.15638351440429688, -0.1502857208251953, -0.14418792724609375, -0.1380901336669922, -0.13199234008789062, -0.12589454650878906, -0.1197967529296875, -0.11369895935058594, -0.10760116577148438, -0.10150337219238281, -0.09540557861328125, -0.08930778503417969, -0.08320999145507812, -0.07711219787597656, -0.071014404296875, -0.06491661071777344, -0.058818817138671875, -0.05272102355957031, -0.04662322998046875, -0.04052543640136719, -0.034427642822265625, -0.028329849243164062, -0.0222320556640625, -0.016134262084960938, -0.010036468505859375, -0.0039386749267578125, 0.00215911865234375, 0.008256912231445312, 0.014354705810546875, 0.020452499389648438, 0.02655029296875, 0.03264808654785156, 0.038745880126953125, 0.04484367370605469, 0.05094146728515625, 0.05703926086425781, 0.06313705444335938, 0.06923484802246094, 0.0753326416015625, 0.08143043518066406, 0.08752822875976562, 0.09362602233886719, 0.09972381591796875, 0.10582160949707031, 0.11191940307617188, 0.11801719665527344, 0.124114990234375, 0.13021278381347656, 0.13631057739257812, 0.1424083709716797, 0.14850616455078125, 0.1546039581298828, 0.16070175170898438, 0.16679954528808594, 0.1728973388671875, 0.17899513244628906, 0.18509292602539062, 0.1911907196044922, 0.19728851318359375, 0.2033863067626953, 0.20948410034179688, 0.21558189392089844, 0.2216796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 8.0, 4.0, 4.0, 10.0, 7.0, 14.0, 19.0, 19.0, 32.0, 40.0, 50.0, 55.0, 93.0, 94.0, 103.0, 89.0, 98.0, 60.0, 50.0, 38.0, 35.0, 15.0, 18.0, 8.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1585693359375, -0.15322113037109375, -0.1478729248046875, -0.14252471923828125, -0.137176513671875, -0.13182830810546875, -0.1264801025390625, -0.12113189697265625, -0.11578369140625, -0.11043548583984375, -0.1050872802734375, -0.09973907470703125, -0.094390869140625, -0.08904266357421875, -0.0836944580078125, -0.07834625244140625, -0.072998046875, -0.06764984130859375, -0.0623016357421875, -0.05695343017578125, -0.051605224609375, -0.04625701904296875, -0.0409088134765625, -0.03556060791015625, -0.03021240234375, -0.02486419677734375, -0.0195159912109375, -0.01416778564453125, -0.008819580078125, -0.00347137451171875, 0.0018768310546875, 0.00722503662109375, 0.0125732421875, 0.01792144775390625, 0.0232696533203125, 0.02861785888671875, 0.033966064453125, 0.03931427001953125, 0.0446624755859375, 0.05001068115234375, 0.05535888671875, 0.06070709228515625, 0.0660552978515625, 0.07140350341796875, 0.076751708984375, 0.08209991455078125, 0.0874481201171875, 0.09279632568359375, 0.09814453125, 0.10349273681640625, 0.1088409423828125, 0.11418914794921875, 0.119537353515625, 0.12488555908203125, 0.1302337646484375, 0.13558197021484375, 0.14093017578125, 0.14627838134765625, 0.1516265869140625, 0.15697479248046875, 0.162322998046875, 0.16767120361328125, 0.1730194091796875, 0.17836761474609375, 0.1837158203125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 27.0, 71.0, 151.0, 294.0, 225.0, 104.0, 43.0, 23.0, 13.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0270872116088867, -2.9053759574890137, -2.7836649417877197, -2.6619536876678467, -2.5402426719665527, -2.4185314178466797, -2.2968201637268066, -2.1751091480255127, -2.0533981323242188, -1.9316869974136353, -1.8099758625030518, -1.6882646083831787, -1.5665535926818848, -1.4448423385620117, -1.3231312036514282, -1.2014200687408447, -1.0797088146209717, -0.9579976797103882, -0.8362865447998047, -0.7145753502845764, -0.5928642153739929, -0.4711530804634094, -0.34944188594818115, -0.22773075103759766, -0.10601961612701416, 0.01569153368473053, 0.13740268349647522, 0.2591138482093811, 0.3808249831199646, 0.5025361180305481, 0.6242473125457764, 0.7459584474563599, 0.8676695823669434, 0.9893807172775269, 1.1110918521881104, 1.2328031063079834, 1.3545141220092773, 1.4762253761291504, 1.5979365110397339, 1.7196476459503174, 1.8413587808609009, 1.9630699157714844, 2.0847811698913574, 2.2064921855926514, 2.3282034397125244, 2.4499144554138184, 2.5716257095336914, 2.6933369636535645, 2.8150479793548584, 2.9367592334747314, 3.0584702491760254, 3.1801815032958984, 3.3018925189971924, 3.4236037731170654, 3.5453147888183594, 3.6670260429382324, 3.7887372970581055, 3.9104485511779785, 4.032159805297852, 4.153870582580566, 4.2755818367004395, 4.3972930908203125, 4.5190043449401855, 4.640715599060059, 4.762426376342773]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 4.0, 8.0, 7.0, 9.0, 9.0, 5.0, 11.0, 13.0, 19.0, 15.0, 23.0, 21.0, 23.0, 28.0, 33.0, 34.0, 34.0, 35.0, 47.0, 59.0, 53.0, 59.0, 57.0, 60.0, 41.0, 46.0, 31.0, 34.0, 27.0, 21.0, 22.0, 26.0, 11.0, 13.0, 18.0, 14.0, 10.0, 5.0, 2.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7909092903137207, -1.7334152460098267, -1.6759212017059326, -1.618427038192749, -1.560932993888855, -1.503438949584961, -1.445944905281067, -1.3884508609771729, -1.3309568166732788, -1.2734627723693848, -1.2159687280654907, -1.1584746837615967, -1.100980520248413, -1.043486475944519, -0.985992431640625, -0.928498387336731, -0.8710042834281921, -0.8135102391242981, -0.7560161352157593, -0.6985220909118652, -0.6410280466079712, -0.5835340023040771, -0.5260398983955383, -0.4685458540916443, -0.41105177998542786, -0.3535577058792114, -0.2960636615753174, -0.23856958746910095, -0.18107552826404572, -0.12358146905899048, -0.06608739495277405, -0.008593350648880005, 0.048900723457336426, 0.10639478266239166, 0.1638888418674469, 0.22138291597366333, 0.2788769602775574, 0.3363710343837738, 0.39386510848999023, 0.4513591527938843, 0.5088531970977783, 0.5663472414016724, 0.6238413453102112, 0.6813353896141052, 0.7388294339179993, 0.7963235378265381, 0.8538175821304321, 0.9113116264343262, 0.968805730342865, 1.0262998342514038, 1.0837938785552979, 1.141287922859192, 1.198781967163086, 1.25627601146698, 1.313770055770874, 1.3712642192840576, 1.4287582635879517, 1.4862523078918457, 1.5437463521957397, 1.6012403964996338, 1.6587345600128174, 1.7162286043167114, 1.7737226486206055, 1.8312166929244995, 1.8887107372283936]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 7.0, 8.0, 11.0, 11.0, 14.0, 19.0, 9.0, 35.0, 54.0, 72.0, 113.0, 192.0, 254.0, 456.0, 878.0, 1771.0, 4164.0, 12936.0, 63940.0, 893825.0, 2970470.0, 205723.0, 26636.0, 7191.0, 2656.0, 1157.0, 677.0, 342.0, 223.0, 166.0, 81.0, 65.0, 35.0, 34.0, 17.0, 10.0, 6.0, 2.0, 5.0, 8.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.267578125, -0.25998878479003906, -0.2523994445800781, -0.2448101043701172, -0.23722076416015625, -0.2296314239501953, -0.22204208374023438, -0.21445274353027344, -0.2068634033203125, -0.19927406311035156, -0.19168472290039062, -0.1840953826904297, -0.17650604248046875, -0.1689167022705078, -0.16132736206054688, -0.15373802185058594, -0.146148681640625, -0.13855934143066406, -0.13097000122070312, -0.12338066101074219, -0.11579132080078125, -0.10820198059082031, -0.10061264038085938, -0.09302330017089844, -0.0854339599609375, -0.07784461975097656, -0.07025527954101562, -0.06266593933105469, -0.05507659912109375, -0.04748725891113281, -0.039897918701171875, -0.03230857849121094, -0.02471923828125, -0.017129898071289062, -0.009540557861328125, -0.0019512176513671875, 0.00563812255859375, 0.013227462768554688, 0.020816802978515625, 0.028406143188476562, 0.0359954833984375, 0.04358482360839844, 0.051174163818359375, 0.05876350402832031, 0.06635284423828125, 0.07394218444824219, 0.08153152465820312, 0.08912086486816406, 0.096710205078125, 0.10429954528808594, 0.11188888549804688, 0.11947822570800781, 0.12706756591796875, 0.1346569061279297, 0.14224624633789062, 0.14983558654785156, 0.1574249267578125, 0.16501426696777344, 0.17260360717773438, 0.1801929473876953, 0.18778228759765625, 0.1953716278076172, 0.20296096801757812, 0.21055030822753906, 0.2181396484375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 13.0, 7.0, 15.0, 13.0, 16.0, 30.0, 31.0, 35.0, 43.0, 44.0, 47.0, 48.0, 57.0, 45.0, 58.0, 45.0, 57.0, 62.0, 45.0, 44.0, 29.0, 33.0, 25.0, 15.0, 30.0, 19.0, 16.0, 11.0, 10.0, 8.0, 6.0, 12.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11968994140625, -0.11590290069580078, -0.11211585998535156, -0.10832881927490234, -0.10454177856445312, -0.1007547378540039, -0.09696769714355469, -0.09318065643310547, -0.08939361572265625, -0.08560657501220703, -0.08181953430175781, -0.0780324935913086, -0.07424545288085938, -0.07045841217041016, -0.06667137145996094, -0.06288433074951172, -0.0590972900390625, -0.05531024932861328, -0.05152320861816406, -0.047736167907714844, -0.043949127197265625, -0.040162086486816406, -0.03637504577636719, -0.03258800506591797, -0.02880096435546875, -0.02501392364501953, -0.021226882934570312, -0.017439842224121094, -0.013652801513671875, -0.009865760803222656, -0.0060787200927734375, -0.0022916793823242188, 0.001495361328125, 0.005282402038574219, 0.009069442749023438, 0.012856483459472656, 0.016643524169921875, 0.020430564880371094, 0.024217605590820312, 0.02800464630126953, 0.03179168701171875, 0.03557872772216797, 0.03936576843261719, 0.043152809143066406, 0.046939849853515625, 0.050726890563964844, 0.05451393127441406, 0.05830097198486328, 0.0620880126953125, 0.06587505340576172, 0.06966209411621094, 0.07344913482666016, 0.07723617553710938, 0.0810232162475586, 0.08481025695800781, 0.08859729766845703, 0.09238433837890625, 0.09617137908935547, 0.09995841979980469, 0.1037454605102539, 0.10753250122070312, 0.11131954193115234, 0.11510658264160156, 0.11889362335205078, 0.1226806640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 13.0, 21.0, 34.0, 72.0, 113.0, 259.0, 551.0, 1311.0, 3740.0, 16206.0, 287536.0, 3784584.0, 85287.0, 9686.0, 2739.0, 1102.0, 497.0, 232.0, 127.0, 63.0, 34.0, 24.0, 14.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462158203125, -0.4463996887207031, -0.43064117431640625, -0.4148826599121094, -0.3991241455078125, -0.3833656311035156, -0.36760711669921875, -0.3518486022949219, -0.336090087890625, -0.3203315734863281, -0.30457305908203125, -0.2888145446777344, -0.2730560302734375, -0.2572975158691406, -0.24153900146484375, -0.22578048706054688, -0.21002197265625, -0.19426345825195312, -0.17850494384765625, -0.16274642944335938, -0.1469879150390625, -0.13122940063476562, -0.11547088623046875, -0.09971237182617188, -0.083953857421875, -0.06819534301757812, -0.05243682861328125, -0.036678314208984375, -0.0209197998046875, -0.005161285400390625, 0.01059722900390625, 0.026355743408203125, 0.0421142578125, 0.057872772216796875, 0.07363128662109375, 0.08938980102539062, 0.1051483154296875, 0.12090682983398438, 0.13666534423828125, 0.15242385864257812, 0.168182373046875, 0.18394088745117188, 0.19969940185546875, 0.21545791625976562, 0.2312164306640625, 0.24697494506835938, 0.26273345947265625, 0.2784919738769531, 0.29425048828125, 0.3100090026855469, 0.32576751708984375, 0.3415260314941406, 0.3572845458984375, 0.3730430603027344, 0.38880157470703125, 0.4045600891113281, 0.420318603515625, 0.4360771179199219, 0.45183563232421875, 0.4675941467285156, 0.4833526611328125, 0.4991111755371094, 0.5148696899414062, 0.5306282043457031, 0.54638671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 9.0, 18.0, 24.0, 37.0, 56.0, 113.0, 214.0, 428.0, 908.0, 1025.0, 570.0, 272.0, 142.0, 72.0, 59.0, 35.0, 18.0, 19.0, 6.0, 10.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.39111328125, -0.3785438537597656, -0.36597442626953125, -0.3534049987792969, -0.3408355712890625, -0.3282661437988281, -0.31569671630859375, -0.3031272888183594, -0.290557861328125, -0.2779884338378906, -0.26541900634765625, -0.2528495788574219, -0.2402801513671875, -0.22771072387695312, -0.21514129638671875, -0.20257186889648438, -0.19000244140625, -0.17743301391601562, -0.16486358642578125, -0.15229415893554688, -0.1397247314453125, -0.12715530395507812, -0.11458587646484375, -0.10201644897460938, -0.089447021484375, -0.07687759399414062, -0.06430816650390625, -0.051738739013671875, -0.0391693115234375, -0.026599884033203125, -0.01403045654296875, -0.001461029052734375, 0.0111083984375, 0.023677825927734375, 0.03624725341796875, 0.048816680908203125, 0.0613861083984375, 0.07395553588867188, 0.08652496337890625, 0.09909439086914062, 0.111663818359375, 0.12423324584960938, 0.13680267333984375, 0.14937210083007812, 0.1619415283203125, 0.17451095581054688, 0.18708038330078125, 0.19964981079101562, 0.21221923828125, 0.22478866577148438, 0.23735809326171875, 0.24992752075195312, 0.2624969482421875, 0.2750663757324219, 0.28763580322265625, 0.3002052307128906, 0.312774658203125, 0.3253440856933594, 0.33791351318359375, 0.3504829406738281, 0.3630523681640625, 0.3756217956542969, 0.38819122314453125, 0.4007606506347656, 0.413330078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 9.0, 16.0, 42.0, 125.0, 274.0, 297.0, 141.0, 44.0, 18.0, 17.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.382657527923584, -4.231736660003662, -4.080815315246582, -3.92989444732666, -3.7789735794067383, -3.6280524730682373, -3.4771313667297363, -3.3262104988098145, -3.1752893924713135, -3.0243682861328125, -2.8734474182128906, -2.7225263118743896, -2.5716052055358887, -2.420684337615967, -2.269763231277466, -2.118842124938965, -1.967921257019043, -1.8170002698898315, -1.6660792827606201, -1.5151581764221191, -1.3642371892929077, -1.2133162021636963, -1.0623950958251953, -0.9114741086959839, -0.7605531215667725, -0.609632134437561, -0.45871108770370483, -0.307790070772171, -0.1568690538406372, -0.005948066711425781, 0.14497298002243042, 0.2958940267562866, 0.44681549072265625, 0.5977364778518677, 0.7486575245857239, 0.8995785713195801, 1.0504995584487915, 1.201420545578003, 1.352341651916504, 1.5032626390457153, 1.6541836261749268, 1.8051046133041382, 1.9560256004333496, 2.1069467067718506, 2.2578678131103516, 2.4087886810302734, 2.5597097873687744, 2.7106308937072754, 2.8615517616271973, 3.0124728679656982, 3.16339373588562, 3.314314842224121, 3.465235710144043, 3.616156816482544, 3.767077922821045, 3.917998790740967, 4.068920135498047, 4.219841003417969, 4.370762348175049, 4.521683216094971, 4.672604084014893, 4.823525428771973, 4.9744462966918945, 5.125367164611816, 5.276288032531738]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 12.0, 8.0, 19.0, 15.0, 15.0, 25.0, 26.0, 19.0, 35.0, 26.0, 47.0, 57.0, 44.0, 57.0, 51.0, 53.0, 64.0, 45.0, 49.0, 46.0, 35.0, 39.0, 29.0, 36.0, 22.0, 13.0, 24.0, 17.0, 13.0, 10.0, 6.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5901000499725342, -1.5446165800094604, -1.4991331100463867, -1.4536497592926025, -1.4081662893295288, -1.362682819366455, -1.317199468612671, -1.2717159986495972, -1.2262325286865234, -1.1807490587234497, -1.135265588760376, -1.0897822380065918, -1.044298768043518, -0.9988152980804443, -0.9533318877220154, -0.9078484773635864, -0.8623650074005127, -0.816881537437439, -0.77139812707901, -0.725914716720581, -0.6804312467575073, -0.6349477767944336, -0.5894643664360046, -0.5439809560775757, -0.49849748611450195, -0.4530140459537506, -0.40753060579299927, -0.3620471656322479, -0.3165637254714966, -0.27108028531074524, -0.2255968451499939, -0.18011340498924255, -0.1346299648284912, -0.08914652466773987, -0.043663084506988525, 0.0018203556537628174, 0.04730379581451416, 0.0927872359752655, 0.13827067613601685, 0.1837541162967682, 0.22923755645751953, 0.2747209966182709, 0.3202044367790222, 0.36568787693977356, 0.4111713171005249, 0.45665475726127625, 0.5021381974220276, 0.5476216077804565, 0.5931050777435303, 0.638588547706604, 0.684071958065033, 0.7295553684234619, 0.7750388383865356, 0.8205223083496094, 0.8660057187080383, 0.9114891290664673, 0.956972599029541, 1.0024560689926147, 1.0479395389556885, 1.0934228897094727, 1.1389063596725464, 1.1843898296356201, 1.2298731803894043, 1.275356650352478, 1.3208401203155518]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 4.0, 7.0, 5.0, 4.0, 19.0, 18.0, 18.0, 30.0, 39.0, 66.0, 120.0, 212.0, 380.0, 708.0, 1383.0, 2908.0, 6960.0, 20831.0, 79619.0, 332895.0, 433655.0, 122291.0, 29530.0, 9313.0, 3850.0, 1771.0, 811.0, 464.0, 259.0, 141.0, 77.0, 49.0, 33.0, 25.0, 10.0, 15.0, 10.0, 12.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.24932289123535156, -0.24278640747070312, -0.2362499237060547, -0.22971343994140625, -0.2231769561767578, -0.21664047241210938, -0.21010398864746094, -0.2035675048828125, -0.19703102111816406, -0.19049453735351562, -0.1839580535888672, -0.17742156982421875, -0.1708850860595703, -0.16434860229492188, -0.15781211853027344, -0.151275634765625, -0.14473915100097656, -0.13820266723632812, -0.1316661834716797, -0.12512969970703125, -0.11859321594238281, -0.11205673217773438, -0.10552024841308594, -0.0989837646484375, -0.09244728088378906, -0.08591079711914062, -0.07937431335449219, -0.07283782958984375, -0.06630134582519531, -0.059764862060546875, -0.05322837829589844, -0.04669189453125, -0.04015541076660156, -0.033618927001953125, -0.027082443237304688, -0.02054595947265625, -0.014009475708007812, -0.007472991943359375, -0.0009365081787109375, 0.0055999755859375, 0.012136459350585938, 0.018672943115234375, 0.025209426879882812, 0.03174591064453125, 0.03828239440917969, 0.044818878173828125, 0.05135536193847656, 0.057891845703125, 0.06442832946777344, 0.07096481323242188, 0.07750129699707031, 0.08403778076171875, 0.09057426452636719, 0.09711074829101562, 0.10364723205566406, 0.1101837158203125, 0.11672019958496094, 0.12325668334960938, 0.1297931671142578, 0.13632965087890625, 0.1428661346435547, 0.14940261840820312, 0.15593910217285156, 0.1624755859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 10.0, 6.0, 13.0, 21.0, 12.0, 29.0, 30.0, 42.0, 48.0, 63.0, 46.0, 41.0, 52.0, 57.0, 60.0, 53.0, 52.0, 50.0, 54.0, 46.0, 39.0, 32.0, 23.0, 23.0, 21.0, 23.0, 8.0, 15.0, 8.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12582969665527344, -0.12141036987304688, -0.11699104309082031, -0.11257171630859375, -0.10815238952636719, -0.10373306274414062, -0.09931373596191406, -0.0948944091796875, -0.09047508239746094, -0.08605575561523438, -0.08163642883300781, -0.07721710205078125, -0.07279777526855469, -0.06837844848632812, -0.06395912170410156, -0.059539794921875, -0.05512046813964844, -0.050701141357421875, -0.04628181457519531, -0.04186248779296875, -0.03744316101074219, -0.033023834228515625, -0.028604507446289062, -0.0241851806640625, -0.019765853881835938, -0.015346527099609375, -0.010927200317382812, -0.00650787353515625, -0.0020885467529296875, 0.002330780029296875, 0.0067501068115234375, 0.01116943359375, 0.015588760375976562, 0.020008087158203125, 0.024427413940429688, 0.02884674072265625, 0.03326606750488281, 0.037685394287109375, 0.04210472106933594, 0.0465240478515625, 0.05094337463378906, 0.055362701416015625, 0.05978202819824219, 0.06420135498046875, 0.06862068176269531, 0.07304000854492188, 0.07745933532714844, 0.081878662109375, 0.08629798889160156, 0.09071731567382812, 0.09513664245605469, 0.09955596923828125, 0.10397529602050781, 0.10839462280273438, 0.11281394958496094, 0.1172332763671875, 0.12165260314941406, 0.12607192993164062, 0.1304912567138672, 0.13491058349609375, 0.1393299102783203, 0.14374923706054688, 0.14816856384277344, 0.152587890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0, 16.0, 11.0, 13.0, 23.0, 28.0, 39.0, 64.0, 90.0, 136.0, 213.0, 400.0, 763.0, 1692.0, 4331.0, 15587.0, 100418.0, 707256.0, 182943.0, 24141.0, 6048.0, 2195.0, 942.0, 482.0, 268.0, 146.0, 84.0, 57.0, 39.0, 26.0, 19.0, 17.0, 13.0, 11.0, 10.0, 6.0, 4.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3046875, -0.29589080810546875, -0.2870941162109375, -0.27829742431640625, -0.269500732421875, -0.26070404052734375, -0.2519073486328125, -0.24311065673828125, -0.23431396484375, -0.22551727294921875, -0.2167205810546875, -0.20792388916015625, -0.199127197265625, -0.19033050537109375, -0.1815338134765625, -0.17273712158203125, -0.1639404296875, -0.15514373779296875, -0.1463470458984375, -0.13755035400390625, -0.128753662109375, -0.11995697021484375, -0.1111602783203125, -0.10236358642578125, -0.09356689453125, -0.08477020263671875, -0.0759735107421875, -0.06717681884765625, -0.058380126953125, -0.04958343505859375, -0.0407867431640625, -0.03199005126953125, -0.023193359375, -0.01439666748046875, -0.0055999755859375, 0.00319671630859375, 0.011993408203125, 0.02079010009765625, 0.0295867919921875, 0.03838348388671875, 0.04718017578125, 0.05597686767578125, 0.0647735595703125, 0.07357025146484375, 0.082366943359375, 0.09116363525390625, 0.0999603271484375, 0.10875701904296875, 0.1175537109375, 0.12635040283203125, 0.1351470947265625, 0.14394378662109375, 0.152740478515625, 0.16153717041015625, 0.1703338623046875, 0.17913055419921875, 0.18792724609375, 0.19672393798828125, 0.2055206298828125, 0.21431732177734375, 0.223114013671875, 0.23191070556640625, 0.2407073974609375, 0.24950408935546875, 0.25830078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 7.0, 5.0, 5.0, 13.0, 15.0, 18.0, 21.0, 18.0, 29.0, 35.0, 31.0, 39.0, 39.0, 49.0, 35.0, 45.0, 44.0, 30.0, 39.0, 46.0, 37.0, 42.0, 38.0, 50.0, 37.0, 39.0, 24.0, 31.0, 19.0, 15.0, 26.0, 15.0, 7.0, 7.0, 5.0, 6.0, 3.0, 10.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.384521484375, -0.3728790283203125, -0.361236572265625, -0.3495941162109375, -0.33795166015625, -0.3263092041015625, -0.314666748046875, -0.3030242919921875, -0.2913818359375, -0.2797393798828125, -0.268096923828125, -0.2564544677734375, -0.24481201171875, -0.2331695556640625, -0.221527099609375, -0.2098846435546875, -0.1982421875, -0.1865997314453125, -0.174957275390625, -0.1633148193359375, -0.15167236328125, -0.1400299072265625, -0.128387451171875, -0.1167449951171875, -0.1051025390625, -0.0934600830078125, -0.081817626953125, -0.0701751708984375, -0.05853271484375, -0.0468902587890625, -0.035247802734375, -0.0236053466796875, -0.011962890625, -0.0003204345703125, 0.011322021484375, 0.0229644775390625, 0.03460693359375, 0.0462493896484375, 0.057891845703125, 0.0695343017578125, 0.0811767578125, 0.0928192138671875, 0.104461669921875, 0.1161041259765625, 0.12774658203125, 0.1393890380859375, 0.151031494140625, 0.1626739501953125, 0.17431640625, 0.1859588623046875, 0.197601318359375, 0.2092437744140625, 0.22088623046875, 0.2325286865234375, 0.244171142578125, 0.2558135986328125, 0.2674560546875, 0.2790985107421875, 0.290740966796875, 0.3023834228515625, 0.31402587890625, 0.3256683349609375, 0.337310791015625, 0.3489532470703125, 0.360595703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 6.0, 19.0, 12.0, 22.0, 41.0, 63.0, 76.0, 121.0, 244.0, 396.0, 790.0, 1715.0, 3629.0, 9598.0, 29975.0, 125966.0, 653502.0, 165771.0, 36765.0, 11369.0, 4425.0, 1905.0, 939.0, 511.0, 242.0, 159.0, 97.0, 59.0, 34.0, 23.0, 26.0, 13.0, 8.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09576416015625, -0.09282493591308594, -0.08988571166992188, -0.08694648742675781, -0.08400726318359375, -0.08106803894042969, -0.07812881469726562, -0.07518959045410156, -0.0722503662109375, -0.06931114196777344, -0.06637191772460938, -0.06343269348144531, -0.06049346923828125, -0.05755424499511719, -0.054615020751953125, -0.05167579650878906, -0.048736572265625, -0.04579734802246094, -0.042858123779296875, -0.03991889953613281, -0.03697967529296875, -0.03404045104980469, -0.031101226806640625, -0.028162002563476562, -0.0252227783203125, -0.022283554077148438, -0.019344329833984375, -0.016405105590820312, -0.01346588134765625, -0.010526657104492188, -0.007587432861328125, -0.0046482086181640625, -0.001708984375, 0.0012302398681640625, 0.004169464111328125, 0.0071086883544921875, 0.01004791259765625, 0.012987136840820312, 0.015926361083984375, 0.018865585327148438, 0.0218048095703125, 0.024744033813476562, 0.027683258056640625, 0.030622482299804688, 0.03356170654296875, 0.03650093078613281, 0.039440155029296875, 0.04237937927246094, 0.045318603515625, 0.04825782775878906, 0.051197052001953125, 0.05413627624511719, 0.05707550048828125, 0.06001472473144531, 0.06295394897460938, 0.06589317321777344, 0.0688323974609375, 0.07177162170410156, 0.07471084594726562, 0.07765007019042969, 0.08058929443359375, 0.08352851867675781, 0.08646774291992188, 0.08940696716308594, 0.09234619140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 6.0, 17.0, 32.0, 36.0, 63.0, 77.0, 102.0, 107.0, 119.0, 102.0, 79.0, 70.0, 44.0, 32.0, 25.0, 14.0, 11.0, 4.0, 9.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9517879486083984e-05, -3.8292258977890015e-05, -3.7066638469696045e-05, -3.5841017961502075e-05, -3.4615397453308105e-05, -3.3389776945114136e-05, -3.2164156436920166e-05, -3.0938535928726196e-05, -2.9712915420532227e-05, -2.8487294912338257e-05, -2.7261674404144287e-05, -2.6036053895950317e-05, -2.4810433387756348e-05, -2.3584812879562378e-05, -2.2359192371368408e-05, -2.113357186317444e-05, -1.990795135498047e-05, -1.86823308467865e-05, -1.745671033859253e-05, -1.623108983039856e-05, -1.500546932220459e-05, -1.377984881401062e-05, -1.255422830581665e-05, -1.132860779762268e-05, -1.0102987289428711e-05, -8.877366781234741e-06, -7.651746273040771e-06, -6.426125764846802e-06, -5.200505256652832e-06, -3.974884748458862e-06, -2.7492642402648926e-06, -1.5236437320709229e-06, -2.980232238769531e-07, 9.275972843170166e-07, 2.1532177925109863e-06, 3.378838300704956e-06, 4.604458808898926e-06, 5.8300793170928955e-06, 7.055699825286865e-06, 8.281320333480835e-06, 9.506940841674805e-06, 1.0732561349868774e-05, 1.1958181858062744e-05, 1.3183802366256714e-05, 1.4409422874450684e-05, 1.5635043382644653e-05, 1.6860663890838623e-05, 1.8086284399032593e-05, 1.9311904907226562e-05, 2.0537525415420532e-05, 2.1763145923614502e-05, 2.298876643180847e-05, 2.421438694000244e-05, 2.544000744819641e-05, 2.666562795639038e-05, 2.789124846458435e-05, 2.911686897277832e-05, 3.034248948097229e-05, 3.156810998916626e-05, 3.279373049736023e-05, 3.40193510055542e-05, 3.524497151374817e-05, 3.647059202194214e-05, 3.769621253013611e-05, 3.892183303833008e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 0.0, 4.0, 4.0, 0.0, 7.0, 6.0, 3.0, 7.0, 12.0, 13.0, 25.0, 25.0, 37.0, 54.0, 78.0, 121.0, 200.0, 259.0, 507.0, 929.0, 1746.0, 3501.0, 7602.0, 18909.0, 58332.0, 234312.0, 566375.0, 103985.0, 30179.0, 11278.0, 4739.0, 2439.0, 1208.0, 638.0, 321.0, 236.0, 148.0, 77.0, 81.0, 48.0, 33.0, 22.0, 11.0, 14.0, 9.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07565784454345703, -0.07306861877441406, -0.0704793930053711, -0.06789016723632812, -0.06530094146728516, -0.06271171569824219, -0.06012248992919922, -0.05753326416015625, -0.05494403839111328, -0.05235481262207031, -0.049765586853027344, -0.047176361083984375, -0.044587135314941406, -0.04199790954589844, -0.03940868377685547, -0.0368194580078125, -0.03423023223876953, -0.03164100646972656, -0.029051780700683594, -0.026462554931640625, -0.023873329162597656, -0.021284103393554688, -0.01869487762451172, -0.01610565185546875, -0.013516426086425781, -0.010927200317382812, -0.008337974548339844, -0.005748748779296875, -0.0031595230102539062, -0.0005702972412109375, 0.0020189285278320312, 0.004608154296875, 0.007197380065917969, 0.009786605834960938, 0.012375831604003906, 0.014965057373046875, 0.017554283142089844, 0.020143508911132812, 0.02273273468017578, 0.02532196044921875, 0.02791118621826172, 0.030500411987304688, 0.033089637756347656, 0.035678863525390625, 0.038268089294433594, 0.04085731506347656, 0.04344654083251953, 0.0460357666015625, 0.04862499237060547, 0.05121421813964844, 0.053803443908691406, 0.056392669677734375, 0.058981895446777344, 0.06157112121582031, 0.06416034698486328, 0.06674957275390625, 0.06933879852294922, 0.07192802429199219, 0.07451725006103516, 0.07710647583007812, 0.0796957015991211, 0.08228492736816406, 0.08487415313720703, 0.08746337890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 8.0, 17.0, 18.0, 11.0, 24.0, 47.0, 61.0, 77.0, 87.0, 95.0, 112.0, 101.0, 69.0, 61.0, 50.0, 37.0, 25.0, 22.0, 13.0, 12.0, 8.0, 4.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10345458984375, -0.09992790222167969, -0.09640121459960938, -0.09287452697753906, -0.08934783935546875, -0.08582115173339844, -0.08229446411132812, -0.07876777648925781, -0.0752410888671875, -0.07171440124511719, -0.06818771362304688, -0.06466102600097656, -0.06113433837890625, -0.05760765075683594, -0.054080963134765625, -0.05055427551269531, -0.047027587890625, -0.04350090026855469, -0.039974212646484375, -0.03644752502441406, -0.03292083740234375, -0.029394149780273438, -0.025867462158203125, -0.022340774536132812, -0.0188140869140625, -0.015287399291992188, -0.011760711669921875, -0.008234024047851562, -0.00470733642578125, -0.0011806488037109375, 0.002346038818359375, 0.0058727264404296875, 0.0093994140625, 0.012926101684570312, 0.016452789306640625, 0.019979476928710938, 0.02350616455078125, 0.027032852172851562, 0.030559539794921875, 0.03408622741699219, 0.0376129150390625, 0.04113960266113281, 0.044666290283203125, 0.04819297790527344, 0.05171966552734375, 0.05524635314941406, 0.058773040771484375, 0.06229972839355469, 0.065826416015625, 0.06935310363769531, 0.07287979125976562, 0.07640647888183594, 0.07993316650390625, 0.08345985412597656, 0.08698654174804688, 0.09051322937011719, 0.0940399169921875, 0.09756660461425781, 0.10109329223632812, 0.10461997985839844, 0.10814666748046875, 0.11167335510253906, 0.11520004272460938, 0.11872673034667969, 0.12225341796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 11.0, 25.0, 68.0, 193.0, 367.0, 208.0, 69.0, 19.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.947725296020508, -3.829380989074707, -3.7110366821289062, -3.5926923751831055, -3.4743480682373047, -3.356003761291504, -3.237659454345703, -3.1193151473999023, -3.0009708404541016, -2.882626533508301, -2.7642822265625, -2.645937919616699, -2.5275936126708984, -2.4092493057250977, -2.290904998779297, -2.172560691833496, -2.0542163848876953, -1.9358720779418945, -1.8175277709960938, -1.699183464050293, -1.5808391571044922, -1.4624948501586914, -1.3441505432128906, -1.2258062362670898, -1.107461929321289, -0.9891176223754883, -0.8707733154296875, -0.7524290084838867, -0.6340847015380859, -0.5157403945922852, -0.3973960876464844, -0.2790517807006836, -0.16070771217346191, -0.04236340522766113, 0.07598090171813965, 0.19432520866394043, 0.3126695156097412, 0.431013822555542, 0.5493581295013428, 0.6677024364471436, 0.7860467433929443, 0.9043910503387451, 1.022735357284546, 1.1410796642303467, 1.2594239711761475, 1.3777682781219482, 1.496112585067749, 1.6144568920135498, 1.7328011989593506, 1.8511455059051514, 1.9694898128509521, 2.087834119796753, 2.2061784267425537, 2.3245227336883545, 2.4428670406341553, 2.561211347579956, 2.679555654525757, 2.7978999614715576, 2.9162442684173584, 3.034588575363159, 3.15293288230896, 3.2712771892547607, 3.3896214962005615, 3.5079658031463623, 3.626310110092163]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 0.0, 10.0, 10.0, 5.0, 10.0, 11.0, 13.0, 22.0, 17.0, 18.0, 24.0, 35.0, 35.0, 26.0, 41.0, 39.0, 45.0, 50.0, 70.0, 82.0, 54.0, 50.0, 52.0, 36.0, 26.0, 21.0, 26.0, 23.0, 23.0, 12.0, 14.0, 22.0, 9.0, 8.0, 11.0, 11.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.552065134048462, -1.5034654140472412, -1.4548656940460205, -1.4062659740447998, -1.357666254043579, -1.3090665340423584, -1.2604668140411377, -1.211867094039917, -1.1632673740386963, -1.1146676540374756, -1.0660679340362549, -1.0174682140350342, -0.9688684940338135, -0.9202687740325928, -0.8716691136360168, -0.8230693936347961, -0.7744697332382202, -0.7258700132369995, -0.6772702932357788, -0.6286705732345581, -0.5800708532333374, -0.5314711332321167, -0.48287147283554077, -0.43427175283432007, -0.38567203283309937, -0.33707231283187866, -0.28847259283065796, -0.23987290263175964, -0.19127318263053894, -0.14267346262931824, -0.09407377243041992, -0.04547405242919922, 0.0031256675720214844, 0.05172538012266159, 0.1003250926733017, 0.1489247977733612, 0.1975245177745819, 0.2461242377758026, 0.2947239279747009, 0.34332364797592163, 0.39192336797714233, 0.44052308797836304, 0.48912280797958374, 0.5377224683761597, 0.5863221883773804, 0.6349219083786011, 0.6835216283798218, 0.7321213483810425, 0.7807210683822632, 0.8293207883834839, 0.8779205083847046, 0.9265202283859253, 0.975119948387146, 1.0237196683883667, 1.0723192691802979, 1.1209189891815186, 1.1695187091827393, 1.21811842918396, 1.2667181491851807, 1.3153178691864014, 1.363917589187622, 1.4125173091888428, 1.4611170291900635, 1.5097167491912842, 1.5583164691925049]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 10.0, 18.0, 19.0, 25.0, 39.0, 62.0, 80.0, 137.0, 195.0, 313.0, 566.0, 1098.0, 2280.0, 5369.0, 15153.0, 58834.0, 452053.0, 2870700.0, 677648.0, 79456.0, 18643.0, 6355.0, 2521.0, 1204.0, 554.0, 322.0, 217.0, 137.0, 80.0, 46.0, 43.0, 28.0, 20.0, 14.0, 10.0, 8.0, 8.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16536903381347656, -0.15996170043945312, -0.1545543670654297, -0.14914703369140625, -0.1437397003173828, -0.13833236694335938, -0.13292503356933594, -0.1275177001953125, -0.12211036682128906, -0.11670303344726562, -0.11129570007324219, -0.10588836669921875, -0.10048103332519531, -0.09507369995117188, -0.08966636657714844, -0.084259033203125, -0.07885169982910156, -0.07344436645507812, -0.06803703308105469, -0.06262969970703125, -0.05722236633300781, -0.051815032958984375, -0.04640769958496094, -0.0410003662109375, -0.03559303283691406, -0.030185699462890625, -0.024778366088867188, -0.01937103271484375, -0.013963699340820312, -0.008556365966796875, -0.0031490325927734375, 0.00225830078125, 0.0076656341552734375, 0.013072967529296875, 0.018480300903320312, 0.02388763427734375, 0.029294967651367188, 0.034702301025390625, 0.04010963439941406, 0.0455169677734375, 0.05092430114746094, 0.056331634521484375, 0.06173896789550781, 0.06714630126953125, 0.07255363464355469, 0.07796096801757812, 0.08336830139160156, 0.088775634765625, 0.09418296813964844, 0.09959030151367188, 0.10499763488769531, 0.11040496826171875, 0.11581230163574219, 0.12121963500976562, 0.12662696838378906, 0.1320343017578125, 0.13744163513183594, 0.14284896850585938, 0.1482563018798828, 0.15366363525390625, 0.1590709686279297, 0.16447830200195312, 0.16988563537597656, 0.17529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 6.0, 9.0, 8.0, 9.0, 12.0, 17.0, 21.0, 24.0, 30.0, 42.0, 40.0, 61.0, 36.0, 36.0, 47.0, 66.0, 52.0, 53.0, 51.0, 44.0, 50.0, 46.0, 42.0, 29.0, 28.0, 34.0, 25.0, 13.0, 15.0, 15.0, 4.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130126953125, -0.12634944915771484, -0.12257194519042969, -0.11879444122314453, -0.11501693725585938, -0.11123943328857422, -0.10746192932128906, -0.1036844253540039, -0.09990692138671875, -0.0961294174194336, -0.09235191345214844, -0.08857440948486328, -0.08479690551757812, -0.08101940155029297, -0.07724189758300781, -0.07346439361572266, -0.0696868896484375, -0.06590938568115234, -0.06213188171386719, -0.05835437774658203, -0.054576873779296875, -0.05079936981201172, -0.04702186584472656, -0.043244361877441406, -0.03946685791015625, -0.035689353942871094, -0.03191184997558594, -0.02813434600830078, -0.024356842041015625, -0.02057933807373047, -0.016801834106445312, -0.013024330139160156, -0.009246826171875, -0.005469322204589844, -0.0016918182373046875, 0.0020856857299804688, 0.005863189697265625, 0.009640693664550781, 0.013418197631835938, 0.017195701599121094, 0.02097320556640625, 0.024750709533691406, 0.028528213500976562, 0.03230571746826172, 0.036083221435546875, 0.03986072540283203, 0.04363822937011719, 0.047415733337402344, 0.0511932373046875, 0.054970741271972656, 0.05874824523925781, 0.06252574920654297, 0.06630325317382812, 0.07008075714111328, 0.07385826110839844, 0.0776357650756836, 0.08141326904296875, 0.0851907730102539, 0.08896827697753906, 0.09274578094482422, 0.09652328491210938, 0.10030078887939453, 0.10407829284667969, 0.10785579681396484, 0.11163330078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 10.0, 10.0, 13.0, 20.0, 46.0, 98.0, 230.0, 608.0, 2167.0, 19947.0, 3296288.0, 860756.0, 11593.0, 1575.0, 492.0, 212.0, 97.0, 47.0, 32.0, 16.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.571441650390625, -0.55352783203125, -0.535614013671875, -0.5177001953125, -0.499786376953125, -0.48187255859375, -0.463958740234375, -0.446044921875, -0.428131103515625, -0.41021728515625, -0.392303466796875, -0.3743896484375, -0.356475830078125, -0.33856201171875, -0.320648193359375, -0.302734375, -0.284820556640625, -0.26690673828125, -0.248992919921875, -0.2310791015625, -0.213165283203125, -0.19525146484375, -0.177337646484375, -0.159423828125, -0.141510009765625, -0.12359619140625, -0.105682373046875, -0.0877685546875, -0.069854736328125, -0.05194091796875, -0.034027099609375, -0.01611328125, 0.001800537109375, 0.01971435546875, 0.037628173828125, 0.0555419921875, 0.073455810546875, 0.09136962890625, 0.109283447265625, 0.127197265625, 0.145111083984375, 0.16302490234375, 0.180938720703125, 0.1988525390625, 0.216766357421875, 0.23468017578125, 0.252593994140625, 0.2705078125, 0.288421630859375, 0.30633544921875, 0.324249267578125, 0.3421630859375, 0.360076904296875, 0.37799072265625, 0.395904541015625, 0.413818359375, 0.431732177734375, 0.44964599609375, 0.467559814453125, 0.4854736328125, 0.503387451171875, 0.52130126953125, 0.539215087890625, 0.55712890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 4.0, 6.0, 10.0, 14.0, 10.0, 17.0, 30.0, 49.0, 79.0, 171.0, 321.0, 689.0, 1082.0, 734.0, 378.0, 178.0, 111.0, 57.0, 50.0, 30.0, 18.0, 11.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2510337829589844, -0.24083709716796875, -0.23064041137695312, -0.2204437255859375, -0.21024703979492188, -0.20005035400390625, -0.18985366821289062, -0.179656982421875, -0.16946029663085938, -0.15926361083984375, -0.14906692504882812, -0.1388702392578125, -0.12867355346679688, -0.11847686767578125, -0.10828018188476562, -0.09808349609375, -0.08788681030273438, -0.07769012451171875, -0.06749343872070312, -0.0572967529296875, -0.047100067138671875, -0.03690338134765625, -0.026706695556640625, -0.016510009765625, -0.006313323974609375, 0.00388336181640625, 0.014080047607421875, 0.0242767333984375, 0.034473419189453125, 0.04467010498046875, 0.054866790771484375, 0.0650634765625, 0.07526016235351562, 0.08545684814453125, 0.09565353393554688, 0.1058502197265625, 0.11604690551757812, 0.12624359130859375, 0.13644027709960938, 0.146636962890625, 0.15683364868164062, 0.16703033447265625, 0.17722702026367188, 0.1874237060546875, 0.19762039184570312, 0.20781707763671875, 0.21801376342773438, 0.22821044921875, 0.23840713500976562, 0.24860382080078125, 0.2588005065917969, 0.2689971923828125, 0.2791938781738281, 0.28939056396484375, 0.2995872497558594, 0.309783935546875, 0.3199806213378906, 0.33017730712890625, 0.3403739929199219, 0.3505706787109375, 0.3607673645019531, 0.37096405029296875, 0.3811607360839844, 0.391357421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 10.0, 9.0, 16.0, 33.0, 64.0, 89.0, 135.0, 159.0, 154.0, 125.0, 82.0, 43.0, 21.0, 16.0, 10.0, 19.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.300692319869995, -2.2412049770355225, -2.1817173957824707, -2.122230052947998, -2.0627427101135254, -2.0032551288604736, -1.943767786026001, -1.8842803239822388, -1.8247928619384766, -1.7653053998947144, -1.7058180570602417, -1.6463305950164795, -1.5868431329727173, -1.527355670928955, -1.4678683280944824, -1.4083808660507202, -1.348893404006958, -1.2894059419631958, -1.2299185991287231, -1.170431137084961, -1.1109436750411987, -1.0514562129974365, -0.9919688701629639, -0.9324814081192017, -0.872994065284729, -0.8135066628456116, -0.7540192008018494, -0.6945317983627319, -0.6350443363189697, -0.5755569338798523, -0.5160695314407349, -0.45658206939697266, -0.39709460735321045, -0.33760717511177063, -0.2781197428703308, -0.21863232553005219, -0.15914489328861237, -0.09965747594833374, -0.04017004370689392, 0.0193173885345459, 0.07880482077598572, 0.13829225301742554, 0.19777968525886536, 0.2572671175003052, 0.3167545199394226, 0.3762419521808624, 0.43572938442230225, 0.49521681666374207, 0.5547042489051819, 0.6141916513442993, 0.6736791133880615, 0.733166515827179, 0.7926539778709412, 0.8521413803100586, 0.9116288423538208, 0.9711162447929382, 1.0306036472320557, 1.0900911092758179, 1.1495784521102905, 1.2090659141540527, 1.268553376197815, 1.3280408382415771, 1.3875281810760498, 1.447015643119812, 1.5065031051635742]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 13.0, 13.0, 13.0, 13.0, 13.0, 17.0, 29.0, 26.0, 22.0, 35.0, 29.0, 43.0, 53.0, 27.0, 44.0, 43.0, 45.0, 42.0, 47.0, 39.0, 36.0, 37.0, 37.0, 39.0, 32.0, 37.0, 23.0, 17.0, 15.0, 20.0, 16.0, 6.0, 16.0, 10.0, 10.0, 6.0, 6.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.9543792009353638, -0.9263274073600769, -0.89827561378479, -0.8702237606048584, -0.8421719670295715, -0.8141201734542847, -0.7860683798789978, -0.7580165863037109, -0.7299647331237793, -0.7019129395484924, -0.6738611459732056, -0.6458092927932739, -0.6177574992179871, -0.5897057056427002, -0.5616539120674133, -0.5336021184921265, -0.5055503249168396, -0.47749853134155273, -0.4494467079639435, -0.4213949143886566, -0.39334309101104736, -0.3652912974357605, -0.33723950386047363, -0.30918771028518677, -0.2811358869075775, -0.25308409333229065, -0.2250322699546814, -0.19698047637939453, -0.16892866790294647, -0.1408768594264984, -0.11282506585121155, -0.08477325737476349, -0.05672144889831543, -0.02866964414715767, -0.0006178393959999084, 0.027433961629867554, 0.05548577010631561, 0.08353757858276367, 0.11158937215805054, 0.1396411806344986, 0.16769298911094666, 0.19574479758739471, 0.22379660606384277, 0.25184839963912964, 0.2799001932144165, 0.30795201659202576, 0.3360038101673126, 0.3640556335449219, 0.39210742712020874, 0.4201592206954956, 0.44821104407310486, 0.4762628376483917, 0.504314661026001, 0.5323664546012878, 0.5604182481765747, 0.5884700417518616, 0.6165218353271484, 0.6445736289024353, 0.6726254224777222, 0.7006772756576538, 0.7287290692329407, 0.7567808628082275, 0.7848326563835144, 0.8128844499588013, 0.8409363031387329]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 9.0, 7.0, 7.0, 17.0, 32.0, 34.0, 70.0, 118.0, 213.0, 341.0, 662.0, 1489.0, 3636.0, 10144.0, 34415.0, 150503.0, 528175.0, 243923.0, 51874.0, 14185.0, 4804.0, 1966.0, 892.0, 437.0, 221.0, 147.0, 88.0, 48.0, 28.0, 20.0, 14.0, 10.0, 10.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208740234375, -0.2023468017578125, -0.195953369140625, -0.1895599365234375, -0.18316650390625, -0.1767730712890625, -0.170379638671875, -0.1639862060546875, -0.1575927734375, -0.1511993408203125, -0.144805908203125, -0.1384124755859375, -0.13201904296875, -0.1256256103515625, -0.119232177734375, -0.1128387451171875, -0.1064453125, -0.1000518798828125, -0.093658447265625, -0.0872650146484375, -0.08087158203125, -0.0744781494140625, -0.068084716796875, -0.0616912841796875, -0.0552978515625, -0.0489044189453125, -0.042510986328125, -0.0361175537109375, -0.02972412109375, -0.0233306884765625, -0.016937255859375, -0.0105438232421875, -0.004150390625, 0.0022430419921875, 0.008636474609375, 0.0150299072265625, 0.02142333984375, 0.0278167724609375, 0.034210205078125, 0.0406036376953125, 0.0469970703125, 0.0533905029296875, 0.059783935546875, 0.0661773681640625, 0.07257080078125, 0.0789642333984375, 0.085357666015625, 0.0917510986328125, 0.09814453125, 0.1045379638671875, 0.110931396484375, 0.1173248291015625, 0.12371826171875, 0.1301116943359375, 0.136505126953125, 0.1428985595703125, 0.1492919921875, 0.1556854248046875, 0.162078857421875, 0.1684722900390625, 0.17486572265625, 0.1812591552734375, 0.187652587890625, 0.1940460205078125, 0.200439453125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 8.0, 11.0, 8.0, 12.0, 13.0, 19.0, 18.0, 36.0, 34.0, 42.0, 39.0, 54.0, 30.0, 56.0, 54.0, 47.0, 51.0, 41.0, 54.0, 56.0, 41.0, 44.0, 32.0, 45.0, 35.0, 25.0, 16.0, 19.0, 12.0, 12.0, 7.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14306640625, -0.1391124725341797, -0.13515853881835938, -0.13120460510253906, -0.12725067138671875, -0.12329673767089844, -0.11934280395507812, -0.11538887023925781, -0.1114349365234375, -0.10748100280761719, -0.10352706909179688, -0.09957313537597656, -0.09561920166015625, -0.09166526794433594, -0.08771133422851562, -0.08375740051269531, -0.079803466796875, -0.07584953308105469, -0.07189559936523438, -0.06794166564941406, -0.06398773193359375, -0.06003379821777344, -0.056079864501953125, -0.05212593078613281, -0.0481719970703125, -0.04421806335449219, -0.040264129638671875, -0.03631019592285156, -0.03235626220703125, -0.028402328491210938, -0.024448394775390625, -0.020494461059570312, -0.01654052734375, -0.012586593627929688, -0.008632659912109375, -0.0046787261962890625, -0.00072479248046875, 0.0032291412353515625, 0.007183074951171875, 0.011137008666992188, 0.0150909423828125, 0.019044876098632812, 0.022998809814453125, 0.026952743530273438, 0.03090667724609375, 0.03486061096191406, 0.038814544677734375, 0.04276847839355469, 0.046722412109375, 0.05067634582519531, 0.054630279541015625, 0.05858421325683594, 0.06253814697265625, 0.06649208068847656, 0.07044601440429688, 0.07439994812011719, 0.0783538818359375, 0.08230781555175781, 0.08626174926757812, 0.09021568298339844, 0.09416961669921875, 0.09812355041503906, 0.10207748413085938, 0.10603141784667969, 0.1099853515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 7.0, 3.0, 10.0, 20.0, 27.0, 23.0, 33.0, 65.0, 83.0, 130.0, 201.0, 411.0, 953.0, 3083.0, 19645.0, 369112.0, 627097.0, 22103.0, 3396.0, 1027.0, 461.0, 246.0, 137.0, 83.0, 51.0, 33.0, 30.0, 15.0, 22.0, 9.0, 8.0, 6.0, 7.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.411865234375, -0.3993949890136719, -0.38692474365234375, -0.3744544982910156, -0.3619842529296875, -0.3495140075683594, -0.33704376220703125, -0.3245735168457031, -0.312103271484375, -0.2996330261230469, -0.28716278076171875, -0.2746925354003906, -0.2622222900390625, -0.24975204467773438, -0.23728179931640625, -0.22481155395507812, -0.21234130859375, -0.19987106323242188, -0.18740081787109375, -0.17493057250976562, -0.1624603271484375, -0.14999008178710938, -0.13751983642578125, -0.12504959106445312, -0.112579345703125, -0.10010910034179688, -0.08763885498046875, -0.07516860961914062, -0.0626983642578125, -0.050228118896484375, -0.03775787353515625, -0.025287628173828125, -0.0128173828125, -0.000347137451171875, 0.01212310791015625, 0.024593353271484375, 0.0370635986328125, 0.049533843994140625, 0.06200408935546875, 0.07447433471679688, 0.086944580078125, 0.09941482543945312, 0.11188507080078125, 0.12435531616210938, 0.1368255615234375, 0.14929580688476562, 0.16176605224609375, 0.17423629760742188, 0.18670654296875, 0.19917678833007812, 0.21164703369140625, 0.22411727905273438, 0.2365875244140625, 0.24905776977539062, 0.26152801513671875, 0.2739982604980469, 0.286468505859375, 0.2989387512207031, 0.31140899658203125, 0.3238792419433594, 0.3363494873046875, 0.3488197326660156, 0.36128997802734375, 0.3737602233886719, 0.38623046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 3.0, 8.0, 9.0, 3.0, 10.0, 24.0, 18.0, 19.0, 25.0, 25.0, 35.0, 45.0, 44.0, 54.0, 57.0, 47.0, 57.0, 61.0, 55.0, 61.0, 43.0, 31.0, 40.0, 31.0, 40.0, 28.0, 22.0, 24.0, 20.0, 15.0, 11.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.401123046875, -0.387664794921875, -0.37420654296875, -0.360748291015625, -0.3472900390625, -0.333831787109375, -0.32037353515625, -0.306915283203125, -0.29345703125, -0.279998779296875, -0.26654052734375, -0.253082275390625, -0.2396240234375, -0.226165771484375, -0.21270751953125, -0.199249267578125, -0.185791015625, -0.172332763671875, -0.15887451171875, -0.145416259765625, -0.1319580078125, -0.118499755859375, -0.10504150390625, -0.091583251953125, -0.078125, -0.064666748046875, -0.05120849609375, -0.037750244140625, -0.0242919921875, -0.010833740234375, 0.00262451171875, 0.016082763671875, 0.029541015625, 0.042999267578125, 0.05645751953125, 0.069915771484375, 0.0833740234375, 0.096832275390625, 0.11029052734375, 0.123748779296875, 0.13720703125, 0.150665283203125, 0.16412353515625, 0.177581787109375, 0.1910400390625, 0.204498291015625, 0.21795654296875, 0.231414794921875, 0.244873046875, 0.258331298828125, 0.27178955078125, 0.285247802734375, 0.2987060546875, 0.312164306640625, 0.32562255859375, 0.339080810546875, 0.3525390625, 0.365997314453125, 0.37945556640625, 0.392913818359375, 0.4063720703125, 0.419830322265625, 0.43328857421875, 0.446746826171875, 0.460205078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 11.0, 12.0, 18.0, 34.0, 58.0, 95.0, 177.0, 324.0, 703.0, 1753.0, 5255.0, 19002.0, 119375.0, 803538.0, 77063.0, 14285.0, 4045.0, 1495.0, 595.0, 303.0, 162.0, 74.0, 63.0, 24.0, 17.0, 16.0, 12.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096923828125, -0.0936269760131836, -0.09033012390136719, -0.08703327178955078, -0.08373641967773438, -0.08043956756591797, -0.07714271545410156, -0.07384586334228516, -0.07054901123046875, -0.06725215911865234, -0.06395530700683594, -0.06065845489501953, -0.057361602783203125, -0.05406475067138672, -0.05076789855957031, -0.047471046447753906, -0.0441741943359375, -0.040877342224121094, -0.03758049011230469, -0.03428363800048828, -0.030986785888671875, -0.02768993377685547, -0.024393081665039062, -0.021096229553222656, -0.01779937744140625, -0.014502525329589844, -0.011205673217773438, -0.007908821105957031, -0.004611968994140625, -0.0013151168823242188, 0.0019817352294921875, 0.005278587341308594, 0.008575439453125, 0.011872291564941406, 0.015169143676757812, 0.01846599578857422, 0.021762847900390625, 0.02505970001220703, 0.028356552124023438, 0.031653404235839844, 0.03495025634765625, 0.038247108459472656, 0.04154396057128906, 0.04484081268310547, 0.048137664794921875, 0.05143451690673828, 0.05473136901855469, 0.058028221130371094, 0.0613250732421875, 0.0646219253540039, 0.06791877746582031, 0.07121562957763672, 0.07451248168945312, 0.07780933380126953, 0.08110618591308594, 0.08440303802490234, 0.08769989013671875, 0.09099674224853516, 0.09429359436035156, 0.09759044647216797, 0.10088729858398438, 0.10418415069580078, 0.10748100280761719, 0.1107778549194336, 0.11407470703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0, 6.0, 10.0, 6.0, 5.0, 11.0, 19.0, 21.0, 16.0, 29.0, 34.0, 58.0, 70.0, 94.0, 92.0, 104.0, 93.0, 76.0, 54.0, 44.0, 32.0, 29.0, 21.0, 14.0, 8.0, 9.0, 6.0, 11.0, 5.0, 3.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.081560134887695e-05, -2.982746809720993e-05, -2.8839334845542908e-05, -2.7851201593875885e-05, -2.6863068342208862e-05, -2.587493509054184e-05, -2.4886801838874817e-05, -2.3898668587207794e-05, -2.291053533554077e-05, -2.192240208387375e-05, -2.0934268832206726e-05, -1.9946135580539703e-05, -1.895800232887268e-05, -1.7969869077205658e-05, -1.6981735825538635e-05, -1.5993602573871613e-05, -1.500546932220459e-05, -1.4017336070537567e-05, -1.3029202818870544e-05, -1.2041069567203522e-05, -1.1052936315536499e-05, -1.0064803063869476e-05, -9.076669812202454e-06, -8.088536560535431e-06, -7.100403308868408e-06, -6.1122700572013855e-06, -5.124136805534363e-06, -4.13600355386734e-06, -3.1478703022003174e-06, -2.1597370505332947e-06, -1.171603798866272e-06, -1.8347054719924927e-07, 8.046627044677734e-07, 1.7927959561347961e-06, 2.780929207801819e-06, 3.7690624594688416e-06, 4.757195711135864e-06, 5.745328962802887e-06, 6.73346221446991e-06, 7.721595466136932e-06, 8.709728717803955e-06, 9.697861969470978e-06, 1.0685995221138e-05, 1.1674128472805023e-05, 1.2662261724472046e-05, 1.3650394976139069e-05, 1.4638528227806091e-05, 1.5626661479473114e-05, 1.6614794731140137e-05, 1.760292798280716e-05, 1.8591061234474182e-05, 1.9579194486141205e-05, 2.0567327737808228e-05, 2.155546098947525e-05, 2.2543594241142273e-05, 2.3531727492809296e-05, 2.451986074447632e-05, 2.550799399614334e-05, 2.6496127247810364e-05, 2.7484260499477386e-05, 2.847239375114441e-05, 2.9460527002811432e-05, 3.0448660254478455e-05, 3.143679350614548e-05, 3.24249267578125e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 0.0, 7.0, 10.0, 12.0, 23.0, 20.0, 19.0, 34.0, 45.0, 67.0, 98.0, 127.0, 197.0, 282.0, 480.0, 711.0, 1341.0, 2641.0, 5434.0, 12174.0, 30597.0, 92263.0, 579881.0, 223763.0, 59097.0, 21317.0, 8889.0, 4035.0, 2084.0, 1165.0, 581.0, 373.0, 216.0, 160.0, 85.0, 78.0, 55.0, 49.0, 41.0, 25.0, 14.0, 18.0, 11.0, 9.0, 3.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.059783935546875, -0.05801582336425781, -0.056247711181640625, -0.05447959899902344, -0.05271148681640625, -0.05094337463378906, -0.049175262451171875, -0.04740715026855469, -0.0456390380859375, -0.04387092590332031, -0.042102813720703125, -0.04033470153808594, -0.03856658935546875, -0.03679847717285156, -0.035030364990234375, -0.03326225280761719, -0.031494140625, -0.029726028442382812, -0.027957916259765625, -0.026189804077148438, -0.02442169189453125, -0.022653579711914062, -0.020885467529296875, -0.019117355346679688, -0.0173492431640625, -0.015581130981445312, -0.013813018798828125, -0.012044906616210938, -0.01027679443359375, -0.008508682250976562, -0.006740570068359375, -0.0049724578857421875, -0.003204345703125, -0.0014362335205078125, 0.000331878662109375, 0.0020999908447265625, 0.00386810302734375, 0.0056362152099609375, 0.007404327392578125, 0.009172439575195312, 0.0109405517578125, 0.012708663940429688, 0.014476776123046875, 0.016244888305664062, 0.01801300048828125, 0.019781112670898438, 0.021549224853515625, 0.023317337036132812, 0.02508544921875, 0.026853561401367188, 0.028621673583984375, 0.030389785766601562, 0.03215789794921875, 0.03392601013183594, 0.035694122314453125, 0.03746223449707031, 0.0392303466796875, 0.04099845886230469, 0.042766571044921875, 0.04453468322753906, 0.04630279541015625, 0.04807090759277344, 0.049839019775390625, 0.05160713195800781, 0.053375244140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 11.0, 9.0, 12.0, 11.0, 15.0, 17.0, 28.0, 26.0, 41.0, 65.0, 89.0, 134.0, 123.0, 97.0, 65.0, 48.0, 40.0, 29.0, 32.0, 14.0, 13.0, 14.0, 8.0, 7.0, 3.0, 5.0, 5.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09637451171875, -0.09338760375976562, -0.09040069580078125, -0.08741378784179688, -0.0844268798828125, -0.08143997192382812, -0.07845306396484375, -0.07546615600585938, -0.072479248046875, -0.06949234008789062, -0.06650543212890625, -0.06351852416992188, -0.0605316162109375, -0.057544708251953125, -0.05455780029296875, -0.051570892333984375, -0.048583984375, -0.045597076416015625, -0.04261016845703125, -0.039623260498046875, -0.0366363525390625, -0.033649444580078125, -0.03066253662109375, -0.027675628662109375, -0.024688720703125, -0.021701812744140625, -0.01871490478515625, -0.015727996826171875, -0.0127410888671875, -0.009754180908203125, -0.00676727294921875, -0.003780364990234375, -0.00079345703125, 0.002193450927734375, 0.00518035888671875, 0.008167266845703125, 0.0111541748046875, 0.014141082763671875, 0.01712799072265625, 0.020114898681640625, 0.023101806640625, 0.026088714599609375, 0.02907562255859375, 0.032062530517578125, 0.0350494384765625, 0.038036346435546875, 0.04102325439453125, 0.044010162353515625, 0.0469970703125, 0.049983978271484375, 0.05297088623046875, 0.055957794189453125, 0.0589447021484375, 0.061931610107421875, 0.06491851806640625, 0.06790542602539062, 0.070892333984375, 0.07387924194335938, 0.07686614990234375, 0.07985305786132812, 0.0828399658203125, 0.08582687377929688, 0.08881378173828125, 0.09180068969726562, 0.09478759765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 6.0, 10.0, 39.0, 126.0, 446.0, 257.0, 73.0, 22.0, 12.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3405585289001465, -2.2088189125061035, -2.0770790576934814, -1.9453394412994385, -1.813599705696106, -1.6818599700927734, -1.5501203536987305, -1.418380618095398, -1.2866408824920654, -1.154901146888733, -1.0231614112854004, -0.8914217948913574, -0.7596820592880249, -0.6279423236846924, -0.49620264768600464, -0.3644629716873169, -0.23272323608398438, -0.10098353028297424, 0.03075617551803589, 0.16249588131904602, 0.29423558712005615, 0.42597532272338867, 0.5577149987220764, 0.6894546747207642, 0.8211944103240967, 0.9529341459274292, 1.0846738815307617, 1.2164134979248047, 1.3481532335281372, 1.4798929691314697, 1.6116325855255127, 1.7433723211288452, 1.875112533569336, 2.006852149963379, 2.138592004776001, 2.270331621170044, 2.402071475982666, 2.533811092376709, 2.665550708770752, 2.797290325164795, 2.929030179977417, 3.06076979637146, 3.192509651184082, 3.324249267578125, 3.455988883972168, 3.58772873878479, 3.719468355178833, 3.851208209991455, 3.982947826385498, 4.114687442779541, 4.246427059173584, 4.378167152404785, 4.509906768798828, 4.641646385192871, 4.773386001586914, 4.905125617980957, 5.036865234375, 5.168604850769043, 5.300344467163086, 5.432084560394287, 5.56382417678833, 5.695563793182373, 5.827303409576416, 5.959043025970459, 6.09078311920166]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 4.0, 6.0, 5.0, 12.0, 8.0, 12.0, 16.0, 21.0, 23.0, 23.0, 12.0, 28.0, 34.0, 41.0, 51.0, 53.0, 75.0, 83.0, 92.0, 64.0, 40.0, 34.0, 24.0, 33.0, 39.0, 26.0, 17.0, 18.0, 15.0, 17.0, 13.0, 7.0, 11.0, 7.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.674190878868103, -1.6258039474487305, -1.5774171352386475, -1.529030203819275, -1.480643391609192, -1.4322564601898193, -1.3838696479797363, -1.3354827165603638, -1.2870957851409912, -1.2387088537216187, -1.1903220415115356, -1.141935110092163, -1.09354829788208, -1.0451613664627075, -0.9967744946479797, -0.948387622833252, -0.900000810623169, -0.8516139388084412, -0.8032270669937134, -0.7548401355743408, -0.7064533233642578, -0.6580663919448853, -0.6096795201301575, -0.5612926483154297, -0.5129057765007019, -0.4645189046859741, -0.41613203287124634, -0.36774513125419617, -0.3193582594394684, -0.2709713876247406, -0.22258448600769043, -0.17419761419296265, -0.12581086158752441, -0.07742398232221603, -0.029037103056907654, 0.019349783658981323, 0.0677366554737091, 0.11612352728843689, 0.16451042890548706, 0.21289730072021484, 0.2612841725349426, 0.3096710443496704, 0.3580579161643982, 0.40644481778144836, 0.45483168959617615, 0.5032185316085815, 0.5516054630279541, 0.5999923348426819, 0.6483792066574097, 0.6967660784721375, 0.7451529502868652, 0.7935398817062378, 0.8419266939163208, 0.8903136253356934, 0.9387004971504211, 0.9870873689651489, 1.0354743003845215, 1.083861231803894, 1.132248044013977, 1.1806349754333496, 1.2290217876434326, 1.2774087190628052, 1.3257956504821777, 1.3741824626922607, 1.4225692749023438]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 8.0, 19.0, 21.0, 26.0, 50.0, 76.0, 107.0, 170.0, 313.0, 593.0, 1208.0, 2795.0, 7244.0, 23427.0, 107034.0, 765472.0, 2582181.0, 582779.0, 88705.0, 20620.0, 6437.0, 2578.0, 1143.0, 527.0, 307.0, 149.0, 106.0, 57.0, 29.0, 19.0, 19.0, 7.0, 6.0, 14.0, 11.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.187255859375, -0.18250751495361328, -0.17775917053222656, -0.17301082611083984, -0.16826248168945312, -0.1635141372680664, -0.1587657928466797, -0.15401744842529297, -0.14926910400390625, -0.14452075958251953, -0.1397724151611328, -0.1350240707397461, -0.13027572631835938, -0.12552738189697266, -0.12077903747558594, -0.11603069305419922, -0.1112823486328125, -0.10653400421142578, -0.10178565979003906, -0.09703731536865234, -0.09228897094726562, -0.0875406265258789, -0.08279228210449219, -0.07804393768310547, -0.07329559326171875, -0.06854724884033203, -0.06379890441894531, -0.059050559997558594, -0.054302215576171875, -0.049553871154785156, -0.04480552673339844, -0.04005718231201172, -0.035308837890625, -0.03056049346923828, -0.025812149047851562, -0.021063804626464844, -0.016315460205078125, -0.011567115783691406, -0.0068187713623046875, -0.0020704269409179688, 0.00267791748046875, 0.007426261901855469, 0.012174606323242188, 0.016922950744628906, 0.021671295166015625, 0.026419639587402344, 0.031167984008789062, 0.03591632843017578, 0.0406646728515625, 0.04541301727294922, 0.05016136169433594, 0.054909706115722656, 0.059658050537109375, 0.0644063949584961, 0.06915473937988281, 0.07390308380126953, 0.07865142822265625, 0.08339977264404297, 0.08814811706542969, 0.0928964614868164, 0.09764480590820312, 0.10239315032958984, 0.10714149475097656, 0.11188983917236328, 0.11663818359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 13.0, 9.0, 13.0, 20.0, 9.0, 24.0, 31.0, 28.0, 33.0, 45.0, 48.0, 47.0, 44.0, 66.0, 51.0, 49.0, 53.0, 41.0, 47.0, 51.0, 42.0, 48.0, 32.0, 39.0, 24.0, 26.0, 16.0, 12.0, 5.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14306640625, -0.13909053802490234, -0.1351146697998047, -0.13113880157470703, -0.12716293334960938, -0.12318706512451172, -0.11921119689941406, -0.1152353286743164, -0.11125946044921875, -0.1072835922241211, -0.10330772399902344, -0.09933185577392578, -0.09535598754882812, -0.09138011932373047, -0.08740425109863281, -0.08342838287353516, -0.0794525146484375, -0.07547664642333984, -0.07150077819824219, -0.06752490997314453, -0.06354904174804688, -0.05957317352294922, -0.05559730529785156, -0.051621437072753906, -0.04764556884765625, -0.043669700622558594, -0.03969383239746094, -0.03571796417236328, -0.031742095947265625, -0.02776622772216797, -0.023790359497070312, -0.019814491271972656, -0.015838623046875, -0.011862754821777344, -0.007886886596679688, -0.003911018371582031, 6.4849853515625e-05, 0.004040718078613281, 0.008016586303710938, 0.011992454528808594, 0.01596832275390625, 0.019944190979003906, 0.023920059204101562, 0.02789592742919922, 0.031871795654296875, 0.03584766387939453, 0.03982353210449219, 0.043799400329589844, 0.0477752685546875, 0.051751136779785156, 0.05572700500488281, 0.05970287322998047, 0.06367874145507812, 0.06765460968017578, 0.07163047790527344, 0.0756063461303711, 0.07958221435546875, 0.0835580825805664, 0.08753395080566406, 0.09150981903076172, 0.09548568725585938, 0.09946155548095703, 0.10343742370605469, 0.10741329193115234, 0.11138916015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 16.0, 19.0, 44.0, 98.0, 198.0, 539.0, 3055.0, 73730.0, 4066467.0, 46763.0, 2471.0, 494.0, 172.0, 86.0, 59.0, 25.0, 17.0, 4.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5893630981445312, -0.5693511962890625, -0.5493392944335938, -0.529327392578125, -0.5093154907226562, -0.4893035888671875, -0.46929168701171875, -0.44927978515625, -0.42926788330078125, -0.4092559814453125, -0.38924407958984375, -0.369232177734375, -0.34922027587890625, -0.3292083740234375, -0.30919647216796875, -0.2891845703125, -0.26917266845703125, -0.2491607666015625, -0.22914886474609375, -0.209136962890625, -0.18912506103515625, -0.1691131591796875, -0.14910125732421875, -0.12908935546875, -0.10907745361328125, -0.0890655517578125, -0.06905364990234375, -0.049041748046875, -0.02902984619140625, -0.0090179443359375, 0.01099395751953125, 0.031005859375, 0.05101776123046875, 0.0710296630859375, 0.09104156494140625, 0.111053466796875, 0.13106536865234375, 0.1510772705078125, 0.17108917236328125, 0.19110107421875, 0.21111297607421875, 0.2311248779296875, 0.25113677978515625, 0.271148681640625, 0.29116058349609375, 0.3111724853515625, 0.33118438720703125, 0.3511962890625, 0.37120819091796875, 0.3912200927734375, 0.41123199462890625, 0.431243896484375, 0.45125579833984375, 0.4712677001953125, 0.49127960205078125, 0.51129150390625, 0.5313034057617188, 0.5513153076171875, 0.5713272094726562, 0.591339111328125, 0.6113510131835938, 0.6313629150390625, 0.6513748168945312, 0.67138671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 8.0, 12.0, 22.0, 18.0, 27.0, 53.0, 101.0, 202.0, 374.0, 794.0, 1094.0, 681.0, 310.0, 148.0, 94.0, 47.0, 29.0, 15.0, 10.0, 12.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2598609924316406, -0.24872589111328125, -0.23759078979492188, -0.2264556884765625, -0.21532058715820312, -0.20418548583984375, -0.19305038452148438, -0.181915283203125, -0.17078018188476562, -0.15964508056640625, -0.14850997924804688, -0.1373748779296875, -0.12623977661132812, -0.11510467529296875, -0.10396957397460938, -0.09283447265625, -0.08169937133789062, -0.07056427001953125, -0.059429168701171875, -0.0482940673828125, -0.037158966064453125, -0.02602386474609375, -0.014888763427734375, -0.003753662109375, 0.007381439208984375, 0.01851654052734375, 0.029651641845703125, 0.0407867431640625, 0.051921844482421875, 0.06305694580078125, 0.07419204711914062, 0.0853271484375, 0.09646224975585938, 0.10759735107421875, 0.11873245239257812, 0.1298675537109375, 0.14100265502929688, 0.15213775634765625, 0.16327285766601562, 0.174407958984375, 0.18554306030273438, 0.19667816162109375, 0.20781326293945312, 0.2189483642578125, 0.23008346557617188, 0.24121856689453125, 0.2523536682128906, 0.26348876953125, 0.2746238708496094, 0.28575897216796875, 0.2968940734863281, 0.3080291748046875, 0.3191642761230469, 0.33029937744140625, 0.3414344787597656, 0.352569580078125, 0.3637046813964844, 0.37483978271484375, 0.3859748840332031, 0.3971099853515625, 0.4082450866699219, 0.41938018798828125, 0.4305152893066406, 0.441650390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 11.0, 24.0, 50.0, 136.0, 266.0, 270.0, 135.0, 47.0, 27.0, 14.0, 8.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6685028076171875, -4.567024230957031, -4.465545654296875, -4.364067077636719, -4.2625885009765625, -4.161109924316406, -4.059631824493408, -3.958153247833252, -3.8566746711730957, -3.7551960945129395, -3.653717517852783, -3.552239179611206, -3.45076060295105, -3.3492820262908936, -3.2478034496307373, -3.14632511138916, -3.044846534729004, -2.9433679580688477, -2.8418893814086914, -2.7404110431671143, -2.638932466506958, -2.5374538898468018, -2.4359753131866455, -2.3344969749450684, -2.233018159866333, -2.1315395832061768, -2.0300610065460205, -1.9285825490951538, -1.827104091644287, -1.7256255149841309, -1.6241469383239746, -1.522668480873108, -1.4211900234222412, -1.319711446762085, -1.2182329893112183, -1.116754412651062, -1.0152759552001953, -0.9137973785400391, -0.8123188614845276, -0.7108403444290161, -0.6093618273735046, -0.5078833103179932, -0.4064047932624817, -0.3049262464046478, -0.20344772934913635, -0.10196918249130249, -0.0004906654357910156, 0.10098785161972046, 0.20246636867523193, 0.3039448857307434, 0.4054234027862549, 0.5069019794464111, 0.6083804368972778, 0.7098590135574341, 0.8113375306129456, 0.912816047668457, 1.0142946243286133, 1.1157732009887695, 1.2172516584396362, 1.3187302350997925, 1.4202086925506592, 1.5216872692108154, 1.6231658458709717, 1.7246443033218384, 1.826122760772705]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 14.0, 9.0, 11.0, 16.0, 20.0, 18.0, 27.0, 29.0, 26.0, 35.0, 37.0, 52.0, 52.0, 58.0, 55.0, 70.0, 61.0, 45.0, 49.0, 39.0, 31.0, 27.0, 27.0, 24.0, 26.0, 26.0, 23.0, 11.0, 16.0, 16.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.176855444908142, -1.1407232284545898, -1.1045911312103271, -1.068458914756775, -1.0323268175125122, -0.99619460105896, -0.9600624442100525, -0.923930287361145, -0.8877981305122375, -0.8516659736633301, -0.8155338168144226, -0.7794016599655151, -0.7432694435119629, -0.7071373462677002, -0.671005129814148, -0.6348729729652405, -0.598740816116333, -0.5626086592674255, -0.5264765024185181, -0.4903443157672882, -0.45421215891838074, -0.41808000206947327, -0.3819478154182434, -0.34581565856933594, -0.30968350172042847, -0.273551344871521, -0.23741917312145233, -0.20128700137138367, -0.1651548445224762, -0.12902268767356873, -0.09289051592350006, -0.056758344173431396, -0.020626306533813477, 0.015505857765674591, 0.05163802206516266, 0.08777018636465073, 0.1239023506641388, 0.16003450751304626, 0.19616667926311493, 0.2322988510131836, 0.26843100786209106, 0.30456316471099854, 0.340695321559906, 0.37682750821113586, 0.41295966506004333, 0.4490918219089508, 0.48522400856018066, 0.5213561654090881, 0.5574883222579956, 0.5936204791069031, 0.6297526359558105, 0.665884792804718, 0.7020169496536255, 0.7381491661071777, 0.7742813229560852, 0.8104134798049927, 0.8465456366539001, 0.8826777935028076, 0.9188099503517151, 0.9549421072006226, 0.9910743236541748, 1.0272064208984375, 1.0633386373519897, 1.099470853805542, 1.1356029510498047]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 10.0, 7.0, 11.0, 18.0, 14.0, 31.0, 38.0, 56.0, 79.0, 149.0, 189.0, 392.0, 703.0, 1304.0, 2682.0, 6208.0, 15780.0, 46825.0, 175681.0, 514074.0, 202199.0, 51991.0, 17275.0, 6734.0, 2916.0, 1440.0, 690.0, 377.0, 240.0, 138.0, 91.0, 59.0, 51.0, 37.0, 19.0, 11.0, 13.0, 5.0, 9.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1837158203125, -0.17749786376953125, -0.1712799072265625, -0.16506195068359375, -0.158843994140625, -0.15262603759765625, -0.1464080810546875, -0.14019012451171875, -0.13397216796875, -0.12775421142578125, -0.1215362548828125, -0.11531829833984375, -0.109100341796875, -0.10288238525390625, -0.0966644287109375, -0.09044647216796875, -0.084228515625, -0.07801055908203125, -0.0717926025390625, -0.06557464599609375, -0.059356689453125, -0.05313873291015625, -0.0469207763671875, -0.04070281982421875, -0.03448486328125, -0.02826690673828125, -0.0220489501953125, -0.01583099365234375, -0.009613037109375, -0.00339508056640625, 0.0028228759765625, 0.00904083251953125, 0.0152587890625, 0.02147674560546875, 0.0276947021484375, 0.03391265869140625, 0.040130615234375, 0.04634857177734375, 0.0525665283203125, 0.05878448486328125, 0.06500244140625, 0.07122039794921875, 0.0774383544921875, 0.08365631103515625, 0.089874267578125, 0.09609222412109375, 0.1023101806640625, 0.10852813720703125, 0.11474609375, 0.12096405029296875, 0.1271820068359375, 0.13339996337890625, 0.139617919921875, 0.14583587646484375, 0.1520538330078125, 0.15827178955078125, 0.16448974609375, 0.17070770263671875, 0.1769256591796875, 0.18314361572265625, 0.189361572265625, 0.19557952880859375, 0.2017974853515625, 0.20801544189453125, 0.2142333984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 10.0, 9.0, 10.0, 16.0, 11.0, 15.0, 20.0, 23.0, 28.0, 36.0, 33.0, 39.0, 30.0, 36.0, 48.0, 68.0, 54.0, 47.0, 34.0, 46.0, 46.0, 36.0, 39.0, 51.0, 29.0, 32.0, 40.0, 25.0, 17.0, 21.0, 12.0, 9.0, 7.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1221923828125, -0.11844253540039062, -0.11469268798828125, -0.11094284057617188, -0.1071929931640625, -0.10344314575195312, -0.09969329833984375, -0.09594345092773438, -0.092193603515625, -0.08844375610351562, -0.08469390869140625, -0.08094406127929688, -0.0771942138671875, -0.07344436645507812, -0.06969451904296875, -0.06594467163085938, -0.06219482421875, -0.058444976806640625, -0.05469512939453125, -0.050945281982421875, -0.0471954345703125, -0.043445587158203125, -0.03969573974609375, -0.035945892333984375, -0.032196044921875, -0.028446197509765625, -0.02469635009765625, -0.020946502685546875, -0.0171966552734375, -0.013446807861328125, -0.00969696044921875, -0.005947113037109375, -0.002197265625, 0.001552581787109375, 0.00530242919921875, 0.009052276611328125, 0.0128021240234375, 0.016551971435546875, 0.02030181884765625, 0.024051666259765625, 0.027801513671875, 0.031551361083984375, 0.03530120849609375, 0.039051055908203125, 0.0428009033203125, 0.046550750732421875, 0.05030059814453125, 0.054050445556640625, 0.05780029296875, 0.061550140380859375, 0.06529998779296875, 0.06904983520507812, 0.0727996826171875, 0.07654953002929688, 0.08029937744140625, 0.08404922485351562, 0.087799072265625, 0.09154891967773438, 0.09529876708984375, 0.09904861450195312, 0.1027984619140625, 0.10654830932617188, 0.11029815673828125, 0.11404800415039062, 0.1177978515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 10.0, 16.0, 25.0, 23.0, 23.0, 58.0, 61.0, 103.0, 187.0, 237.0, 407.0, 874.0, 2191.0, 7424.0, 52422.0, 854657.0, 113042.0, 11497.0, 2871.0, 1157.0, 521.0, 246.0, 154.0, 95.0, 55.0, 50.0, 26.0, 25.0, 20.0, 17.0, 8.0, 14.0, 8.0, 7.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.399658203125, -0.38741302490234375, -0.3751678466796875, -0.36292266845703125, -0.350677490234375, -0.33843231201171875, -0.3261871337890625, -0.31394195556640625, -0.30169677734375, -0.28945159912109375, -0.2772064208984375, -0.26496124267578125, -0.252716064453125, -0.24047088623046875, -0.2282257080078125, -0.21598052978515625, -0.2037353515625, -0.19149017333984375, -0.1792449951171875, -0.16699981689453125, -0.154754638671875, -0.14250946044921875, -0.1302642822265625, -0.11801910400390625, -0.10577392578125, -0.09352874755859375, -0.0812835693359375, -0.06903839111328125, -0.056793212890625, -0.04454803466796875, -0.0323028564453125, -0.02005767822265625, -0.0078125, 0.00443267822265625, 0.0166778564453125, 0.02892303466796875, 0.041168212890625, 0.05341339111328125, 0.0656585693359375, 0.07790374755859375, 0.09014892578125, 0.10239410400390625, 0.1146392822265625, 0.12688446044921875, 0.139129638671875, 0.15137481689453125, 0.1636199951171875, 0.17586517333984375, 0.1881103515625, 0.20035552978515625, 0.2126007080078125, 0.22484588623046875, 0.237091064453125, 0.24933624267578125, 0.2615814208984375, 0.27382659912109375, 0.28607177734375, 0.29831695556640625, 0.3105621337890625, 0.32280731201171875, 0.335052490234375, 0.34729766845703125, 0.3595428466796875, 0.37178802490234375, 0.384033203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 9.0, 10.0, 13.0, 10.0, 11.0, 18.0, 14.0, 11.0, 19.0, 33.0, 28.0, 46.0, 37.0, 48.0, 45.0, 53.0, 39.0, 57.0, 55.0, 69.0, 51.0, 51.0, 38.0, 28.0, 36.0, 30.0, 22.0, 22.0, 23.0, 16.0, 10.0, 15.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.412109375, -0.3994636535644531, -0.38681793212890625, -0.3741722106933594, -0.3615264892578125, -0.3488807678222656, -0.33623504638671875, -0.3235893249511719, -0.310943603515625, -0.2982978820800781, -0.28565216064453125, -0.2730064392089844, -0.2603607177734375, -0.24771499633789062, -0.23506927490234375, -0.22242355346679688, -0.20977783203125, -0.19713211059570312, -0.18448638916015625, -0.17184066772460938, -0.1591949462890625, -0.14654922485351562, -0.13390350341796875, -0.12125778198242188, -0.108612060546875, -0.09596633911132812, -0.08332061767578125, -0.07067489624023438, -0.0580291748046875, -0.045383453369140625, -0.03273773193359375, -0.020092010498046875, -0.0074462890625, 0.005199432373046875, 0.01784515380859375, 0.030490875244140625, 0.0431365966796875, 0.055782318115234375, 0.06842803955078125, 0.08107376098632812, 0.093719482421875, 0.10636520385742188, 0.11901092529296875, 0.13165664672851562, 0.1443023681640625, 0.15694808959960938, 0.16959381103515625, 0.18223953247070312, 0.19488525390625, 0.20753097534179688, 0.22017669677734375, 0.23282241821289062, 0.2454681396484375, 0.2581138610839844, 0.27075958251953125, 0.2834053039550781, 0.296051025390625, 0.3086967468261719, 0.32134246826171875, 0.3339881896972656, 0.3466339111328125, 0.3592796325683594, 0.37192535400390625, 0.3845710754394531, 0.397216796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 8.0, 7.0, 4.0, 5.0, 8.0, 12.0, 20.0, 20.0, 28.0, 34.0, 66.0, 138.0, 370.0, 1069.0, 4706.0, 58702.0, 953780.0, 25106.0, 3094.0, 774.0, 263.0, 123.0, 69.0, 41.0, 24.0, 21.0, 13.0, 14.0, 11.0, 5.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2020263671875, -0.1957855224609375, -0.189544677734375, -0.1833038330078125, -0.17706298828125, -0.1708221435546875, -0.164581298828125, -0.1583404541015625, -0.152099609375, -0.1458587646484375, -0.139617919921875, -0.1333770751953125, -0.12713623046875, -0.1208953857421875, -0.114654541015625, -0.1084136962890625, -0.1021728515625, -0.0959320068359375, -0.089691162109375, -0.0834503173828125, -0.07720947265625, -0.0709686279296875, -0.064727783203125, -0.0584869384765625, -0.05224609375, -0.0460052490234375, -0.039764404296875, -0.0335235595703125, -0.02728271484375, -0.0210418701171875, -0.014801025390625, -0.0085601806640625, -0.0023193359375, 0.0039215087890625, 0.010162353515625, 0.0164031982421875, 0.02264404296875, 0.0288848876953125, 0.035125732421875, 0.0413665771484375, 0.047607421875, 0.0538482666015625, 0.060089111328125, 0.0663299560546875, 0.07257080078125, 0.0788116455078125, 0.085052490234375, 0.0912933349609375, 0.0975341796875, 0.1037750244140625, 0.110015869140625, 0.1162567138671875, 0.12249755859375, 0.1287384033203125, 0.134979248046875, 0.1412200927734375, 0.1474609375, 0.1537017822265625, 0.159942626953125, 0.1661834716796875, 0.17242431640625, 0.1786651611328125, 0.184906005859375, 0.1911468505859375, 0.1973876953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 7.0, 5.0, 4.0, 3.0, 5.0, 13.0, 12.0, 6.0, 20.0, 15.0, 24.0, 33.0, 38.0, 53.0, 77.0, 114.0, 89.0, 113.0, 84.0, 64.0, 52.0, 36.0, 32.0, 26.0, 21.0, 10.0, 9.0, 6.0, 9.0, 5.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-05, -2.5212764739990234e-05, -2.4199485778808594e-05, -2.3186206817626953e-05, -2.2172927856445312e-05, -2.1159648895263672e-05, -2.014636993408203e-05, -1.913309097290039e-05, -1.811981201171875e-05, -1.710653305053711e-05, -1.609325408935547e-05, -1.5079975128173828e-05, -1.4066696166992188e-05, -1.3053417205810547e-05, -1.2040138244628906e-05, -1.1026859283447266e-05, -1.0013580322265625e-05, -9.000301361083984e-06, -7.987022399902344e-06, -6.973743438720703e-06, -5.9604644775390625e-06, -4.947185516357422e-06, -3.933906555175781e-06, -2.9206275939941406e-06, -1.9073486328125e-06, -8.940696716308594e-07, 1.1920928955078125e-07, 1.1324882507324219e-06, 2.1457672119140625e-06, 3.159046173095703e-06, 4.172325134277344e-06, 5.185604095458984e-06, 6.198883056640625e-06, 7.212162017822266e-06, 8.225440979003906e-06, 9.238719940185547e-06, 1.0251998901367188e-05, 1.1265277862548828e-05, 1.2278556823730469e-05, 1.329183578491211e-05, 1.430511474609375e-05, 1.531839370727539e-05, 1.633167266845703e-05, 1.7344951629638672e-05, 1.8358230590820312e-05, 1.9371509552001953e-05, 2.0384788513183594e-05, 2.1398067474365234e-05, 2.2411346435546875e-05, 2.3424625396728516e-05, 2.4437904357910156e-05, 2.5451183319091797e-05, 2.6464462280273438e-05, 2.7477741241455078e-05, 2.849102020263672e-05, 2.950429916381836e-05, 3.0517578125e-05, 3.153085708618164e-05, 3.254413604736328e-05, 3.355741500854492e-05, 3.457069396972656e-05, 3.55839729309082e-05, 3.6597251892089844e-05, 3.7610530853271484e-05, 3.8623809814453125e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 11.0, 17.0, 18.0, 23.0, 39.0, 52.0, 76.0, 104.0, 180.0, 323.0, 563.0, 1085.0, 2651.0, 8141.0, 37982.0, 322370.0, 618681.0, 41961.0, 8900.0, 2803.0, 1122.0, 563.0, 326.0, 189.0, 116.0, 77.0, 34.0, 35.0, 29.0, 18.0, 15.0, 8.0, 7.0, 8.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08905029296875, -0.08643341064453125, -0.0838165283203125, -0.08119964599609375, -0.078582763671875, -0.07596588134765625, -0.0733489990234375, -0.07073211669921875, -0.068115234375, -0.06549835205078125, -0.0628814697265625, -0.06026458740234375, -0.057647705078125, -0.05503082275390625, -0.0524139404296875, -0.04979705810546875, -0.04718017578125, -0.04456329345703125, -0.0419464111328125, -0.03932952880859375, -0.036712646484375, -0.03409576416015625, -0.0314788818359375, -0.02886199951171875, -0.0262451171875, -0.02362823486328125, -0.0210113525390625, -0.01839447021484375, -0.015777587890625, -0.01316070556640625, -0.0105438232421875, -0.00792694091796875, -0.00531005859375, -0.00269317626953125, -7.62939453125e-05, 0.00254058837890625, 0.005157470703125, 0.00777435302734375, 0.0103912353515625, 0.01300811767578125, 0.015625, 0.01824188232421875, 0.0208587646484375, 0.02347564697265625, 0.026092529296875, 0.02870941162109375, 0.0313262939453125, 0.03394317626953125, 0.03656005859375, 0.03917694091796875, 0.0417938232421875, 0.04441070556640625, 0.047027587890625, 0.04964447021484375, 0.0522613525390625, 0.05487823486328125, 0.0574951171875, 0.06011199951171875, 0.0627288818359375, 0.06534576416015625, 0.067962646484375, 0.07057952880859375, 0.0731964111328125, 0.07581329345703125, 0.07843017578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 10.0, 7.0, 6.0, 12.0, 11.0, 18.0, 21.0, 29.0, 46.0, 40.0, 72.0, 68.0, 98.0, 125.0, 99.0, 82.0, 61.0, 42.0, 31.0, 22.0, 28.0, 17.0, 15.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.089111328125, -0.08651161193847656, -0.08391189575195312, -0.08131217956542969, -0.07871246337890625, -0.07611274719238281, -0.07351303100585938, -0.07091331481933594, -0.0683135986328125, -0.06571388244628906, -0.06311416625976562, -0.06051445007324219, -0.05791473388671875, -0.05531501770019531, -0.052715301513671875, -0.05011558532714844, -0.047515869140625, -0.04491615295410156, -0.042316436767578125, -0.03971672058105469, -0.03711700439453125, -0.03451728820800781, -0.031917572021484375, -0.029317855834960938, -0.0267181396484375, -0.024118423461914062, -0.021518707275390625, -0.018918991088867188, -0.01631927490234375, -0.013719558715820312, -0.011119842529296875, -0.008520126342773438, -0.00592041015625, -0.0033206939697265625, -0.000720977783203125, 0.0018787384033203125, 0.00447845458984375, 0.0070781707763671875, 0.009677886962890625, 0.012277603149414062, 0.0148773193359375, 0.017477035522460938, 0.020076751708984375, 0.022676467895507812, 0.02527618408203125, 0.027875900268554688, 0.030475616455078125, 0.03307533264160156, 0.035675048828125, 0.03827476501464844, 0.040874481201171875, 0.04347419738769531, 0.04607391357421875, 0.04867362976074219, 0.051273345947265625, 0.05387306213378906, 0.0564727783203125, 0.05907249450683594, 0.061672210693359375, 0.06427192687988281, 0.06687164306640625, 0.06947135925292969, 0.07207107543945312, 0.07467079162597656, 0.0772705078125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 7.0, 11.0, 49.0, 244.0, 492.0, 132.0, 34.0, 18.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.8222055435180664, -3.676370143890381, -3.5305347442626953, -3.3846993446350098, -3.238863945007324, -3.0930285453796387, -2.947193145751953, -2.8013577461242676, -2.655522346496582, -2.5096869468688965, -2.363851547241211, -2.2180161476135254, -2.07218074798584, -1.9263453483581543, -1.7805100679397583, -1.6346746683120728, -1.4888393878936768, -1.3430039882659912, -1.1971685886383057, -1.0513331890106201, -0.9054978489875793, -0.7596624493598938, -0.613827109336853, -0.4679917097091675, -0.32215631008148193, -0.17632092535495758, -0.030485540628433228, 0.11534982919692993, 0.2611852288246155, 0.407020628452301, 0.5528559684753418, 0.6986913681030273, 0.8445267677307129, 0.9903621673583984, 1.136197566986084, 1.2820329666137695, 1.427868366241455, 1.5737037658691406, 1.7195390462875366, 1.8653744459152222, 2.0112099647521973, 2.157045364379883, 2.3028807640075684, 2.448716163635254, 2.5945515632629395, 2.740386962890625, 2.8862223625183105, 3.032057762145996, 3.1778929233551025, 3.323728322982788, 3.4695637226104736, 3.615399122238159, 3.7612345218658447, 3.9070699214935303, 4.052905082702637, 4.198740482330322, 4.344575881958008, 4.490411281585693, 4.636246681213379, 4.7820820808410645, 4.92791748046875, 5.0737528800964355, 5.219588279724121, 5.365423679351807, 5.511259078979492]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 5.0, 4.0, 5.0, 5.0, 8.0, 14.0, 7.0, 7.0, 13.0, 14.0, 16.0, 20.0, 15.0, 17.0, 34.0, 24.0, 29.0, 41.0, 47.0, 69.0, 84.0, 110.0, 70.0, 58.0, 36.0, 28.0, 29.0, 33.0, 31.0, 20.0, 15.0, 20.0, 11.0, 14.0, 9.0, 7.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7603014707565308, -1.7141252756118774, -1.6679491996765137, -1.6217730045318604, -1.5755969285964966, -1.5294207334518433, -1.4832446575164795, -1.4370684623718262, -1.3908922672271729, -1.3447160720825195, -1.2985399961471558, -1.2523638010025024, -1.2061877250671387, -1.1600115299224854, -1.113835334777832, -1.0676592588424683, -1.0214831829071045, -0.975307047367096, -0.9291309118270874, -0.8829547166824341, -0.8367786407470703, -0.790602445602417, -0.7444263100624084, -0.6982501745223999, -0.6520740389823914, -0.6058979034423828, -0.5597217679023743, -0.5135456323623657, -0.4673694670200348, -0.42119333148002625, -0.3750171661376953, -0.32884103059768677, -0.2826648950576782, -0.23648875951766968, -0.19031260907649994, -0.1441364586353302, -0.09796032309532166, -0.05178418755531311, -0.005608022212982178, 0.04056811332702637, 0.08674424886703491, 0.13292038440704346, 0.1790965348482132, 0.22527268528938293, 0.2714488208293915, 0.3176249563694, 0.36380112171173096, 0.4099772572517395, 0.45615339279174805, 0.5023295283317566, 0.5485056638717651, 0.5946818590164185, 0.6408579349517822, 0.6870341300964355, 0.7332102656364441, 0.7793864011764526, 0.8255625367164612, 0.8717386722564697, 0.9179148077964783, 0.9640909433364868, 1.0102671384811401, 1.056443214416504, 1.1026194095611572, 1.1487956047058105, 1.1949716806411743]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 8.0, 14.0, 13.0, 20.0, 24.0, 40.0, 37.0, 72.0, 111.0, 181.0, 268.0, 491.0, 826.0, 1431.0, 2854.0, 6257.0, 16180.0, 57424.0, 351118.0, 2164938.0, 1347141.0, 186568.0, 36590.0, 11748.0, 4723.0, 2267.0, 1230.0, 658.0, 370.0, 246.0, 146.0, 96.0, 55.0, 35.0, 33.0, 21.0, 18.0, 8.0, 7.0, 4.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.253173828125, -0.24590682983398438, -0.23863983154296875, -0.23137283325195312, -0.2241058349609375, -0.21683883666992188, -0.20957183837890625, -0.20230484008789062, -0.195037841796875, -0.18777084350585938, -0.18050384521484375, -0.17323684692382812, -0.1659698486328125, -0.15870285034179688, -0.15143585205078125, -0.14416885375976562, -0.13690185546875, -0.12963485717773438, -0.12236785888671875, -0.11510086059570312, -0.1078338623046875, -0.10056686401367188, -0.09329986572265625, -0.08603286743164062, -0.078765869140625, -0.07149887084960938, -0.06423187255859375, -0.056964874267578125, -0.0496978759765625, -0.042430877685546875, -0.03516387939453125, -0.027896881103515625, -0.0206298828125, -0.013362884521484375, -0.00609588623046875, 0.001171112060546875, 0.0084381103515625, 0.015705108642578125, 0.02297210693359375, 0.030239105224609375, 0.037506103515625, 0.044773101806640625, 0.05204010009765625, 0.059307098388671875, 0.0665740966796875, 0.07384109497070312, 0.08110809326171875, 0.08837509155273438, 0.09564208984375, 0.10290908813476562, 0.11017608642578125, 0.11744308471679688, 0.1247100830078125, 0.13197708129882812, 0.13924407958984375, 0.14651107788085938, 0.153778076171875, 0.16104507446289062, 0.16831207275390625, 0.17557907104492188, 0.1828460693359375, 0.19011306762695312, 0.19738006591796875, 0.20464706420898438, 0.2119140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 5.0, 12.0, 8.0, 12.0, 7.0, 11.0, 17.0, 26.0, 19.0, 25.0, 32.0, 29.0, 37.0, 31.0, 40.0, 57.0, 53.0, 46.0, 47.0, 44.0, 58.0, 52.0, 34.0, 51.0, 32.0, 33.0, 32.0, 34.0, 20.0, 26.0, 13.0, 13.0, 5.0, 7.0, 17.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12127685546875, -0.11776256561279297, -0.11424827575683594, -0.1107339859008789, -0.10721969604492188, -0.10370540618896484, -0.10019111633300781, -0.09667682647705078, -0.09316253662109375, -0.08964824676513672, -0.08613395690917969, -0.08261966705322266, -0.07910537719726562, -0.0755910873413086, -0.07207679748535156, -0.06856250762939453, -0.0650482177734375, -0.06153392791748047, -0.05801963806152344, -0.054505348205566406, -0.050991058349609375, -0.047476768493652344, -0.04396247863769531, -0.04044818878173828, -0.03693389892578125, -0.03341960906982422, -0.029905319213867188, -0.026391029357910156, -0.022876739501953125, -0.019362449645996094, -0.015848159790039062, -0.012333869934082031, -0.008819580078125, -0.005305290222167969, -0.0017910003662109375, 0.0017232894897460938, 0.005237579345703125, 0.008751869201660156, 0.012266159057617188, 0.01578044891357422, 0.01929473876953125, 0.02280902862548828, 0.026323318481445312, 0.029837608337402344, 0.033351898193359375, 0.036866188049316406, 0.04038047790527344, 0.04389476776123047, 0.0474090576171875, 0.05092334747314453, 0.05443763732910156, 0.057951927185058594, 0.061466217041015625, 0.06498050689697266, 0.06849479675292969, 0.07200908660888672, 0.07552337646484375, 0.07903766632080078, 0.08255195617675781, 0.08606624603271484, 0.08958053588867188, 0.0930948257446289, 0.09660911560058594, 0.10012340545654297, 0.1036376953125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 12.0, 24.0, 39.0, 54.0, 91.0, 168.0, 335.0, 882.0, 3064.0, 44994.0, 4101040.0, 38771.0, 3212.0, 868.0, 361.0, 153.0, 89.0, 40.0, 29.0, 18.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33984375, -1.3059005737304688, -1.2719573974609375, -1.2380142211914062, -1.204071044921875, -1.1701278686523438, -1.1361846923828125, -1.1022415161132812, -1.06829833984375, -1.0343551635742188, -1.0004119873046875, -0.9664688110351562, -0.932525634765625, -0.8985824584960938, -0.8646392822265625, -0.8306961059570312, -0.7967529296875, -0.7628097534179688, -0.7288665771484375, -0.6949234008789062, -0.660980224609375, -0.6270370483398438, -0.5930938720703125, -0.5591506958007812, -0.52520751953125, -0.49126434326171875, -0.4573211669921875, -0.42337799072265625, -0.389434814453125, -0.35549163818359375, -0.3215484619140625, -0.28760528564453125, -0.253662109375, -0.21971893310546875, -0.1857757568359375, -0.15183258056640625, -0.117889404296875, -0.08394622802734375, -0.0500030517578125, -0.01605987548828125, 0.01788330078125, 0.05182647705078125, 0.0857696533203125, 0.11971282958984375, 0.153656005859375, 0.18759918212890625, 0.2215423583984375, 0.25548553466796875, 0.2894287109375, 0.32337188720703125, 0.3573150634765625, 0.39125823974609375, 0.425201416015625, 0.45914459228515625, 0.4930877685546875, 0.5270309448242188, 0.56097412109375, 0.5949172973632812, 0.6288604736328125, 0.6628036499023438, 0.696746826171875, 0.7306900024414062, 0.7646331787109375, 0.7985763549804688, 0.83251953125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 10.0, 24.0, 22.0, 42.0, 67.0, 117.0, 222.0, 367.0, 735.0, 929.0, 604.0, 328.0, 220.0, 143.0, 82.0, 50.0, 41.0, 20.0, 16.0, 13.0, 10.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3307380676269531, -0.31357574462890625, -0.2964134216308594, -0.2792510986328125, -0.2620887756347656, -0.24492645263671875, -0.22776412963867188, -0.210601806640625, -0.19343948364257812, -0.17627716064453125, -0.15911483764648438, -0.1419525146484375, -0.12479019165039062, -0.10762786865234375, -0.09046554565429688, -0.07330322265625, -0.056140899658203125, -0.03897857666015625, -0.021816253662109375, -0.0046539306640625, 0.012508392333984375, 0.02967071533203125, 0.046833038330078125, 0.063995361328125, 0.08115768432617188, 0.09832000732421875, 0.11548233032226562, 0.1326446533203125, 0.14980697631835938, 0.16696929931640625, 0.18413162231445312, 0.2012939453125, 0.21845626831054688, 0.23561859130859375, 0.2527809143066406, 0.2699432373046875, 0.2871055603027344, 0.30426788330078125, 0.3214302062988281, 0.338592529296875, 0.3557548522949219, 0.37291717529296875, 0.3900794982910156, 0.4072418212890625, 0.4244041442871094, 0.44156646728515625, 0.4587287902832031, 0.47589111328125, 0.4930534362792969, 0.5102157592773438, 0.5273780822753906, 0.5445404052734375, 0.5617027282714844, 0.5788650512695312, 0.5960273742675781, 0.613189697265625, 0.6303520202636719, 0.6475143432617188, 0.6646766662597656, 0.6818389892578125, 0.6990013122558594, 0.7161636352539062, 0.7333259582519531, 0.75048828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 9.0, 14.0, 37.0, 75.0, 158.0, 242.0, 197.0, 118.0, 65.0, 25.0, 23.0, 10.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.147567272186279, -3.963603973388672, -3.7796406745910645, -3.595677137374878, -3.4117138385772705, -3.227750539779663, -3.0437870025634766, -2.859823703765869, -2.6758604049682617, -2.4918971061706543, -2.307933807373047, -2.1239702701568604, -1.940006971359253, -1.7560436725616455, -1.5720802545547485, -1.3881168365478516, -1.2041535377502441, -1.0201902389526367, -0.8362268209457397, -0.6522634625434875, -0.46830010414123535, -0.28433674573898315, -0.10037338733673096, 0.08359003067016602, 0.26755332946777344, 0.45151668787002563, 0.6354800462722778, 0.81944340467453, 1.0034067630767822, 1.1873700618743896, 1.3713334798812866, 1.5552968978881836, 1.739260196685791, 1.9232234954833984, 2.107186794281006, 2.2911503314971924, 2.4751136302948, 2.6590769290924072, 2.8430404663085938, 3.027003765106201, 3.2109670639038086, 3.394930362701416, 3.5788936614990234, 3.76285719871521, 3.9468204975128174, 4.130784034729004, 4.314747333526611, 4.498710632324219, 4.682673931121826, 4.866637229919434, 5.050600528717041, 5.234563827514648, 5.418527603149414, 5.6024909019470215, 5.786454200744629, 5.970417499542236, 6.154380798339844, 6.338344097137451, 6.522307395935059, 6.706270694732666, 6.890233993530273, 7.074197769165039, 7.2581610679626465, 7.442124366760254, 7.626087665557861]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 9.0, 7.0, 18.0, 28.0, 26.0, 39.0, 44.0, 38.0, 50.0, 44.0, 65.0, 83.0, 89.0, 72.0, 59.0, 52.0, 56.0, 36.0, 44.0, 29.0, 22.0, 17.0, 14.0, 12.0, 9.0, 8.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3122994899749756, -3.215684175491333, -3.1190686225891113, -3.0224533081054688, -2.925837993621826, -2.8292226791381836, -2.732607364654541, -2.6359918117523193, -2.5393764972686768, -2.442761182785034, -2.3461456298828125, -2.24953031539917, -2.1529150009155273, -2.0562996864318848, -1.9596842527389526, -1.8630688190460205, -1.766453504562378, -1.6698381900787354, -1.5732227563858032, -1.476607322692871, -1.3799920082092285, -1.283376693725586, -1.1867612600326538, -1.0901458263397217, -0.9935305118560791, -0.8969151377677917, -0.8002997636795044, -0.703684389591217, -0.6070690155029297, -0.5104536414146423, -0.413838267326355, -0.3172228932380676, -0.22060728073120117, -0.12399190664291382, -0.027376532554626465, 0.06923884153366089, 0.16585421562194824, 0.2624695897102356, 0.35908496379852295, 0.4557003378868103, 0.5523157119750977, 0.648931086063385, 0.7455464601516724, 0.8421618342399597, 0.9387772083282471, 1.0353925228118896, 1.1320079565048218, 1.228623390197754, 1.3252387046813965, 1.421854019165039, 1.5184694528579712, 1.6150848865509033, 1.711700201034546, 1.8083155155181885, 1.9049309492111206, 2.0015463829040527, 2.0981616973876953, 2.194777011871338, 2.2913923263549805, 2.388007879257202, 2.4846231937408447, 2.5812385082244873, 2.677854061126709, 2.7744693756103516, 2.871084690093994]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 12.0, 10.0, 17.0, 19.0, 30.0, 40.0, 62.0, 117.0, 178.0, 255.0, 457.0, 815.0, 1469.0, 3163.0, 7478.0, 20018.0, 73500.0, 533972.0, 324267.0, 54527.0, 16161.0, 6187.0, 2669.0, 1368.0, 701.0, 403.0, 220.0, 144.0, 102.0, 55.0, 35.0, 30.0, 15.0, 11.0, 14.0, 10.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2059326171875, -0.19967269897460938, -0.19341278076171875, -0.18715286254882812, -0.1808929443359375, -0.17463302612304688, -0.16837310791015625, -0.16211318969726562, -0.155853271484375, -0.14959335327148438, -0.14333343505859375, -0.13707351684570312, -0.1308135986328125, -0.12455368041992188, -0.11829376220703125, -0.11203384399414062, -0.10577392578125, -0.09951400756835938, -0.09325408935546875, -0.08699417114257812, -0.0807342529296875, -0.07447433471679688, -0.06821441650390625, -0.061954498291015625, -0.055694580078125, -0.049434661865234375, -0.04317474365234375, -0.036914825439453125, -0.0306549072265625, -0.024394989013671875, -0.01813507080078125, -0.011875152587890625, -0.005615234375, 0.000644683837890625, 0.00690460205078125, 0.013164520263671875, 0.0194244384765625, 0.025684356689453125, 0.03194427490234375, 0.038204193115234375, 0.044464111328125, 0.050724029541015625, 0.05698394775390625, 0.06324386596679688, 0.0695037841796875, 0.07576370239257812, 0.08202362060546875, 0.08828353881835938, 0.09454345703125, 0.10080337524414062, 0.10706329345703125, 0.11332321166992188, 0.1195831298828125, 0.12584304809570312, 0.13210296630859375, 0.13836288452148438, 0.144622802734375, 0.15088272094726562, 0.15714263916015625, 0.16340255737304688, 0.1696624755859375, 0.17592239379882812, 0.18218231201171875, 0.18844223022460938, 0.1947021484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 1.0, 5.0, 7.0, 9.0, 13.0, 13.0, 15.0, 37.0, 35.0, 44.0, 51.0, 38.0, 61.0, 66.0, 70.0, 55.0, 82.0, 64.0, 57.0, 50.0, 49.0, 45.0, 34.0, 19.0, 36.0, 16.0, 4.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2149658203125, -0.20870018005371094, -0.20243453979492188, -0.1961688995361328, -0.18990325927734375, -0.1836376190185547, -0.17737197875976562, -0.17110633850097656, -0.1648406982421875, -0.15857505798339844, -0.15230941772460938, -0.1460437774658203, -0.13977813720703125, -0.1335124969482422, -0.12724685668945312, -0.12098121643066406, -0.114715576171875, -0.10844993591308594, -0.10218429565429688, -0.09591865539550781, -0.08965301513671875, -0.08338737487792969, -0.07712173461914062, -0.07085609436035156, -0.0645904541015625, -0.05832481384277344, -0.052059173583984375, -0.04579353332519531, -0.03952789306640625, -0.03326225280761719, -0.026996612548828125, -0.020730972290039062, -0.01446533203125, -0.008199691772460938, -0.001934051513671875, 0.0043315887451171875, 0.01059722900390625, 0.016862869262695312, 0.023128509521484375, 0.029394149780273438, 0.0356597900390625, 0.04192543029785156, 0.048191070556640625, 0.05445671081542969, 0.06072235107421875, 0.06698799133300781, 0.07325363159179688, 0.07951927185058594, 0.085784912109375, 0.09205055236816406, 0.09831619262695312, 0.10458183288574219, 0.11084747314453125, 0.11711311340332031, 0.12337875366210938, 0.12964439392089844, 0.1359100341796875, 0.14217567443847656, 0.14844131469726562, 0.1547069549560547, 0.16097259521484375, 0.1672382354736328, 0.17350387573242188, 0.17976951599121094, 0.18603515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 11.0, 8.0, 14.0, 28.0, 27.0, 50.0, 78.0, 97.0, 134.0, 212.0, 370.0, 698.0, 1545.0, 5510.0, 38457.0, 917863.0, 71573.0, 7878.0, 2014.0, 810.0, 401.0, 218.0, 138.0, 97.0, 77.0, 59.0, 38.0, 28.0, 25.0, 15.0, 10.0, 11.0, 9.0, 10.0, 6.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.33642578125, -0.32611083984375, -0.3157958984375, -0.30548095703125, -0.295166015625, -0.28485107421875, -0.2745361328125, -0.26422119140625, -0.25390625, -0.24359130859375, -0.2332763671875, -0.22296142578125, -0.212646484375, -0.20233154296875, -0.1920166015625, -0.18170166015625, -0.17138671875, -0.16107177734375, -0.1507568359375, -0.14044189453125, -0.130126953125, -0.11981201171875, -0.1094970703125, -0.09918212890625, -0.0888671875, -0.07855224609375, -0.0682373046875, -0.05792236328125, -0.047607421875, -0.03729248046875, -0.0269775390625, -0.01666259765625, -0.00634765625, 0.00396728515625, 0.0142822265625, 0.02459716796875, 0.034912109375, 0.04522705078125, 0.0555419921875, 0.06585693359375, 0.076171875, 0.08648681640625, 0.0968017578125, 0.10711669921875, 0.117431640625, 0.12774658203125, 0.1380615234375, 0.14837646484375, 0.15869140625, 0.16900634765625, 0.1793212890625, 0.18963623046875, 0.199951171875, 0.21026611328125, 0.2205810546875, 0.23089599609375, 0.2412109375, 0.25152587890625, 0.2618408203125, 0.27215576171875, 0.282470703125, 0.29278564453125, 0.3031005859375, 0.31341552734375, 0.32373046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 8.0, 7.0, 15.0, 10.0, 17.0, 17.0, 20.0, 23.0, 34.0, 38.0, 37.0, 69.0, 65.0, 76.0, 84.0, 73.0, 60.0, 61.0, 41.0, 39.0, 35.0, 28.0, 26.0, 24.0, 16.0, 19.0, 9.0, 9.0, 7.0, 1.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5874176025390625, -0.566925048828125, -0.5464324951171875, -0.52593994140625, -0.5054473876953125, -0.484954833984375, -0.4644622802734375, -0.4439697265625, -0.4234771728515625, -0.402984619140625, -0.3824920654296875, -0.36199951171875, -0.3415069580078125, -0.321014404296875, -0.3005218505859375, -0.280029296875, -0.2595367431640625, -0.239044189453125, -0.2185516357421875, -0.19805908203125, -0.1775665283203125, -0.157073974609375, -0.1365814208984375, -0.1160888671875, -0.0955963134765625, -0.075103759765625, -0.0546112060546875, -0.03411865234375, -0.0136260986328125, 0.006866455078125, 0.0273590087890625, 0.0478515625, 0.0683441162109375, 0.088836669921875, 0.1093292236328125, 0.12982177734375, 0.1503143310546875, 0.170806884765625, 0.1912994384765625, 0.2117919921875, 0.2322845458984375, 0.252777099609375, 0.2732696533203125, 0.29376220703125, 0.3142547607421875, 0.334747314453125, 0.3552398681640625, 0.375732421875, 0.3962249755859375, 0.416717529296875, 0.4372100830078125, 0.45770263671875, 0.4781951904296875, 0.498687744140625, 0.5191802978515625, 0.5396728515625, 0.5601654052734375, 0.580657958984375, 0.6011505126953125, 0.62164306640625, 0.6421356201171875, 0.662628173828125, 0.6831207275390625, 0.70361328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 12.0, 17.0, 31.0, 31.0, 50.0, 88.0, 164.0, 260.0, 515.0, 1145.0, 2855.0, 9323.0, 53149.0, 892481.0, 71679.0, 11079.0, 3121.0, 1232.0, 537.0, 309.0, 147.0, 92.0, 58.0, 36.0, 33.0, 26.0, 18.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0518798828125, -0.05023622512817383, -0.048592567443847656, -0.046948909759521484, -0.04530525207519531, -0.04366159439086914, -0.04201793670654297, -0.0403742790222168, -0.038730621337890625, -0.03708696365356445, -0.03544330596923828, -0.03379964828491211, -0.03215599060058594, -0.030512332916259766, -0.028868675231933594, -0.027225017547607422, -0.02558135986328125, -0.023937702178955078, -0.022294044494628906, -0.020650386810302734, -0.019006729125976562, -0.01736307144165039, -0.01571941375732422, -0.014075756072998047, -0.012432098388671875, -0.010788440704345703, -0.009144783020019531, -0.007501125335693359, -0.0058574676513671875, -0.004213809967041016, -0.0025701522827148438, -0.0009264945983886719, 0.0007171630859375, 0.002360820770263672, 0.004004478454589844, 0.005648136138916016, 0.0072917938232421875, 0.00893545150756836, 0.010579109191894531, 0.012222766876220703, 0.013866424560546875, 0.015510082244873047, 0.01715373992919922, 0.01879739761352539, 0.020441055297851562, 0.022084712982177734, 0.023728370666503906, 0.025372028350830078, 0.02701568603515625, 0.028659343719482422, 0.030303001403808594, 0.031946659088134766, 0.03359031677246094, 0.03523397445678711, 0.03687763214111328, 0.03852128982543945, 0.040164947509765625, 0.0418086051940918, 0.04345226287841797, 0.04509592056274414, 0.04673957824707031, 0.048383235931396484, 0.050026893615722656, 0.05167055130004883, 0.053314208984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 7.0, 8.0, 19.0, 19.0, 23.0, 19.0, 30.0, 26.0, 34.0, 55.0, 62.0, 74.0, 83.0, 68.0, 71.0, 85.0, 56.0, 43.0, 35.0, 31.0, 17.0, 20.0, 9.0, 17.0, 14.0, 14.0, 11.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.409385681152344e-05, -3.31047922372818e-05, -3.211572766304016e-05, -3.112666308879852e-05, -3.0137598514556885e-05, -2.9148533940315247e-05, -2.815946936607361e-05, -2.717040479183197e-05, -2.6181340217590332e-05, -2.5192275643348694e-05, -2.4203211069107056e-05, -2.3214146494865417e-05, -2.222508192062378e-05, -2.123601734638214e-05, -2.0246952772140503e-05, -1.9257888197898865e-05, -1.8268823623657227e-05, -1.727975904941559e-05, -1.629069447517395e-05, -1.5301629900932312e-05, -1.4312565326690674e-05, -1.3323500752449036e-05, -1.2334436178207397e-05, -1.134537160396576e-05, -1.0356307029724121e-05, -9.367242455482483e-06, -8.378177881240845e-06, -7.3891133069992065e-06, -6.400048732757568e-06, -5.41098415851593e-06, -4.421919584274292e-06, -3.432855010032654e-06, -2.4437904357910156e-06, -1.4547258615493774e-06, -4.6566128730773926e-07, 5.234032869338989e-07, 1.5124678611755371e-06, 2.5015324354171753e-06, 3.4905970096588135e-06, 4.479661583900452e-06, 5.46872615814209e-06, 6.457790732383728e-06, 7.446855306625366e-06, 8.435919880867004e-06, 9.424984455108643e-06, 1.041404902935028e-05, 1.1403113603591919e-05, 1.2392178177833557e-05, 1.3381242752075195e-05, 1.4370307326316833e-05, 1.535937190055847e-05, 1.634843647480011e-05, 1.7337501049041748e-05, 1.8326565623283386e-05, 1.9315630197525024e-05, 2.0304694771766663e-05, 2.12937593460083e-05, 2.228282392024994e-05, 2.3271888494491577e-05, 2.4260953068733215e-05, 2.5250017642974854e-05, 2.6239082217216492e-05, 2.722814679145813e-05, 2.8217211365699768e-05, 2.9206275939941406e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 6.0, 12.0, 18.0, 23.0, 51.0, 67.0, 109.0, 170.0, 291.0, 523.0, 959.0, 1820.0, 4202.0, 10176.0, 32262.0, 184429.0, 743561.0, 46449.0, 13327.0, 5065.0, 2376.0, 1152.0, 591.0, 334.0, 200.0, 112.0, 79.0, 47.0, 36.0, 23.0, 13.0, 18.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 5.0], "bins": [-0.04205322265625, -0.04088926315307617, -0.039725303649902344, -0.038561344146728516, -0.03739738464355469, -0.03623342514038086, -0.03506946563720703, -0.0339055061340332, -0.032741546630859375, -0.03157758712768555, -0.03041362762451172, -0.02924966812133789, -0.028085708618164062, -0.026921749114990234, -0.025757789611816406, -0.024593830108642578, -0.02342987060546875, -0.022265911102294922, -0.021101951599121094, -0.019937992095947266, -0.018774032592773438, -0.01761007308959961, -0.01644611358642578, -0.015282154083251953, -0.014118194580078125, -0.012954235076904297, -0.011790275573730469, -0.01062631607055664, -0.009462356567382812, -0.008298397064208984, -0.007134437561035156, -0.005970478057861328, -0.0048065185546875, -0.003642559051513672, -0.0024785995483398438, -0.0013146400451660156, -0.0001506805419921875, 0.0010132789611816406, 0.0021772384643554688, 0.003341197967529297, 0.004505157470703125, 0.005669116973876953, 0.006833076477050781, 0.00799703598022461, 0.009160995483398438, 0.010324954986572266, 0.011488914489746094, 0.012652873992919922, 0.01381683349609375, 0.014980792999267578, 0.016144752502441406, 0.017308712005615234, 0.018472671508789062, 0.01963663101196289, 0.02080059051513672, 0.021964550018310547, 0.023128509521484375, 0.024292469024658203, 0.02545642852783203, 0.02662038803100586, 0.027784347534179688, 0.028948307037353516, 0.030112266540527344, 0.03127622604370117, 0.032440185546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 4.0, 7.0, 8.0, 9.0, 10.0, 25.0, 11.0, 19.0, 36.0, 40.0, 54.0, 75.0, 95.0, 114.0, 117.0, 111.0, 60.0, 36.0, 29.0, 22.0, 22.0, 12.0, 13.0, 8.0, 17.0, 7.0, 5.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05010986328125, -0.04842042922973633, -0.046730995178222656, -0.045041561126708984, -0.04335212707519531, -0.04166269302368164, -0.03997325897216797, -0.0382838249206543, -0.036594390869140625, -0.03490495681762695, -0.03321552276611328, -0.03152608871459961, -0.029836654663085938, -0.028147220611572266, -0.026457786560058594, -0.024768352508544922, -0.02307891845703125, -0.021389484405517578, -0.019700050354003906, -0.018010616302490234, -0.016321182250976562, -0.01463174819946289, -0.012942314147949219, -0.011252880096435547, -0.009563446044921875, -0.007874011993408203, -0.006184577941894531, -0.004495143890380859, -0.0028057098388671875, -0.0011162757873535156, 0.0005731582641601562, 0.002262592315673828, 0.0039520263671875, 0.005641460418701172, 0.007330894470214844, 0.009020328521728516, 0.010709762573242188, 0.01239919662475586, 0.014088630676269531, 0.015778064727783203, 0.017467498779296875, 0.019156932830810547, 0.02084636688232422, 0.02253580093383789, 0.024225234985351562, 0.025914669036865234, 0.027604103088378906, 0.029293537139892578, 0.03098297119140625, 0.03267240524291992, 0.034361839294433594, 0.036051273345947266, 0.03774070739746094, 0.03943014144897461, 0.04111957550048828, 0.04280900955200195, 0.044498443603515625, 0.0461878776550293, 0.04787731170654297, 0.04956674575805664, 0.05125617980957031, 0.052945613861083984, 0.054635047912597656, 0.05632448196411133, 0.058013916015625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 16.0, 15.0, 35.0, 70.0, 325.0, 375.0, 85.0, 39.0, 19.0, 12.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.643389940261841, -3.5394234657287598, -3.435457229614258, -3.3314907550811768, -3.2275242805480957, -3.1235578060150146, -3.0195913314819336, -2.9156250953674316, -2.8116586208343506, -2.7076921463012695, -2.6037259101867676, -2.4997594356536865, -2.3957929611206055, -2.2918264865875244, -2.1878600120544434, -2.0838937759399414, -1.9799273014068604, -1.8759608268737793, -1.7719944715499878, -1.6680281162261963, -1.5640616416931152, -1.4600951671600342, -1.3561288118362427, -1.2521624565124512, -1.1481959819793701, -1.044229507446289, -0.9402631521224976, -0.8362967371940613, -0.732330322265625, -0.6283639073371887, -0.5243974924087524, -0.42043107748031616, -0.3164644241333008, -0.2124980092048645, -0.10853159427642822, -0.004565179347991943, 0.09940123558044434, 0.20336765050888062, 0.3073340654373169, 0.4113004803657532, 0.5152668952941895, 0.6192333102226257, 0.723199725151062, 0.8271661400794983, 0.9311325550079346, 1.0350990295410156, 1.1390653848648071, 1.2430317401885986, 1.3469982147216797, 1.4509646892547607, 1.5549310445785522, 1.6588973999023438, 1.7628638744354248, 1.8668303489685059, 1.9707967042922974, 2.074763059616089, 2.17872953414917, 2.282696008682251, 2.386662483215332, 2.490628719329834, 2.594595193862915, 2.698561668395996, 2.802527904510498, 2.906494379043579, 3.01046085357666]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 5.0, 14.0, 15.0, 16.0, 25.0, 21.0, 24.0, 39.0, 48.0, 115.0, 189.0, 172.0, 104.0, 33.0, 44.0, 23.0, 24.0, 26.0, 6.0, 9.0, 7.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.523043632507324, -2.44126558303833, -2.359487533569336, -2.277709722518921, -2.1959316730499268, -2.1141536235809326, -2.0323755741119385, -1.9505975246429443, -1.8688195943832397, -1.7870415449142456, -1.705263614654541, -1.6234855651855469, -1.5417075157165527, -1.4599295854568481, -1.378151535987854, -1.2963736057281494, -1.2145955562591553, -1.1328175067901611, -1.0510395765304565, -0.9692615270614624, -0.887483537197113, -0.8057055473327637, -0.7239274978637695, -0.6421495079994202, -0.5603715181350708, -0.47859352827072144, -0.3968155086040497, -0.31503748893737793, -0.23325949907302856, -0.1514815092086792, -0.06970348954200745, 0.012074530124664307, 0.09385228157043457, 0.17563028633594513, 0.2574082911014557, 0.33918631076812744, 0.4209643006324768, 0.5027422904968262, 0.5845203399658203, 0.6662983298301697, 0.748076319694519, 0.8298543095588684, 0.9116322994232178, 0.9934103488922119, 1.075188398361206, 1.1569663286209106, 1.2387443780899048, 1.3205223083496094, 1.4023003578186035, 1.4840784072875977, 1.5658563375473022, 1.6476343870162964, 1.729412317276001, 1.8111903667449951, 1.8929684162139893, 1.9747464656829834, 2.0565242767333984, 2.1383023262023926, 2.2200803756713867, 2.3018581867218018, 2.383636236190796, 2.46541428565979, 2.547192335128784, 2.6289703845977783, 2.7107484340667725]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 0.0, 5.0, 4.0, 9.0, 7.0, 6.0, 9.0, 13.0, 17.0, 18.0, 13.0, 24.0, 24.0, 30.0, 32.0, 46.0, 81.0, 286.0, 92.0, 41.0, 31.0, 37.0, 39.0, 23.0, 18.0, 16.0, 12.0, 10.0, 12.0, 8.0, 10.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1729736328125, -0.16825294494628906, -0.16353225708007812, -0.1588115692138672, -0.15409088134765625, -0.1493701934814453, -0.14464950561523438, -0.13992881774902344, -0.1352081298828125, -0.13048744201660156, -0.12576675415039062, -0.12104606628417969, -0.11632537841796875, -0.11160469055175781, -0.10688400268554688, -0.10216331481933594, -0.097442626953125, -0.09272193908691406, -0.08800125122070312, -0.08328056335449219, -0.07855987548828125, -0.07383918762207031, -0.06911849975585938, -0.06439781188964844, -0.0596771240234375, -0.05495643615722656, -0.050235748291015625, -0.04551506042480469, -0.04079437255859375, -0.03607368469238281, -0.031352996826171875, -0.026632308959960938, -0.02191162109375, -0.017190933227539062, -0.012470245361328125, -0.0077495574951171875, -0.00302886962890625, 0.0016918182373046875, 0.006412506103515625, 0.011133193969726562, 0.0158538818359375, 0.020574569702148438, 0.025295257568359375, 0.030015945434570312, 0.03473663330078125, 0.03945732116699219, 0.044178009033203125, 0.04889869689941406, 0.053619384765625, 0.05834007263183594, 0.06306076049804688, 0.06778144836425781, 0.07250213623046875, 0.07722282409667969, 0.08194351196289062, 0.08666419982910156, 0.0913848876953125, 0.09610557556152344, 0.10082626342773438, 0.10554695129394531, 0.11026763916015625, 0.11498832702636719, 0.11970901489257812, 0.12442970275878906, 0.129150390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 10.0, 4.0, 5.0, 4.0, 4.0, 6.0, 7.0, 12.0, 25.0, 24.0, 45.0, 55.0, 137.0, 202.0, 571.0, 1897.0, 9789.0, 8342751.0, 28047.0, 3287.0, 903.0, 303.0, 152.0, 105.0, 57.0, 45.0, 22.0, 25.0, 27.0, 7.0, 2.0, 6.0, 5.0, 5.0, 10.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 4.0], "bins": [-1.769706130027771, -1.7171709537506104, -1.6646357774734497, -1.612100601196289, -1.5595654249191284, -1.5070302486419678, -1.4544950723648071, -1.4019598960876465, -1.3494247198104858, -1.2968895435333252, -1.2443543672561646, -1.191819190979004, -1.1392840147018433, -1.0867488384246826, -1.034213662147522, -0.9816784858703613, -0.9291433095932007, -0.87660813331604, -0.8240729570388794, -0.7715377807617188, -0.7190026044845581, -0.6664674282073975, -0.6139322519302368, -0.5613970756530762, -0.5088618993759155, -0.4563267230987549, -0.40379154682159424, -0.3512563705444336, -0.29872119426727295, -0.2461860179901123, -0.19365084171295166, -0.14111566543579102, -0.08858060836791992, -0.03604543209075928, 0.016489744186401367, 0.06902492046356201, 0.12156009674072266, 0.1740952730178833, 0.22663044929504395, 0.2791656255722046, 0.33170080184936523, 0.3842359781265259, 0.4367711544036865, 0.48930633068084717, 0.5418415069580078, 0.5943766832351685, 0.6469118595123291, 0.6994470357894897, 0.7519822120666504, 0.804517388343811, 0.8570525646209717, 0.9095877408981323, 0.962122917175293, 1.0146580934524536, 1.0671932697296143, 1.119728446006775, 1.1722636222839355, 1.2247987985610962, 1.2773339748382568, 1.3298691511154175, 1.3824043273925781, 1.4349395036697388, 1.4874746799468994, 1.54000985622406, 1.5925450325012207]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 7.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.4350876808166504, -2.3660364151000977, -2.296984910964966, -2.227933645248413, -2.1588821411132812, -2.0898308753967285, -2.020779609680176, -1.951728105545044, -1.8826768398284912, -1.813625454902649, -1.7445740699768066, -1.675522804260254, -1.6064714193344116, -1.5374200344085693, -1.468368649482727, -1.3993172645568848, -1.3302658796310425, -1.2612144947052002, -1.192163109779358, -1.1231117248535156, -1.054060459136963, -0.9850090742111206, -0.9159576892852783, -0.846906304359436, -0.7778549790382385, -0.7088035941123962, -0.6397522687911987, -0.5707008838653564, -0.5016494989395142, -0.43259817361831665, -0.36354678869247437, -0.29449543356895447, -0.22544395923614502, -0.15639260411262512, -0.08734123408794403, -0.01828986406326294, 0.05076149106025696, 0.11981284618377686, 0.18886423110961914, 0.25791558623313904, 0.32696694135665894, 0.39601829648017883, 0.46506965160369873, 0.534121036529541, 0.6031724214553833, 0.6722237467765808, 0.7412751317024231, 0.8103264570236206, 0.8793778419494629, 0.9484292268753052, 1.0174806118011475, 1.0865318775177002, 1.1555832624435425, 1.2246346473693848, 1.293686032295227, 1.3627374172210693, 1.431788682937622, 1.5008400678634644, 1.5698914527893066, 1.6389427185058594, 1.7079941034317017, 1.777045488357544, 1.8460968732833862, 1.9151482582092285, 1.9841996431350708]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 10.0, 4.0, 5.0, 9.0, 15.0, 15.0, 21.0, 34.0, 56.0, 58.0, 129.0, 156.0, 260.0, 497.0, 913.0, 1885.0, 4152.0, 10590.0, 28391.0, 78920.0, 180458.0, 137280.0, 50266.0, 17775.0, 6661.0, 2760.0, 1308.0, 615.0, 340.0, 212.0, 137.0, 96.0, 73.0, 36.0, 30.0, 26.0, 20.0, 12.0, 6.0, 6.0, 7.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.1181640625, -1.086029052734375, -1.05389404296875, -1.021759033203125, -0.9896240234375, -0.957489013671875, -0.92535400390625, -0.893218994140625, -0.861083984375, -0.828948974609375, -0.79681396484375, -0.764678955078125, -0.7325439453125, -0.700408935546875, -0.66827392578125, -0.636138916015625, -0.60400390625, -0.571868896484375, -0.53973388671875, -0.507598876953125, -0.4754638671875, -0.443328857421875, -0.41119384765625, -0.379058837890625, -0.346923828125, -0.314788818359375, -0.28265380859375, -0.250518798828125, -0.2183837890625, -0.186248779296875, -0.15411376953125, -0.121978759765625, -0.08984375, -0.057708740234375, -0.02557373046875, 0.006561279296875, 0.0386962890625, 0.070831298828125, 0.10296630859375, 0.135101318359375, 0.167236328125, 0.199371337890625, 0.23150634765625, 0.263641357421875, 0.2957763671875, 0.327911376953125, 0.36004638671875, 0.392181396484375, 0.42431640625, 0.456451416015625, 0.48858642578125, 0.520721435546875, 0.5528564453125, 0.584991455078125, 0.61712646484375, 0.649261474609375, 0.681396484375, 0.713531494140625, 0.74566650390625, 0.777801513671875, 0.8099365234375, 0.842071533203125, 0.87420654296875, 0.906341552734375, 0.9384765625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 12.0, 10.0, 8.0, 15.0, 11.0, 20.0, 20.0, 21.0, 30.0, 40.0, 51.0, 66.0, 68.0, 83.0, 62.0, 74.0, 77.0, 58.0, 53.0, 37.0, 38.0, 23.0, 27.0, 16.0, 16.0, 8.0, 6.0, 9.0, 11.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2005615234375, -0.1948089599609375, -0.189056396484375, -0.1833038330078125, -0.17755126953125, -0.1717987060546875, -0.166046142578125, -0.1602935791015625, -0.154541015625, -0.1487884521484375, -0.143035888671875, -0.1372833251953125, -0.13153076171875, -0.1257781982421875, -0.120025634765625, -0.1142730712890625, -0.1085205078125, -0.1027679443359375, -0.097015380859375, -0.0912628173828125, -0.08551025390625, -0.0797576904296875, -0.074005126953125, -0.0682525634765625, -0.0625, -0.0567474365234375, -0.050994873046875, -0.0452423095703125, -0.03948974609375, -0.0337371826171875, -0.027984619140625, -0.0222320556640625, -0.0164794921875, -0.0107269287109375, -0.004974365234375, 0.0007781982421875, 0.00653076171875, 0.0122833251953125, 0.018035888671875, 0.0237884521484375, 0.029541015625, 0.0352935791015625, 0.041046142578125, 0.0467987060546875, 0.05255126953125, 0.0583038330078125, 0.064056396484375, 0.0698089599609375, 0.0755615234375, 0.0813140869140625, 0.087066650390625, 0.0928192138671875, 0.09857177734375, 0.1043243408203125, 0.110076904296875, 0.1158294677734375, 0.12158203125, 0.1273345947265625, 0.133087158203125, 0.1388397216796875, 0.14459228515625, 0.1503448486328125, 0.156097412109375, 0.1618499755859375, 0.1676025390625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 11.0, 12.0, 11.0, 18.0, 30.0, 35.0, 63.0, 86.0, 76.0, 52.0, 34.0, 23.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2628158330917358, -1.2193162441253662, -1.1758167743682861, -1.132317304611206, -1.0888177156448364, -1.0453181266784668, -1.0018186569213867, -0.9583191275596619, -0.914819598197937, -0.8713200688362122, -0.8278205394744873, -0.7843210101127625, -0.7408214807510376, -0.6973219513893127, -0.6538224220275879, -0.610322892665863, -0.5668233633041382, -0.5233238339424133, -0.4798243045806885, -0.4363247752189636, -0.39282524585723877, -0.3493257164955139, -0.30582618713378906, -0.2623266577720642, -0.21882712841033936, -0.1753275990486145, -0.13182806968688965, -0.0883285403251648, -0.04482901096343994, -0.0013294816017150879, 0.042170047760009766, 0.08566957712173462, 0.12916898727416992, 0.17266851663589478, 0.21616804599761963, 0.2596675753593445, 0.30316710472106934, 0.3466666340827942, 0.39016616344451904, 0.4336656928062439, 0.47716522216796875, 0.5206647515296936, 0.5641642808914185, 0.6076638102531433, 0.6511633396148682, 0.694662868976593, 0.7381623983383179, 0.7816619277000427, 0.8251614570617676, 0.8686609864234924, 0.9121605157852173, 0.9556600451469421, 0.999159574508667, 1.042659044265747, 1.0861586332321167, 1.1296582221984863, 1.1731576919555664, 1.2166571617126465, 1.2601567506790161, 1.3036563396453857, 1.3471558094024658, 1.390655279159546, 1.4341548681259155, 1.4776544570922852, 1.5211539268493652]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 9.0, 10.0, 16.0, 28.0, 32.0, 49.0, 55.0, 66.0, 80.0, 46.0, 30.0, 9.0, 11.0, 2.0, 7.0, 7.0, 4.0, 0.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2756131887435913, -1.2461988925933838, -1.2167847156524658, -1.1873704195022583, -1.1579561233520508, -1.1285419464111328, -1.0991276502609253, -1.0697133541107178, -1.0402991771697998, -1.0108848810195923, -0.9814706444740295, -0.9520564079284668, -0.922642171382904, -0.8932279348373413, -0.8638136386871338, -0.834399402141571, -0.8049851655960083, -0.7755709290504456, -0.746156632900238, -0.7167423963546753, -0.6873281598091125, -0.6579139232635498, -0.6284996271133423, -0.5990853905677795, -0.569671094417572, -0.5402568578720093, -0.5108425617218018, -0.481428325176239, -0.45201408863067627, -0.42259982228279114, -0.393185555934906, -0.36377131938934326, -0.3343570828437805, -0.3049428164958954, -0.27552857995033264, -0.2461143136024475, -0.21670007705688477, -0.18728581070899963, -0.1578715592622757, -0.12845730781555176, -0.09904305636882782, -0.06962880492210388, -0.040214549750089645, -0.010800294578075409, 0.01861395686864853, 0.048028215765953064, 0.077442467212677, 0.10685671865940094, 0.13627097010612488, 0.16568522155284882, 0.19509947299957275, 0.22451373934745789, 0.25392797589302063, 0.28334224224090576, 0.3127564787864685, 0.34217074513435364, 0.37158501148223877, 0.4009992778301239, 0.43041351437568665, 0.4598277807235718, 0.4892420172691345, 0.5186562538146973, 0.5480705499649048, 0.5774847865104675, 0.6068990230560303]}, "eval/loss": 1.7490322589874268, "eval/wer": 1.068405394684649, "eval/runtime": 1265.4167, "eval/samples_per_second": 2.088, "eval/steps_per_second": 0.262} \ No newline at end of file +{"train/loss": 0.0093, "train/learning_rate": 3.1745843230403805e-05, "train/epoch": 14.01, "train/global_step": 12500, "_runtime": 79331, "_timestamp": 1647177101, "_step": 12504, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 17.0, 19.0, 50.0, 172.0, 401.0, 191.0, 82.0, 31.0, 14.0, 11.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.92704772949219, -50.708030700683594, -49.489017486572266, -48.27000045776367, -47.050987243652344, -45.83197021484375, -44.61295700073242, -43.39393997192383, -42.1749267578125, -40.955909729003906, -39.73689651489258, -38.517879486083984, -37.298866271972656, -36.07984924316406, -34.860836029052734, -33.64181900024414, -32.42280578613281, -31.20379066467285, -29.98477554321289, -28.76576042175293, -27.54674530029297, -26.327730178833008, -25.108715057373047, -23.889698028564453, -22.67068099975586, -21.4516658782959, -20.232650756835938, -19.013635635375977, -17.794620513916016, -16.575605392456055, -15.356589317321777, -14.137574195861816, -12.918561935424805, -11.699546813964844, -10.480531692504883, -9.261516571044922, -8.042501449584961, -6.823485851287842, -5.604470252990723, -4.385455131530762, -3.166440010070801, -1.9474247694015503, -0.7284095287322998, 0.49060583114624023, 1.7096209526062012, 2.928636074066162, 4.147651672363281, 5.366666793823242, 6.585681915283203, 7.804697036743164, 9.023712158203125, 10.242727279663086, 11.461742401123047, 12.680757522583008, 13.899773597717285, 15.118788719177246, 16.33780288696289, 17.55681800842285, 18.775833129882812, 19.994848251342773, 21.213863372802734, 22.432878494262695, 23.651893615722656, 24.87091064453125, 26.08992576599121]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 7.0, 7.0, 10.0, 8.0, 16.0, 16.0, 19.0, 19.0, 36.0, 35.0, 28.0, 40.0, 60.0, 49.0, 41.0, 45.0, 61.0, 47.0, 42.0, 54.0, 56.0, 51.0, 35.0, 32.0, 39.0, 28.0, 20.0, 22.0, 16.0, 11.0, 14.0, 6.0, 6.0, 4.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.404919624328613, -10.10635757446289, -9.807794570922852, -9.509231567382812, -9.21066951751709, -8.912107467651367, -8.613544464111328, -8.314981460571289, -8.016419410705566, -7.7178568840026855, -7.419294357299805, -7.120731830596924, -6.822169303894043, -6.523606777191162, -6.225044250488281, -5.9264817237854, -5.6279191970825195, -5.329356670379639, -5.030794143676758, -4.732231616973877, -4.433669090270996, -4.135106563568115, -3.8365440368652344, -3.5379815101623535, -3.2394189834594727, -2.940856456756592, -2.642293930053711, -2.34373140335083, -2.045168876647949, -1.7466063499450684, -1.4480438232421875, -1.1494812965393066, -0.8509178161621094, -0.5523552894592285, -0.25379276275634766, 0.0447697639465332, 0.34333229064941406, 0.6418948173522949, 0.9404573440551758, 1.2390198707580566, 1.5375823974609375, 1.8361449241638184, 2.134707450866699, 2.43326997756958, 2.731832504272461, 3.030395030975342, 3.3289575576782227, 3.6275200843811035, 3.9260826110839844, 4.224645137786865, 4.523207664489746, 4.821770191192627, 5.120332717895508, 5.418895244598389, 5.7174577713012695, 6.01602029800415, 6.314582824707031, 6.613145351409912, 6.911707878112793, 7.210270404815674, 7.508832931518555, 7.8073954582214355, 8.105957984924316, 8.404520034790039, 8.703083038330078]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 11.0, 5.0, 11.0, 13.0, 21.0, 21.0, 22.0, 26.0, 36.0, 36.0, 44.0, 59.0, 51.0, 41.0, 46.0, 46.0, 51.0, 44.0, 63.0, 43.0, 50.0, 47.0, 32.0, 39.0, 27.0, 22.0, 17.0, 13.0, 18.0, 7.0, 5.0, 10.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.03570556640625, -1.0010986328125, -0.96649169921875, -0.931884765625, -0.89727783203125, -0.8626708984375, -0.82806396484375, -0.79345703125, -0.75885009765625, -0.7242431640625, -0.68963623046875, -0.655029296875, -0.62042236328125, -0.5858154296875, -0.55120849609375, -0.5166015625, -0.48199462890625, -0.4473876953125, -0.41278076171875, -0.378173828125, -0.34356689453125, -0.3089599609375, -0.27435302734375, -0.23974609375, -0.20513916015625, -0.1705322265625, -0.13592529296875, -0.101318359375, -0.06671142578125, -0.0321044921875, 0.00250244140625, 0.037109375, 0.07171630859375, 0.1063232421875, 0.14093017578125, 0.175537109375, 0.21014404296875, 0.2447509765625, 0.27935791015625, 0.31396484375, 0.34857177734375, 0.3831787109375, 0.41778564453125, 0.452392578125, 0.48699951171875, 0.5216064453125, 0.55621337890625, 0.5908203125, 0.62542724609375, 0.6600341796875, 0.69464111328125, 0.729248046875, 0.76385498046875, 0.7984619140625, 0.83306884765625, 0.86767578125, 0.90228271484375, 0.9368896484375, 0.97149658203125, 1.006103515625, 1.04071044921875, 1.0753173828125, 1.10992431640625, 1.14453125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 4.0, 13.0, 5.0, 8.0, 23.0, 22.0, 20.0, 51.0, 54.0, 85.0, 121.0, 161.0, 241.0, 398.0, 664.0, 1291.0, 2692.0, 6707.0, 21943.0, 319144.0, 3792736.0, 31912.0, 8928.0, 3355.0, 1503.0, 796.0, 462.0, 292.0, 183.0, 124.0, 100.0, 52.0, 48.0, 43.0, 19.0, 17.0, 20.0, 15.0, 5.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.2742919921875, -10.900146484375, -10.5260009765625, -10.15185546875, -9.7777099609375, -9.403564453125, -9.0294189453125, -8.6552734375, -8.2811279296875, -7.906982421875, -7.5328369140625, -7.15869140625, -6.7845458984375, -6.410400390625, -6.0362548828125, -5.662109375, -5.2879638671875, -4.913818359375, -4.5396728515625, -4.16552734375, -3.7913818359375, -3.417236328125, -3.0430908203125, -2.6689453125, -2.2947998046875, -1.920654296875, -1.5465087890625, -1.17236328125, -0.7982177734375, -0.424072265625, -0.0499267578125, 0.32421875, 0.6983642578125, 1.072509765625, 1.4466552734375, 1.82080078125, 2.1949462890625, 2.569091796875, 2.9432373046875, 3.3173828125, 3.6915283203125, 4.065673828125, 4.4398193359375, 4.81396484375, 5.1881103515625, 5.562255859375, 5.9364013671875, 6.310546875, 6.6846923828125, 7.058837890625, 7.4329833984375, 7.80712890625, 8.1812744140625, 8.555419921875, 8.9295654296875, 9.3037109375, 9.6778564453125, 10.052001953125, 10.4261474609375, 10.80029296875, 11.1744384765625, 11.548583984375, 11.9227294921875, 12.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 10.0, 4.0, 10.0, 12.0, 14.0, 16.0, 24.0, 21.0, 29.0, 27.0, 26.0, 34.0, 62.0, 88.0, 211.0, 773.0, 1767.0, 490.0, 176.0, 72.0, 34.0, 36.0, 19.0, 18.0, 17.0, 11.0, 7.0, 9.0, 9.0, 8.0, 5.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.65625, -3.5355224609375, -3.414794921875, -3.2940673828125, -3.17333984375, -3.0526123046875, -2.931884765625, -2.8111572265625, -2.6904296875, -2.5697021484375, -2.448974609375, -2.3282470703125, -2.20751953125, -2.0867919921875, -1.966064453125, -1.8453369140625, -1.724609375, -1.6038818359375, -1.483154296875, -1.3624267578125, -1.24169921875, -1.1209716796875, -1.000244140625, -0.8795166015625, -0.7587890625, -0.6380615234375, -0.517333984375, -0.3966064453125, -0.27587890625, -0.1551513671875, -0.034423828125, 0.0863037109375, 0.20703125, 0.3277587890625, 0.448486328125, 0.5692138671875, 0.68994140625, 0.8106689453125, 0.931396484375, 1.0521240234375, 1.1728515625, 1.2935791015625, 1.414306640625, 1.5350341796875, 1.65576171875, 1.7764892578125, 1.897216796875, 2.0179443359375, 2.138671875, 2.2593994140625, 2.380126953125, 2.5008544921875, 2.62158203125, 2.7423095703125, 2.863037109375, 2.9837646484375, 3.1044921875, 3.2252197265625, 3.345947265625, 3.4666748046875, 3.58740234375, 3.7081298828125, 3.828857421875, 3.9495849609375, 4.0703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 9.0, 7.0, 11.0, 5.0, 9.0, 21.0, 18.0, 26.0, 44.0, 48.0, 90.0, 135.0, 174.0, 290.0, 579.0, 1109.0, 2408.0, 5714.0, 15519.0, 47552.0, 478206.0, 3532548.0, 73667.0, 22025.0, 7941.0, 3138.0, 1434.0, 681.0, 330.0, 176.0, 94.0, 75.0, 44.0, 42.0, 27.0, 21.0, 18.0, 10.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.25, -10.876953125, -10.50390625, -10.130859375, -9.7578125, -9.384765625, -9.01171875, -8.638671875, -8.265625, -7.892578125, -7.51953125, -7.146484375, -6.7734375, -6.400390625, -6.02734375, -5.654296875, -5.28125, -4.908203125, -4.53515625, -4.162109375, -3.7890625, -3.416015625, -3.04296875, -2.669921875, -2.296875, -1.923828125, -1.55078125, -1.177734375, -0.8046875, -0.431640625, -0.05859375, 0.314453125, 0.6875, 1.060546875, 1.43359375, 1.806640625, 2.1796875, 2.552734375, 2.92578125, 3.298828125, 3.671875, 4.044921875, 4.41796875, 4.791015625, 5.1640625, 5.537109375, 5.91015625, 6.283203125, 6.65625, 7.029296875, 7.40234375, 7.775390625, 8.1484375, 8.521484375, 8.89453125, 9.267578125, 9.640625, 10.013671875, 10.38671875, 10.759765625, 11.1328125, 11.505859375, 11.87890625, 12.251953125, 12.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 28.0, 62.0, 151.0, 446.0, 199.0, 68.0, 32.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.036022186279297, -15.688886642456055, -14.341751098632812, -12.994616508483887, -11.647480964660645, -10.300345420837402, -8.953210830688477, -7.606075286865234, -6.258939743041992, -4.91180419921875, -3.564669132232666, -2.217534065246582, -0.8703985214233398, 0.47673702239990234, 1.8238716125488281, 3.1710071563720703, 4.5181427001953125, 5.865278244018555, 7.212413311004639, 8.559548377990723, 9.906683921813965, 11.253819465637207, 12.600954055786133, 13.948089599609375, 15.295225143432617, 16.64236068725586, 17.9894962310791, 19.336631774902344, 20.683765411376953, 22.030902862548828, 23.378036499023438, 24.72517204284668, 26.072303771972656, 27.4194393157959, 28.76657485961914, 30.11370849609375, 31.460845947265625, 32.807979583740234, 34.155113220214844, 35.50225067138672, 36.849388122558594, 38.1965217590332, 39.54365921020508, 40.89079284667969, 42.23793029785156, 43.58506393432617, 44.93219757080078, 46.279335021972656, 47.626468658447266, 48.973602294921875, 50.32073974609375, 51.66787338256836, 53.015010833740234, 54.362144470214844, 55.70928192138672, 57.05641555786133, 58.40354919433594, 59.75068283081055, 61.09782028198242, 62.44495391845703, 63.792091369628906, 65.13922882080078, 66.48635864257812, 67.83349609375, 69.18063354492188]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 7.0, 9.0, 9.0, 7.0, 16.0, 20.0, 28.0, 20.0, 21.0, 39.0, 35.0, 30.0, 48.0, 38.0, 46.0, 36.0, 41.0, 35.0, 51.0, 44.0, 37.0, 48.0, 32.0, 39.0, 30.0, 33.0, 24.0, 30.0, 32.0, 22.0, 17.0, 9.0, 16.0, 10.0, 7.0, 7.0, 4.0, 4.0, 5.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.524043083190918, -11.145256996154785, -10.766470909118652, -10.38768482208252, -10.008898735046387, -9.630112648010254, -9.251326560974121, -8.872540473937988, -8.493754386901855, -8.114968299865723, -7.73618221282959, -7.357396125793457, -6.978610038757324, -6.599823951721191, -6.221037864685059, -5.842251777648926, -5.463465690612793, -5.08467960357666, -4.705893516540527, -4.3271074295043945, -3.9483213424682617, -3.569535255432129, -3.190749168395996, -2.8119630813598633, -2.4331769943237305, -2.0543909072875977, -1.6756048202514648, -1.296818733215332, -0.9180326461791992, -0.5392465591430664, -0.1604604721069336, 0.21832561492919922, 0.597111701965332, 0.9758977890014648, 1.3546838760375977, 1.7334699630737305, 2.1122560501098633, 2.491042137145996, 2.869828224182129, 3.2486143112182617, 3.6274003982543945, 4.006186485290527, 4.38497257232666, 4.763758659362793, 5.142544746398926, 5.521330833435059, 5.900116920471191, 6.278903007507324, 6.657689094543457, 7.03647518157959, 7.415261268615723, 7.7940473556518555, 8.172833442687988, 8.551619529724121, 8.930405616760254, 9.309191703796387, 9.68797779083252, 10.066763877868652, 10.445549964904785, 10.824336051940918, 11.20312213897705, 11.581908226013184, 11.960694313049316, 12.33948040008545, 12.718266487121582]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 4.0, 2.0, 4.0, 10.0, 6.0, 8.0, 9.0, 9.0, 12.0, 23.0, 24.0, 25.0, 31.0, 28.0, 29.0, 46.0, 45.0, 41.0, 30.0, 49.0, 49.0, 43.0, 42.0, 37.0, 44.0, 42.0, 43.0, 37.0, 26.0, 25.0, 18.0, 29.0, 23.0, 20.0, 16.0, 10.0, 15.0, 9.0, 10.0, 5.0, 9.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0223617553710938, -0.9910125732421875, -0.9596633911132812, -0.928314208984375, -0.8969650268554688, -0.8656158447265625, -0.8342666625976562, -0.80291748046875, -0.7715682983398438, -0.7402191162109375, -0.7088699340820312, -0.677520751953125, -0.6461715698242188, -0.6148223876953125, -0.5834732055664062, -0.5521240234375, -0.5207748413085938, -0.4894256591796875, -0.45807647705078125, -0.426727294921875, -0.39537811279296875, -0.3640289306640625, -0.33267974853515625, -0.30133056640625, -0.26998138427734375, -0.2386322021484375, -0.20728302001953125, -0.175933837890625, -0.14458465576171875, -0.1132354736328125, -0.08188629150390625, -0.050537109375, -0.01918792724609375, 0.0121612548828125, 0.04351043701171875, 0.074859619140625, 0.10620880126953125, 0.1375579833984375, 0.16890716552734375, 0.20025634765625, 0.23160552978515625, 0.2629547119140625, 0.29430389404296875, 0.325653076171875, 0.35700225830078125, 0.3883514404296875, 0.41970062255859375, 0.4510498046875, 0.48239898681640625, 0.5137481689453125, 0.5450973510742188, 0.576446533203125, 0.6077957153320312, 0.6391448974609375, 0.6704940795898438, 0.70184326171875, 0.7331924438476562, 0.7645416259765625, 0.7958908081054688, 0.827239990234375, 0.8585891723632812, 0.8899383544921875, 0.9212875366210938, 0.95263671875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 5.0, 10.0, 19.0, 30.0, 39.0, 61.0, 88.0, 130.0, 197.0, 300.0, 475.0, 634.0, 1062.0, 1661.0, 2477.0, 3965.0, 6382.0, 10441.0, 18062.0, 33193.0, 66443.0, 163062.0, 415897.0, 173067.0, 69574.0, 33883.0, 18386.0, 10725.0, 6728.0, 4069.0, 2661.0, 1662.0, 1069.0, 690.0, 458.0, 322.0, 228.0, 133.0, 88.0, 58.0, 38.0, 23.0, 23.0, 12.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.568359375, -1.5201416015625, -1.471923828125, -1.4237060546875, -1.37548828125, -1.3272705078125, -1.279052734375, -1.2308349609375, -1.1826171875, -1.1343994140625, -1.086181640625, -1.0379638671875, -0.98974609375, -0.9415283203125, -0.893310546875, -0.8450927734375, -0.796875, -0.7486572265625, -0.700439453125, -0.6522216796875, -0.60400390625, -0.5557861328125, -0.507568359375, -0.4593505859375, -0.4111328125, -0.3629150390625, -0.314697265625, -0.2664794921875, -0.21826171875, -0.1700439453125, -0.121826171875, -0.0736083984375, -0.025390625, 0.0228271484375, 0.071044921875, 0.1192626953125, 0.16748046875, 0.2156982421875, 0.263916015625, 0.3121337890625, 0.3603515625, 0.4085693359375, 0.456787109375, 0.5050048828125, 0.55322265625, 0.6014404296875, 0.649658203125, 0.6978759765625, 0.74609375, 0.7943115234375, 0.842529296875, 0.8907470703125, 0.93896484375, 0.9871826171875, 1.035400390625, 1.0836181640625, 1.1318359375, 1.1800537109375, 1.228271484375, 1.2764892578125, 1.32470703125, 1.3729248046875, 1.421142578125, 1.4693603515625, 1.517578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 5.0, 7.0, 3.0, 7.0, 12.0, 14.0, 21.0, 15.0, 21.0, 26.0, 28.0, 34.0, 27.0, 36.0, 39.0, 48.0, 57.0, 58.0, 1072.0, 46.0, 50.0, 52.0, 63.0, 40.0, 44.0, 44.0, 25.0, 29.0, 23.0, 25.0, 8.0, 10.0, 6.0, 14.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.619140625, -1.5726470947265625, -1.526153564453125, -1.4796600341796875, -1.43316650390625, -1.3866729736328125, -1.340179443359375, -1.2936859130859375, -1.2471923828125, -1.2006988525390625, -1.154205322265625, -1.1077117919921875, -1.06121826171875, -1.0147247314453125, -0.968231201171875, -0.9217376708984375, -0.875244140625, -0.8287506103515625, -0.782257080078125, -0.7357635498046875, -0.68927001953125, -0.6427764892578125, -0.596282958984375, -0.5497894287109375, -0.5032958984375, -0.4568023681640625, -0.410308837890625, -0.3638153076171875, -0.31732177734375, -0.2708282470703125, -0.224334716796875, -0.1778411865234375, -0.13134765625, -0.0848541259765625, -0.038360595703125, 0.0081329345703125, 0.05462646484375, 0.1011199951171875, 0.147613525390625, 0.1941070556640625, 0.2406005859375, 0.2870941162109375, 0.333587646484375, 0.3800811767578125, 0.42657470703125, 0.4730682373046875, 0.519561767578125, 0.5660552978515625, 0.612548828125, 0.6590423583984375, 0.705535888671875, 0.7520294189453125, 0.79852294921875, 0.8450164794921875, 0.891510009765625, 0.9380035400390625, 0.9844970703125, 1.0309906005859375, 1.077484130859375, 1.1239776611328125, 1.17047119140625, 1.2169647216796875, 1.263458251953125, 1.3099517822265625, 1.3564453125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 8.0, 15.0, 20.0, 19.0, 25.0, 26.0, 37.0, 54.0, 92.0, 137.0, 176.0, 259.0, 364.0, 484.0, 799.0, 1170.0, 1917.0, 3115.0, 5293.0, 10020.0, 20872.0, 70478.0, 1788839.0, 137115.0, 27594.0, 12089.0, 6380.0, 3602.0, 2130.0, 1367.0, 866.0, 569.0, 363.0, 254.0, 163.0, 108.0, 80.0, 70.0, 51.0, 34.0, 25.0, 13.0, 12.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0], "bins": [-2.78515625, -2.70477294921875, -2.6243896484375, -2.54400634765625, -2.463623046875, -2.38323974609375, -2.3028564453125, -2.22247314453125, -2.14208984375, -2.06170654296875, -1.9813232421875, -1.90093994140625, -1.820556640625, -1.74017333984375, -1.6597900390625, -1.57940673828125, -1.4990234375, -1.41864013671875, -1.3382568359375, -1.25787353515625, -1.177490234375, -1.09710693359375, -1.0167236328125, -0.93634033203125, -0.85595703125, -0.77557373046875, -0.6951904296875, -0.61480712890625, -0.534423828125, -0.45404052734375, -0.3736572265625, -0.29327392578125, -0.212890625, -0.13250732421875, -0.0521240234375, 0.02825927734375, 0.108642578125, 0.18902587890625, 0.2694091796875, 0.34979248046875, 0.43017578125, 0.51055908203125, 0.5909423828125, 0.67132568359375, 0.751708984375, 0.83209228515625, 0.9124755859375, 0.99285888671875, 1.0732421875, 1.15362548828125, 1.2340087890625, 1.31439208984375, 1.394775390625, 1.47515869140625, 1.5555419921875, 1.63592529296875, 1.71630859375, 1.79669189453125, 1.8770751953125, 1.95745849609375, 2.037841796875, 2.11822509765625, 2.1986083984375, 2.27899169921875, 2.359375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 12.0, 12.0, 25.0, 26.0, 21.0, 32.0, 46.0, 76.0, 130.0, 158.0, 140.0, 80.0, 52.0, 50.0, 22.0, 22.0, 17.0, 12.0, 6.0, 10.0, 5.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.27312469482421875, -0.2649993896484375, -0.25687408447265625, -0.248748779296875, -0.24062347412109375, -0.2324981689453125, -0.22437286376953125, -0.21624755859375, -0.20812225341796875, -0.1999969482421875, -0.19187164306640625, -0.183746337890625, -0.17562103271484375, -0.1674957275390625, -0.15937042236328125, -0.1512451171875, -0.14311981201171875, -0.1349945068359375, -0.12686920166015625, -0.118743896484375, -0.11061859130859375, -0.1024932861328125, -0.09436798095703125, -0.08624267578125, -0.07811737060546875, -0.0699920654296875, -0.06186676025390625, -0.053741455078125, -0.04561614990234375, -0.0374908447265625, -0.02936553955078125, -0.021240234375, -0.01311492919921875, -0.0049896240234375, 0.00313568115234375, 0.011260986328125, 0.01938629150390625, 0.0275115966796875, 0.03563690185546875, 0.04376220703125, 0.05188751220703125, 0.0600128173828125, 0.06813812255859375, 0.076263427734375, 0.08438873291015625, 0.0925140380859375, 0.10063934326171875, 0.1087646484375, 0.11688995361328125, 0.1250152587890625, 0.13314056396484375, 0.141265869140625, 0.14939117431640625, 0.1575164794921875, 0.16564178466796875, 0.17376708984375, 0.18189239501953125, 0.1900177001953125, 0.19814300537109375, 0.206268310546875, 0.21439361572265625, 0.2225189208984375, 0.23064422607421875, 0.23876953125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 6.0, 2.0, 3.0, 9.0, 8.0, 20.0, 17.0, 31.0, 32.0, 65.0, 79.0, 80.0, 139.0, 286.0, 1067.0, 13147.0, 1005169.0, 25952.0, 1523.0, 336.0, 197.0, 97.0, 71.0, 54.0, 31.0, 24.0, 25.0, 9.0, 12.0, 16.0, 6.0, 5.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.52734375, -4.396453857421875, -4.26556396484375, -4.134674072265625, -4.0037841796875, -3.872894287109375, -3.74200439453125, -3.611114501953125, -3.480224609375, -3.349334716796875, -3.21844482421875, -3.087554931640625, -2.9566650390625, -2.825775146484375, -2.69488525390625, -2.563995361328125, -2.43310546875, -2.302215576171875, -2.17132568359375, -2.040435791015625, -1.9095458984375, -1.778656005859375, -1.64776611328125, -1.516876220703125, -1.385986328125, -1.255096435546875, -1.12420654296875, -0.993316650390625, -0.8624267578125, -0.731536865234375, -0.60064697265625, -0.469757080078125, -0.3388671875, -0.207977294921875, -0.07708740234375, 0.053802490234375, 0.1846923828125, 0.315582275390625, 0.44647216796875, 0.577362060546875, 0.708251953125, 0.839141845703125, 0.97003173828125, 1.100921630859375, 1.2318115234375, 1.362701416015625, 1.49359130859375, 1.624481201171875, 1.75537109375, 1.886260986328125, 2.01715087890625, 2.148040771484375, 2.2789306640625, 2.409820556640625, 2.54071044921875, 2.671600341796875, 2.802490234375, 2.933380126953125, 3.06427001953125, 3.195159912109375, 3.3260498046875, 3.456939697265625, 3.58782958984375, 3.718719482421875, 3.849609375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 11.0, 17.0, 30.0, 51.0, 126.0, 328.0, 245.0, 95.0, 52.0, 27.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.483856201171875, -1.4514906406402588, -1.4191251993179321, -1.386759638786316, -1.3543940782546997, -1.3220285177230835, -1.2896630764007568, -1.2572975158691406, -1.2249319553375244, -1.1925663948059082, -1.1602009534835815, -1.1278353929519653, -1.0954698324203491, -1.063104271888733, -1.0307388305664062, -0.99837327003479, -0.9660077691078186, -0.9336422681808472, -0.901276707649231, -0.8689112067222595, -0.8365456461906433, -0.8041801452636719, -0.7718145847320557, -0.7394490838050842, -0.7070835828781128, -0.6747180819511414, -0.6423525214195251, -0.6099870204925537, -0.5776214599609375, -0.5452559590339661, -0.5128904581069946, -0.4805248975753784, -0.4481593370437622, -0.4157938063144684, -0.38342827558517456, -0.3510627746582031, -0.3186972141265869, -0.2863317131996155, -0.25396618247032166, -0.22160065174102783, -0.189235121011734, -0.15686959028244019, -0.12450406700372696, -0.09213854372501373, -0.05977301299571991, -0.027407482266426086, 0.004958033561706543, 0.037323564291000366, 0.06968909502029419, 0.10205462574958801, 0.13442015647888184, 0.16678567230701447, 0.1991512030363083, 0.2315167337656021, 0.26388224959373474, 0.29624778032302856, 0.3286133110523224, 0.3609788417816162, 0.39334437251091003, 0.42570990324020386, 0.4580754041671753, 0.4904409646987915, 0.5228064656257629, 0.5551719665527344, 0.5875375270843506]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 8.0, 9.0, 6.0, 17.0, 8.0, 15.0, 17.0, 29.0, 14.0, 25.0, 32.0, 38.0, 40.0, 51.0, 48.0, 47.0, 46.0, 42.0, 47.0, 45.0, 47.0, 51.0, 53.0, 60.0, 44.0, 27.0, 26.0, 28.0, 17.0, 18.0, 8.0, 9.0, 10.0, 6.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37790876626968384, -0.3633962571620941, -0.3488837480545044, -0.3343712091445923, -0.31985870003700256, -0.30534619092941284, -0.2908336818218231, -0.2763211727142334, -0.2618086636066437, -0.24729615449905396, -0.23278363049030304, -0.21827112138271332, -0.2037586122751236, -0.18924608826637268, -0.17473357915878296, -0.16022107005119324, -0.14570854604244232, -0.1311960369348526, -0.11668352037668228, -0.10217100381851196, -0.08765849471092224, -0.07314597815275192, -0.058633461594581604, -0.04412095248699188, -0.029608435928821564, -0.015095922164618969, -0.0005834084004163742, 0.013929106295108795, 0.028441619127988815, 0.042954131960868835, 0.057466648519039154, 0.07197915762662888, 0.0864916741847992, 0.10100419074296951, 0.11551669985055923, 0.13002921640872955, 0.14454172551631927, 0.1590542495250702, 0.1735667586326599, 0.18807926774024963, 0.20259177684783936, 0.21710428595542908, 0.23161680996418, 0.24612931907176971, 0.26064184308052063, 0.27515435218811035, 0.2896668612957001, 0.3041793704032898, 0.3186919093132019, 0.3332044184207916, 0.34771692752838135, 0.36222946643829346, 0.3767419755458832, 0.3912544846534729, 0.4057669937610626, 0.42027950286865234, 0.43479201197624207, 0.4493045210838318, 0.4638170301914215, 0.47832953929901123, 0.49284207820892334, 0.5073545575141907, 0.5218670964241028, 0.5363795757293701, 0.5508921146392822]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 11.0, 6.0, 5.0, 10.0, 11.0, 17.0, 19.0, 23.0, 30.0, 27.0, 33.0, 31.0, 43.0, 49.0, 34.0, 40.0, 54.0, 36.0, 52.0, 35.0, 46.0, 38.0, 46.0, 39.0, 39.0, 21.0, 23.0, 28.0, 19.0, 23.0, 20.0, 13.0, 8.0, 13.0, 13.0, 7.0, 7.0, 9.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0458984375, -1.01446533203125, -0.9830322265625, -0.95159912109375, -0.920166015625, -0.88873291015625, -0.8572998046875, -0.82586669921875, -0.79443359375, -0.76300048828125, -0.7315673828125, -0.70013427734375, -0.668701171875, -0.63726806640625, -0.6058349609375, -0.57440185546875, -0.54296875, -0.51153564453125, -0.4801025390625, -0.44866943359375, -0.417236328125, -0.38580322265625, -0.3543701171875, -0.32293701171875, -0.29150390625, -0.26007080078125, -0.2286376953125, -0.19720458984375, -0.165771484375, -0.13433837890625, -0.1029052734375, -0.07147216796875, -0.0400390625, -0.00860595703125, 0.0228271484375, 0.05426025390625, 0.085693359375, 0.11712646484375, 0.1485595703125, 0.17999267578125, 0.21142578125, 0.24285888671875, 0.2742919921875, 0.30572509765625, 0.337158203125, 0.36859130859375, 0.4000244140625, 0.43145751953125, 0.462890625, 0.49432373046875, 0.5257568359375, 0.55718994140625, 0.588623046875, 0.62005615234375, 0.6514892578125, 0.68292236328125, 0.71435546875, 0.74578857421875, 0.7772216796875, 0.80865478515625, 0.840087890625, 0.87152099609375, 0.9029541015625, 0.93438720703125, 0.9658203125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 14.0, 16.0, 29.0, 37.0, 49.0, 71.0, 83.0, 158.0, 185.0, 246.0, 350.0, 473.0, 677.0, 876.0, 1261.0, 1765.0, 2581.0, 3789.0, 5742.0, 8634.0, 14317.0, 25033.0, 47590.0, 105385.0, 340597.0, 288233.0, 94695.0, 43172.0, 23353.0, 13442.0, 8229.0, 5316.0, 3552.0, 2542.0, 1691.0, 1196.0, 892.0, 616.0, 448.0, 313.0, 237.0, 201.0, 127.0, 96.0, 66.0, 54.0, 42.0, 27.0, 17.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0], "bins": [-2.162109375, -2.096466064453125, -2.03082275390625, -1.965179443359375, -1.8995361328125, -1.833892822265625, -1.76824951171875, -1.702606201171875, -1.636962890625, -1.571319580078125, -1.50567626953125, -1.440032958984375, -1.3743896484375, -1.308746337890625, -1.24310302734375, -1.177459716796875, -1.11181640625, -1.046173095703125, -0.98052978515625, -0.914886474609375, -0.8492431640625, -0.783599853515625, -0.71795654296875, -0.652313232421875, -0.586669921875, -0.521026611328125, -0.45538330078125, -0.389739990234375, -0.3240966796875, -0.258453369140625, -0.19281005859375, -0.127166748046875, -0.0615234375, 0.004119873046875, 0.06976318359375, 0.135406494140625, 0.2010498046875, 0.266693115234375, 0.33233642578125, 0.397979736328125, 0.463623046875, 0.529266357421875, 0.59490966796875, 0.660552978515625, 0.7261962890625, 0.791839599609375, 0.85748291015625, 0.923126220703125, 0.98876953125, 1.054412841796875, 1.12005615234375, 1.185699462890625, 1.2513427734375, 1.316986083984375, 1.38262939453125, 1.448272705078125, 1.513916015625, 1.579559326171875, 1.64520263671875, 1.710845947265625, 1.7764892578125, 1.842132568359375, 1.90777587890625, 1.973419189453125, 2.0390625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 8.0, 8.0, 12.0, 15.0, 10.0, 20.0, 34.0, 28.0, 35.0, 33.0, 47.0, 46.0, 54.0, 72.0, 107.0, 179.0, 1426.0, 250.0, 142.0, 95.0, 87.0, 54.0, 49.0, 42.0, 32.0, 24.0, 26.0, 18.0, 15.0, 15.0, 8.0, 9.0, 16.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.650390625, -3.5386962890625, -3.427001953125, -3.3153076171875, -3.20361328125, -3.0919189453125, -2.980224609375, -2.8685302734375, -2.7568359375, -2.6451416015625, -2.533447265625, -2.4217529296875, -2.31005859375, -2.1983642578125, -2.086669921875, -1.9749755859375, -1.86328125, -1.7515869140625, -1.639892578125, -1.5281982421875, -1.41650390625, -1.3048095703125, -1.193115234375, -1.0814208984375, -0.9697265625, -0.8580322265625, -0.746337890625, -0.6346435546875, -0.52294921875, -0.4112548828125, -0.299560546875, -0.1878662109375, -0.076171875, 0.0355224609375, 0.147216796875, 0.2589111328125, 0.37060546875, 0.4822998046875, 0.593994140625, 0.7056884765625, 0.8173828125, 0.9290771484375, 1.040771484375, 1.1524658203125, 1.26416015625, 1.3758544921875, 1.487548828125, 1.5992431640625, 1.7109375, 1.8226318359375, 1.934326171875, 2.0460205078125, 2.15771484375, 2.2694091796875, 2.381103515625, 2.4927978515625, 2.6044921875, 2.7161865234375, 2.827880859375, 2.9395751953125, 3.05126953125, 3.1629638671875, 3.274658203125, 3.3863525390625, 3.498046875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 10.0, 8.0, 15.0, 15.0, 11.0, 15.0, 27.0, 28.0, 27.0, 45.0, 53.0, 131.0, 206.0, 578.0, 2564.0, 29571.0, 2889770.0, 213169.0, 7631.0, 1041.0, 313.0, 129.0, 82.0, 60.0, 39.0, 25.0, 27.0, 27.0, 18.0, 12.0, 13.0, 7.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.7109375, -14.2994384765625, -13.887939453125, -13.4764404296875, -13.06494140625, -12.6534423828125, -12.241943359375, -11.8304443359375, -11.4189453125, -11.0074462890625, -10.595947265625, -10.1844482421875, -9.77294921875, -9.3614501953125, -8.949951171875, -8.5384521484375, -8.126953125, -7.7154541015625, -7.303955078125, -6.8924560546875, -6.48095703125, -6.0694580078125, -5.657958984375, -5.2464599609375, -4.8349609375, -4.4234619140625, -4.011962890625, -3.6004638671875, -3.18896484375, -2.7774658203125, -2.365966796875, -1.9544677734375, -1.54296875, -1.1314697265625, -0.719970703125, -0.3084716796875, 0.10302734375, 0.5145263671875, 0.926025390625, 1.3375244140625, 1.7490234375, 2.1605224609375, 2.572021484375, 2.9835205078125, 3.39501953125, 3.8065185546875, 4.218017578125, 4.6295166015625, 5.041015625, 5.4525146484375, 5.864013671875, 6.2755126953125, 6.68701171875, 7.0985107421875, 7.510009765625, 7.9215087890625, 8.3330078125, 8.7445068359375, 9.156005859375, 9.5675048828125, 9.97900390625, 10.3905029296875, 10.802001953125, 11.2135009765625, 11.625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 29.0, 148.0, 456.0, 300.0, 61.0, 15.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.035027980804443, -6.120114326477051, -5.2052001953125, -4.290286064147949, -3.3753724098205566, -2.460458278656006, -1.5455446243286133, -0.6306309700012207, 0.2842831611633301, 1.1991970539093018, 2.1141109466552734, 3.029024839401245, 3.943938732147217, 4.858852863311768, 5.77376651763916, 6.688680171966553, 7.6035943031311035, 8.518507957458496, 9.433422088623047, 10.348336219787598, 11.263250350952148, 12.178163528442383, 13.093077659606934, 14.007991790771484, 14.922904968261719, 15.83781909942627, 16.75273323059082, 17.667646408081055, 18.582561492919922, 19.497474670410156, 20.41238784790039, 21.327301025390625, 22.242218017578125, 23.15713119506836, 24.072046279907227, 24.98695945739746, 25.901874542236328, 26.816787719726562, 27.731700897216797, 28.64661407470703, 29.5615291595459, 30.476442337036133, 31.391357421875, 32.306270599365234, 33.22118377685547, 34.13610076904297, 35.0510139465332, 35.96592712402344, 36.88084030151367, 37.795753479003906, 38.71066665649414, 39.62558364868164, 40.540496826171875, 41.45541000366211, 42.370323181152344, 43.28523635864258, 44.20014953613281, 45.11506271362305, 46.02997589111328, 46.94489288330078, 47.859806060791016, 48.77471923828125, 49.689632415771484, 50.60454559326172, 51.51946258544922]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 2.0, 10.0, 9.0, 17.0, 18.0, 17.0, 14.0, 21.0, 23.0, 27.0, 23.0, 36.0, 58.0, 47.0, 41.0, 49.0, 51.0, 41.0, 41.0, 49.0, 57.0, 35.0, 32.0, 29.0, 42.0, 31.0, 34.0, 28.0, 24.0, 9.0, 18.0, 12.0, 13.0, 4.0, 6.0, 1.0, 9.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.891485214233398, -14.473793029785156, -14.056100845336914, -13.638407707214355, -13.220715522766113, -12.803023338317871, -12.385330200195312, -11.96763801574707, -11.549945831298828, -11.132253646850586, -10.714561462402344, -10.296868324279785, -9.879176139831543, -9.4614839553833, -9.043790817260742, -8.6260986328125, -8.208406448364258, -7.790714263916016, -7.373021602630615, -6.955328941345215, -6.537636756896973, -6.1199445724487305, -5.70225191116333, -5.28455924987793, -4.8668670654296875, -4.449174880981445, -4.031482219696045, -3.6137897968292236, -3.1960973739624023, -2.778404951095581, -2.3607125282287598, -1.9430201053619385, -1.5253276824951172, -1.107635259628296, -0.6899428367614746, -0.2722504138946533, 0.14544200897216797, 0.5631344318389893, 0.9808268547058105, 1.3985192775726318, 1.8162117004394531, 2.2339041233062744, 2.6515965461730957, 3.069288969039917, 3.4869813919067383, 3.9046738147735596, 4.322366237640381, 4.740058898925781, 5.157751083374023, 5.575443267822266, 5.993135929107666, 6.410828590393066, 6.828520774841309, 7.246212959289551, 7.663905620574951, 8.081598281860352, 8.499290466308594, 8.916982650756836, 9.334674835205078, 9.752367973327637, 10.170060157775879, 10.587752342224121, 11.00544548034668, 11.423137664794922, 11.840829849243164]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 5.0, 10.0, 10.0, 12.0, 12.0, 18.0, 16.0, 20.0, 34.0, 31.0, 43.0, 43.0, 38.0, 53.0, 47.0, 57.0, 37.0, 39.0, 51.0, 50.0, 42.0, 43.0, 41.0, 38.0, 28.0, 34.0, 18.0, 18.0, 21.0, 13.0, 13.0, 13.0, 11.0, 7.0, 8.0, 4.0, 4.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.328125, -1.2894134521484375, -1.250701904296875, -1.2119903564453125, -1.17327880859375, -1.1345672607421875, -1.095855712890625, -1.0571441650390625, -1.0184326171875, -0.9797210693359375, -0.941009521484375, -0.9022979736328125, -0.86358642578125, -0.8248748779296875, -0.786163330078125, -0.7474517822265625, -0.708740234375, -0.6700286865234375, -0.631317138671875, -0.5926055908203125, -0.55389404296875, -0.5151824951171875, -0.476470947265625, -0.4377593994140625, -0.3990478515625, -0.3603363037109375, -0.321624755859375, -0.2829132080078125, -0.24420166015625, -0.2054901123046875, -0.166778564453125, -0.1280670166015625, -0.08935546875, -0.0506439208984375, -0.011932373046875, 0.0267791748046875, 0.06549072265625, 0.1042022705078125, 0.142913818359375, 0.1816253662109375, 0.2203369140625, 0.2590484619140625, 0.297760009765625, 0.3364715576171875, 0.37518310546875, 0.4138946533203125, 0.452606201171875, 0.4913177490234375, 0.530029296875, 0.5687408447265625, 0.607452392578125, 0.6461639404296875, 0.68487548828125, 0.7235870361328125, 0.762298583984375, 0.8010101318359375, 0.8397216796875, 0.8784332275390625, 0.917144775390625, 0.9558563232421875, 0.99456787109375, 1.0332794189453125, 1.071990966796875, 1.1107025146484375, 1.1494140625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 7.0, 18.0, 22.0, 26.0, 45.0, 51.0, 86.0, 116.0, 173.0, 250.0, 364.0, 538.0, 828.0, 1268.0, 1915.0, 3090.0, 4973.0, 8155.0, 13819.0, 25504.0, 78028.0, 2340319.0, 1595453.0, 61821.0, 22855.0, 12547.0, 7606.0, 4825.0, 3134.0, 2067.0, 1394.0, 981.0, 598.0, 466.0, 284.0, 221.0, 139.0, 80.0, 81.0, 38.0, 33.0, 19.0, 16.0, 12.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.15625, -4.033843994140625, -3.91143798828125, -3.789031982421875, -3.6666259765625, -3.544219970703125, -3.42181396484375, -3.299407958984375, -3.177001953125, -3.054595947265625, -2.93218994140625, -2.809783935546875, -2.6873779296875, -2.564971923828125, -2.44256591796875, -2.320159912109375, -2.19775390625, -2.075347900390625, -1.95294189453125, -1.830535888671875, -1.7081298828125, -1.585723876953125, -1.46331787109375, -1.340911865234375, -1.218505859375, -1.096099853515625, -0.97369384765625, -0.851287841796875, -0.7288818359375, -0.606475830078125, -0.48406982421875, -0.361663818359375, -0.2392578125, -0.116851806640625, 0.00555419921875, 0.127960205078125, 0.2503662109375, 0.372772216796875, 0.49517822265625, 0.617584228515625, 0.739990234375, 0.862396240234375, 0.98480224609375, 1.107208251953125, 1.2296142578125, 1.352020263671875, 1.47442626953125, 1.596832275390625, 1.71923828125, 1.841644287109375, 1.96405029296875, 2.086456298828125, 2.2088623046875, 2.331268310546875, 2.45367431640625, 2.576080322265625, 2.698486328125, 2.820892333984375, 2.94329833984375, 3.065704345703125, 3.1881103515625, 3.310516357421875, 3.43292236328125, 3.555328369140625, 3.677734375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 16.0, 9.0, 9.0, 22.0, 29.0, 32.0, 50.0, 83.0, 157.0, 616.0, 1989.0, 673.0, 156.0, 62.0, 43.0, 28.0, 34.0, 19.0, 15.0, 8.0, 9.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -8.007080078125, -7.78759765625, -7.568115234375, -7.3486328125, -7.129150390625, -6.90966796875, -6.690185546875, -6.470703125, -6.251220703125, -6.03173828125, -5.812255859375, -5.5927734375, -5.373291015625, -5.15380859375, -4.934326171875, -4.71484375, -4.495361328125, -4.27587890625, -4.056396484375, -3.8369140625, -3.617431640625, -3.39794921875, -3.178466796875, -2.958984375, -2.739501953125, -2.52001953125, -2.300537109375, -2.0810546875, -1.861572265625, -1.64208984375, -1.422607421875, -1.203125, -0.983642578125, -0.76416015625, -0.544677734375, -0.3251953125, -0.105712890625, 0.11376953125, 0.333251953125, 0.552734375, 0.772216796875, 0.99169921875, 1.211181640625, 1.4306640625, 1.650146484375, 1.86962890625, 2.089111328125, 2.30859375, 2.528076171875, 2.74755859375, 2.967041015625, 3.1865234375, 3.406005859375, 3.62548828125, 3.844970703125, 4.064453125, 4.283935546875, 4.50341796875, 4.722900390625, 4.9423828125, 5.161865234375, 5.38134765625, 5.600830078125, 5.8203125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 10.0, 26.0, 41.0, 67.0, 78.0, 156.0, 238.0, 550.0, 1527.0, 5319.0, 23380.0, 203170.0, 3870287.0, 71522.0, 12763.0, 3207.0, 1000.0, 416.0, 216.0, 103.0, 64.0, 43.0, 35.0, 20.0, 14.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -17.0765380859375, -16.606201171875, -16.1358642578125, -15.66552734375, -15.1951904296875, -14.724853515625, -14.2545166015625, -13.7841796875, -13.3138427734375, -12.843505859375, -12.3731689453125, -11.90283203125, -11.4324951171875, -10.962158203125, -10.4918212890625, -10.021484375, -9.5511474609375, -9.080810546875, -8.6104736328125, -8.14013671875, -7.6697998046875, -7.199462890625, -6.7291259765625, -6.2587890625, -5.7884521484375, -5.318115234375, -4.8477783203125, -4.37744140625, -3.9071044921875, -3.436767578125, -2.9664306640625, -2.49609375, -2.0257568359375, -1.555419921875, -1.0850830078125, -0.61474609375, -0.1444091796875, 0.325927734375, 0.7962646484375, 1.2666015625, 1.7369384765625, 2.207275390625, 2.6776123046875, 3.14794921875, 3.6182861328125, 4.088623046875, 4.5589599609375, 5.029296875, 5.4996337890625, 5.969970703125, 6.4403076171875, 6.91064453125, 7.3809814453125, 7.851318359375, 8.3216552734375, 8.7919921875, 9.2623291015625, 9.732666015625, 10.2030029296875, 10.67333984375, 11.1436767578125, 11.614013671875, 12.0843505859375, 12.5546875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [5.0, 5.0, 18.0, 30.0, 90.0, 507.0, 303.0, 43.0, 13.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.678433418273926, -9.671285629272461, -7.6641387939453125, -5.656991481781006, -3.649844169616699, -1.6426973342895508, 0.36445045471191406, 2.371598243713379, 4.378745079040527, 6.385892391204834, 8.39303970336914, 10.400186538696289, 12.407334327697754, 14.414481163024902, 16.421628952026367, 18.428775787353516, 20.435924530029297, 22.443071365356445, 24.450218200683594, 26.457366943359375, 28.464513778686523, 30.471660614013672, 32.47880935668945, 34.48595428466797, 36.49310302734375, 38.50025177001953, 40.50739669799805, 42.51454544067383, 44.521690368652344, 46.528839111328125, 48.535987854003906, 50.54313659667969, 52.55028533935547, 54.55743408203125, 56.564579010009766, 58.57172775268555, 60.57887268066406, 62.586021423339844, 64.59317016601562, 66.6003189086914, 68.60746765136719, 70.61461639404297, 72.62176513671875, 74.62890625, 76.63605499267578, 78.64320373535156, 80.65035247802734, 82.65750122070312, 84.66464233398438, 86.67179107666016, 88.67893981933594, 90.68608093261719, 92.69322967529297, 94.70037841796875, 96.70752716064453, 98.71467590332031, 100.72181701660156, 102.72896575927734, 104.73611450195312, 106.74325561523438, 108.75040435791016, 110.75755310058594, 112.76470184326172, 114.7718505859375, 116.77899932861328]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 11.0, 10.0, 10.0, 21.0, 24.0, 10.0, 29.0, 33.0, 25.0, 28.0, 30.0, 29.0, 41.0, 36.0, 43.0, 46.0, 36.0, 42.0, 45.0, 35.0, 40.0, 35.0, 42.0, 34.0, 33.0, 30.0, 27.0, 26.0, 8.0, 18.0, 14.0, 17.0, 9.0, 9.0, 14.0, 6.0, 6.0, 6.0, 5.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.847256660461426, -11.48775577545166, -11.128253936767578, -10.768753051757812, -10.409252166748047, -10.049750328063965, -9.6902494430542, -9.330747604370117, -8.971246719360352, -8.611745834350586, -8.252243995666504, -7.892743110656738, -7.5332417488098145, -7.173740386962891, -6.814239501953125, -6.454738140106201, -6.095236778259277, -5.7357354164123535, -5.37623405456543, -5.016733169555664, -4.65723180770874, -4.297730445861816, -3.9382293224334717, -3.578728199005127, -3.219226837158203, -2.8597254753112793, -2.5002243518829346, -2.14072322845459, -1.781221866607666, -1.4217206239700317, -1.0622193813323975, -0.7027182579040527, -0.3432159423828125, 0.016285300254821777, 0.37578654289245605, 0.7352877855300903, 1.0947890281677246, 1.4542902708053589, 1.8137915134429932, 2.173292636871338, 2.5327939987182617, 2.8922953605651855, 3.2517964839935303, 3.611297607421875, 3.970798969268799, 4.330300331115723, 4.689801216125488, 5.049302577972412, 5.408803939819336, 5.76830530166626, 6.127806663513184, 6.487307548522949, 6.846808910369873, 7.206310272216797, 7.5658111572265625, 7.925312519073486, 8.28481388092041, 8.644314765930176, 9.003816604614258, 9.363317489624023, 9.722818374633789, 10.082320213317871, 10.441821098327637, 10.801322937011719, 11.160823822021484]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 6.0, 4.0, 18.0, 12.0, 13.0, 17.0, 31.0, 29.0, 37.0, 26.0, 31.0, 51.0, 40.0, 43.0, 49.0, 45.0, 41.0, 41.0, 49.0, 54.0, 40.0, 43.0, 37.0, 35.0, 32.0, 22.0, 19.0, 19.0, 21.0, 22.0, 16.0, 12.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.31640625, -1.2775726318359375, -1.238739013671875, -1.1999053955078125, -1.16107177734375, -1.1222381591796875, -1.083404541015625, -1.0445709228515625, -1.0057373046875, -0.9669036865234375, -0.928070068359375, -0.8892364501953125, -0.85040283203125, -0.8115692138671875, -0.772735595703125, -0.7339019775390625, -0.695068359375, -0.6562347412109375, -0.617401123046875, -0.5785675048828125, -0.53973388671875, -0.5009002685546875, -0.462066650390625, -0.4232330322265625, -0.3843994140625, -0.3455657958984375, -0.306732177734375, -0.2678985595703125, -0.22906494140625, -0.1902313232421875, -0.151397705078125, -0.1125640869140625, -0.07373046875, -0.0348968505859375, 0.003936767578125, 0.0427703857421875, 0.08160400390625, 0.1204376220703125, 0.159271240234375, 0.1981048583984375, 0.2369384765625, 0.2757720947265625, 0.314605712890625, 0.3534393310546875, 0.39227294921875, 0.4311065673828125, 0.469940185546875, 0.5087738037109375, 0.547607421875, 0.5864410400390625, 0.625274658203125, 0.6641082763671875, 0.70294189453125, 0.7417755126953125, 0.780609130859375, 0.8194427490234375, 0.8582763671875, 0.8971099853515625, 0.935943603515625, 0.9747772216796875, 1.01361083984375, 1.0524444580078125, 1.091278076171875, 1.1301116943359375, 1.1689453125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 11.0, 28.0, 28.0, 37.0, 45.0, 73.0, 94.0, 162.0, 196.0, 291.0, 455.0, 615.0, 863.0, 1337.0, 1960.0, 2934.0, 4411.0, 6923.0, 10870.0, 17614.0, 28817.0, 49517.0, 90076.0, 192284.0, 300544.0, 152579.0, 75336.0, 42233.0, 25039.0, 15373.0, 9535.0, 6046.0, 4038.0, 2666.0, 1741.0, 1144.0, 783.0, 557.0, 356.0, 287.0, 179.0, 135.0, 97.0, 63.0, 43.0, 49.0, 28.0, 16.0, 10.0, 8.0, 2.0, 2.0, 4.0, 3.0, 6.0, 2.0], "bins": [-1.408203125, -1.36468505859375, -1.3211669921875, -1.27764892578125, -1.234130859375, -1.19061279296875, -1.1470947265625, -1.10357666015625, -1.06005859375, -1.01654052734375, -0.9730224609375, -0.92950439453125, -0.885986328125, -0.84246826171875, -0.7989501953125, -0.75543212890625, -0.7119140625, -0.66839599609375, -0.6248779296875, -0.58135986328125, -0.537841796875, -0.49432373046875, -0.4508056640625, -0.40728759765625, -0.36376953125, -0.32025146484375, -0.2767333984375, -0.23321533203125, -0.189697265625, -0.14617919921875, -0.1026611328125, -0.05914306640625, -0.015625, 0.02789306640625, 0.0714111328125, 0.11492919921875, 0.158447265625, 0.20196533203125, 0.2454833984375, 0.28900146484375, 0.33251953125, 0.37603759765625, 0.4195556640625, 0.46307373046875, 0.506591796875, 0.55010986328125, 0.5936279296875, 0.63714599609375, 0.6806640625, 0.72418212890625, 0.7677001953125, 0.81121826171875, 0.854736328125, 0.89825439453125, 0.9417724609375, 0.98529052734375, 1.02880859375, 1.07232666015625, 1.1158447265625, 1.15936279296875, 1.202880859375, 1.24639892578125, 1.2899169921875, 1.33343505859375, 1.376953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 10.0, 6.0, 8.0, 13.0, 14.0, 13.0, 24.0, 19.0, 28.0, 21.0, 28.0, 39.0, 38.0, 39.0, 53.0, 57.0, 31.0, 48.0, 1092.0, 42.0, 52.0, 41.0, 32.0, 40.0, 33.0, 32.0, 15.0, 27.0, 29.0, 16.0, 13.0, 13.0, 8.0, 6.0, 4.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.5107421875, -1.4620208740234375, -1.413299560546875, -1.3645782470703125, -1.31585693359375, -1.2671356201171875, -1.218414306640625, -1.1696929931640625, -1.1209716796875, -1.0722503662109375, -1.023529052734375, -0.9748077392578125, -0.92608642578125, -0.8773651123046875, -0.828643798828125, -0.7799224853515625, -0.731201171875, -0.6824798583984375, -0.633758544921875, -0.5850372314453125, -0.53631591796875, -0.4875946044921875, -0.438873291015625, -0.3901519775390625, -0.3414306640625, -0.2927093505859375, -0.243988037109375, -0.1952667236328125, -0.14654541015625, -0.0978240966796875, -0.049102783203125, -0.0003814697265625, 0.04833984375, 0.0970611572265625, 0.145782470703125, 0.1945037841796875, 0.24322509765625, 0.2919464111328125, 0.340667724609375, 0.3893890380859375, 0.4381103515625, 0.4868316650390625, 0.535552978515625, 0.5842742919921875, 0.63299560546875, 0.6817169189453125, 0.730438232421875, 0.7791595458984375, 0.827880859375, 0.8766021728515625, 0.925323486328125, 0.9740447998046875, 1.02276611328125, 1.0714874267578125, 1.120208740234375, 1.1689300537109375, 1.2176513671875, 1.2663726806640625, 1.315093994140625, 1.3638153076171875, 1.41253662109375, 1.4612579345703125, 1.509979248046875, 1.5587005615234375, 1.607421875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 12.0, 16.0, 18.0, 31.0, 37.0, 68.0, 88.0, 122.0, 158.0, 233.0, 335.0, 474.0, 683.0, 1045.0, 1655.0, 2539.0, 3944.0, 6546.0, 11775.0, 24556.0, 91897.0, 1782973.0, 110379.0, 26473.0, 12370.0, 6973.0, 4044.0, 2611.0, 1638.0, 1080.0, 723.0, 482.0, 326.0, 226.0, 149.0, 128.0, 99.0, 58.0, 44.0, 41.0, 21.0, 15.0, 12.0, 7.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.94921875, -2.861297607421875, -2.77337646484375, -2.685455322265625, -2.5975341796875, -2.509613037109375, -2.42169189453125, -2.333770751953125, -2.245849609375, -2.157928466796875, -2.07000732421875, -1.982086181640625, -1.8941650390625, -1.806243896484375, -1.71832275390625, -1.630401611328125, -1.54248046875, -1.454559326171875, -1.36663818359375, -1.278717041015625, -1.1907958984375, -1.102874755859375, -1.01495361328125, -0.927032470703125, -0.839111328125, -0.751190185546875, -0.66326904296875, -0.575347900390625, -0.4874267578125, -0.399505615234375, -0.31158447265625, -0.223663330078125, -0.1357421875, -0.047821044921875, 0.04010009765625, 0.128021240234375, 0.2159423828125, 0.303863525390625, 0.39178466796875, 0.479705810546875, 0.567626953125, 0.655548095703125, 0.74346923828125, 0.831390380859375, 0.9193115234375, 1.007232666015625, 1.09515380859375, 1.183074951171875, 1.27099609375, 1.358917236328125, 1.44683837890625, 1.534759521484375, 1.6226806640625, 1.710601806640625, 1.79852294921875, 1.886444091796875, 1.974365234375, 2.062286376953125, 2.15020751953125, 2.238128662109375, 2.3260498046875, 2.413970947265625, 2.50189208984375, 2.589813232421875, 2.677734375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 6.0, 8.0, 7.0, 13.0, 11.0, 17.0, 16.0, 19.0, 25.0, 45.0, 60.0, 101.0, 183.0, 146.0, 107.0, 76.0, 38.0, 25.0, 18.0, 20.0, 7.0, 5.0, 11.0, 13.0, 9.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.31659698486328125, -0.3048248291015625, -0.29305267333984375, -0.281280517578125, -0.26950836181640625, -0.2577362060546875, -0.24596405029296875, -0.23419189453125, -0.22241973876953125, -0.2106475830078125, -0.19887542724609375, -0.187103271484375, -0.17533111572265625, -0.1635589599609375, -0.15178680419921875, -0.1400146484375, -0.12824249267578125, -0.1164703369140625, -0.10469818115234375, -0.092926025390625, -0.08115386962890625, -0.0693817138671875, -0.05760955810546875, -0.04583740234375, -0.03406524658203125, -0.0222930908203125, -0.01052093505859375, 0.001251220703125, 0.01302337646484375, 0.0247955322265625, 0.03656768798828125, 0.04833984375, 0.06011199951171875, 0.0718841552734375, 0.08365631103515625, 0.095428466796875, 0.10720062255859375, 0.1189727783203125, 0.13074493408203125, 0.14251708984375, 0.15428924560546875, 0.1660614013671875, 0.17783355712890625, 0.189605712890625, 0.20137786865234375, 0.2131500244140625, 0.22492218017578125, 0.2366943359375, 0.24846649169921875, 0.2602386474609375, 0.27201080322265625, 0.283782958984375, 0.29555511474609375, 0.3073272705078125, 0.31909942626953125, 0.33087158203125, 0.34264373779296875, 0.3544158935546875, 0.36618804931640625, 0.377960205078125, 0.38973236083984375, 0.4015045166015625, 0.41327667236328125, 0.425048828125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 10.0, 13.0, 18.0, 19.0, 16.0, 32.0, 44.0, 45.0, 63.0, 87.0, 126.0, 227.0, 513.0, 4363.0, 944302.0, 95913.0, 1768.0, 390.0, 170.0, 115.0, 90.0, 42.0, 35.0, 31.0, 41.0, 27.0, 14.0, 5.0, 7.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4921875, -5.30181884765625, -5.1114501953125, -4.92108154296875, -4.730712890625, -4.54034423828125, -4.3499755859375, -4.15960693359375, -3.96923828125, -3.77886962890625, -3.5885009765625, -3.39813232421875, -3.207763671875, -3.01739501953125, -2.8270263671875, -2.63665771484375, -2.4462890625, -2.25592041015625, -2.0655517578125, -1.87518310546875, -1.684814453125, -1.49444580078125, -1.3040771484375, -1.11370849609375, -0.92333984375, -0.73297119140625, -0.5426025390625, -0.35223388671875, -0.161865234375, 0.02850341796875, 0.2188720703125, 0.40924072265625, 0.599609375, 0.78997802734375, 0.9803466796875, 1.17071533203125, 1.361083984375, 1.55145263671875, 1.7418212890625, 1.93218994140625, 2.12255859375, 2.31292724609375, 2.5032958984375, 2.69366455078125, 2.884033203125, 3.07440185546875, 3.2647705078125, 3.45513916015625, 3.6455078125, 3.83587646484375, 4.0262451171875, 4.21661376953125, 4.406982421875, 4.59735107421875, 4.7877197265625, 4.97808837890625, 5.16845703125, 5.35882568359375, 5.5491943359375, 5.73956298828125, 5.929931640625, 6.12030029296875, 6.3106689453125, 6.50103759765625, 6.69140625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 21.0, 68.0, 112.0, 287.0, 283.0, 122.0, 60.0, 22.0, 12.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.390726327896118, -2.344717502593994, -2.29870867729187, -2.252699851989746, -2.206691026687622, -2.160681962966919, -2.114673137664795, -2.068664312362671, -2.022655487060547, -1.9766466617584229, -1.9306378364562988, -1.8846288919448853, -1.8386200666427612, -1.7926112413406372, -1.7466024160385132, -1.7005934715270996, -1.6545846462249756, -1.6085758209228516, -1.5625669956207275, -1.516558051109314, -1.47054922580719, -1.424540400505066, -1.378531575202942, -1.3325226306915283, -1.2865139245986938, -1.2405050992965698, -1.1944962739944458, -1.1484873294830322, -1.1024785041809082, -1.0564696788787842, -1.0104608535766602, -0.9644519686698914, -0.9184430837631226, -0.8724342584609985, -0.8264253735542297, -0.7804165482521057, -0.7344076633453369, -0.6883988380432129, -0.6423900127410889, -0.5963811278343201, -0.5503722429275513, -0.5043634176254272, -0.45835453271865845, -0.4123457074165344, -0.3663368225097656, -0.3203279972076416, -0.2743191421031952, -0.22831028699874878, -0.18230146169662476, -0.13629260659217834, -0.09028375893831253, -0.044274911284446716, 0.0017339438199996948, 0.047742798924446106, 0.09375163912773132, 0.13976049423217773, 0.18576934933662415, 0.23177820444107056, 0.27778705954551697, 0.3237959146499634, 0.3698047399520874, 0.4158136248588562, 0.4618224501609802, 0.507831335067749, 0.553840160369873]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 11.0, 13.0, 13.0, 10.0, 20.0, 16.0, 31.0, 27.0, 38.0, 44.0, 55.0, 41.0, 53.0, 54.0, 47.0, 37.0, 35.0, 44.0, 51.0, 27.0, 46.0, 33.0, 40.0, 29.0, 31.0, 23.0, 20.0, 17.0, 14.0, 14.0, 16.0, 8.0, 7.0, 7.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5569312572479248, -0.5381261110305786, -0.5193209648132324, -0.5005158185958862, -0.48171064257621765, -0.46290549635887146, -0.4441003203392029, -0.4252951741218567, -0.4064900279045105, -0.3876848816871643, -0.3688797354698181, -0.35007455945014954, -0.33126941323280334, -0.31246426701545715, -0.2936590909957886, -0.2748539447784424, -0.2560487985610962, -0.23724365234375, -0.21843849122524261, -0.19963333010673523, -0.18082818388938904, -0.16202303767204285, -0.14321787655353546, -0.12441271543502808, -0.10560756921768188, -0.0868024155497551, -0.06799726188182831, -0.04919210821390152, -0.03038695454597473, -0.011581800878047943, 0.007223352789878845, 0.02602851390838623, 0.044833600521087646, 0.06363875418901443, 0.08244390785694122, 0.10124906152486801, 0.1200542151927948, 0.138859361410141, 0.15766452252864838, 0.17646968364715576, 0.19527482986450195, 0.21407997608184814, 0.23288513720035553, 0.2516902983188629, 0.2704954445362091, 0.2893005907535553, 0.3081057667732239, 0.32691091299057007, 0.34571605920791626, 0.36452120542526245, 0.38332635164260864, 0.4021315276622772, 0.4209366738796234, 0.4397418200969696, 0.4585469961166382, 0.4773521423339844, 0.49615728855133057, 0.5149624347686768, 0.533767580986023, 0.5525727272033691, 0.5713778734207153, 0.5901830792427063, 0.6089882254600525, 0.6277933716773987, 0.6465985178947449]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 6.0, 6.0, 2.0, 10.0, 14.0, 13.0, 16.0, 16.0, 33.0, 28.0, 34.0, 29.0, 41.0, 47.0, 40.0, 39.0, 48.0, 50.0, 37.0, 40.0, 50.0, 50.0, 50.0, 43.0, 28.0, 42.0, 24.0, 24.0, 18.0, 20.0, 21.0, 19.0, 16.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3134765625, -1.2744903564453125, -1.235504150390625, -1.1965179443359375, -1.15753173828125, -1.1185455322265625, -1.079559326171875, -1.0405731201171875, -1.0015869140625, -0.9626007080078125, -0.923614501953125, -0.8846282958984375, -0.84564208984375, -0.8066558837890625, -0.767669677734375, -0.7286834716796875, -0.689697265625, -0.6507110595703125, -0.611724853515625, -0.5727386474609375, -0.53375244140625, -0.4947662353515625, -0.455780029296875, -0.4167938232421875, -0.3778076171875, -0.3388214111328125, -0.299835205078125, -0.2608489990234375, -0.22186279296875, -0.1828765869140625, -0.143890380859375, -0.1049041748046875, -0.06591796875, -0.0269317626953125, 0.012054443359375, 0.0510406494140625, 0.09002685546875, 0.1290130615234375, 0.167999267578125, 0.2069854736328125, 0.2459716796875, 0.2849578857421875, 0.323944091796875, 0.3629302978515625, 0.40191650390625, 0.4409027099609375, 0.479888916015625, 0.5188751220703125, 0.557861328125, 0.5968475341796875, 0.635833740234375, 0.6748199462890625, 0.71380615234375, 0.7527923583984375, 0.791778564453125, 0.8307647705078125, 0.8697509765625, 0.9087371826171875, 0.947723388671875, 0.9867095947265625, 1.02569580078125, 1.0646820068359375, 1.103668212890625, 1.1426544189453125, 1.181640625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 9.0, 7.0, 16.0, 16.0, 14.0, 26.0, 48.0, 57.0, 63.0, 110.0, 162.0, 204.0, 308.0, 427.0, 638.0, 902.0, 1464.0, 2305.0, 3778.0, 6892.0, 13628.0, 35883.0, 205258.0, 646598.0, 83491.0, 22410.0, 9896.0, 5233.0, 3026.0, 1952.0, 1198.0, 755.0, 528.0, 359.0, 253.0, 169.0, 117.0, 101.0, 67.0, 54.0, 34.0, 26.0, 17.0, 16.0, 15.0, 11.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.685546875, -2.6048583984375, -2.524169921875, -2.4434814453125, -2.36279296875, -2.2821044921875, -2.201416015625, -2.1207275390625, -2.0400390625, -1.9593505859375, -1.878662109375, -1.7979736328125, -1.71728515625, -1.6365966796875, -1.555908203125, -1.4752197265625, -1.39453125, -1.3138427734375, -1.233154296875, -1.1524658203125, -1.07177734375, -0.9910888671875, -0.910400390625, -0.8297119140625, -0.7490234375, -0.6683349609375, -0.587646484375, -0.5069580078125, -0.42626953125, -0.3455810546875, -0.264892578125, -0.1842041015625, -0.103515625, -0.0228271484375, 0.057861328125, 0.1385498046875, 0.21923828125, 0.2999267578125, 0.380615234375, 0.4613037109375, 0.5419921875, 0.6226806640625, 0.703369140625, 0.7840576171875, 0.86474609375, 0.9454345703125, 1.026123046875, 1.1068115234375, 1.1875, 1.2681884765625, 1.348876953125, 1.4295654296875, 1.51025390625, 1.5909423828125, 1.671630859375, 1.7523193359375, 1.8330078125, 1.9136962890625, 1.994384765625, 2.0750732421875, 2.15576171875, 2.2364501953125, 2.317138671875, 2.3978271484375, 2.478515625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 8.0, 7.0, 17.0, 21.0, 18.0, 22.0, 22.0, 56.0, 30.0, 50.0, 52.0, 74.0, 86.0, 258.0, 1525.0, 265.0, 99.0, 74.0, 63.0, 56.0, 38.0, 24.0, 28.0, 31.0, 32.0, 14.0, 16.0, 12.0, 10.0, 12.0, 1.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.95465087890625, -4.7921142578125, -4.62957763671875, -4.467041015625, -4.30450439453125, -4.1419677734375, -3.97943115234375, -3.81689453125, -3.65435791015625, -3.4918212890625, -3.32928466796875, -3.166748046875, -3.00421142578125, -2.8416748046875, -2.67913818359375, -2.5166015625, -2.35406494140625, -2.1915283203125, -2.02899169921875, -1.866455078125, -1.70391845703125, -1.5413818359375, -1.37884521484375, -1.21630859375, -1.05377197265625, -0.8912353515625, -0.72869873046875, -0.566162109375, -0.40362548828125, -0.2410888671875, -0.07855224609375, 0.083984375, 0.24652099609375, 0.4090576171875, 0.57159423828125, 0.734130859375, 0.89666748046875, 1.0592041015625, 1.22174072265625, 1.38427734375, 1.54681396484375, 1.7093505859375, 1.87188720703125, 2.034423828125, 2.19696044921875, 2.3594970703125, 2.52203369140625, 2.6845703125, 2.84710693359375, 3.0096435546875, 3.17218017578125, 3.334716796875, 3.49725341796875, 3.6597900390625, 3.82232666015625, 3.98486328125, 4.14739990234375, 4.3099365234375, 4.47247314453125, 4.635009765625, 4.79754638671875, 4.9600830078125, 5.12261962890625, 5.28515625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 17.0, 20.0, 24.0, 36.0, 47.0, 77.0, 138.0, 251.0, 464.0, 1082.0, 2838.0, 10610.0, 74698.0, 2871802.0, 161874.0, 15447.0, 3701.0, 1273.0, 590.0, 276.0, 149.0, 86.0, 65.0, 20.0, 30.0, 23.0, 13.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6484375, -8.38330078125, -8.1181640625, -7.85302734375, -7.587890625, -7.32275390625, -7.0576171875, -6.79248046875, -6.52734375, -6.26220703125, -5.9970703125, -5.73193359375, -5.466796875, -5.20166015625, -4.9365234375, -4.67138671875, -4.40625, -4.14111328125, -3.8759765625, -3.61083984375, -3.345703125, -3.08056640625, -2.8154296875, -2.55029296875, -2.28515625, -2.02001953125, -1.7548828125, -1.48974609375, -1.224609375, -0.95947265625, -0.6943359375, -0.42919921875, -0.1640625, 0.10107421875, 0.3662109375, 0.63134765625, 0.896484375, 1.16162109375, 1.4267578125, 1.69189453125, 1.95703125, 2.22216796875, 2.4873046875, 2.75244140625, 3.017578125, 3.28271484375, 3.5478515625, 3.81298828125, 4.078125, 4.34326171875, 4.6083984375, 4.87353515625, 5.138671875, 5.40380859375, 5.6689453125, 5.93408203125, 6.19921875, 6.46435546875, 6.7294921875, 6.99462890625, 7.259765625, 7.52490234375, 7.7900390625, 8.05517578125, 8.3203125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 24.0, 51.0, 174.0, 342.0, 262.0, 89.0, 45.0, 13.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.9703369140625, -17.29708480834961, -16.62383460998535, -15.950582504272461, -15.27733039855957, -14.604079246520996, -13.930828094482422, -13.257575988769531, -12.584324836730957, -11.911073684692383, -11.237821578979492, -10.564570426940918, -9.891319274902344, -9.218067169189453, -8.544816017150879, -7.8715643882751465, -7.198312759399414, -6.525061130523682, -5.851809501647949, -5.178558349609375, -4.505306720733643, -3.83205509185791, -3.158803939819336, -2.4855523109436035, -1.812300682067871, -1.1390491724014282, -0.46579766273498535, 0.20745372772216797, 0.8807053565979004, 1.5539569854736328, 2.227208137512207, 2.9004597663879395, 3.573711395263672, 4.246963024139404, 4.920214653015137, 5.593465805053711, 6.266717433929443, 6.939969062805176, 7.61322021484375, 8.28647232055664, 8.959723472595215, 9.632974624633789, 10.30622673034668, 10.979477882385254, 11.652729034423828, 12.325981140136719, 12.999232292175293, 13.672483444213867, 14.345735549926758, 15.018986701965332, 15.692238807678223, 16.365489959716797, 17.038742065429688, 17.711994171142578, 18.385244369506836, 19.058496475219727, 19.731746673583984, 20.404998779296875, 21.078248977661133, 21.751501083374023, 22.424753189086914, 23.098003387451172, 23.771255493164062, 24.444507598876953, 25.117759704589844]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 9.0, 18.0, 13.0, 17.0, 17.0, 20.0, 23.0, 26.0, 25.0, 28.0, 40.0, 31.0, 38.0, 39.0, 44.0, 52.0, 34.0, 32.0, 48.0, 29.0, 36.0, 40.0, 45.0, 33.0, 29.0, 27.0, 28.0, 21.0, 25.0, 13.0, 22.0, 17.0, 11.0, 14.0, 9.0, 4.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.096919059753418, -11.711995124816895, -11.327071189880371, -10.942146301269531, -10.557222366333008, -10.172298431396484, -9.787374496459961, -9.402450561523438, -9.017526626586914, -8.63260269165039, -8.247678756713867, -7.8627543449401855, -7.477829933166504, -7.0929059982299805, -6.707982063293457, -6.323058128356934, -5.938133239746094, -5.55320930480957, -5.168284893035889, -4.783360958099365, -4.398436546325684, -4.01351261138916, -3.6285886764526367, -3.243664503097534, -2.8587403297424316, -2.473816156387329, -2.0888919830322266, -1.7039680480957031, -1.3190438747406006, -0.934119701385498, -0.5491957664489746, -0.16427159309387207, 0.22065353393554688, 0.6055776476860046, 0.9905017614364624, 1.3754258155822754, 1.760349988937378, 2.1452741622924805, 2.530198097229004, 2.9151222705841064, 3.300046443939209, 3.6849706172943115, 4.069894790649414, 4.4548187255859375, 4.839742660522461, 5.224667072296143, 5.609591007232666, 5.994515419006348, 6.379439353942871, 6.7643632888793945, 7.149287700653076, 7.5342116355896, 7.919136047363281, 8.304059982299805, 8.688983917236328, 9.073907852172852, 9.458831787109375, 9.843755722045898, 10.228679656982422, 10.613603591918945, 10.998528480529785, 11.383452415466309, 11.768376350402832, 12.153300285339355, 12.538225173950195]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 6.0, 9.0, 12.0, 12.0, 12.0, 21.0, 24.0, 21.0, 40.0, 34.0, 31.0, 37.0, 43.0, 51.0, 44.0, 49.0, 46.0, 43.0, 50.0, 38.0, 46.0, 47.0, 42.0, 25.0, 25.0, 31.0, 26.0, 22.0, 17.0, 20.0, 15.0, 17.0, 5.0, 10.0, 3.0, 10.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34375, -1.3031463623046875, -1.262542724609375, -1.2219390869140625, -1.18133544921875, -1.1407318115234375, -1.100128173828125, -1.0595245361328125, -1.0189208984375, -0.9783172607421875, -0.937713623046875, -0.8971099853515625, -0.85650634765625, -0.8159027099609375, -0.775299072265625, -0.7346954345703125, -0.694091796875, -0.6534881591796875, -0.612884521484375, -0.5722808837890625, -0.53167724609375, -0.4910736083984375, -0.450469970703125, -0.4098663330078125, -0.3692626953125, -0.3286590576171875, -0.288055419921875, -0.2474517822265625, -0.20684814453125, -0.1662445068359375, -0.125640869140625, -0.0850372314453125, -0.04443359375, -0.0038299560546875, 0.036773681640625, 0.0773773193359375, 0.11798095703125, 0.1585845947265625, 0.199188232421875, 0.2397918701171875, 0.2803955078125, 0.3209991455078125, 0.361602783203125, 0.4022064208984375, 0.44281005859375, 0.4834136962890625, 0.524017333984375, 0.5646209716796875, 0.605224609375, 0.6458282470703125, 0.686431884765625, 0.7270355224609375, 0.76763916015625, 0.8082427978515625, 0.848846435546875, 0.8894500732421875, 0.9300537109375, 0.9706573486328125, 1.011260986328125, 1.0518646240234375, 1.09246826171875, 1.1330718994140625, 1.173675537109375, 1.2142791748046875, 1.2548828125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 17.0, 15.0, 14.0, 34.0, 40.0, 48.0, 82.0, 142.0, 228.0, 386.0, 822.0, 1478.0, 3171.0, 7109.0, 18063.0, 70646.0, 3877735.0, 174202.0, 23461.0, 8620.0, 3850.0, 1915.0, 926.0, 556.0, 256.0, 129.0, 118.0, 54.0, 35.0, 31.0, 19.0, 18.0, 8.0, 12.0, 10.0, 8.0, 2.0, 0.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.48046875, -7.25799560546875, -7.0355224609375, -6.81304931640625, -6.590576171875, -6.36810302734375, -6.1456298828125, -5.92315673828125, -5.70068359375, -5.47821044921875, -5.2557373046875, -5.03326416015625, -4.810791015625, -4.58831787109375, -4.3658447265625, -4.14337158203125, -3.9208984375, -3.69842529296875, -3.4759521484375, -3.25347900390625, -3.031005859375, -2.80853271484375, -2.5860595703125, -2.36358642578125, -2.14111328125, -1.91864013671875, -1.6961669921875, -1.47369384765625, -1.251220703125, -1.02874755859375, -0.8062744140625, -0.58380126953125, -0.361328125, -0.13885498046875, 0.0836181640625, 0.30609130859375, 0.528564453125, 0.75103759765625, 0.9735107421875, 1.19598388671875, 1.41845703125, 1.64093017578125, 1.8634033203125, 2.08587646484375, 2.308349609375, 2.53082275390625, 2.7532958984375, 2.97576904296875, 3.1982421875, 3.42071533203125, 3.6431884765625, 3.86566162109375, 4.088134765625, 4.31060791015625, 4.5330810546875, 4.75555419921875, 4.97802734375, 5.20050048828125, 5.4229736328125, 5.64544677734375, 5.867919921875, 6.09039306640625, 6.3128662109375, 6.53533935546875, 6.7578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 5.0, 9.0, 10.0, 12.0, 15.0, 18.0, 22.0, 22.0, 26.0, 43.0, 63.0, 147.0, 432.0, 1266.0, 1181.0, 428.0, 130.0, 58.0, 35.0, 19.0, 27.0, 17.0, 14.0, 17.0, 10.0, 9.0, 2.0, 11.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.92578125, -3.7801513671875, -3.634521484375, -3.4888916015625, -3.34326171875, -3.1976318359375, -3.052001953125, -2.9063720703125, -2.7607421875, -2.6151123046875, -2.469482421875, -2.3238525390625, -2.17822265625, -2.0325927734375, -1.886962890625, -1.7413330078125, -1.595703125, -1.4500732421875, -1.304443359375, -1.1588134765625, -1.01318359375, -0.8675537109375, -0.721923828125, -0.5762939453125, -0.4306640625, -0.2850341796875, -0.139404296875, 0.0062255859375, 0.15185546875, 0.2974853515625, 0.443115234375, 0.5887451171875, 0.734375, 0.8800048828125, 1.025634765625, 1.1712646484375, 1.31689453125, 1.4625244140625, 1.608154296875, 1.7537841796875, 1.8994140625, 2.0450439453125, 2.190673828125, 2.3363037109375, 2.48193359375, 2.6275634765625, 2.773193359375, 2.9188232421875, 3.064453125, 3.2100830078125, 3.355712890625, 3.5013427734375, 3.64697265625, 3.7926025390625, 3.938232421875, 4.0838623046875, 4.2294921875, 4.3751220703125, 4.520751953125, 4.6663818359375, 4.81201171875, 4.9576416015625, 5.103271484375, 5.2489013671875, 5.39453125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 10.0, 6.0, 16.0, 27.0, 43.0, 51.0, 88.0, 117.0, 164.0, 242.0, 401.0, 760.0, 1341.0, 2420.0, 5066.0, 11237.0, 26800.0, 86926.0, 3306587.0, 661423.0, 53493.0, 19790.0, 8540.0, 4110.0, 1990.0, 1033.0, 578.0, 383.0, 215.0, 155.0, 89.0, 50.0, 30.0, 32.0, 15.0, 17.0, 11.0, 9.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.9140625, -6.6563720703125, -6.398681640625, -6.1409912109375, -5.88330078125, -5.6256103515625, -5.367919921875, -5.1102294921875, -4.8525390625, -4.5948486328125, -4.337158203125, -4.0794677734375, -3.82177734375, -3.5640869140625, -3.306396484375, -3.0487060546875, -2.791015625, -2.5333251953125, -2.275634765625, -2.0179443359375, -1.76025390625, -1.5025634765625, -1.244873046875, -0.9871826171875, -0.7294921875, -0.4718017578125, -0.214111328125, 0.0435791015625, 0.30126953125, 0.5589599609375, 0.816650390625, 1.0743408203125, 1.33203125, 1.5897216796875, 1.847412109375, 2.1051025390625, 2.36279296875, 2.6204833984375, 2.878173828125, 3.1358642578125, 3.3935546875, 3.6512451171875, 3.908935546875, 4.1666259765625, 4.42431640625, 4.6820068359375, 4.939697265625, 5.1973876953125, 5.455078125, 5.7127685546875, 5.970458984375, 6.2281494140625, 6.48583984375, 6.7435302734375, 7.001220703125, 7.2589111328125, 7.5166015625, 7.7742919921875, 8.031982421875, 8.2896728515625, 8.54736328125, 8.8050537109375, 9.062744140625, 9.3204345703125, 9.578125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 17.0, 15.0, 25.0, 67.0, 101.0, 210.0, 285.0, 141.0, 58.0, 41.0, 22.0, 12.0, 7.0, 4.0, 1.0, 1.0, 2.0], "bins": [-48.79997253417969, -47.88185501098633, -46.963741302490234, -46.045623779296875, -45.127506256103516, -44.20939254760742, -43.29127502441406, -42.3731575012207, -41.45504379272461, -40.53692626953125, -39.618812561035156, -38.7006950378418, -37.78257751464844, -36.864463806152344, -35.946346282958984, -35.028228759765625, -34.110111236572266, -33.191993713378906, -32.27388000488281, -31.355762481689453, -30.437646865844727, -29.519529342651367, -28.60141372680664, -27.68329620361328, -26.765182495117188, -25.84706687927246, -24.9289493560791, -24.010833740234375, -23.09271812438965, -22.17460060119629, -21.256484985351562, -20.338367462158203, -19.42025375366211, -18.502138137817383, -17.584020614624023, -16.665904998779297, -15.747788429260254, -14.829671859741211, -13.911556243896484, -12.993439674377441, -12.075323104858398, -11.157206535339355, -10.239090919494629, -9.320974349975586, -8.402857780456543, -7.484741687774658, -6.566625595092773, -5.6485090255737305, -4.7303924560546875, -3.8122761249542236, -2.8941597938537598, -1.976043701171875, -1.0579273700714111, -0.13981103897094727, 0.7783050537109375, 1.6964216232299805, 2.6145377159118652, 3.532654047012329, 4.450770378112793, 5.368886470794678, 6.2870025634765625, 7.2051191329956055, 8.123235702514648, 9.041351318359375, 9.959467887878418]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 10.0, 12.0, 9.0, 16.0, 12.0, 12.0, 15.0, 21.0, 36.0, 25.0, 26.0, 32.0, 34.0, 38.0, 35.0, 29.0, 44.0, 38.0, 38.0, 35.0, 25.0, 40.0, 36.0, 29.0, 35.0, 43.0, 30.0, 28.0, 34.0, 16.0, 17.0, 23.0, 15.0, 16.0, 15.0, 11.0, 12.0, 5.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-8.914299011230469, -8.620478630065918, -8.32665729522705, -8.0328369140625, -7.739016056060791, -7.445195198059082, -7.151374816894531, -6.857553958892822, -6.563733100891113, -6.269912242889404, -5.976091384887695, -5.6822710037231445, -5.3884501457214355, -5.094629287719727, -4.800808906555176, -4.506988048553467, -4.213167190551758, -3.919346332550049, -3.625525712966919, -3.331705093383789, -3.03788423538208, -2.744063377380371, -2.450242757797241, -2.1564221382141113, -1.8626012802124023, -1.568780541419983, -1.2749598026275635, -0.981139063835144, -0.6873183250427246, -0.3934975862503052, -0.09967684745788574, 0.19414377212524414, 0.4879646301269531, 0.7817853689193726, 1.075606107711792, 1.3694268465042114, 1.6632475852966309, 1.9570683240890503, 2.2508890628814697, 2.5447096824645996, 2.8385305404663086, 3.1323513984680176, 3.4261720180511475, 3.7199926376342773, 4.013813495635986, 4.307634353637695, 4.601454734802246, 4.895275592803955, 5.189096450805664, 5.482917308807373, 5.776738166809082, 6.070558547973633, 6.364379405975342, 6.658200263977051, 6.952020645141602, 7.2458415031433105, 7.5396623611450195, 7.8334832191467285, 8.127304077148438, 8.421124458312988, 8.714944839477539, 9.008766174316406, 9.302586555480957, 9.596406936645508, 9.890228271484375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 7.0, 6.0, 11.0, 9.0, 22.0, 22.0, 13.0, 24.0, 24.0, 27.0, 31.0, 38.0, 40.0, 47.0, 33.0, 47.0, 35.0, 46.0, 42.0, 41.0, 38.0, 35.0, 28.0, 34.0, 37.0, 36.0, 34.0, 20.0, 26.0, 24.0, 16.0, 12.0, 17.0, 13.0, 10.0, 7.0, 4.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.2861328125, -1.2493438720703125, -1.212554931640625, -1.1757659912109375, -1.13897705078125, -1.1021881103515625, -1.065399169921875, -1.0286102294921875, -0.9918212890625, -0.9550323486328125, -0.918243408203125, -0.8814544677734375, -0.84466552734375, -0.8078765869140625, -0.771087646484375, -0.7342987060546875, -0.697509765625, -0.6607208251953125, -0.623931884765625, -0.5871429443359375, -0.55035400390625, -0.5135650634765625, -0.476776123046875, -0.4399871826171875, -0.4031982421875, -0.3664093017578125, -0.329620361328125, -0.2928314208984375, -0.25604248046875, -0.2192535400390625, -0.182464599609375, -0.1456756591796875, -0.10888671875, -0.0720977783203125, -0.035308837890625, 0.0014801025390625, 0.03826904296875, 0.0750579833984375, 0.111846923828125, 0.1486358642578125, 0.1854248046875, 0.2222137451171875, 0.259002685546875, 0.2957916259765625, 0.33258056640625, 0.3693695068359375, 0.406158447265625, 0.4429473876953125, 0.479736328125, 0.5165252685546875, 0.553314208984375, 0.5901031494140625, 0.62689208984375, 0.6636810302734375, 0.700469970703125, 0.7372589111328125, 0.7740478515625, 0.8108367919921875, 0.847625732421875, 0.8844146728515625, 0.92120361328125, 0.9579925537109375, 0.994781494140625, 1.0315704345703125, 1.068359375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 11.0, 18.0, 27.0, 25.0, 45.0, 85.0, 90.0, 143.0, 235.0, 366.0, 548.0, 807.0, 1263.0, 1940.0, 2933.0, 4698.0, 7583.0, 11996.0, 19805.0, 33337.0, 58787.0, 111773.0, 257922.0, 270008.0, 115800.0, 60050.0, 34440.0, 20284.0, 12248.0, 7803.0, 4729.0, 3099.0, 1967.0, 1272.0, 783.0, 587.0, 353.0, 234.0, 167.0, 91.0, 57.0, 55.0, 37.0, 20.0, 12.0, 7.0, 6.0, 2.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-1.6669921875, -1.6179962158203125, -1.569000244140625, -1.5200042724609375, -1.47100830078125, -1.4220123291015625, -1.373016357421875, -1.3240203857421875, -1.2750244140625, -1.2260284423828125, -1.177032470703125, -1.1280364990234375, -1.07904052734375, -1.0300445556640625, -0.981048583984375, -0.9320526123046875, -0.883056640625, -0.8340606689453125, -0.785064697265625, -0.7360687255859375, -0.68707275390625, -0.6380767822265625, -0.589080810546875, -0.5400848388671875, -0.4910888671875, -0.4420928955078125, -0.393096923828125, -0.3441009521484375, -0.29510498046875, -0.2461090087890625, -0.197113037109375, -0.1481170654296875, -0.09912109375, -0.0501251220703125, -0.001129150390625, 0.0478668212890625, 0.09686279296875, 0.1458587646484375, 0.194854736328125, 0.2438507080078125, 0.2928466796875, 0.3418426513671875, 0.390838623046875, 0.4398345947265625, 0.48883056640625, 0.5378265380859375, 0.586822509765625, 0.6358184814453125, 0.684814453125, 0.7338104248046875, 0.782806396484375, 0.8318023681640625, 0.88079833984375, 0.9297943115234375, 0.978790283203125, 1.0277862548828125, 1.0767822265625, 1.1257781982421875, 1.174774169921875, 1.2237701416015625, 1.27276611328125, 1.3217620849609375, 1.370758056640625, 1.4197540283203125, 1.46875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 4.0, 12.0, 8.0, 20.0, 10.0, 13.0, 14.0, 21.0, 25.0, 23.0, 23.0, 43.0, 45.0, 42.0, 44.0, 58.0, 65.0, 1073.0, 52.0, 46.0, 43.0, 46.0, 41.0, 43.0, 38.0, 32.0, 19.0, 15.0, 15.0, 20.0, 13.0, 14.0, 10.0, 8.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.76763916015625, -1.7110595703125, -1.65447998046875, -1.597900390625, -1.54132080078125, -1.4847412109375, -1.42816162109375, -1.37158203125, -1.31500244140625, -1.2584228515625, -1.20184326171875, -1.145263671875, -1.08868408203125, -1.0321044921875, -0.97552490234375, -0.9189453125, -0.86236572265625, -0.8057861328125, -0.74920654296875, -0.692626953125, -0.63604736328125, -0.5794677734375, -0.52288818359375, -0.46630859375, -0.40972900390625, -0.3531494140625, -0.29656982421875, -0.239990234375, -0.18341064453125, -0.1268310546875, -0.07025146484375, -0.013671875, 0.04290771484375, 0.0994873046875, 0.15606689453125, 0.212646484375, 0.26922607421875, 0.3258056640625, 0.38238525390625, 0.43896484375, 0.49554443359375, 0.5521240234375, 0.60870361328125, 0.665283203125, 0.72186279296875, 0.7784423828125, 0.83502197265625, 0.8916015625, 0.94818115234375, 1.0047607421875, 1.06134033203125, 1.117919921875, 1.17449951171875, 1.2310791015625, 1.28765869140625, 1.34423828125, 1.40081787109375, 1.4573974609375, 1.51397705078125, 1.570556640625, 1.62713623046875, 1.6837158203125, 1.74029541015625, 1.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 10.0, 15.0, 15.0, 26.0, 25.0, 37.0, 74.0, 70.0, 118.0, 163.0, 218.0, 320.0, 497.0, 719.0, 1089.0, 1546.0, 2375.0, 3647.0, 6074.0, 10920.0, 22075.0, 69020.0, 1691503.0, 213563.0, 35984.0, 15110.0, 8111.0, 4725.0, 2992.0, 1966.0, 1336.0, 912.0, 596.0, 393.0, 257.0, 188.0, 128.0, 103.0, 71.0, 40.0, 33.0, 23.0, 11.0, 15.0, 8.0, 4.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.982421875, -2.891357421875, -2.80029296875, -2.709228515625, -2.6181640625, -2.527099609375, -2.43603515625, -2.344970703125, -2.25390625, -2.162841796875, -2.07177734375, -1.980712890625, -1.8896484375, -1.798583984375, -1.70751953125, -1.616455078125, -1.525390625, -1.434326171875, -1.34326171875, -1.252197265625, -1.1611328125, -1.070068359375, -0.97900390625, -0.887939453125, -0.796875, -0.705810546875, -0.61474609375, -0.523681640625, -0.4326171875, -0.341552734375, -0.25048828125, -0.159423828125, -0.068359375, 0.022705078125, 0.11376953125, 0.204833984375, 0.2958984375, 0.386962890625, 0.47802734375, 0.569091796875, 0.66015625, 0.751220703125, 0.84228515625, 0.933349609375, 1.0244140625, 1.115478515625, 1.20654296875, 1.297607421875, 1.388671875, 1.479736328125, 1.57080078125, 1.661865234375, 1.7529296875, 1.843994140625, 1.93505859375, 2.026123046875, 2.1171875, 2.208251953125, 2.29931640625, 2.390380859375, 2.4814453125, 2.572509765625, 2.66357421875, 2.754638671875, 2.845703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 8.0, 10.0, 3.0, 13.0, 18.0, 23.0, 29.0, 67.0, 81.0, 127.0, 167.0, 136.0, 86.0, 77.0, 54.0, 34.0, 18.0, 12.0, 12.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.418212890625, -0.4041404724121094, -0.39006805419921875, -0.3759956359863281, -0.3619232177734375, -0.3478507995605469, -0.33377838134765625, -0.3197059631347656, -0.305633544921875, -0.2915611267089844, -0.27748870849609375, -0.2634162902832031, -0.2493438720703125, -0.23527145385742188, -0.22119903564453125, -0.20712661743164062, -0.19305419921875, -0.17898178100585938, -0.16490936279296875, -0.15083694458007812, -0.1367645263671875, -0.12269210815429688, -0.10861968994140625, -0.09454727172851562, -0.080474853515625, -0.06640243530273438, -0.05233001708984375, -0.038257598876953125, -0.0241851806640625, -0.010112762451171875, 0.00395965576171875, 0.018032073974609375, 0.0321044921875, 0.046176910400390625, 0.06024932861328125, 0.07432174682617188, 0.0883941650390625, 0.10246658325195312, 0.11653900146484375, 0.13061141967773438, 0.144683837890625, 0.15875625610351562, 0.17282867431640625, 0.18690109252929688, 0.2009735107421875, 0.21504592895507812, 0.22911834716796875, 0.24319076538085938, 0.25726318359375, 0.2713356018066406, 0.28540802001953125, 0.2994804382324219, 0.3135528564453125, 0.3276252746582031, 0.34169769287109375, 0.3557701110839844, 0.369842529296875, 0.3839149475097656, 0.39798736572265625, 0.4120597839355469, 0.4261322021484375, 0.4402046203613281, 0.45427703857421875, 0.4683494567871094, 0.482421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 11.0, 5.0, 8.0, 5.0, 7.0, 14.0, 28.0, 24.0, 33.0, 66.0, 95.0, 218.0, 534.0, 1622.0, 7015.0, 614378.0, 415254.0, 6667.0, 1554.0, 494.0, 190.0, 110.0, 55.0, 31.0, 24.0, 12.0, 11.0, 10.0, 5.0, 7.0, 6.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.42578125, -5.24481201171875, -5.0638427734375, -4.88287353515625, -4.701904296875, -4.52093505859375, -4.3399658203125, -4.15899658203125, -3.97802734375, -3.79705810546875, -3.6160888671875, -3.43511962890625, -3.254150390625, -3.07318115234375, -2.8922119140625, -2.71124267578125, -2.5302734375, -2.34930419921875, -2.1683349609375, -1.98736572265625, -1.806396484375, -1.62542724609375, -1.4444580078125, -1.26348876953125, -1.08251953125, -0.90155029296875, -0.7205810546875, -0.53961181640625, -0.358642578125, -0.17767333984375, 0.0032958984375, 0.18426513671875, 0.365234375, 0.54620361328125, 0.7271728515625, 0.90814208984375, 1.089111328125, 1.27008056640625, 1.4510498046875, 1.63201904296875, 1.81298828125, 1.99395751953125, 2.1749267578125, 2.35589599609375, 2.536865234375, 2.71783447265625, 2.8988037109375, 3.07977294921875, 3.2607421875, 3.44171142578125, 3.6226806640625, 3.80364990234375, 3.984619140625, 4.16558837890625, 4.3465576171875, 4.52752685546875, 4.70849609375, 4.88946533203125, 5.0704345703125, 5.25140380859375, 5.432373046875, 5.61334228515625, 5.7943115234375, 5.97528076171875, 6.15625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 24.0, 34.0, 74.0, 250.0, 426.0, 119.0, 45.0, 18.0, 10.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6664323806762695, -5.541020393371582, -5.4156084060668945, -5.290196418762207, -5.1647844314575195, -5.039371967315674, -4.913959980010986, -4.788547992706299, -4.663136005401611, -4.537724018096924, -4.412312030792236, -4.286900043487549, -4.161487579345703, -4.036075592041016, -3.910663604736328, -3.7852516174316406, -3.659839630126953, -3.5344276428222656, -3.409015655517578, -3.2836034297943115, -3.158191442489624, -3.0327794551849365, -2.90736722946167, -2.7819552421569824, -2.656543254852295, -2.5311312675476074, -2.40571928024292, -2.2803070545196533, -2.154895067214966, -2.0294830799102783, -1.9040709733963013, -1.7786588668823242, -1.653247356414795, -1.5278353691101074, -1.4024232625961304, -1.2770111560821533, -1.1515991687774658, -1.0261871814727783, -0.9007750749588013, -0.775363028049469, -0.6499509811401367, -0.5245389342308044, -0.39912688732147217, -0.2737148404121399, -0.14830279350280762, -0.022890746593475342, 0.10252130031585693, 0.2279333472251892, 0.3533453941345215, 0.47875744104385376, 0.604169487953186, 0.7295815348625183, 0.8549935817718506, 0.9804056286811829, 1.1058176755905151, 1.2312297821044922, 1.3566417694091797, 1.4820537567138672, 1.6074658632278442, 1.7328779697418213, 1.8582899570465088, 1.9837019443511963, 2.109114170074463, 2.2345261573791504, 2.359938144683838]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 9.0, 12.0, 10.0, 12.0, 19.0, 22.0, 21.0, 26.0, 24.0, 28.0, 32.0, 33.0, 61.0, 47.0, 46.0, 42.0, 36.0, 37.0, 42.0, 48.0, 29.0, 42.0, 37.0, 33.0, 37.0, 39.0, 27.0, 20.0, 20.0, 22.0, 20.0, 8.0, 11.0, 10.0, 7.0, 9.0, 4.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.168479323387146, -1.1367031335830688, -1.1049270629882812, -1.073150873184204, -1.0413748025894165, -1.0095986127853394, -0.9778225421905518, -0.9460463523864746, -0.914270281791687, -0.8824941515922546, -0.8507180213928223, -0.8189418911933899, -0.7871657609939575, -0.7553896307945251, -0.7236135005950928, -0.6918373107910156, -0.6600611805915833, -0.6282850503921509, -0.5965089201927185, -0.5647327899932861, -0.5329566597938538, -0.5011805295944214, -0.4694043695926666, -0.43762823939323425, -0.4058521091938019, -0.3740759789943695, -0.34229984879493713, -0.3105236887931824, -0.27874755859375, -0.24697144329547882, -0.21519529819488525, -0.18341916799545288, -0.15164297819137573, -0.11986684799194336, -0.08809071034193039, -0.05631457269191742, -0.024538442492485046, 0.007237687706947327, 0.039013832807540894, 0.07078996300697327, 0.10256609320640564, 0.134342223405838, 0.16611835360527039, 0.19789449870586395, 0.22967062890529633, 0.2614467740058899, 0.29322290420532227, 0.32499903440475464, 0.356775164604187, 0.3885512948036194, 0.42032742500305176, 0.45210355520248413, 0.4838796854019165, 0.5156558156013489, 0.5474319458007812, 0.5792081356048584, 0.610984206199646, 0.6427603363990784, 0.6745364665985107, 0.7063125967979431, 0.7380887269973755, 0.7698648571968079, 0.8016409873962402, 0.8334171772003174, 0.8651933073997498]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 15.0, 6.0, 9.0, 6.0, 12.0, 22.0, 15.0, 27.0, 13.0, 27.0, 32.0, 31.0, 37.0, 42.0, 42.0, 46.0, 35.0, 35.0, 44.0, 44.0, 41.0, 33.0, 35.0, 30.0, 44.0, 33.0, 32.0, 32.0, 22.0, 28.0, 19.0, 16.0, 15.0, 13.0, 10.0, 9.0, 6.0, 7.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.2763671875, -1.239654541015625, -1.20294189453125, -1.166229248046875, -1.1295166015625, -1.092803955078125, -1.05609130859375, -1.019378662109375, -0.982666015625, -0.945953369140625, -0.90924072265625, -0.872528076171875, -0.8358154296875, -0.799102783203125, -0.76239013671875, -0.725677490234375, -0.68896484375, -0.652252197265625, -0.61553955078125, -0.578826904296875, -0.5421142578125, -0.505401611328125, -0.46868896484375, -0.431976318359375, -0.395263671875, -0.358551025390625, -0.32183837890625, -0.285125732421875, -0.2484130859375, -0.211700439453125, -0.17498779296875, -0.138275146484375, -0.1015625, -0.064849853515625, -0.02813720703125, 0.008575439453125, 0.0452880859375, 0.082000732421875, 0.11871337890625, 0.155426025390625, 0.192138671875, 0.228851318359375, 0.26556396484375, 0.302276611328125, 0.3389892578125, 0.375701904296875, 0.41241455078125, 0.449127197265625, 0.48583984375, 0.522552490234375, 0.55926513671875, 0.595977783203125, 0.6326904296875, 0.669403076171875, 0.70611572265625, 0.742828369140625, 0.779541015625, 0.816253662109375, 0.85296630859375, 0.889678955078125, 0.9263916015625, 0.963104248046875, 0.99981689453125, 1.036529541015625, 1.0732421875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 9.0, 17.0, 9.0, 24.0, 44.0, 61.0, 64.0, 102.0, 159.0, 207.0, 293.0, 433.0, 619.0, 970.0, 1485.0, 2333.0, 3918.0, 6952.0, 13080.0, 26952.0, 61309.0, 182212.0, 463409.0, 169688.0, 58824.0, 25598.0, 12548.0, 6736.0, 3794.0, 2283.0, 1454.0, 905.0, 635.0, 433.0, 274.0, 224.0, 135.0, 106.0, 78.0, 49.0, 33.0, 22.0, 24.0, 17.0, 7.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0], "bins": [-1.2119140625, -1.1767578125, -1.1416015625, -1.1064453125, -1.0712890625, -1.0361328125, -1.0009765625, -0.9658203125, -0.9306640625, -0.8955078125, -0.8603515625, -0.8251953125, -0.7900390625, -0.7548828125, -0.7197265625, -0.6845703125, -0.6494140625, -0.6142578125, -0.5791015625, -0.5439453125, -0.5087890625, -0.4736328125, -0.4384765625, -0.4033203125, -0.3681640625, -0.3330078125, -0.2978515625, -0.2626953125, -0.2275390625, -0.1923828125, -0.1572265625, -0.1220703125, -0.0869140625, -0.0517578125, -0.0166015625, 0.0185546875, 0.0537109375, 0.0888671875, 0.1240234375, 0.1591796875, 0.1943359375, 0.2294921875, 0.2646484375, 0.2998046875, 0.3349609375, 0.3701171875, 0.4052734375, 0.4404296875, 0.4755859375, 0.5107421875, 0.5458984375, 0.5810546875, 0.6162109375, 0.6513671875, 0.6865234375, 0.7216796875, 0.7568359375, 0.7919921875, 0.8271484375, 0.8623046875, 0.8974609375, 0.9326171875, 0.9677734375, 1.0029296875, 1.0380859375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 6.0, 11.0, 20.0, 26.0, 10.0, 20.0, 23.0, 33.0, 38.0, 45.0, 35.0, 48.0, 51.0, 70.0, 120.0, 376.0, 1488.0, 120.0, 79.0, 63.0, 49.0, 30.0, 30.0, 36.0, 19.0, 17.0, 27.0, 27.0, 16.0, 17.0, 18.0, 11.0, 6.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.0491943359375, -3.918701171875, -3.7882080078125, -3.65771484375, -3.5272216796875, -3.396728515625, -3.2662353515625, -3.1357421875, -3.0052490234375, -2.874755859375, -2.7442626953125, -2.61376953125, -2.4832763671875, -2.352783203125, -2.2222900390625, -2.091796875, -1.9613037109375, -1.830810546875, -1.7003173828125, -1.56982421875, -1.4393310546875, -1.308837890625, -1.1783447265625, -1.0478515625, -0.9173583984375, -0.786865234375, -0.6563720703125, -0.52587890625, -0.3953857421875, -0.264892578125, -0.1343994140625, -0.00390625, 0.1265869140625, 0.257080078125, 0.3875732421875, 0.51806640625, 0.6485595703125, 0.779052734375, 0.9095458984375, 1.0400390625, 1.1705322265625, 1.301025390625, 1.4315185546875, 1.56201171875, 1.6925048828125, 1.822998046875, 1.9534912109375, 2.083984375, 2.2144775390625, 2.344970703125, 2.4754638671875, 2.60595703125, 2.7364501953125, 2.866943359375, 2.9974365234375, 3.1279296875, 3.2584228515625, 3.388916015625, 3.5194091796875, 3.64990234375, 3.7803955078125, 3.910888671875, 4.0413818359375, 4.171875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 6.0, 6.0, 10.0, 3.0, 12.0, 24.0, 14.0, 14.0, 32.0, 22.0, 40.0, 34.0, 80.0, 138.0, 239.0, 539.0, 1481.0, 5117.0, 28509.0, 419764.0, 2605435.0, 70213.0, 9793.0, 2404.0, 850.0, 374.0, 169.0, 120.0, 54.0, 43.0, 29.0, 22.0, 16.0, 23.0, 12.0, 15.0, 12.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.51953125, -4.35931396484375, -4.1990966796875, -4.03887939453125, -3.878662109375, -3.71844482421875, -3.5582275390625, -3.39801025390625, -3.23779296875, -3.07757568359375, -2.9173583984375, -2.75714111328125, -2.596923828125, -2.43670654296875, -2.2764892578125, -2.11627197265625, -1.9560546875, -1.79583740234375, -1.6356201171875, -1.47540283203125, -1.315185546875, -1.15496826171875, -0.9947509765625, -0.83453369140625, -0.67431640625, -0.51409912109375, -0.3538818359375, -0.19366455078125, -0.033447265625, 0.12677001953125, 0.2869873046875, 0.44720458984375, 0.607421875, 0.76763916015625, 0.9278564453125, 1.08807373046875, 1.248291015625, 1.40850830078125, 1.5687255859375, 1.72894287109375, 1.88916015625, 2.04937744140625, 2.2095947265625, 2.36981201171875, 2.530029296875, 2.69024658203125, 2.8504638671875, 3.01068115234375, 3.1708984375, 3.33111572265625, 3.4913330078125, 3.65155029296875, 3.811767578125, 3.97198486328125, 4.1322021484375, 4.29241943359375, 4.45263671875, 4.61285400390625, 4.7730712890625, 4.93328857421875, 5.093505859375, 5.25372314453125, 5.4139404296875, 5.57415771484375, 5.734375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 20.0, 959.0, 40.0], "bins": [-216.15628051757812, -212.6983184814453, -209.2403564453125, -205.7823944091797, -202.32444763183594, -198.86648559570312, -195.4085235595703, -191.9505615234375, -188.4925994873047, -185.03463745117188, -181.57667541503906, -178.11871337890625, -174.6607666015625, -171.2028045654297, -167.74484252929688, -164.28688049316406, -160.82891845703125, -157.37095642089844, -153.91299438476562, -150.4550323486328, -146.99708557128906, -143.53912353515625, -140.08116149902344, -136.62319946289062, -133.1652374267578, -129.707275390625, -126.24932098388672, -122.7913589477539, -119.3333969116211, -115.87544250488281, -112.41748046875, -108.95951843261719, -105.5015640258789, -102.0436019897461, -98.58564758300781, -95.127685546875, -91.66972351074219, -88.21176147460938, -84.7538070678711, -81.29584503173828, -77.837890625, -74.37992858886719, -70.9219741821289, -67.4640121459961, -64.00605010986328, -60.548091888427734, -57.09013366699219, -53.632171630859375, -50.17420959472656, -46.716251373291016, -43.2582893371582, -39.800331115722656, -36.342369079589844, -32.8844108581543, -29.426450729370117, -25.968490600585938, -22.510528564453125, -19.052568435668945, -15.594608306884766, -12.136649131774902, -8.678689002990723, -5.220729827880859, -1.7627696990966797, 1.6951904296875, 5.15315055847168]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 7.0, 14.0, 13.0, 23.0, 19.0, 28.0, 19.0, 26.0, 24.0, 27.0, 38.0, 21.0, 43.0, 34.0, 39.0, 39.0, 51.0, 26.0, 46.0, 44.0, 37.0, 41.0, 44.0, 31.0, 29.0, 23.0, 25.0, 18.0, 28.0, 29.0, 14.0, 16.0, 13.0, 9.0, 12.0, 6.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-15.658852577209473, -15.231025695800781, -14.803197860717773, -14.375370979309082, -13.94754409790039, -13.519716262817383, -13.091889381408691, -12.6640625, -12.236234664916992, -11.8084077835083, -11.380579948425293, -10.952753067016602, -10.52492618560791, -10.097099304199219, -9.669271469116211, -9.24144458770752, -8.813617706298828, -8.385790824890137, -7.957963466644287, -7.5301361083984375, -7.102309226989746, -6.6744818687438965, -6.246654510498047, -5.8188276290893555, -5.391000270843506, -4.963172912597656, -4.535346031188965, -4.107518672943115, -3.6796915531158447, -3.251864433288574, -2.8240370750427246, -2.396209955215454, -1.9683818817138672, -1.5405547618865967, -1.1127275228500366, -0.6849002838134766, -0.25707316398620605, 0.17075395584106445, 0.5985813140869141, 1.0264084339141846, 1.454235553741455, 1.8820626735687256, 2.309889793395996, 2.7377171516418457, 3.165544271469116, 3.5933713912963867, 4.021198749542236, 4.449026107788086, 4.876852989196777, 5.304680347442627, 5.732507228851318, 6.160334587097168, 6.588161468505859, 7.015988826751709, 7.443816184997559, 7.87164306640625, 8.299470901489258, 8.72729778289795, 9.155125617980957, 9.582952499389648, 10.01077938079834, 10.438606262207031, 10.866434097290039, 11.29426097869873, 11.722087860107422]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 10.0, 6.0, 13.0, 13.0, 13.0, 18.0, 19.0, 14.0, 24.0, 34.0, 25.0, 41.0, 45.0, 40.0, 28.0, 42.0, 51.0, 41.0, 40.0, 33.0, 36.0, 33.0, 36.0, 32.0, 36.0, 36.0, 39.0, 29.0, 23.0, 24.0, 20.0, 10.0, 12.0, 8.0, 8.0, 10.0, 7.0, 4.0, 12.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.3203125, -1.282806396484375, -1.24530029296875, -1.207794189453125, -1.1702880859375, -1.132781982421875, -1.09527587890625, -1.057769775390625, -1.020263671875, -0.982757568359375, -0.94525146484375, -0.907745361328125, -0.8702392578125, -0.832733154296875, -0.79522705078125, -0.757720947265625, -0.72021484375, -0.682708740234375, -0.64520263671875, -0.607696533203125, -0.5701904296875, -0.532684326171875, -0.49517822265625, -0.457672119140625, -0.420166015625, -0.382659912109375, -0.34515380859375, -0.307647705078125, -0.2701416015625, -0.232635498046875, -0.19512939453125, -0.157623291015625, -0.1201171875, -0.082611083984375, -0.04510498046875, -0.007598876953125, 0.0299072265625, 0.067413330078125, 0.10491943359375, 0.142425537109375, 0.179931640625, 0.217437744140625, 0.25494384765625, 0.292449951171875, 0.3299560546875, 0.367462158203125, 0.40496826171875, 0.442474365234375, 0.47998046875, 0.517486572265625, 0.55499267578125, 0.592498779296875, 0.6300048828125, 0.667510986328125, 0.70501708984375, 0.742523193359375, 0.780029296875, 0.817535400390625, 0.85504150390625, 0.892547607421875, 0.9300537109375, 0.967559814453125, 1.00506591796875, 1.042572021484375, 1.080078125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 13.0, 15.0, 14.0, 16.0, 25.0, 45.0, 56.0, 54.0, 81.0, 141.0, 176.0, 251.0, 415.0, 659.0, 1109.0, 1749.0, 3122.0, 5223.0, 9909.0, 21056.0, 132767.0, 3636932.0, 327528.0, 26263.0, 11609.0, 6208.0, 3461.0, 2021.0, 1216.0, 752.0, 443.0, 271.0, 184.0, 135.0, 79.0, 67.0, 41.0, 37.0, 34.0, 23.0, 15.0, 12.0, 12.0, 13.0, 7.0, 4.0, 0.0, 6.0, 1.0, 1.0], "bins": [-5.4453125, -5.29241943359375, -5.1395263671875, -4.98663330078125, -4.833740234375, -4.68084716796875, -4.5279541015625, -4.37506103515625, -4.22216796875, -4.06927490234375, -3.9163818359375, -3.76348876953125, -3.610595703125, -3.45770263671875, -3.3048095703125, -3.15191650390625, -2.9990234375, -2.84613037109375, -2.6932373046875, -2.54034423828125, -2.387451171875, -2.23455810546875, -2.0816650390625, -1.92877197265625, -1.77587890625, -1.62298583984375, -1.4700927734375, -1.31719970703125, -1.164306640625, -1.01141357421875, -0.8585205078125, -0.70562744140625, -0.552734375, -0.39984130859375, -0.2469482421875, -0.09405517578125, 0.058837890625, 0.21173095703125, 0.3646240234375, 0.51751708984375, 0.67041015625, 0.82330322265625, 0.9761962890625, 1.12908935546875, 1.281982421875, 1.43487548828125, 1.5877685546875, 1.74066162109375, 1.8935546875, 2.04644775390625, 2.1993408203125, 2.35223388671875, 2.505126953125, 2.65802001953125, 2.8109130859375, 2.96380615234375, 3.11669921875, 3.26959228515625, 3.4224853515625, 3.57537841796875, 3.728271484375, 3.88116455078125, 4.0340576171875, 4.18695068359375, 4.33984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 18.0, 17.0, 16.0, 32.0, 27.0, 55.0, 89.0, 303.0, 1085.0, 1569.0, 483.0, 133.0, 64.0, 39.0, 26.0, 16.0, 18.0, 20.0, 8.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.3673095703125, -3.191650390625, -3.0159912109375, -2.84033203125, -2.6646728515625, -2.489013671875, -2.3133544921875, -2.1376953125, -1.9620361328125, -1.786376953125, -1.6107177734375, -1.43505859375, -1.2593994140625, -1.083740234375, -0.9080810546875, -0.732421875, -0.5567626953125, -0.381103515625, -0.2054443359375, -0.02978515625, 0.1458740234375, 0.321533203125, 0.4971923828125, 0.6728515625, 0.8485107421875, 1.024169921875, 1.1998291015625, 1.37548828125, 1.5511474609375, 1.726806640625, 1.9024658203125, 2.078125, 2.2537841796875, 2.429443359375, 2.6051025390625, 2.78076171875, 2.9564208984375, 3.132080078125, 3.3077392578125, 3.4833984375, 3.6590576171875, 3.834716796875, 4.0103759765625, 4.18603515625, 4.3616943359375, 4.537353515625, 4.7130126953125, 4.888671875, 5.0643310546875, 5.239990234375, 5.4156494140625, 5.59130859375, 5.7669677734375, 5.942626953125, 6.1182861328125, 6.2939453125, 6.4696044921875, 6.645263671875, 6.8209228515625, 6.99658203125, 7.1722412109375, 7.347900390625, 7.5235595703125, 7.69921875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 7.0, 14.0, 4.0, 13.0, 29.0, 32.0, 41.0, 75.0, 142.0, 256.0, 468.0, 1028.0, 2227.0, 5407.0, 14835.0, 54133.0, 2787917.0, 1259906.0, 45635.0, 13318.0, 4835.0, 2016.0, 944.0, 427.0, 236.0, 129.0, 79.0, 34.0, 33.0, 15.0, 15.0, 11.0, 9.0, 5.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.4503173828125, -8.111572265625, -7.7728271484375, -7.43408203125, -7.0953369140625, -6.756591796875, -6.4178466796875, -6.0791015625, -5.7403564453125, -5.401611328125, -5.0628662109375, -4.72412109375, -4.3853759765625, -4.046630859375, -3.7078857421875, -3.369140625, -3.0303955078125, -2.691650390625, -2.3529052734375, -2.01416015625, -1.6754150390625, -1.336669921875, -0.9979248046875, -0.6591796875, -0.3204345703125, 0.018310546875, 0.3570556640625, 0.69580078125, 1.0345458984375, 1.373291015625, 1.7120361328125, 2.05078125, 2.3895263671875, 2.728271484375, 3.0670166015625, 3.40576171875, 3.7445068359375, 4.083251953125, 4.4219970703125, 4.7607421875, 5.0994873046875, 5.438232421875, 5.7769775390625, 6.11572265625, 6.4544677734375, 6.793212890625, 7.1319580078125, 7.470703125, 7.8094482421875, 8.148193359375, 8.4869384765625, 8.82568359375, 9.1644287109375, 9.503173828125, 9.8419189453125, 10.1806640625, 10.5194091796875, 10.858154296875, 11.1968994140625, 11.53564453125, 11.8743896484375, 12.213134765625, 12.5518798828125, 12.890625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 15.0, 25.0, 48.0, 117.0, 246.0, 323.0, 128.0, 46.0, 30.0, 15.0, 4.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.677122116088867, -23.38429832458496, -22.091474533081055, -20.79865074157715, -19.505826950073242, -18.213003158569336, -16.920177459716797, -15.627354621887207, -14.3345308303833, -13.041707038879395, -11.748883247375488, -10.456058502197266, -9.16323471069336, -7.870411396026611, -6.577587127685547, -5.284763336181641, -3.9919395446777344, -2.699115753173828, -1.4062917232513428, -0.11346769332885742, 1.1793560981750488, 2.472179889678955, 3.7650041580200195, 5.057827949523926, 6.350651741027832, 7.643475532531738, 8.936299324035645, 10.229124069213867, 11.521947860717773, 12.81477165222168, 14.107595443725586, 15.400419235229492, 16.693241119384766, 17.986064910888672, 19.278888702392578, 20.571712493896484, 21.86453628540039, 23.157360076904297, 24.450183868408203, 25.74300765991211, 27.035831451416016, 28.328655242919922, 29.621479034423828, 30.914302825927734, 32.20712661743164, 33.49995040893555, 34.79277420043945, 36.08559799194336, 37.37842559814453, 38.67124938964844, 39.964073181152344, 41.25689697265625, 42.549720764160156, 43.84254455566406, 45.13536834716797, 46.428192138671875, 47.72101593017578, 49.01383972167969, 50.306663513183594, 51.5994873046875, 52.892311096191406, 54.18513488769531, 55.47795867919922, 56.770782470703125, 58.06360626220703]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 7.0, 7.0, 10.0, 15.0, 10.0, 9.0, 16.0, 15.0, 18.0, 23.0, 23.0, 20.0, 28.0, 17.0, 31.0, 27.0, 30.0, 38.0, 33.0, 34.0, 34.0, 39.0, 37.0, 36.0, 35.0, 23.0, 37.0, 36.0, 27.0, 25.0, 28.0, 36.0, 29.0, 21.0, 17.0, 26.0, 14.0, 12.0, 11.0, 9.0, 14.0, 5.0, 7.0, 4.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.41481876373291, -8.133217811584473, -7.851616859436035, -7.570015907287598, -7.28841495513916, -7.006814002990723, -6.725212574005127, -6.4436116218566895, -6.162010669708252, -5.8804097175598145, -5.598808765411377, -5.3172078132629395, -5.035606384277344, -4.754005432128906, -4.472404479980469, -4.190803527832031, -3.9092025756835938, -3.6276016235351562, -3.3460006713867188, -3.064399480819702, -2.7827985286712646, -2.501197576522827, -2.2195963859558105, -1.937995433807373, -1.6563944816589355, -1.374793529510498, -1.093192458152771, -0.8115914463996887, -0.5299904346466064, -0.24838948249816895, 0.033211588859558105, 0.31481266021728516, 0.5964136123657227, 0.8780146241188049, 1.1596156358718872, 1.4412167072296143, 1.7228176593780518, 2.0044186115264893, 2.286019802093506, 2.5676207542419434, 2.849221706390381, 3.1308226585388184, 3.412423610687256, 3.6940248012542725, 3.97562575340271, 4.257226943969727, 4.538827896118164, 4.820428848266602, 5.102029800415039, 5.383630752563477, 5.665231704711914, 5.946832656860352, 6.228433609008789, 6.510034561157227, 6.791635990142822, 7.07323694229126, 7.354837894439697, 7.636438846588135, 7.918039798736572, 8.199641227722168, 8.481242179870605, 8.762843132019043, 9.04444408416748, 9.326045036315918, 9.607645988464355]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 6.0, 10.0, 7.0, 13.0, 17.0, 17.0, 26.0, 24.0, 19.0, 29.0, 42.0, 24.0, 34.0, 41.0, 45.0, 40.0, 53.0, 42.0, 49.0, 37.0, 47.0, 50.0, 33.0, 40.0, 35.0, 33.0, 31.0, 25.0, 22.0, 16.0, 12.0, 16.0, 6.0, 9.0, 6.0, 9.0, 2.0, 7.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.55859375, -1.5160980224609375, -1.473602294921875, -1.4311065673828125, -1.38861083984375, -1.3461151123046875, -1.303619384765625, -1.2611236572265625, -1.2186279296875, -1.1761322021484375, -1.133636474609375, -1.0911407470703125, -1.04864501953125, -1.0061492919921875, -0.963653564453125, -0.9211578369140625, -0.878662109375, -0.8361663818359375, -0.793670654296875, -0.7511749267578125, -0.70867919921875, -0.6661834716796875, -0.623687744140625, -0.5811920166015625, -0.5386962890625, -0.4962005615234375, -0.453704833984375, -0.4112091064453125, -0.36871337890625, -0.3262176513671875, -0.283721923828125, -0.2412261962890625, -0.19873046875, -0.1562347412109375, -0.113739013671875, -0.0712432861328125, -0.02874755859375, 0.0137481689453125, 0.056243896484375, 0.0987396240234375, 0.1412353515625, 0.1837310791015625, 0.226226806640625, 0.2687225341796875, 0.31121826171875, 0.3537139892578125, 0.396209716796875, 0.4387054443359375, 0.481201171875, 0.5236968994140625, 0.566192626953125, 0.6086883544921875, 0.65118408203125, 0.6936798095703125, 0.736175537109375, 0.7786712646484375, 0.8211669921875, 0.8636627197265625, 0.906158447265625, 0.9486541748046875, 0.99114990234375, 1.0336456298828125, 1.076141357421875, 1.1186370849609375, 1.1611328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 5.0, 16.0, 18.0, 26.0, 43.0, 67.0, 126.0, 173.0, 250.0, 390.0, 644.0, 977.0, 1530.0, 2436.0, 3677.0, 5769.0, 9359.0, 15313.0, 25559.0, 44370.0, 81602.0, 174114.0, 303779.0, 180960.0, 84061.0, 45230.0, 26258.0, 15747.0, 9497.0, 5959.0, 3767.0, 2447.0, 1600.0, 998.0, 643.0, 410.0, 243.0, 188.0, 110.0, 71.0, 57.0, 22.0, 15.0, 12.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 3.0], "bins": [-1.974609375, -1.9190216064453125, -1.863433837890625, -1.8078460693359375, -1.75225830078125, -1.6966705322265625, -1.641082763671875, -1.5854949951171875, -1.5299072265625, -1.4743194580078125, -1.418731689453125, -1.3631439208984375, -1.30755615234375, -1.2519683837890625, -1.196380615234375, -1.1407928466796875, -1.085205078125, -1.0296173095703125, -0.974029541015625, -0.9184417724609375, -0.86285400390625, -0.8072662353515625, -0.751678466796875, -0.6960906982421875, -0.6405029296875, -0.5849151611328125, -0.529327392578125, -0.4737396240234375, -0.41815185546875, -0.3625640869140625, -0.306976318359375, -0.2513885498046875, -0.19580078125, -0.1402130126953125, -0.084625244140625, -0.0290374755859375, 0.02655029296875, 0.0821380615234375, 0.137725830078125, 0.1933135986328125, 0.2489013671875, 0.3044891357421875, 0.360076904296875, 0.4156646728515625, 0.47125244140625, 0.5268402099609375, 0.582427978515625, 0.6380157470703125, 0.693603515625, 0.7491912841796875, 0.804779052734375, 0.8603668212890625, 0.91595458984375, 0.9715423583984375, 1.027130126953125, 1.0827178955078125, 1.1383056640625, 1.1938934326171875, 1.249481201171875, 1.3050689697265625, 1.36065673828125, 1.4162445068359375, 1.471832275390625, 1.5274200439453125, 1.5830078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 7.0, 8.0, 6.0, 8.0, 9.0, 21.0, 13.0, 18.0, 30.0, 16.0, 20.0, 45.0, 34.0, 38.0, 40.0, 36.0, 37.0, 39.0, 35.0, 1060.0, 40.0, 35.0, 38.0, 36.0, 24.0, 36.0, 24.0, 30.0, 34.0, 28.0, 20.0, 28.0, 15.0, 19.0, 10.0, 18.0, 7.0, 11.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.408203125, -1.3623504638671875, -1.316497802734375, -1.2706451416015625, -1.22479248046875, -1.1789398193359375, -1.133087158203125, -1.0872344970703125, -1.0413818359375, -0.9955291748046875, -0.949676513671875, -0.9038238525390625, -0.85797119140625, -0.8121185302734375, -0.766265869140625, -0.7204132080078125, -0.674560546875, -0.6287078857421875, -0.582855224609375, -0.5370025634765625, -0.49114990234375, -0.4452972412109375, -0.399444580078125, -0.3535919189453125, -0.3077392578125, -0.2618865966796875, -0.216033935546875, -0.1701812744140625, -0.12432861328125, -0.0784759521484375, -0.032623291015625, 0.0132293701171875, 0.05908203125, 0.1049346923828125, 0.150787353515625, 0.1966400146484375, 0.24249267578125, 0.2883453369140625, 0.334197998046875, 0.3800506591796875, 0.4259033203125, 0.4717559814453125, 0.517608642578125, 0.5634613037109375, 0.60931396484375, 0.6551666259765625, 0.701019287109375, 0.7468719482421875, 0.792724609375, 0.8385772705078125, 0.884429931640625, 0.9302825927734375, 0.97613525390625, 1.0219879150390625, 1.067840576171875, 1.1136932373046875, 1.1595458984375, 1.2053985595703125, 1.251251220703125, 1.2971038818359375, 1.34295654296875, 1.3888092041015625, 1.434661865234375, 1.4805145263671875, 1.5263671875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 10.0, 14.0, 24.0, 36.0, 47.0, 78.0, 113.0, 160.0, 216.0, 302.0, 424.0, 610.0, 943.0, 1533.0, 2285.0, 3644.0, 6066.0, 10581.0, 20539.0, 52305.0, 1126225.0, 773995.0, 50567.0, 19766.0, 10334.0, 5951.0, 3572.0, 2263.0, 1480.0, 973.0, 592.0, 435.0, 301.0, 233.0, 159.0, 101.0, 67.0, 44.0, 36.0, 24.0, 22.0, 13.0, 17.0, 7.0, 6.0, 4.0, 5.0, 3.0], "bins": [-3.701171875, -3.601104736328125, -3.50103759765625, -3.400970458984375, -3.3009033203125, -3.200836181640625, -3.10076904296875, -3.000701904296875, -2.900634765625, -2.800567626953125, -2.70050048828125, -2.600433349609375, -2.5003662109375, -2.400299072265625, -2.30023193359375, -2.200164794921875, -2.10009765625, -2.000030517578125, -1.89996337890625, -1.799896240234375, -1.6998291015625, -1.599761962890625, -1.49969482421875, -1.399627685546875, -1.299560546875, -1.199493408203125, -1.09942626953125, -0.999359130859375, -0.8992919921875, -0.799224853515625, -0.69915771484375, -0.599090576171875, -0.4990234375, -0.398956298828125, -0.29888916015625, -0.198822021484375, -0.0987548828125, 0.001312255859375, 0.10137939453125, 0.201446533203125, 0.301513671875, 0.401580810546875, 0.50164794921875, 0.601715087890625, 0.7017822265625, 0.801849365234375, 0.90191650390625, 1.001983642578125, 1.10205078125, 1.202117919921875, 1.30218505859375, 1.402252197265625, 1.5023193359375, 1.602386474609375, 1.70245361328125, 1.802520751953125, 1.902587890625, 2.002655029296875, 2.10272216796875, 2.202789306640625, 2.3028564453125, 2.402923583984375, 2.50299072265625, 2.603057861328125, 2.703125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 8.0, 5.0, 11.0, 10.0, 8.0, 17.0, 27.0, 24.0, 28.0, 39.0, 41.0, 93.0, 154.0, 160.0, 120.0, 57.0, 42.0, 32.0, 24.0, 14.0, 8.0, 23.0, 21.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2959251403808594, -0.28545379638671875, -0.2749824523925781, -0.2645111083984375, -0.2540397644042969, -0.24356842041015625, -0.23309707641601562, -0.222625732421875, -0.21215438842773438, -0.20168304443359375, -0.19121170043945312, -0.1807403564453125, -0.17026901245117188, -0.15979766845703125, -0.14932632446289062, -0.13885498046875, -0.12838363647460938, -0.11791229248046875, -0.10744094848632812, -0.0969696044921875, -0.08649826049804688, -0.07602691650390625, -0.06555557250976562, -0.055084228515625, -0.044612884521484375, -0.03414154052734375, -0.023670196533203125, -0.0131988525390625, -0.002727508544921875, 0.00774383544921875, 0.018215179443359375, 0.0286865234375, 0.039157867431640625, 0.04962921142578125, 0.060100555419921875, 0.0705718994140625, 0.08104324340820312, 0.09151458740234375, 0.10198593139648438, 0.112457275390625, 0.12292861938476562, 0.13339996337890625, 0.14387130737304688, 0.1543426513671875, 0.16481399536132812, 0.17528533935546875, 0.18575668334960938, 0.19622802734375, 0.20669937133789062, 0.21717071533203125, 0.22764205932617188, 0.2381134033203125, 0.24858474731445312, 0.25905609130859375, 0.2695274353027344, 0.279998779296875, 0.2904701232910156, 0.30094146728515625, 0.3114128112792969, 0.3218841552734375, 0.3323554992675781, 0.34282684326171875, 0.3532981872558594, 0.36376953125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 4.0, 8.0, 10.0, 16.0, 21.0, 29.0, 41.0, 38.0, 73.0, 86.0, 116.0, 185.0, 339.0, 889.0, 4737.0, 56179.0, 942743.0, 37831.0, 3550.0, 786.0, 262.0, 159.0, 116.0, 81.0, 62.0, 47.0, 28.0, 25.0, 21.0, 14.0, 15.0, 8.0, 7.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.76171875, -3.6339111328125, -3.506103515625, -3.3782958984375, -3.25048828125, -3.1226806640625, -2.994873046875, -2.8670654296875, -2.7392578125, -2.6114501953125, -2.483642578125, -2.3558349609375, -2.22802734375, -2.1002197265625, -1.972412109375, -1.8446044921875, -1.716796875, -1.5889892578125, -1.461181640625, -1.3333740234375, -1.20556640625, -1.0777587890625, -0.949951171875, -0.8221435546875, -0.6943359375, -0.5665283203125, -0.438720703125, -0.3109130859375, -0.18310546875, -0.0552978515625, 0.072509765625, 0.2003173828125, 0.328125, 0.4559326171875, 0.583740234375, 0.7115478515625, 0.83935546875, 0.9671630859375, 1.094970703125, 1.2227783203125, 1.3505859375, 1.4783935546875, 1.606201171875, 1.7340087890625, 1.86181640625, 1.9896240234375, 2.117431640625, 2.2452392578125, 2.373046875, 2.5008544921875, 2.628662109375, 2.7564697265625, 2.88427734375, 3.0120849609375, 3.139892578125, 3.2677001953125, 3.3955078125, 3.5233154296875, 3.651123046875, 3.7789306640625, 3.90673828125, 4.0345458984375, 4.162353515625, 4.2901611328125, 4.41796875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 21.0, 50.0, 168.0, 445.0, 218.0, 65.0, 26.0, 12.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.938371181488037, -5.813541412353516, -5.688711643218994, -5.563881874084473, -5.439052104949951, -5.31422233581543, -5.189393043518066, -5.064563274383545, -4.939733505249023, -4.814903736114502, -4.6900739669799805, -4.565244197845459, -4.4404144287109375, -4.315585136413574, -4.1907548904418945, -4.065925598144531, -3.9410955905914307, -3.816265821456909, -3.6914360523223877, -3.5666065216064453, -3.441776752471924, -3.3169469833374023, -3.192117214202881, -3.0672874450683594, -2.942457675933838, -2.8176279067993164, -2.692798137664795, -2.5679683685302734, -2.443138837814331, -2.3183090686798096, -2.193479299545288, -2.0686495304107666, -1.9438199996948242, -1.8189902305603027, -1.6941605806350708, -1.5693308115005493, -1.4445011615753174, -1.319671392440796, -1.1948416233062744, -1.070011854171753, -0.945182204246521, -0.8203524947166443, -0.6955227851867676, -0.5706930160522461, -0.4458633065223694, -0.3210335969924927, -0.1962038278579712, -0.07137411832809448, 0.05345559120178223, 0.17828531563282013, 0.30311504006385803, 0.42794477939605713, 0.5527744889259338, 0.6776041984558105, 0.802433967590332, 0.9272636771202087, 1.0520933866500854, 1.176923155784607, 1.3017528057098389, 1.4265825748443604, 1.5514123439788818, 1.6762419939041138, 1.8010717630386353, 1.9259014129638672, 2.0507311820983887]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 3.0, 4.0, 10.0, 7.0, 19.0, 9.0, 22.0, 12.0, 17.0, 26.0, 27.0, 28.0, 21.0, 35.0, 35.0, 34.0, 39.0, 37.0, 49.0, 26.0, 35.0, 43.0, 42.0, 33.0, 34.0, 40.0, 35.0, 36.0, 25.0, 22.0, 21.0, 22.0, 19.0, 17.0, 14.0, 18.0, 12.0, 15.0, 11.0, 4.0, 9.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.9533117413520813, -0.9275822639465332, -0.9018527269363403, -0.8761232495307922, -0.8503937721252441, -0.8246642351150513, -0.7989347577095032, -0.7732052803039551, -0.7474757432937622, -0.7217462658882141, -0.6960167288780212, -0.6702872514724731, -0.6445577144622803, -0.6188282370567322, -0.5930987596511841, -0.5673692226409912, -0.5416397452354431, -0.515910267829895, -0.49018073081970215, -0.46445125341415405, -0.43872174620628357, -0.4129922389984131, -0.387262761592865, -0.3615332543849945, -0.335803747177124, -0.31007423996925354, -0.28434473276138306, -0.25861525535583496, -0.23288574814796448, -0.207156240940094, -0.1814267486333847, -0.15569725632667542, -0.12996768951416016, -0.10423818975687027, -0.07850868999958038, -0.0527791902422905, -0.02704969048500061, -0.001320183277130127, 0.024409309029579163, 0.05013880133628845, 0.07586830854415894, 0.10159780830144882, 0.1273273080587387, 0.153056800365448, 0.17878630757331848, 0.20451581478118896, 0.23024530708789825, 0.25597479939460754, 0.281704306602478, 0.3074338138103485, 0.333163321018219, 0.3588927984237671, 0.3846223056316376, 0.41035181283950806, 0.43608129024505615, 0.46181079745292664, 0.4875403046607971, 0.5132697820663452, 0.5389993190765381, 0.5647287964820862, 0.5904582738876343, 0.6161878108978271, 0.6419172883033752, 0.6676467657089233, 0.6933763027191162]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 6.0, 7.0, 7.0, 8.0, 9.0, 23.0, 10.0, 20.0, 26.0, 22.0, 25.0, 31.0, 30.0, 33.0, 42.0, 38.0, 48.0, 40.0, 43.0, 49.0, 41.0, 41.0, 47.0, 48.0, 32.0, 38.0, 40.0, 31.0, 33.0, 19.0, 21.0, 14.0, 13.0, 11.0, 8.0, 9.0, 8.0, 8.0, 4.0, 3.0, 3.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5556640625, -1.5128326416015625, -1.470001220703125, -1.4271697998046875, -1.38433837890625, -1.3415069580078125, -1.298675537109375, -1.2558441162109375, -1.2130126953125, -1.1701812744140625, -1.127349853515625, -1.0845184326171875, -1.04168701171875, -0.9988555908203125, -0.956024169921875, -0.9131927490234375, -0.870361328125, -0.8275299072265625, -0.784698486328125, -0.7418670654296875, -0.69903564453125, -0.6562042236328125, -0.613372802734375, -0.5705413818359375, -0.5277099609375, -0.4848785400390625, -0.442047119140625, -0.3992156982421875, -0.35638427734375, -0.3135528564453125, -0.270721435546875, -0.2278900146484375, -0.18505859375, -0.1422271728515625, -0.099395751953125, -0.0565643310546875, -0.01373291015625, 0.0290985107421875, 0.071929931640625, 0.1147613525390625, 0.1575927734375, 0.2004241943359375, 0.243255615234375, 0.2860870361328125, 0.32891845703125, 0.3717498779296875, 0.414581298828125, 0.4574127197265625, 0.500244140625, 0.5430755615234375, 0.585906982421875, 0.6287384033203125, 0.67156982421875, 0.7144012451171875, 0.757232666015625, 0.8000640869140625, 0.8428955078125, 0.8857269287109375, 0.928558349609375, 0.9713897705078125, 1.01422119140625, 1.0570526123046875, 1.099884033203125, 1.1427154541015625, 1.185546875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 11.0, 15.0, 27.0, 32.0, 42.0, 60.0, 88.0, 137.0, 200.0, 304.0, 392.0, 563.0, 829.0, 1210.0, 1777.0, 2673.0, 4017.0, 6514.0, 11848.0, 30197.0, 143521.0, 648395.0, 135902.0, 29265.0, 11813.0, 6470.0, 4095.0, 2615.0, 1633.0, 1188.0, 830.0, 597.0, 415.0, 271.0, 195.0, 128.0, 89.0, 52.0, 51.0, 32.0, 23.0, 9.0, 9.0, 6.0, 6.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.65234375, -1.60443115234375, -1.5565185546875, -1.50860595703125, -1.460693359375, -1.41278076171875, -1.3648681640625, -1.31695556640625, -1.26904296875, -1.22113037109375, -1.1732177734375, -1.12530517578125, -1.077392578125, -1.02947998046875, -0.9815673828125, -0.93365478515625, -0.8857421875, -0.83782958984375, -0.7899169921875, -0.74200439453125, -0.694091796875, -0.64617919921875, -0.5982666015625, -0.55035400390625, -0.50244140625, -0.45452880859375, -0.4066162109375, -0.35870361328125, -0.310791015625, -0.26287841796875, -0.2149658203125, -0.16705322265625, -0.119140625, -0.07122802734375, -0.0233154296875, 0.02459716796875, 0.072509765625, 0.12042236328125, 0.1683349609375, 0.21624755859375, 0.26416015625, 0.31207275390625, 0.3599853515625, 0.40789794921875, 0.455810546875, 0.50372314453125, 0.5516357421875, 0.59954833984375, 0.6474609375, 0.69537353515625, 0.7432861328125, 0.79119873046875, 0.839111328125, 0.88702392578125, 0.9349365234375, 0.98284912109375, 1.03076171875, 1.07867431640625, 1.1265869140625, 1.17449951171875, 1.222412109375, 1.27032470703125, 1.3182373046875, 1.36614990234375, 1.4140625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 0.0, 3.0, 5.0, 7.0, 8.0, 6.0, 11.0, 8.0, 9.0, 17.0, 16.0, 27.0, 29.0, 23.0, 38.0, 37.0, 43.0, 36.0, 51.0, 69.0, 120.0, 434.0, 1487.0, 117.0, 56.0, 53.0, 43.0, 51.0, 39.0, 30.0, 27.0, 21.0, 18.0, 21.0, 18.0, 14.0, 8.0, 9.0, 12.0, 7.0, 10.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.9488525390625, -3.807861328125, -3.6668701171875, -3.52587890625, -3.3848876953125, -3.243896484375, -3.1029052734375, -2.9619140625, -2.8209228515625, -2.679931640625, -2.5389404296875, -2.39794921875, -2.2569580078125, -2.115966796875, -1.9749755859375, -1.833984375, -1.6929931640625, -1.552001953125, -1.4110107421875, -1.27001953125, -1.1290283203125, -0.988037109375, -0.8470458984375, -0.7060546875, -0.5650634765625, -0.424072265625, -0.2830810546875, -0.14208984375, -0.0010986328125, 0.139892578125, 0.2808837890625, 0.421875, 0.5628662109375, 0.703857421875, 0.8448486328125, 0.98583984375, 1.1268310546875, 1.267822265625, 1.4088134765625, 1.5498046875, 1.6907958984375, 1.831787109375, 1.9727783203125, 2.11376953125, 2.2547607421875, 2.395751953125, 2.5367431640625, 2.677734375, 2.8187255859375, 2.959716796875, 3.1007080078125, 3.24169921875, 3.3826904296875, 3.523681640625, 3.6646728515625, 3.8056640625, 3.9466552734375, 4.087646484375, 4.2286376953125, 4.36962890625, 4.5106201171875, 4.651611328125, 4.7926025390625, 4.93359375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 1.0, 5.0, 5.0, 11.0, 7.0, 10.0, 19.0, 17.0, 25.0, 24.0, 48.0, 62.0, 112.0, 159.0, 330.0, 713.0, 1712.0, 5037.0, 19396.0, 189612.0, 2824376.0, 84572.0, 13157.0, 3716.0, 1290.0, 546.0, 289.0, 131.0, 98.0, 49.0, 46.0, 28.0, 31.0, 14.0, 9.0, 16.0, 4.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.29296875, -5.13897705078125, -4.9849853515625, -4.83099365234375, -4.677001953125, -4.52301025390625, -4.3690185546875, -4.21502685546875, -4.06103515625, -3.90704345703125, -3.7530517578125, -3.59906005859375, -3.445068359375, -3.29107666015625, -3.1370849609375, -2.98309326171875, -2.8291015625, -2.67510986328125, -2.5211181640625, -2.36712646484375, -2.213134765625, -2.05914306640625, -1.9051513671875, -1.75115966796875, -1.59716796875, -1.44317626953125, -1.2891845703125, -1.13519287109375, -0.981201171875, -0.82720947265625, -0.6732177734375, -0.51922607421875, -0.365234375, -0.21124267578125, -0.0572509765625, 0.09674072265625, 0.250732421875, 0.40472412109375, 0.5587158203125, 0.71270751953125, 0.86669921875, 1.02069091796875, 1.1746826171875, 1.32867431640625, 1.482666015625, 1.63665771484375, 1.7906494140625, 1.94464111328125, 2.0986328125, 2.25262451171875, 2.4066162109375, 2.56060791015625, 2.714599609375, 2.86859130859375, 3.0225830078125, 3.17657470703125, 3.33056640625, 3.48455810546875, 3.6385498046875, 3.79254150390625, 3.946533203125, 4.10052490234375, 4.2545166015625, 4.40850830078125, 4.5625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 481.0, 519.0, 12.0, 0.0, 1.0], "bins": [-118.86695861816406, -116.8858642578125, -114.90476989746094, -112.9236831665039, -110.94258880615234, -108.96149444580078, -106.98040008544922, -104.99930572509766, -103.01821899414062, -101.03712463378906, -99.0560302734375, -97.07494354248047, -95.0938491821289, -93.11275482177734, -91.13166046142578, -89.15056610107422, -87.16947174072266, -85.1883773803711, -83.20728302001953, -81.2261962890625, -79.24510192871094, -77.26400756835938, -75.28291320800781, -73.30181884765625, -71.32073211669922, -69.33963775634766, -67.3585433959961, -65.37745666503906, -63.3963623046875, -61.41526794433594, -59.434173583984375, -57.45308303833008, -55.47199249267578, -53.49089813232422, -51.50980758666992, -49.52871322631836, -47.54762268066406, -45.5665283203125, -43.58543395996094, -41.60434341430664, -39.62324905395508, -37.642154693603516, -35.66106414794922, -33.679969787597656, -31.698877334594727, -29.717784881591797, -27.736692428588867, -25.755599975585938, -23.774505615234375, -21.793413162231445, -19.812320709228516, -17.831226348876953, -15.850133895874023, -13.869041442871094, -11.887948989868164, -9.906855583190918, -7.925763130187988, -5.9446702003479, -3.9635775089263916, -1.9824848175048828, -0.0013918876647949219, 1.979701042175293, 3.9607934951782227, 5.941886901855469, 7.922979354858398]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 11.0, 12.0, 5.0, 10.0, 9.0, 11.0, 14.0, 26.0, 23.0, 26.0, 37.0, 45.0, 21.0, 34.0, 39.0, 37.0, 47.0, 44.0, 43.0, 46.0, 31.0, 42.0, 48.0, 35.0, 33.0, 35.0, 38.0, 22.0, 26.0, 24.0, 17.0, 15.0, 16.0, 20.0, 13.0, 6.0, 5.0, 6.0, 4.0, 8.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.246219635009766, -12.810907363891602, -12.375594139099121, -11.940281867980957, -11.504968643188477, -11.069656372070312, -10.634344100952148, -10.199031829833984, -9.763718605041504, -9.32840633392334, -8.89309310913086, -8.457780838012695, -8.022468566894531, -7.587155342102051, -7.151843070983887, -6.7165303230285645, -6.281217575073242, -5.84590482711792, -5.410592079162598, -4.975279808044434, -4.539967060089111, -4.104654312133789, -3.669341802597046, -3.2340292930603027, -2.7987165451049805, -2.363403797149658, -1.928091287612915, -1.4927786588668823, -1.0574660301208496, -0.6221532821655273, -0.18684077262878418, 0.24847173690795898, 0.6837844848632812, 1.119097113609314, 1.5544097423553467, 1.9897223711013794, 2.425034999847412, 2.8603477478027344, 3.2956602573394775, 3.7309727668762207, 4.166285514831543, 4.601598262786865, 5.0369110107421875, 5.472223281860352, 5.907536029815674, 6.342848777770996, 6.77816104888916, 7.213473796844482, 7.648786544799805, 8.084098815917969, 8.51941204071045, 8.954724311828613, 9.390037536621094, 9.825349807739258, 10.260662078857422, 10.695974349975586, 11.131287574768066, 11.56659984588623, 12.001913070678711, 12.437225341796875, 12.872537612915039, 13.30785083770752, 13.743163108825684, 14.178476333618164, 14.613788604736328]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 4.0, 5.0, 10.0, 9.0, 10.0, 15.0, 18.0, 23.0, 36.0, 15.0, 24.0, 40.0, 26.0, 29.0, 37.0, 42.0, 38.0, 53.0, 36.0, 53.0, 35.0, 52.0, 46.0, 36.0, 41.0, 40.0, 41.0, 24.0, 23.0, 28.0, 18.0, 11.0, 15.0, 10.0, 13.0, 10.0, 5.0, 3.0, 4.0, 5.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.626953125, -1.583038330078125, -1.53912353515625, -1.495208740234375, -1.4512939453125, -1.407379150390625, -1.36346435546875, -1.319549560546875, -1.275634765625, -1.231719970703125, -1.18780517578125, -1.143890380859375, -1.0999755859375, -1.056060791015625, -1.01214599609375, -0.968231201171875, -0.92431640625, -0.880401611328125, -0.83648681640625, -0.792572021484375, -0.7486572265625, -0.704742431640625, -0.66082763671875, -0.616912841796875, -0.572998046875, -0.529083251953125, -0.48516845703125, -0.441253662109375, -0.3973388671875, -0.353424072265625, -0.30950927734375, -0.265594482421875, -0.2216796875, -0.177764892578125, -0.13385009765625, -0.089935302734375, -0.0460205078125, -0.002105712890625, 0.04180908203125, 0.085723876953125, 0.129638671875, 0.173553466796875, 0.21746826171875, 0.261383056640625, 0.3052978515625, 0.349212646484375, 0.39312744140625, 0.437042236328125, 0.48095703125, 0.524871826171875, 0.56878662109375, 0.612701416015625, 0.6566162109375, 0.700531005859375, 0.74444580078125, 0.788360595703125, 0.832275390625, 0.876190185546875, 0.92010498046875, 0.964019775390625, 1.0079345703125, 1.051849365234375, 1.09576416015625, 1.139678955078125, 1.18359375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 9.0, 14.0, 21.0, 26.0, 32.0, 44.0, 65.0, 102.0, 154.0, 251.0, 341.0, 522.0, 884.0, 1427.0, 2341.0, 4104.0, 7669.0, 16640.0, 91733.0, 2841945.0, 1149312.0, 48244.0, 13319.0, 6315.0, 3410.0, 2029.0, 1198.0, 780.0, 470.0, 295.0, 194.0, 123.0, 81.0, 46.0, 51.0, 31.0, 21.0, 12.0, 6.0, 7.0, 2.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.62896728515625, -4.4962158203125, -4.36346435546875, -4.230712890625, -4.09796142578125, -3.9652099609375, -3.83245849609375, -3.69970703125, -3.56695556640625, -3.4342041015625, -3.30145263671875, -3.168701171875, -3.03594970703125, -2.9031982421875, -2.77044677734375, -2.6376953125, -2.50494384765625, -2.3721923828125, -2.23944091796875, -2.106689453125, -1.97393798828125, -1.8411865234375, -1.70843505859375, -1.57568359375, -1.44293212890625, -1.3101806640625, -1.17742919921875, -1.044677734375, -0.91192626953125, -0.7791748046875, -0.64642333984375, -0.513671875, -0.38092041015625, -0.2481689453125, -0.11541748046875, 0.017333984375, 0.15008544921875, 0.2828369140625, 0.41558837890625, 0.54833984375, 0.68109130859375, 0.8138427734375, 0.94659423828125, 1.079345703125, 1.21209716796875, 1.3448486328125, 1.47760009765625, 1.6103515625, 1.74310302734375, 1.8758544921875, 2.00860595703125, 2.141357421875, 2.27410888671875, 2.4068603515625, 2.53961181640625, 2.67236328125, 2.80511474609375, 2.9378662109375, 3.07061767578125, 3.203369140625, 3.33612060546875, 3.4688720703125, 3.60162353515625, 3.734375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 8.0, 7.0, 5.0, 6.0, 19.0, 22.0, 22.0, 23.0, 30.0, 57.0, 105.0, 270.0, 769.0, 1366.0, 725.0, 264.0, 103.0, 63.0, 43.0, 26.0, 22.0, 17.0, 14.0, 11.0, 14.0, 9.0, 13.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5546875, -4.41455078125, -4.2744140625, -4.13427734375, -3.994140625, -3.85400390625, -3.7138671875, -3.57373046875, -3.43359375, -3.29345703125, -3.1533203125, -3.01318359375, -2.873046875, -2.73291015625, -2.5927734375, -2.45263671875, -2.3125, -2.17236328125, -2.0322265625, -1.89208984375, -1.751953125, -1.61181640625, -1.4716796875, -1.33154296875, -1.19140625, -1.05126953125, -0.9111328125, -0.77099609375, -0.630859375, -0.49072265625, -0.3505859375, -0.21044921875, -0.0703125, 0.06982421875, 0.2099609375, 0.35009765625, 0.490234375, 0.63037109375, 0.7705078125, 0.91064453125, 1.05078125, 1.19091796875, 1.3310546875, 1.47119140625, 1.611328125, 1.75146484375, 1.8916015625, 2.03173828125, 2.171875, 2.31201171875, 2.4521484375, 2.59228515625, 2.732421875, 2.87255859375, 3.0126953125, 3.15283203125, 3.29296875, 3.43310546875, 3.5732421875, 3.71337890625, 3.853515625, 3.99365234375, 4.1337890625, 4.27392578125, 4.4140625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 11.0, 20.0, 26.0, 35.0, 57.0, 74.0, 124.0, 184.0, 311.0, 427.0, 788.0, 1285.0, 2128.0, 3762.0, 7185.0, 14369.0, 34141.0, 133984.0, 3358029.0, 537481.0, 56874.0, 21028.0, 9831.0, 5123.0, 2779.0, 1609.0, 936.0, 596.0, 369.0, 239.0, 151.0, 102.0, 64.0, 42.0, 34.0, 21.0, 17.0, 12.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5390625, -6.3330078125, -6.126953125, -5.9208984375, -5.71484375, -5.5087890625, -5.302734375, -5.0966796875, -4.890625, -4.6845703125, -4.478515625, -4.2724609375, -4.06640625, -3.8603515625, -3.654296875, -3.4482421875, -3.2421875, -3.0361328125, -2.830078125, -2.6240234375, -2.41796875, -2.2119140625, -2.005859375, -1.7998046875, -1.59375, -1.3876953125, -1.181640625, -0.9755859375, -0.76953125, -0.5634765625, -0.357421875, -0.1513671875, 0.0546875, 0.2607421875, 0.466796875, 0.6728515625, 0.87890625, 1.0849609375, 1.291015625, 1.4970703125, 1.703125, 1.9091796875, 2.115234375, 2.3212890625, 2.52734375, 2.7333984375, 2.939453125, 3.1455078125, 3.3515625, 3.5576171875, 3.763671875, 3.9697265625, 4.17578125, 4.3818359375, 4.587890625, 4.7939453125, 5.0, 5.2060546875, 5.412109375, 5.6181640625, 5.82421875, 6.0302734375, 6.236328125, 6.4423828125, 6.6484375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 5.0, 32.0, 62.0, 208.0, 442.0, 176.0, 48.0, 17.0, 9.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.571571350097656, -21.94209098815918, -20.312610626220703, -18.683128356933594, -17.053647994995117, -15.42416763305664, -13.794686317443848, -12.165205001831055, -10.535724639892578, -8.906244277954102, -7.276762962341309, -5.647282123565674, -4.017801284790039, -2.3883209228515625, -0.7588396072387695, 0.8706417083740234, 2.5001220703125, 4.129602909088135, 5.7590837478637695, 7.388564586639404, 9.018045425415039, 10.647525787353516, 12.277007102966309, 13.906488418579102, 15.535968780517578, 17.165449142456055, 18.79492950439453, 20.42441177368164, 22.053892135620117, 23.683372497558594, 25.312854766845703, 26.94233512878418, 28.571815490722656, 30.201295852661133, 31.83077621459961, 33.46025848388672, 35.08973693847656, 36.71921920776367, 38.34870147705078, 39.978179931640625, 41.607662200927734, 43.237144470214844, 44.86662292480469, 46.4961051940918, 48.125587463378906, 49.75506591796875, 51.38454818725586, 53.01403045654297, 54.64350891113281, 56.27299118041992, 57.902469635009766, 59.531951904296875, 61.16143035888672, 62.79091262817383, 64.42039489746094, 66.04987335205078, 67.67935180664062, 69.30883026123047, 70.93831634521484, 72.56779479980469, 74.19727325439453, 75.82675170898438, 77.45623779296875, 79.0857162475586, 80.71520233154297]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 3.0, 4.0, 5.0, 4.0, 7.0, 13.0, 11.0, 19.0, 16.0, 18.0, 22.0, 26.0, 30.0, 31.0, 31.0, 39.0, 32.0, 47.0, 29.0, 39.0, 56.0, 26.0, 36.0, 46.0, 43.0, 42.0, 41.0, 36.0, 31.0, 33.0, 33.0, 22.0, 27.0, 19.0, 17.0, 15.0, 7.0, 8.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.876404762268066, -11.534066200256348, -11.191726684570312, -10.849388122558594, -10.507048606872559, -10.16471004486084, -9.822370529174805, -9.480031967163086, -9.13769245147705, -8.795353889465332, -8.453014373779297, -8.110675811767578, -7.768336296081543, -7.425997257232666, -7.083658218383789, -6.74131965637207, -6.398980617523193, -6.056641578674316, -5.7143025398254395, -5.3719635009765625, -5.0296244621276855, -4.687285423278809, -4.34494686126709, -4.002607345581055, -3.660268545150757, -3.31792950630188, -2.975590467453003, -2.633251667022705, -2.290912628173828, -1.9485734701156616, -1.6062345504760742, -1.2638955116271973, -0.9215564727783203, -0.5792174339294434, -0.23687845468521118, 0.105460524559021, 0.44779956340789795, 0.7901386022567749, 1.1324775218963623, 1.4748165607452393, 1.8171555995941162, 2.159494638442993, 2.50183367729187, 2.844172477722168, 3.186511516571045, 3.528850555419922, 3.871189594268799, 4.213528633117676, 4.555867671966553, 4.89820671081543, 5.240545749664307, 5.582884788513184, 5.9252238273620605, 6.2675628662109375, 6.609901428222656, 6.952240943908691, 7.29457950592041, 7.636918544769287, 7.979257583618164, 8.321596145629883, 8.663935661315918, 9.006274223327637, 9.348613739013672, 9.69095230102539, 10.033291816711426]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 4.0, 5.0, 7.0, 11.0, 4.0, 8.0, 16.0, 18.0, 14.0, 21.0, 23.0, 23.0, 23.0, 27.0, 39.0, 37.0, 47.0, 31.0, 35.0, 38.0, 53.0, 55.0, 45.0, 35.0, 42.0, 49.0, 36.0, 32.0, 34.0, 35.0, 22.0, 19.0, 23.0, 12.0, 12.0, 14.0, 6.0, 8.0, 8.0, 6.0, 4.0, 6.0, 1.0, 2.0, 6.0, 3.0, 1.0, 2.0], "bins": [-1.5927734375, -1.549530029296875, -1.50628662109375, -1.463043212890625, -1.4197998046875, -1.376556396484375, -1.33331298828125, -1.290069580078125, -1.246826171875, -1.203582763671875, -1.16033935546875, -1.117095947265625, -1.0738525390625, -1.030609130859375, -0.98736572265625, -0.944122314453125, -0.90087890625, -0.857635498046875, -0.81439208984375, -0.771148681640625, -0.7279052734375, -0.684661865234375, -0.64141845703125, -0.598175048828125, -0.554931640625, -0.511688232421875, -0.46844482421875, -0.425201416015625, -0.3819580078125, -0.338714599609375, -0.29547119140625, -0.252227783203125, -0.208984375, -0.165740966796875, -0.12249755859375, -0.079254150390625, -0.0360107421875, 0.007232666015625, 0.05047607421875, 0.093719482421875, 0.136962890625, 0.180206298828125, 0.22344970703125, 0.266693115234375, 0.3099365234375, 0.353179931640625, 0.39642333984375, 0.439666748046875, 0.48291015625, 0.526153564453125, 0.56939697265625, 0.612640380859375, 0.6558837890625, 0.699127197265625, 0.74237060546875, 0.785614013671875, 0.828857421875, 0.872100830078125, 0.91534423828125, 0.958587646484375, 1.0018310546875, 1.045074462890625, 1.08831787109375, 1.131561279296875, 1.1748046875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 11.0, 12.0, 11.0, 26.0, 20.0, 44.0, 64.0, 107.0, 152.0, 223.0, 299.0, 555.0, 781.0, 1230.0, 1832.0, 2963.0, 4437.0, 6912.0, 10614.0, 17103.0, 27816.0, 48418.0, 93794.0, 208370.0, 290211.0, 156610.0, 72518.0, 39900.0, 23143.0, 14424.0, 9228.0, 5803.0, 3814.0, 2556.0, 1538.0, 1049.0, 654.0, 458.0, 291.0, 181.0, 138.0, 74.0, 58.0, 47.0, 17.0, 15.0, 18.0, 7.0, 7.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.8330078125, -1.7811126708984375, -1.729217529296875, -1.6773223876953125, -1.62542724609375, -1.5735321044921875, -1.521636962890625, -1.4697418212890625, -1.4178466796875, -1.3659515380859375, -1.314056396484375, -1.2621612548828125, -1.21026611328125, -1.1583709716796875, -1.106475830078125, -1.0545806884765625, -1.002685546875, -0.9507904052734375, -0.898895263671875, -0.8470001220703125, -0.79510498046875, -0.7432098388671875, -0.691314697265625, -0.6394195556640625, -0.5875244140625, -0.5356292724609375, -0.483734130859375, -0.4318389892578125, -0.37994384765625, -0.3280487060546875, -0.276153564453125, -0.2242584228515625, -0.17236328125, -0.1204681396484375, -0.068572998046875, -0.0166778564453125, 0.03521728515625, 0.0871124267578125, 0.139007568359375, 0.1909027099609375, 0.2427978515625, 0.2946929931640625, 0.346588134765625, 0.3984832763671875, 0.45037841796875, 0.5022735595703125, 0.554168701171875, 0.6060638427734375, 0.657958984375, 0.7098541259765625, 0.761749267578125, 0.8136444091796875, 0.86553955078125, 0.9174346923828125, 0.969329833984375, 1.0212249755859375, 1.0731201171875, 1.1250152587890625, 1.176910400390625, 1.2288055419921875, 1.28070068359375, 1.3325958251953125, 1.384490966796875, 1.4363861083984375, 1.48828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 9.0, 9.0, 12.0, 12.0, 7.0, 16.0, 31.0, 21.0, 34.0, 19.0, 40.0, 42.0, 33.0, 51.0, 43.0, 36.0, 1070.0, 49.0, 39.0, 46.0, 32.0, 45.0, 39.0, 28.0, 43.0, 31.0, 25.0, 28.0, 15.0, 18.0, 16.0, 17.0, 18.0, 10.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.58984375, -1.54156494140625, -1.4932861328125, -1.44500732421875, -1.396728515625, -1.34844970703125, -1.3001708984375, -1.25189208984375, -1.20361328125, -1.15533447265625, -1.1070556640625, -1.05877685546875, -1.010498046875, -0.96221923828125, -0.9139404296875, -0.86566162109375, -0.8173828125, -0.76910400390625, -0.7208251953125, -0.67254638671875, -0.624267578125, -0.57598876953125, -0.5277099609375, -0.47943115234375, -0.43115234375, -0.38287353515625, -0.3345947265625, -0.28631591796875, -0.238037109375, -0.18975830078125, -0.1414794921875, -0.09320068359375, -0.044921875, 0.00335693359375, 0.0516357421875, 0.09991455078125, 0.148193359375, 0.19647216796875, 0.2447509765625, 0.29302978515625, 0.34130859375, 0.38958740234375, 0.4378662109375, 0.48614501953125, 0.534423828125, 0.58270263671875, 0.6309814453125, 0.67926025390625, 0.7275390625, 0.77581787109375, 0.8240966796875, 0.87237548828125, 0.920654296875, 0.96893310546875, 1.0172119140625, 1.06549072265625, 1.11376953125, 1.16204833984375, 1.2103271484375, 1.25860595703125, 1.306884765625, 1.35516357421875, 1.4034423828125, 1.45172119140625, 1.5]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 12.0, 10.0, 20.0, 31.0, 46.0, 63.0, 79.0, 126.0, 202.0, 276.0, 405.0, 630.0, 1050.0, 1715.0, 2933.0, 5301.0, 10505.0, 23132.0, 96557.0, 1827495.0, 82153.0, 21568.0, 9865.0, 5149.0, 2870.0, 1726.0, 1077.0, 684.0, 440.0, 314.0, 223.0, 129.0, 81.0, 75.0, 63.0, 34.0, 24.0, 14.0, 11.0, 8.0, 10.0, 2.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.279296875, -3.18414306640625, -3.0889892578125, -2.99383544921875, -2.898681640625, -2.80352783203125, -2.7083740234375, -2.61322021484375, -2.51806640625, -2.42291259765625, -2.3277587890625, -2.23260498046875, -2.137451171875, -2.04229736328125, -1.9471435546875, -1.85198974609375, -1.7568359375, -1.66168212890625, -1.5665283203125, -1.47137451171875, -1.376220703125, -1.28106689453125, -1.1859130859375, -1.09075927734375, -0.99560546875, -0.90045166015625, -0.8052978515625, -0.71014404296875, -0.614990234375, -0.51983642578125, -0.4246826171875, -0.32952880859375, -0.234375, -0.13922119140625, -0.0440673828125, 0.05108642578125, 0.146240234375, 0.24139404296875, 0.3365478515625, 0.43170166015625, 0.52685546875, 0.62200927734375, 0.7171630859375, 0.81231689453125, 0.907470703125, 1.00262451171875, 1.0977783203125, 1.19293212890625, 1.2880859375, 1.38323974609375, 1.4783935546875, 1.57354736328125, 1.668701171875, 1.76385498046875, 1.8590087890625, 1.95416259765625, 2.04931640625, 2.14447021484375, 2.2396240234375, 2.33477783203125, 2.429931640625, 2.52508544921875, 2.6202392578125, 2.71539306640625, 2.810546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 5.0, 6.0, 10.0, 17.0, 22.0, 39.0, 38.0, 96.0, 139.0, 165.0, 153.0, 123.0, 66.0, 39.0, 28.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2169189453125, -0.21067428588867188, -0.20442962646484375, -0.19818496704101562, -0.1919403076171875, -0.18569564819335938, -0.17945098876953125, -0.17320632934570312, -0.166961669921875, -0.16071701049804688, -0.15447235107421875, -0.14822769165039062, -0.1419830322265625, -0.13573837280273438, -0.12949371337890625, -0.12324905395507812, -0.11700439453125, -0.11075973510742188, -0.10451507568359375, -0.09827041625976562, -0.0920257568359375, -0.08578109741210938, -0.07953643798828125, -0.07329177856445312, -0.067047119140625, -0.060802459716796875, -0.05455780029296875, -0.048313140869140625, -0.0420684814453125, -0.035823822021484375, -0.02957916259765625, -0.023334503173828125, -0.01708984375, -0.010845184326171875, -0.00460052490234375, 0.001644134521484375, 0.0078887939453125, 0.014133453369140625, 0.02037811279296875, 0.026622772216796875, 0.032867431640625, 0.039112091064453125, 0.04535675048828125, 0.051601409912109375, 0.0578460693359375, 0.06409072875976562, 0.07033538818359375, 0.07658004760742188, 0.08282470703125, 0.08906936645507812, 0.09531402587890625, 0.10155868530273438, 0.1078033447265625, 0.11404800415039062, 0.12029266357421875, 0.12653732299804688, 0.132781982421875, 0.13902664184570312, 0.14527130126953125, 0.15151596069335938, 0.1577606201171875, 0.16400527954101562, 0.17024993896484375, 0.17649459838867188, 0.1827392578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 4.0, 4.0, 7.0, 14.0, 16.0, 28.0, 33.0, 63.0, 72.0, 198.0, 494.0, 1788.0, 15226.0, 999935.0, 27313.0, 2310.0, 585.0, 200.0, 98.0, 50.0, 26.0, 21.0, 14.0, 4.0, 10.0, 6.0, 0.0, 7.0, 4.0, 0.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.96484375, -2.87908935546875, -2.7933349609375, -2.70758056640625, -2.621826171875, -2.53607177734375, -2.4503173828125, -2.36456298828125, -2.27880859375, -2.19305419921875, -2.1072998046875, -2.02154541015625, -1.935791015625, -1.85003662109375, -1.7642822265625, -1.67852783203125, -1.5927734375, -1.50701904296875, -1.4212646484375, -1.33551025390625, -1.249755859375, -1.16400146484375, -1.0782470703125, -0.99249267578125, -0.90673828125, -0.82098388671875, -0.7352294921875, -0.64947509765625, -0.563720703125, -0.47796630859375, -0.3922119140625, -0.30645751953125, -0.220703125, -0.13494873046875, -0.0491943359375, 0.03656005859375, 0.122314453125, 0.20806884765625, 0.2938232421875, 0.37957763671875, 0.46533203125, 0.55108642578125, 0.6368408203125, 0.72259521484375, 0.808349609375, 0.89410400390625, 0.9798583984375, 1.06561279296875, 1.1513671875, 1.23712158203125, 1.3228759765625, 1.40863037109375, 1.494384765625, 1.58013916015625, 1.6658935546875, 1.75164794921875, 1.83740234375, 1.92315673828125, 2.0089111328125, 2.09466552734375, 2.180419921875, 2.26617431640625, 2.3519287109375, 2.43768310546875, 2.5234375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 15.0, 20.0, 24.0, 40.0, 63.0, 87.0, 141.0, 147.0, 133.0, 89.0, 66.0, 46.0, 38.0, 23.0, 22.0, 13.0, 10.0, 8.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.632057249546051, -0.615587055683136, -0.5991168022155762, -0.5826466083526611, -0.5661764144897461, -0.549706220626831, -0.533236026763916, -0.5167657732963562, -0.5002955794334412, -0.4838253855705261, -0.4673551619052887, -0.45088493824005127, -0.43441474437713623, -0.4179445505142212, -0.40147432684898376, -0.38500410318374634, -0.3685339093208313, -0.35206371545791626, -0.33559349179267883, -0.3191232681274414, -0.30265307426452637, -0.28618288040161133, -0.2697126567363739, -0.2532424330711365, -0.23677223920822144, -0.2203020304441452, -0.20383182168006897, -0.18736161291599274, -0.1708914041519165, -0.15442119538784027, -0.13795098662376404, -0.1214807778596878, -0.1050105094909668, -0.08854030072689056, -0.07207009196281433, -0.0555998831987381, -0.039129674434661865, -0.022659465670585632, -0.006189256906509399, 0.010280951857566833, 0.026751160621643066, 0.0432213693857193, 0.05969157814979553, 0.07616178691387177, 0.092631995677948, 0.10910220444202423, 0.12557241320610046, 0.1420426219701767, 0.15851283073425293, 0.17498303949832916, 0.1914532482624054, 0.20792345702648163, 0.22439366579055786, 0.2408638745546341, 0.2573340833187103, 0.27380430698394775, 0.2902745008468628, 0.30674469470977783, 0.32321491837501526, 0.3396851420402527, 0.3561553359031677, 0.37262552976608276, 0.3890957534313202, 0.4055659770965576, 0.42203617095947266]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 2.0, 8.0, 6.0, 10.0, 7.0, 5.0, 9.0, 21.0, 18.0, 25.0, 16.0, 21.0, 29.0, 29.0, 36.0, 33.0, 45.0, 35.0, 41.0, 30.0, 45.0, 46.0, 45.0, 34.0, 34.0, 35.0, 40.0, 24.0, 39.0, 37.0, 27.0, 17.0, 23.0, 19.0, 23.0, 17.0, 13.0, 17.0, 9.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22995620965957642, -0.22270561754703522, -0.21545502543449402, -0.20820441842079163, -0.20095382630825043, -0.19370323419570923, -0.18645264208316803, -0.17920204997062683, -0.17195144295692444, -0.16470085084438324, -0.15745025873184204, -0.15019965171813965, -0.14294905960559845, -0.13569846749305725, -0.12844787538051605, -0.12119728326797485, -0.11394669115543365, -0.10669609904289246, -0.09944549947977066, -0.09219490736722946, -0.08494430780410767, -0.07769371569156647, -0.07044312357902527, -0.06319253146648407, -0.055941931903362274, -0.04869133606553078, -0.04144074022769928, -0.03419014811515808, -0.026939552277326584, -0.019688956439495087, -0.012438364326953888, -0.005187768489122391, 0.0020628273487091064, 0.009313422255218029, 0.01656401716172695, 0.0238146111369133, 0.031065206974744797, 0.038315802812576294, 0.04556639492511749, 0.05281699076294899, 0.06006758660078049, 0.06731817871332169, 0.07456877827644348, 0.08181937038898468, 0.08906996250152588, 0.09632056206464767, 0.10357115417718887, 0.11082175374031067, 0.11807234585285187, 0.12532293796539307, 0.13257353007793427, 0.13982412219047546, 0.14707472920417786, 0.15432532131671906, 0.16157591342926025, 0.16882650554180145, 0.17607709765434265, 0.18332768976688385, 0.19057828187942505, 0.19782888889312744, 0.20507948100566864, 0.21233007311820984, 0.21958066523075104, 0.22683125734329224, 0.23408186435699463]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 9.0, 10.0, 3.0, 12.0, 16.0, 17.0, 16.0, 18.0, 22.0, 26.0, 24.0, 25.0, 39.0, 44.0, 41.0, 36.0, 29.0, 39.0, 59.0, 52.0, 42.0, 38.0, 45.0, 38.0, 45.0, 27.0, 36.0, 33.0, 24.0, 16.0, 23.0, 11.0, 12.0, 13.0, 6.0, 8.0, 10.0, 5.0, 4.0, 5.0, 1.0, 2.0, 6.0, 2.0, 2.0, 2.0], "bins": [-1.587890625, -1.5446014404296875, -1.501312255859375, -1.4580230712890625, -1.41473388671875, -1.3714447021484375, -1.328155517578125, -1.2848663330078125, -1.2415771484375, -1.1982879638671875, -1.154998779296875, -1.1117095947265625, -1.06842041015625, -1.0251312255859375, -0.981842041015625, -0.9385528564453125, -0.895263671875, -0.8519744873046875, -0.808685302734375, -0.7653961181640625, -0.72210693359375, -0.6788177490234375, -0.635528564453125, -0.5922393798828125, -0.5489501953125, -0.5056610107421875, -0.462371826171875, -0.4190826416015625, -0.37579345703125, -0.3325042724609375, -0.289215087890625, -0.2459259033203125, -0.20263671875, -0.1593475341796875, -0.116058349609375, -0.0727691650390625, -0.02947998046875, 0.0138092041015625, 0.057098388671875, 0.1003875732421875, 0.1436767578125, 0.1869659423828125, 0.230255126953125, 0.2735443115234375, 0.31683349609375, 0.3601226806640625, 0.403411865234375, 0.4467010498046875, 0.489990234375, 0.5332794189453125, 0.576568603515625, 0.6198577880859375, 0.66314697265625, 0.7064361572265625, 0.749725341796875, 0.7930145263671875, 0.8363037109375, 0.8795928955078125, 0.922882080078125, 0.9661712646484375, 1.00946044921875, 1.0527496337890625, 1.096038818359375, 1.1393280029296875, 1.1826171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 11.0, 6.0, 16.0, 19.0, 28.0, 35.0, 51.0, 67.0, 116.0, 132.0, 213.0, 256.0, 388.0, 522.0, 794.0, 1190.0, 1829.0, 3071.0, 5908.0, 12855.0, 36536.0, 151796.0, 598315.0, 167032.0, 38854.0, 13536.0, 6007.0, 3105.0, 1914.0, 1212.0, 780.0, 590.0, 368.0, 291.0, 208.0, 140.0, 116.0, 71.0, 52.0, 34.0, 25.0, 24.0, 12.0, 9.0, 8.0, 8.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.076812744140625, -1.04034423828125, -1.003875732421875, -0.9674072265625, -0.930938720703125, -0.89447021484375, -0.858001708984375, -0.821533203125, -0.785064697265625, -0.74859619140625, -0.712127685546875, -0.6756591796875, -0.639190673828125, -0.60272216796875, -0.566253662109375, -0.52978515625, -0.493316650390625, -0.45684814453125, -0.420379638671875, -0.3839111328125, -0.347442626953125, -0.31097412109375, -0.274505615234375, -0.238037109375, -0.201568603515625, -0.16510009765625, -0.128631591796875, -0.0921630859375, -0.055694580078125, -0.01922607421875, 0.017242431640625, 0.0537109375, 0.090179443359375, 0.12664794921875, 0.163116455078125, 0.1995849609375, 0.236053466796875, 0.27252197265625, 0.308990478515625, 0.345458984375, 0.381927490234375, 0.41839599609375, 0.454864501953125, 0.4913330078125, 0.527801513671875, 0.56427001953125, 0.600738525390625, 0.63720703125, 0.673675537109375, 0.71014404296875, 0.746612548828125, 0.7830810546875, 0.819549560546875, 0.85601806640625, 0.892486572265625, 0.928955078125, 0.965423583984375, 1.00189208984375, 1.038360595703125, 1.0748291015625, 1.111297607421875, 1.14776611328125, 1.184234619140625, 1.220703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 4.0, 8.0, 9.0, 12.0, 12.0, 13.0, 15.0, 15.0, 18.0, 28.0, 17.0, 22.0, 30.0, 36.0, 32.0, 32.0, 28.0, 42.0, 77.0, 115.0, 1678.0, 239.0, 81.0, 56.0, 55.0, 42.0, 41.0, 38.0, 39.0, 22.0, 30.0, 24.0, 22.0, 16.0, 23.0, 13.0, 9.0, 9.0, 7.0, 2.0, 7.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.890625, -4.74578857421875, -4.6009521484375, -4.45611572265625, -4.311279296875, -4.16644287109375, -4.0216064453125, -3.87677001953125, -3.73193359375, -3.58709716796875, -3.4422607421875, -3.29742431640625, -3.152587890625, -3.00775146484375, -2.8629150390625, -2.71807861328125, -2.5732421875, -2.42840576171875, -2.2835693359375, -2.13873291015625, -1.993896484375, -1.84906005859375, -1.7042236328125, -1.55938720703125, -1.41455078125, -1.26971435546875, -1.1248779296875, -0.98004150390625, -0.835205078125, -0.69036865234375, -0.5455322265625, -0.40069580078125, -0.255859375, -0.11102294921875, 0.0338134765625, 0.17864990234375, 0.323486328125, 0.46832275390625, 0.6131591796875, 0.75799560546875, 0.90283203125, 1.04766845703125, 1.1925048828125, 1.33734130859375, 1.482177734375, 1.62701416015625, 1.7718505859375, 1.91668701171875, 2.0615234375, 2.20635986328125, 2.3511962890625, 2.49603271484375, 2.640869140625, 2.78570556640625, 2.9305419921875, 3.07537841796875, 3.22021484375, 3.36505126953125, 3.5098876953125, 3.65472412109375, 3.799560546875, 3.94439697265625, 4.0892333984375, 4.23406982421875, 4.37890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 5.0, 3.0, 8.0, 8.0, 12.0, 11.0, 19.0, 19.0, 34.0, 48.0, 52.0, 63.0, 90.0, 137.0, 276.0, 543.0, 1277.0, 3810.0, 19670.0, 569870.0, 2509561.0, 32179.0, 5032.0, 1468.0, 590.0, 305.0, 181.0, 107.0, 70.0, 42.0, 35.0, 44.0, 23.0, 16.0, 18.0, 12.0, 13.0, 9.0, 8.0, 9.0, 4.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.91876220703125, -4.7437744140625, -4.56878662109375, -4.393798828125, -4.21881103515625, -4.0438232421875, -3.86883544921875, -3.69384765625, -3.51885986328125, -3.3438720703125, -3.16888427734375, -2.993896484375, -2.81890869140625, -2.6439208984375, -2.46893310546875, -2.2939453125, -2.11895751953125, -1.9439697265625, -1.76898193359375, -1.593994140625, -1.41900634765625, -1.2440185546875, -1.06903076171875, -0.89404296875, -0.71905517578125, -0.5440673828125, -0.36907958984375, -0.194091796875, -0.01910400390625, 0.1558837890625, 0.33087158203125, 0.505859375, 0.68084716796875, 0.8558349609375, 1.03082275390625, 1.205810546875, 1.38079833984375, 1.5557861328125, 1.73077392578125, 1.90576171875, 2.08074951171875, 2.2557373046875, 2.43072509765625, 2.605712890625, 2.78070068359375, 2.9556884765625, 3.13067626953125, 3.3056640625, 3.48065185546875, 3.6556396484375, 3.83062744140625, 4.005615234375, 4.18060302734375, 4.3555908203125, 4.53057861328125, 4.70556640625, 4.88055419921875, 5.0555419921875, 5.23052978515625, 5.405517578125, 5.58050537109375, 5.7554931640625, 5.93048095703125, 6.10546875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [9.0, 42.0, 279.0, 509.0, 153.0, 19.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.614901304244995, -1.8275578022003174, -1.0402143001556396, -0.2528707981109619, 0.5344727039337158, 1.3218162059783936, 2.1091597080230713, 2.896503210067749, 3.6838467121124268, 4.471190452575684, 5.258533477783203, 6.045877456665039, 6.833220481872559, 7.6205644607543945, 8.407907485961914, 9.19525146484375, 9.98259449005127, 10.769937515258789, 11.557281494140625, 12.344625473022461, 13.13196849822998, 13.9193115234375, 14.706655502319336, 15.493999481201172, 16.281343460083008, 17.068687438964844, 17.856029510498047, 18.643373489379883, 19.43071746826172, 20.218061447143555, 21.00540542602539, 21.792747497558594, 22.580089569091797, 23.367433547973633, 24.15477752685547, 24.942119598388672, 25.729463577270508, 26.516807556152344, 27.304149627685547, 28.091493606567383, 28.87883758544922, 29.666181564331055, 30.45352554321289, 31.240867614746094, 32.02821350097656, 32.815555572509766, 33.60289764404297, 34.39024353027344, 35.17758560180664, 35.964927673339844, 36.75227355957031, 37.539615631103516, 38.32695770263672, 39.11430358886719, 39.90164566040039, 40.68899154663086, 41.47633361816406, 42.263675689697266, 43.051021575927734, 43.83836364746094, 44.625709533691406, 45.41305160522461, 46.20039367675781, 46.98773956298828, 47.775081634521484]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 16.0, 7.0, 9.0, 14.0, 22.0, 26.0, 19.0, 29.0, 32.0, 27.0, 34.0, 49.0, 37.0, 39.0, 48.0, 54.0, 49.0, 57.0, 38.0, 41.0, 48.0, 42.0, 34.0, 34.0, 32.0, 34.0, 23.0, 21.0, 15.0, 9.0, 14.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.526429176330566, -14.952455520629883, -14.378482818603516, -13.804509162902832, -13.230535507202148, -12.656561851501465, -12.082588195800781, -11.508615493774414, -10.93464183807373, -10.360668182373047, -9.78669548034668, -9.212721824645996, -8.638748168945312, -8.064774513244629, -7.4908013343811035, -6.916828155517578, -6.3428544998168945, -5.768880844116211, -5.1949076652526855, -4.62093448638916, -4.046960830688477, -3.472987413406372, -2.8990139961242676, -2.325040817260742, -1.7510671615600586, -1.177093744277954, -0.6031203269958496, -0.029146909713745117, 0.5448265075683594, 1.1187999248504639, 1.6927733421325684, 2.2667465209960938, 2.840719223022461, 3.4146926403045654, 3.98866605758667, 4.562639236450195, 5.136612892150879, 5.7105865478515625, 6.284559726715088, 6.858532905578613, 7.432506561279297, 8.00648021697998, 8.580453872680664, 9.154426574707031, 9.728400230407715, 10.302373886108398, 10.876346588134766, 11.45032024383545, 12.024293899536133, 12.598267555236816, 13.1722412109375, 13.746213912963867, 14.32018756866455, 14.894161224365234, 15.468133926391602, 16.04210662841797, 16.61608123779297, 17.190053939819336, 17.764028549194336, 18.338001251220703, 18.911975860595703, 19.48594856262207, 20.059921264648438, 20.633895874023438, 21.207868576049805]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 3.0, 9.0, 6.0, 11.0, 7.0, 14.0, 5.0, 11.0, 17.0, 26.0, 30.0, 22.0, 23.0, 27.0, 38.0, 40.0, 42.0, 40.0, 39.0, 41.0, 45.0, 45.0, 49.0, 48.0, 38.0, 33.0, 37.0, 43.0, 23.0, 32.0, 24.0, 21.0, 19.0, 17.0, 12.0, 6.0, 13.0, 11.0, 6.0, 5.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0], "bins": [-1.6171875, -1.5731201171875, -1.529052734375, -1.4849853515625, -1.44091796875, -1.3968505859375, -1.352783203125, -1.3087158203125, -1.2646484375, -1.2205810546875, -1.176513671875, -1.1324462890625, -1.08837890625, -1.0443115234375, -1.000244140625, -0.9561767578125, -0.912109375, -0.8680419921875, -0.823974609375, -0.7799072265625, -0.73583984375, -0.6917724609375, -0.647705078125, -0.6036376953125, -0.5595703125, -0.5155029296875, -0.471435546875, -0.4273681640625, -0.38330078125, -0.3392333984375, -0.295166015625, -0.2510986328125, -0.20703125, -0.1629638671875, -0.118896484375, -0.0748291015625, -0.03076171875, 0.0133056640625, 0.057373046875, 0.1014404296875, 0.1455078125, 0.1895751953125, 0.233642578125, 0.2777099609375, 0.32177734375, 0.3658447265625, 0.409912109375, 0.4539794921875, 0.498046875, 0.5421142578125, 0.586181640625, 0.6302490234375, 0.67431640625, 0.7183837890625, 0.762451171875, 0.8065185546875, 0.8505859375, 0.8946533203125, 0.938720703125, 0.9827880859375, 1.02685546875, 1.0709228515625, 1.114990234375, 1.1590576171875, 1.203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 13.0, 13.0, 21.0, 38.0, 34.0, 55.0, 84.0, 116.0, 157.0, 238.0, 341.0, 498.0, 675.0, 1004.0, 1488.0, 2215.0, 3568.0, 6109.0, 11508.0, 28281.0, 401470.0, 3325951.0, 355355.0, 28503.0, 10999.0, 5821.0, 3359.0, 2063.0, 1345.0, 939.0, 626.0, 422.0, 287.0, 233.0, 141.0, 98.0, 66.0, 43.0, 32.0, 24.0, 14.0, 12.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.27734375, -4.156768798828125, -4.03619384765625, -3.915618896484375, -3.7950439453125, -3.674468994140625, -3.55389404296875, -3.433319091796875, -3.312744140625, -3.192169189453125, -3.07159423828125, -2.951019287109375, -2.8304443359375, -2.709869384765625, -2.58929443359375, -2.468719482421875, -2.34814453125, -2.227569580078125, -2.10699462890625, -1.986419677734375, -1.8658447265625, -1.745269775390625, -1.62469482421875, -1.504119873046875, -1.383544921875, -1.262969970703125, -1.14239501953125, -1.021820068359375, -0.9012451171875, -0.780670166015625, -0.66009521484375, -0.539520263671875, -0.4189453125, -0.298370361328125, -0.17779541015625, -0.057220458984375, 0.0633544921875, 0.183929443359375, 0.30450439453125, 0.425079345703125, 0.545654296875, 0.666229248046875, 0.78680419921875, 0.907379150390625, 1.0279541015625, 1.148529052734375, 1.26910400390625, 1.389678955078125, 1.51025390625, 1.630828857421875, 1.75140380859375, 1.871978759765625, 1.9925537109375, 2.113128662109375, 2.23370361328125, 2.354278564453125, 2.474853515625, 2.595428466796875, 2.71600341796875, 2.836578369140625, 2.9571533203125, 3.077728271484375, 3.19830322265625, 3.318878173828125, 3.439453125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 5.0, 16.0, 19.0, 17.0, 19.0, 32.0, 29.0, 63.0, 141.0, 273.0, 743.0, 1282.0, 728.0, 319.0, 121.0, 60.0, 34.0, 33.0, 23.0, 16.0, 21.0, 12.0, 10.0, 4.0, 6.0, 4.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.88671875, -4.74493408203125, -4.6031494140625, -4.46136474609375, -4.319580078125, -4.17779541015625, -4.0360107421875, -3.89422607421875, -3.75244140625, -3.61065673828125, -3.4688720703125, -3.32708740234375, -3.185302734375, -3.04351806640625, -2.9017333984375, -2.75994873046875, -2.6181640625, -2.47637939453125, -2.3345947265625, -2.19281005859375, -2.051025390625, -1.90924072265625, -1.7674560546875, -1.62567138671875, -1.48388671875, -1.34210205078125, -1.2003173828125, -1.05853271484375, -0.916748046875, -0.77496337890625, -0.6331787109375, -0.49139404296875, -0.349609375, -0.20782470703125, -0.0660400390625, 0.07574462890625, 0.217529296875, 0.35931396484375, 0.5010986328125, 0.64288330078125, 0.78466796875, 0.92645263671875, 1.0682373046875, 1.21002197265625, 1.351806640625, 1.49359130859375, 1.6353759765625, 1.77716064453125, 1.9189453125, 2.06072998046875, 2.2025146484375, 2.34429931640625, 2.486083984375, 2.62786865234375, 2.7696533203125, 2.91143798828125, 3.05322265625, 3.19500732421875, 3.3367919921875, 3.47857666015625, 3.620361328125, 3.76214599609375, 3.9039306640625, 4.04571533203125, 4.1875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 5.0, 17.0, 23.0, 30.0, 56.0, 59.0, 87.0, 160.0, 195.0, 314.0, 502.0, 797.0, 1285.0, 2216.0, 4124.0, 7732.0, 16349.0, 39913.0, 186039.0, 3379126.0, 455660.0, 57013.0, 21195.0, 9690.0, 4822.0, 2762.0, 1515.0, 901.0, 598.0, 331.0, 269.0, 141.0, 105.0, 76.0, 50.0, 24.0, 28.0, 22.0, 16.0, 6.0, 11.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.42578125, -6.2403564453125, -6.054931640625, -5.8695068359375, -5.68408203125, -5.4986572265625, -5.313232421875, -5.1278076171875, -4.9423828125, -4.7569580078125, -4.571533203125, -4.3861083984375, -4.20068359375, -4.0152587890625, -3.829833984375, -3.6444091796875, -3.458984375, -3.2735595703125, -3.088134765625, -2.9027099609375, -2.71728515625, -2.5318603515625, -2.346435546875, -2.1610107421875, -1.9755859375, -1.7901611328125, -1.604736328125, -1.4193115234375, -1.23388671875, -1.0484619140625, -0.863037109375, -0.6776123046875, -0.4921875, -0.3067626953125, -0.121337890625, 0.0640869140625, 0.24951171875, 0.4349365234375, 0.620361328125, 0.8057861328125, 0.9912109375, 1.1766357421875, 1.362060546875, 1.5474853515625, 1.73291015625, 1.9183349609375, 2.103759765625, 2.2891845703125, 2.474609375, 2.6600341796875, 2.845458984375, 3.0308837890625, 3.21630859375, 3.4017333984375, 3.587158203125, 3.7725830078125, 3.9580078125, 4.1434326171875, 4.328857421875, 4.5142822265625, 4.69970703125, 4.8851318359375, 5.070556640625, 5.2559814453125, 5.44140625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 13.0, 24.0, 48.0, 60.0, 95.0, 184.0, 181.0, 152.0, 81.0, 54.0, 30.0, 24.0, 6.0, 9.0, 5.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.955810546875, -19.225208282470703, -18.49460792541504, -17.764005661010742, -17.033405303955078, -16.30280303955078, -15.5722017288208, -14.84160041809082, -14.11099910736084, -13.38039779663086, -12.649796485900879, -11.919195175170898, -11.188592910766602, -10.457992553710938, -9.72739028930664, -8.99678897857666, -8.26618766784668, -7.535586357116699, -6.804985046386719, -6.07438325881958, -5.3437819480896, -4.613180637359619, -3.8825788497924805, -3.1519775390625, -2.4213762283325195, -1.6907747983932495, -0.9601733684539795, -0.22957181930541992, 0.5010294914245605, 1.231630802154541, 1.9622325897216797, 2.69283390045166, 3.423433303833008, 4.154034614562988, 4.884635925292969, 5.615237712860107, 6.345839023590088, 7.076440334320068, 7.807042121887207, 8.537643432617188, 9.268244743347168, 9.998846054077148, 10.729447364807129, 11.46004867553711, 12.190650939941406, 12.92125129699707, 13.651853561401367, 14.382454872131348, 15.113056182861328, 15.843657493591309, 16.57425880432129, 17.304861068725586, 18.03546142578125, 18.766063690185547, 19.496665954589844, 20.227266311645508, 20.957866668701172, 21.68846893310547, 22.419069290161133, 23.14967155456543, 23.880271911621094, 24.61087417602539, 25.341476440429688, 26.07207679748535, 26.80267906188965]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 6.0, 18.0, 12.0, 19.0, 18.0, 15.0, 21.0, 31.0, 21.0, 22.0, 39.0, 43.0, 41.0, 48.0, 39.0, 44.0, 47.0, 35.0, 33.0, 36.0, 33.0, 32.0, 45.0, 38.0, 34.0, 29.0, 29.0, 27.0, 18.0, 19.0, 17.0, 5.0, 17.0, 4.0, 12.0, 12.0, 3.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.627976417541504, -10.29914379119873, -9.97031021118164, -9.641477584838867, -9.312644958496094, -8.98381233215332, -8.65497875213623, -8.326146125793457, -7.997313022613525, -7.668479919433594, -7.33964729309082, -7.010814189910889, -6.681981086730957, -6.353148460388184, -6.024315357208252, -5.69548225402832, -5.366649627685547, -5.037816524505615, -4.708983898162842, -4.38015079498291, -4.051318168640137, -3.722485065460205, -3.3936519622802734, -3.064819097518921, -2.7359862327575684, -2.407153367996216, -2.0783205032348633, -1.7494874000549316, -1.420654535293579, -1.0918216705322266, -0.7629886865615845, -0.4341557025909424, -0.10532283782958984, 0.22351008653640747, 0.5523430109024048, 0.8811759352684021, 1.2100088596343994, 1.538841724395752, 1.867674708366394, 2.196507692337036, 2.5253405570983887, 2.854173421859741, 3.1830062866210938, 3.5118393898010254, 3.840672254562378, 4.1695051193237305, 4.498338222503662, 4.827171325683594, 5.156003952026367, 5.484837055206299, 5.813669681549072, 6.142502784729004, 6.471335411071777, 6.800168514251709, 7.129001617431641, 7.457834243774414, 7.786667346954346, 8.115500450134277, 8.44433307647705, 8.773165702819824, 9.101999282836914, 9.430831909179688, 9.759664535522461, 10.08849811553955, 10.417330741882324]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 10.0, 6.0, 3.0, 13.0, 8.0, 8.0, 13.0, 15.0, 26.0, 31.0, 27.0, 27.0, 34.0, 35.0, 43.0, 39.0, 46.0, 33.0, 51.0, 40.0, 47.0, 44.0, 42.0, 34.0, 36.0, 41.0, 36.0, 26.0, 31.0, 26.0, 27.0, 18.0, 12.0, 14.0, 12.0, 12.0, 9.0, 5.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.62890625, -1.58306884765625, -1.5372314453125, -1.49139404296875, -1.445556640625, -1.39971923828125, -1.3538818359375, -1.30804443359375, -1.26220703125, -1.21636962890625, -1.1705322265625, -1.12469482421875, -1.078857421875, -1.03302001953125, -0.9871826171875, -0.94134521484375, -0.8955078125, -0.84967041015625, -0.8038330078125, -0.75799560546875, -0.712158203125, -0.66632080078125, -0.6204833984375, -0.57464599609375, -0.52880859375, -0.48297119140625, -0.4371337890625, -0.39129638671875, -0.345458984375, -0.29962158203125, -0.2537841796875, -0.20794677734375, -0.162109375, -0.11627197265625, -0.0704345703125, -0.02459716796875, 0.021240234375, 0.06707763671875, 0.1129150390625, 0.15875244140625, 0.20458984375, 0.25042724609375, 0.2962646484375, 0.34210205078125, 0.387939453125, 0.43377685546875, 0.4796142578125, 0.52545166015625, 0.5712890625, 0.61712646484375, 0.6629638671875, 0.70880126953125, 0.754638671875, 0.80047607421875, 0.8463134765625, 0.89215087890625, 0.93798828125, 0.98382568359375, 1.0296630859375, 1.07550048828125, 1.121337890625, 1.16717529296875, 1.2130126953125, 1.25885009765625, 1.3046875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 10.0, 14.0, 21.0, 43.0, 47.0, 71.0, 102.0, 151.0, 222.0, 366.0, 539.0, 902.0, 1358.0, 2180.0, 3562.0, 5935.0, 9495.0, 16325.0, 28085.0, 50306.0, 96724.0, 202774.0, 281736.0, 165447.0, 79473.0, 42667.0, 24059.0, 14089.0, 8279.0, 5032.0, 3119.0, 1878.0, 1259.0, 786.0, 491.0, 327.0, 222.0, 151.0, 105.0, 60.0, 50.0, 32.0, 24.0, 7.0, 9.0, 8.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7529296875, -1.698760986328125, -1.64459228515625, -1.590423583984375, -1.5362548828125, -1.482086181640625, -1.42791748046875, -1.373748779296875, -1.319580078125, -1.265411376953125, -1.21124267578125, -1.157073974609375, -1.1029052734375, -1.048736572265625, -0.99456787109375, -0.940399169921875, -0.88623046875, -0.832061767578125, -0.77789306640625, -0.723724365234375, -0.6695556640625, -0.615386962890625, -0.56121826171875, -0.507049560546875, -0.452880859375, -0.398712158203125, -0.34454345703125, -0.290374755859375, -0.2362060546875, -0.182037353515625, -0.12786865234375, -0.073699951171875, -0.01953125, 0.034637451171875, 0.08880615234375, 0.142974853515625, 0.1971435546875, 0.251312255859375, 0.30548095703125, 0.359649658203125, 0.413818359375, 0.467987060546875, 0.52215576171875, 0.576324462890625, 0.6304931640625, 0.684661865234375, 0.73883056640625, 0.792999267578125, 0.84716796875, 0.901336669921875, 0.95550537109375, 1.009674072265625, 1.0638427734375, 1.118011474609375, 1.17218017578125, 1.226348876953125, 1.280517578125, 1.334686279296875, 1.38885498046875, 1.443023681640625, 1.4971923828125, 1.551361083984375, 1.60552978515625, 1.659698486328125, 1.7138671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 5.0, 8.0, 12.0, 10.0, 11.0, 18.0, 16.0, 22.0, 25.0, 31.0, 35.0, 29.0, 44.0, 33.0, 41.0, 30.0, 48.0, 52.0, 1071.0, 35.0, 40.0, 41.0, 55.0, 28.0, 34.0, 32.0, 27.0, 30.0, 17.0, 22.0, 23.0, 18.0, 15.0, 10.0, 9.0, 2.0, 5.0, 6.0, 2.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.9072265625, -1.852264404296875, -1.79730224609375, -1.742340087890625, -1.6873779296875, -1.632415771484375, -1.57745361328125, -1.522491455078125, -1.467529296875, -1.412567138671875, -1.35760498046875, -1.302642822265625, -1.2476806640625, -1.192718505859375, -1.13775634765625, -1.082794189453125, -1.02783203125, -0.972869873046875, -0.91790771484375, -0.862945556640625, -0.8079833984375, -0.753021240234375, -0.69805908203125, -0.643096923828125, -0.588134765625, -0.533172607421875, -0.47821044921875, -0.423248291015625, -0.3682861328125, -0.313323974609375, -0.25836181640625, -0.203399658203125, -0.1484375, -0.093475341796875, -0.03851318359375, 0.016448974609375, 0.0714111328125, 0.126373291015625, 0.18133544921875, 0.236297607421875, 0.291259765625, 0.346221923828125, 0.40118408203125, 0.456146240234375, 0.5111083984375, 0.566070556640625, 0.62103271484375, 0.675994873046875, 0.73095703125, 0.785919189453125, 0.84088134765625, 0.895843505859375, 0.9508056640625, 1.005767822265625, 1.06072998046875, 1.115692138671875, 1.170654296875, 1.225616455078125, 1.28057861328125, 1.335540771484375, 1.3905029296875, 1.445465087890625, 1.50042724609375, 1.555389404296875, 1.6103515625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 11.0, 14.0, 10.0, 31.0, 31.0, 43.0, 60.0, 69.0, 113.0, 167.0, 226.0, 325.0, 480.0, 719.0, 1065.0, 1667.0, 2765.0, 4709.0, 8162.0, 16310.0, 40380.0, 363266.0, 1561490.0, 52591.0, 19140.0, 9479.0, 5157.0, 3115.0, 1842.0, 1191.0, 732.0, 504.0, 361.0, 243.0, 196.0, 133.0, 101.0, 59.0, 47.0, 28.0, 23.0, 17.0, 13.0, 16.0, 6.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.47265625, -3.364501953125, -3.25634765625, -3.148193359375, -3.0400390625, -2.931884765625, -2.82373046875, -2.715576171875, -2.607421875, -2.499267578125, -2.39111328125, -2.282958984375, -2.1748046875, -2.066650390625, -1.95849609375, -1.850341796875, -1.7421875, -1.634033203125, -1.52587890625, -1.417724609375, -1.3095703125, -1.201416015625, -1.09326171875, -0.985107421875, -0.876953125, -0.768798828125, -0.66064453125, -0.552490234375, -0.4443359375, -0.336181640625, -0.22802734375, -0.119873046875, -0.01171875, 0.096435546875, 0.20458984375, 0.312744140625, 0.4208984375, 0.529052734375, 0.63720703125, 0.745361328125, 0.853515625, 0.961669921875, 1.06982421875, 1.177978515625, 1.2861328125, 1.394287109375, 1.50244140625, 1.610595703125, 1.71875, 1.826904296875, 1.93505859375, 2.043212890625, 2.1513671875, 2.259521484375, 2.36767578125, 2.475830078125, 2.583984375, 2.692138671875, 2.80029296875, 2.908447265625, 3.0166015625, 3.124755859375, 3.23291015625, 3.341064453125, 3.44921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 5.0, 1.0, 4.0, 5.0, 8.0, 10.0, 30.0, 24.0, 23.0, 42.0, 64.0, 116.0, 202.0, 172.0, 111.0, 38.0, 37.0, 28.0, 15.0, 9.0, 8.0, 9.0, 5.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3427734375, -0.3323402404785156, -0.32190704345703125, -0.3114738464355469, -0.3010406494140625, -0.2906074523925781, -0.28017425537109375, -0.2697410583496094, -0.259307861328125, -0.24887466430664062, -0.23844146728515625, -0.22800827026367188, -0.2175750732421875, -0.20714187622070312, -0.19670867919921875, -0.18627548217773438, -0.17584228515625, -0.16540908813476562, -0.15497589111328125, -0.14454269409179688, -0.1341094970703125, -0.12367630004882812, -0.11324310302734375, -0.10280990600585938, -0.092376708984375, -0.08194351196289062, -0.07151031494140625, -0.061077117919921875, -0.0506439208984375, -0.040210723876953125, -0.02977752685546875, -0.019344329833984375, -0.0089111328125, 0.001522064208984375, 0.01195526123046875, 0.022388458251953125, 0.0328216552734375, 0.043254852294921875, 0.05368804931640625, 0.06412124633789062, 0.074554443359375, 0.08498764038085938, 0.09542083740234375, 0.10585403442382812, 0.1162872314453125, 0.12672042846679688, 0.13715362548828125, 0.14758682250976562, 0.15802001953125, 0.16845321655273438, 0.17888641357421875, 0.18931961059570312, 0.1997528076171875, 0.21018600463867188, 0.22061920166015625, 0.23105239868164062, 0.241485595703125, 0.2519187927246094, 0.26235198974609375, 0.2727851867675781, 0.2832183837890625, 0.2936515808105469, 0.30408477783203125, 0.3145179748535156, 0.324951171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 6.0, 5.0, 7.0, 6.0, 3.0, 7.0, 2.0, 15.0, 11.0, 8.0, 25.0, 33.0, 26.0, 47.0, 79.0, 148.0, 298.0, 774.0, 2805.0, 18716.0, 944120.0, 73619.0, 5629.0, 1253.0, 387.0, 167.0, 107.0, 59.0, 38.0, 30.0, 36.0, 19.0, 12.0, 15.0, 9.0, 8.0, 3.0, 3.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.09735107421875, -3.9681396484375, -3.83892822265625, -3.709716796875, -3.58050537109375, -3.4512939453125, -3.32208251953125, -3.19287109375, -3.06365966796875, -2.9344482421875, -2.80523681640625, -2.676025390625, -2.54681396484375, -2.4176025390625, -2.28839111328125, -2.1591796875, -2.02996826171875, -1.9007568359375, -1.77154541015625, -1.642333984375, -1.51312255859375, -1.3839111328125, -1.25469970703125, -1.12548828125, -0.99627685546875, -0.8670654296875, -0.73785400390625, -0.608642578125, -0.47943115234375, -0.3502197265625, -0.22100830078125, -0.091796875, 0.03741455078125, 0.1666259765625, 0.29583740234375, 0.425048828125, 0.55426025390625, 0.6834716796875, 0.81268310546875, 0.94189453125, 1.07110595703125, 1.2003173828125, 1.32952880859375, 1.458740234375, 1.58795166015625, 1.7171630859375, 1.84637451171875, 1.9755859375, 2.10479736328125, 2.2340087890625, 2.36322021484375, 2.492431640625, 2.62164306640625, 2.7508544921875, 2.88006591796875, 3.00927734375, 3.13848876953125, 3.2677001953125, 3.39691162109375, 3.526123046875, 3.65533447265625, 3.7845458984375, 3.91375732421875, 4.04296875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 10.0, 35.0, 31.0, 60.0, 112.0, 180.0, 204.0, 114.0, 76.0, 56.0, 27.0, 23.0, 15.0, 11.0, 14.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1236042976379395, -1.0850311517715454, -1.0464580059051514, -1.0078848600387573, -0.9693117141723633, -0.9307385683059692, -0.8921654224395752, -0.8535922765731812, -0.8150191307067871, -0.7764459848403931, -0.737872838973999, -0.699299693107605, -0.6607265472412109, -0.6221534013748169, -0.5835802555084229, -0.5450071096420288, -0.5064339637756348, -0.4678608179092407, -0.4292876720428467, -0.39071452617645264, -0.3521413803100586, -0.31356823444366455, -0.2749950885772705, -0.23642194271087646, -0.19784879684448242, -0.15927565097808838, -0.12070250511169434, -0.08212935924530029, -0.04355621337890625, -0.004983067512512207, 0.033590078353881836, 0.07216322422027588, 0.11073637008666992, 0.14930951595306396, 0.187882661819458, 0.22645580768585205, 0.2650289535522461, 0.30360209941864014, 0.3421752452850342, 0.3807483911514282, 0.41932153701782227, 0.4578946828842163, 0.49646782875061035, 0.5350409746170044, 0.5736141204833984, 0.6121872663497925, 0.6507604122161865, 0.6893335580825806, 0.7279067039489746, 0.7664798498153687, 0.8050529956817627, 0.8436261415481567, 0.8821992874145508, 0.9207724332809448, 0.9593455791473389, 0.9979187250137329, 1.036491870880127, 1.075065016746521, 1.113638162612915, 1.152211308479309, 1.1907844543457031, 1.2293576002120972, 1.2679307460784912, 1.3065038919448853, 1.3450770378112793]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 10.0, 10.0, 8.0, 11.0, 18.0, 13.0, 17.0, 21.0, 22.0, 21.0, 25.0, 28.0, 37.0, 33.0, 50.0, 36.0, 28.0, 34.0, 38.0, 44.0, 49.0, 29.0, 51.0, 29.0, 36.0, 47.0, 31.0, 31.0, 24.0, 29.0, 22.0, 15.0, 10.0, 10.0, 10.0, 9.0, 8.0, 9.0, 8.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.6140314936637878, -0.5966061353683472, -0.5791807770729065, -0.5617554187774658, -0.5443300604820251, -0.5269047021865845, -0.5094793438911438, -0.49205395579338074, -0.47462859749794006, -0.4572032392024994, -0.4397778809070587, -0.42235252261161804, -0.404927134513855, -0.3875017762184143, -0.37007641792297363, -0.35265105962753296, -0.3352257013320923, -0.3178003430366516, -0.30037498474121094, -0.28294962644577026, -0.2655242681503296, -0.24809889495372772, -0.23067352175712585, -0.21324816346168518, -0.1958228051662445, -0.17839744687080383, -0.16097208857536316, -0.1435467153787613, -0.12612135708332062, -0.10869599878787994, -0.09127063304185867, -0.0738452672958374, -0.056419968605041504, -0.03899460658431053, -0.02156924456357956, -0.004143882542848587, 0.013281479477882385, 0.03070683777332306, 0.04813220351934433, 0.0655575692653656, 0.08298292756080627, 0.10040828585624695, 0.11783365160226822, 0.1352590173482895, 0.15268437564373016, 0.17010973393917084, 0.1875351071357727, 0.20496046543121338, 0.22238582372665405, 0.23981118202209473, 0.2572365403175354, 0.2746618986129761, 0.29208725690841675, 0.3095126152038574, 0.3269380033016205, 0.34436336159706116, 0.36178871989250183, 0.3792140781879425, 0.3966394364833832, 0.41406479477882385, 0.4314901828765869, 0.4489155411720276, 0.46634089946746826, 0.48376625776290894, 0.5011916160583496]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 7.0, 7.0, 8.0, 9.0, 9.0, 12.0, 23.0, 34.0, 22.0, 26.0, 28.0, 41.0, 39.0, 45.0, 34.0, 46.0, 39.0, 43.0, 44.0, 48.0, 37.0, 41.0, 38.0, 50.0, 29.0, 31.0, 27.0, 37.0, 23.0, 23.0, 12.0, 13.0, 15.0, 11.0, 6.0, 8.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.586273193359375, -1.53973388671875, -1.493194580078125, -1.4466552734375, -1.400115966796875, -1.35357666015625, -1.307037353515625, -1.260498046875, -1.213958740234375, -1.16741943359375, -1.120880126953125, -1.0743408203125, -1.027801513671875, -0.98126220703125, -0.934722900390625, -0.88818359375, -0.841644287109375, -0.79510498046875, -0.748565673828125, -0.7020263671875, -0.655487060546875, -0.60894775390625, -0.562408447265625, -0.515869140625, -0.469329833984375, -0.42279052734375, -0.376251220703125, -0.3297119140625, -0.283172607421875, -0.23663330078125, -0.190093994140625, -0.1435546875, -0.097015380859375, -0.05047607421875, -0.003936767578125, 0.0426025390625, 0.089141845703125, 0.13568115234375, 0.182220458984375, 0.228759765625, 0.275299072265625, 0.32183837890625, 0.368377685546875, 0.4149169921875, 0.461456298828125, 0.50799560546875, 0.554534912109375, 0.60107421875, 0.647613525390625, 0.69415283203125, 0.740692138671875, 0.7872314453125, 0.833770751953125, 0.88031005859375, 0.926849365234375, 0.973388671875, 1.019927978515625, 1.06646728515625, 1.113006591796875, 1.1595458984375, 1.206085205078125, 1.25262451171875, 1.299163818359375, 1.345703125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 7.0, 20.0, 25.0, 31.0, 38.0, 61.0, 98.0, 158.0, 240.0, 418.0, 605.0, 1169.0, 1827.0, 3163.0, 5396.0, 9199.0, 17110.0, 35991.0, 141296.0, 699298.0, 73612.0, 26333.0, 13675.0, 7749.0, 4515.0, 2560.0, 1581.0, 901.0, 579.0, 335.0, 204.0, 138.0, 73.0, 48.0, 22.0, 22.0, 18.0, 12.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.01654052734375, -2.9061279296875, -2.79571533203125, -2.685302734375, -2.57489013671875, -2.4644775390625, -2.35406494140625, -2.24365234375, -2.13323974609375, -2.0228271484375, -1.91241455078125, -1.802001953125, -1.69158935546875, -1.5811767578125, -1.47076416015625, -1.3603515625, -1.24993896484375, -1.1395263671875, -1.02911376953125, -0.918701171875, -0.80828857421875, -0.6978759765625, -0.58746337890625, -0.47705078125, -0.36663818359375, -0.2562255859375, -0.14581298828125, -0.035400390625, 0.07501220703125, 0.1854248046875, 0.29583740234375, 0.40625, 0.51666259765625, 0.6270751953125, 0.73748779296875, 0.847900390625, 0.95831298828125, 1.0687255859375, 1.17913818359375, 1.28955078125, 1.39996337890625, 1.5103759765625, 1.62078857421875, 1.731201171875, 1.84161376953125, 1.9520263671875, 2.06243896484375, 2.1728515625, 2.28326416015625, 2.3936767578125, 2.50408935546875, 2.614501953125, 2.72491455078125, 2.8353271484375, 2.94573974609375, 3.05615234375, 3.16656494140625, 3.2769775390625, 3.38739013671875, 3.497802734375, 3.60821533203125, 3.7186279296875, 3.82904052734375, 3.939453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 14.0, 10.0, 11.0, 13.0, 12.0, 17.0, 22.0, 26.0, 41.0, 29.0, 50.0, 43.0, 48.0, 70.0, 61.0, 82.0, 163.0, 1593.0, 177.0, 85.0, 67.0, 58.0, 55.0, 37.0, 38.0, 35.0, 34.0, 22.0, 18.0, 24.0, 13.0, 16.0, 9.0, 19.0, 3.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -5.01025390625, -4.8408203125, -4.67138671875, -4.501953125, -4.33251953125, -4.1630859375, -3.99365234375, -3.82421875, -3.65478515625, -3.4853515625, -3.31591796875, -3.146484375, -2.97705078125, -2.8076171875, -2.63818359375, -2.46875, -2.29931640625, -2.1298828125, -1.96044921875, -1.791015625, -1.62158203125, -1.4521484375, -1.28271484375, -1.11328125, -0.94384765625, -0.7744140625, -0.60498046875, -0.435546875, -0.26611328125, -0.0966796875, 0.07275390625, 0.2421875, 0.41162109375, 0.5810546875, 0.75048828125, 0.919921875, 1.08935546875, 1.2587890625, 1.42822265625, 1.59765625, 1.76708984375, 1.9365234375, 2.10595703125, 2.275390625, 2.44482421875, 2.6142578125, 2.78369140625, 2.953125, 3.12255859375, 3.2919921875, 3.46142578125, 3.630859375, 3.80029296875, 3.9697265625, 4.13916015625, 4.30859375, 4.47802734375, 4.6474609375, 4.81689453125, 4.986328125, 5.15576171875, 5.3251953125, 5.49462890625, 5.6640625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 12.0, 11.0, 27.0, 32.0, 55.0, 76.0, 109.0, 230.0, 419.0, 800.0, 1823.0, 5671.0, 25788.0, 539875.0, 2526376.0, 33449.0, 6801.0, 2193.0, 905.0, 446.0, 211.0, 131.0, 109.0, 47.0, 37.0, 20.0, 12.0, 12.0, 3.0, 6.0, 3.0, 2.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.265625, -17.7447509765625, -17.223876953125, -16.7030029296875, -16.18212890625, -15.6612548828125, -15.140380859375, -14.6195068359375, -14.0986328125, -13.5777587890625, -13.056884765625, -12.5360107421875, -12.01513671875, -11.4942626953125, -10.973388671875, -10.4525146484375, -9.931640625, -9.4107666015625, -8.889892578125, -8.3690185546875, -7.84814453125, -7.3272705078125, -6.806396484375, -6.2855224609375, -5.7646484375, -5.2437744140625, -4.722900390625, -4.2020263671875, -3.68115234375, -3.1602783203125, -2.639404296875, -2.1185302734375, -1.59765625, -1.0767822265625, -0.555908203125, -0.0350341796875, 0.48583984375, 1.0067138671875, 1.527587890625, 2.0484619140625, 2.5693359375, 3.0902099609375, 3.611083984375, 4.1319580078125, 4.65283203125, 5.1737060546875, 5.694580078125, 6.2154541015625, 6.736328125, 7.2572021484375, 7.778076171875, 8.2989501953125, 8.81982421875, 9.3406982421875, 9.861572265625, 10.3824462890625, 10.9033203125, 11.4241943359375, 11.945068359375, 12.4659423828125, 12.98681640625, 13.5076904296875, 14.028564453125, 14.5494384765625, 15.0703125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 123.0, 643.0, 210.0, 30.0], "bins": [-218.69415283203125, -215.146484375, -211.59881591796875, -208.05113220214844, -204.5034637451172, -200.95579528808594, -197.4081268310547, -193.86045837402344, -190.31277465820312, -186.76510620117188, -183.21743774414062, -179.6697540283203, -176.12208557128906, -172.5744171142578, -169.02674865722656, -165.4790802001953, -161.93141174316406, -158.3837432861328, -154.83607482910156, -151.28839111328125, -147.74072265625, -144.19305419921875, -140.6453857421875, -137.09771728515625, -133.550048828125, -130.00238037109375, -126.45470428466797, -122.90703582763672, -119.35935974121094, -115.81169128417969, -112.26402282714844, -108.71635437011719, -105.1686782836914, -101.62100982666016, -98.07333374023438, -94.52566528320312, -90.97799682617188, -87.4303207397461, -83.88265228271484, -80.33497619628906, -76.78730773925781, -73.23963928222656, -69.69196319580078, -66.14429473876953, -62.596622467041016, -59.0489501953125, -55.50128173828125, -51.953609466552734, -48.40593719482422, -44.8582649230957, -41.31059265136719, -37.76292419433594, -34.21525192260742, -30.667579650878906, -27.119909286499023, -23.57223892211914, -20.024566650390625, -16.47689437866211, -12.929224014282227, -9.381552696228027, -5.833881378173828, -2.2862091064453125, 1.2614612579345703, 4.809131622314453, 8.356804847717285]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 4.0, 7.0, 5.0, 6.0, 16.0, 14.0, 17.0, 14.0, 17.0, 19.0, 27.0, 30.0, 35.0, 36.0, 23.0, 33.0, 39.0, 42.0, 50.0, 45.0, 36.0, 30.0, 33.0, 31.0, 45.0, 38.0, 33.0, 42.0, 29.0, 29.0, 20.0, 24.0, 26.0, 11.0, 12.0, 13.0, 14.0, 7.0, 14.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.523218154907227, -16.022323608398438, -15.521428108215332, -15.020533561706543, -14.519638061523438, -14.018743515014648, -13.51784896850586, -13.01695442199707, -12.516058921813965, -12.015164375305176, -11.51426887512207, -11.013374328613281, -10.512479782104492, -10.011584281921387, -9.510689735412598, -9.009794235229492, -8.508899688720703, -8.008005142211914, -7.507109642028809, -7.0062150955200195, -6.505320072174072, -6.004425048828125, -5.503530502319336, -5.002635478973389, -4.501740455627441, -4.000845432281494, -3.499950647354126, -2.999055862426758, -2.4981608390808105, -1.9972658157348633, -1.4963710308074951, -0.995476245880127, -0.4945802688598633, 0.006314635276794434, 0.5072095394134521, 1.0081044435501099, 1.5089993476867676, 2.009894371032715, 2.510789155960083, 3.011683940887451, 3.5125789642333984, 4.013473987579346, 4.514369010925293, 5.015263557434082, 5.516158580780029, 6.017053604125977, 6.517948150634766, 7.018843173980713, 7.51973819732666, 8.02063274383545, 8.521528244018555, 9.022422790527344, 9.523317337036133, 10.024212837219238, 10.525107383728027, 11.026002883911133, 11.526897430419922, 12.027791976928711, 12.528687477111816, 13.029582023620605, 13.530477523803711, 14.0313720703125, 14.532266616821289, 15.033161163330078, 15.534056663513184]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 9.0, 10.0, 10.0, 6.0, 15.0, 23.0, 16.0, 24.0, 18.0, 27.0, 36.0, 24.0, 40.0, 48.0, 35.0, 39.0, 29.0, 41.0, 59.0, 40.0, 39.0, 37.0, 47.0, 37.0, 41.0, 36.0, 38.0, 26.0, 15.0, 27.0, 13.0, 17.0, 13.0, 7.0, 9.0, 7.0, 6.0, 7.0, 15.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.8486328125, -1.7990570068359375, -1.749481201171875, -1.6999053955078125, -1.65032958984375, -1.6007537841796875, -1.551177978515625, -1.5016021728515625, -1.4520263671875, -1.4024505615234375, -1.352874755859375, -1.3032989501953125, -1.25372314453125, -1.2041473388671875, -1.154571533203125, -1.1049957275390625, -1.055419921875, -1.0058441162109375, -0.956268310546875, -0.9066925048828125, -0.85711669921875, -0.8075408935546875, -0.757965087890625, -0.7083892822265625, -0.6588134765625, -0.6092376708984375, -0.559661865234375, -0.5100860595703125, -0.46051025390625, -0.4109344482421875, -0.361358642578125, -0.3117828369140625, -0.26220703125, -0.2126312255859375, -0.163055419921875, -0.1134796142578125, -0.06390380859375, -0.0143280029296875, 0.035247802734375, 0.0848236083984375, 0.1343994140625, 0.1839752197265625, 0.233551025390625, 0.2831268310546875, 0.33270263671875, 0.3822784423828125, 0.431854248046875, 0.4814300537109375, 0.531005859375, 0.5805816650390625, 0.630157470703125, 0.6797332763671875, 0.72930908203125, 0.7788848876953125, 0.828460693359375, 0.8780364990234375, 0.9276123046875, 0.9771881103515625, 1.026763916015625, 1.0763397216796875, 1.12591552734375, 1.1754913330078125, 1.225067138671875, 1.2746429443359375, 1.32421875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 5.0, 15.0, 15.0, 18.0, 22.0, 34.0, 54.0, 79.0, 109.0, 119.0, 182.0, 233.0, 389.0, 494.0, 709.0, 962.0, 1429.0, 2124.0, 3416.0, 5518.0, 10585.0, 21993.0, 82775.0, 733960.0, 2767891.0, 458799.0, 59528.0, 19407.0, 9230.0, 4989.0, 3004.0, 1948.0, 1304.0, 843.0, 565.0, 434.0, 297.0, 240.0, 154.0, 114.0, 95.0, 63.0, 46.0, 31.0, 20.0, 16.0, 10.0, 2.0, 3.0, 4.0, 0.0, 1.0], "bins": [-3.623046875, -3.52349853515625, -3.4239501953125, -3.32440185546875, -3.224853515625, -3.12530517578125, -3.0257568359375, -2.92620849609375, -2.82666015625, -2.72711181640625, -2.6275634765625, -2.52801513671875, -2.428466796875, -2.32891845703125, -2.2293701171875, -2.12982177734375, -2.0302734375, -1.93072509765625, -1.8311767578125, -1.73162841796875, -1.632080078125, -1.53253173828125, -1.4329833984375, -1.33343505859375, -1.23388671875, -1.13433837890625, -1.0347900390625, -0.93524169921875, -0.835693359375, -0.73614501953125, -0.6365966796875, -0.53704833984375, -0.4375, -0.33795166015625, -0.2384033203125, -0.13885498046875, -0.039306640625, 0.06024169921875, 0.1597900390625, 0.25933837890625, 0.35888671875, 0.45843505859375, 0.5579833984375, 0.65753173828125, 0.757080078125, 0.85662841796875, 0.9561767578125, 1.05572509765625, 1.1552734375, 1.25482177734375, 1.3543701171875, 1.45391845703125, 1.553466796875, 1.65301513671875, 1.7525634765625, 1.85211181640625, 1.95166015625, 2.05120849609375, 2.1507568359375, 2.25030517578125, 2.349853515625, 2.44940185546875, 2.5489501953125, 2.64849853515625, 2.748046875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 2.0, 2.0, 7.0, 7.0, 6.0, 10.0, 21.0, 21.0, 20.0, 33.0, 39.0, 64.0, 96.0, 158.0, 365.0, 722.0, 1039.0, 658.0, 310.0, 155.0, 86.0, 61.0, 38.0, 29.0, 22.0, 20.0, 9.0, 11.0, 12.0, 8.0, 6.0, 8.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.9765625, -4.8360595703125, -4.695556640625, -4.5550537109375, -4.41455078125, -4.2740478515625, -4.133544921875, -3.9930419921875, -3.8525390625, -3.7120361328125, -3.571533203125, -3.4310302734375, -3.29052734375, -3.1500244140625, -3.009521484375, -2.8690185546875, -2.728515625, -2.5880126953125, -2.447509765625, -2.3070068359375, -2.16650390625, -2.0260009765625, -1.885498046875, -1.7449951171875, -1.6044921875, -1.4639892578125, -1.323486328125, -1.1829833984375, -1.04248046875, -0.9019775390625, -0.761474609375, -0.6209716796875, -0.48046875, -0.3399658203125, -0.199462890625, -0.0589599609375, 0.08154296875, 0.2220458984375, 0.362548828125, 0.5030517578125, 0.6435546875, 0.7840576171875, 0.924560546875, 1.0650634765625, 1.20556640625, 1.3460693359375, 1.486572265625, 1.6270751953125, 1.767578125, 1.9080810546875, 2.048583984375, 2.1890869140625, 2.32958984375, 2.4700927734375, 2.610595703125, 2.7510986328125, 2.8916015625, 3.0321044921875, 3.172607421875, 3.3131103515625, 3.45361328125, 3.5941162109375, 3.734619140625, 3.8751220703125, 4.015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 17.0, 20.0, 32.0, 48.0, 63.0, 94.0, 136.0, 211.0, 315.0, 580.0, 779.0, 1332.0, 2079.0, 3322.0, 5926.0, 10974.0, 23282.0, 59895.0, 296680.0, 3176689.0, 480330.0, 75238.0, 27053.0, 12536.0, 6685.0, 3797.0, 2292.0, 1361.0, 849.0, 561.0, 344.0, 244.0, 169.0, 102.0, 58.0, 58.0, 22.0, 22.0, 18.0, 16.0, 6.0, 12.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.6114501953125, -5.433837890625, -5.2562255859375, -5.07861328125, -4.9010009765625, -4.723388671875, -4.5457763671875, -4.3681640625, -4.1905517578125, -4.012939453125, -3.8353271484375, -3.65771484375, -3.4801025390625, -3.302490234375, -3.1248779296875, -2.947265625, -2.7696533203125, -2.592041015625, -2.4144287109375, -2.23681640625, -2.0592041015625, -1.881591796875, -1.7039794921875, -1.5263671875, -1.3487548828125, -1.171142578125, -0.9935302734375, -0.81591796875, -0.6383056640625, -0.460693359375, -0.2830810546875, -0.10546875, 0.0721435546875, 0.249755859375, 0.4273681640625, 0.60498046875, 0.7825927734375, 0.960205078125, 1.1378173828125, 1.3154296875, 1.4930419921875, 1.670654296875, 1.8482666015625, 2.02587890625, 2.2034912109375, 2.381103515625, 2.5587158203125, 2.736328125, 2.9139404296875, 3.091552734375, 3.2691650390625, 3.44677734375, 3.6243896484375, 3.802001953125, 3.9796142578125, 4.1572265625, 4.3348388671875, 4.512451171875, 4.6900634765625, 4.86767578125, 5.0452880859375, 5.222900390625, 5.4005126953125, 5.578125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 14.0, 7.0, 24.0, 17.0, 44.0, 45.0, 71.0, 102.0, 112.0, 160.0, 109.0, 87.0, 62.0, 45.0, 24.0, 21.0, 12.0, 18.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.038684844970703, -23.412660598754883, -22.786636352539062, -22.16061019897461, -21.53458595275879, -20.90856170654297, -20.28253746032715, -19.656513214111328, -19.030487060546875, -18.404462814331055, -17.778438568115234, -17.15241241455078, -16.52638816833496, -15.90036392211914, -15.27433967590332, -14.6483154296875, -14.02229118347168, -13.39626693725586, -12.770241737365723, -12.144217491149902, -11.518192291259766, -10.892168045043945, -10.266143798828125, -9.640119552612305, -9.014094352722168, -8.388070106506348, -7.762044906616211, -7.136020660400391, -6.509995937347412, -5.883971214294434, -5.257946968078613, -4.631922245025635, -4.005899429321289, -3.3798747062683105, -2.753850221633911, -2.1278257369995117, -1.5018010139465332, -0.8757762908935547, -0.24975180625915527, 0.37627267837524414, 1.0022974014282227, 1.6283220052719116, 2.2543466091156006, 2.88037109375, 3.5063958168029785, 4.132420539855957, 4.758444786071777, 5.384469509124756, 6.010494232177734, 6.636518955230713, 7.262543678283691, 7.888567924499512, 8.514593124389648, 9.140617370605469, 9.766641616821289, 10.39266586303711, 11.018691062927246, 11.644715309143066, 12.270740509033203, 12.896764755249023, 13.522789001464844, 14.14881420135498, 14.7748384475708, 15.400863647460938, 16.026887893676758]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 3.0, 7.0, 5.0, 11.0, 5.0, 13.0, 14.0, 17.0, 13.0, 25.0, 17.0, 25.0, 21.0, 25.0, 18.0, 31.0, 32.0, 33.0, 24.0, 28.0, 44.0, 40.0, 40.0, 42.0, 46.0, 35.0, 33.0, 25.0, 36.0, 27.0, 28.0, 28.0, 24.0, 27.0, 25.0, 13.0, 18.0, 18.0, 15.0, 8.0, 11.0, 13.0, 11.0, 9.0, 1.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.325490951538086, -10.000835418701172, -9.676180839538574, -9.35152530670166, -9.026870727539062, -8.702215194702148, -8.37756061553955, -8.052905082702637, -7.728250026702881, -7.403594970703125, -7.078939914703369, -6.754284858703613, -6.429629325866699, -6.104974746704102, -5.7803192138671875, -5.455664157867432, -5.131009101867676, -4.80635404586792, -4.481698989868164, -4.157043933868408, -3.8323886394500732, -3.5077335834503174, -3.1830782890319824, -2.8584232330322266, -2.5337681770324707, -2.209113121032715, -1.8844579458236694, -1.559802770614624, -1.2351477146148682, -0.9104926586151123, -0.5858374834060669, -0.2611823081970215, 0.06347179412841797, 0.3881269097328186, 0.7127820253372192, 1.0374372005462646, 1.3620922565460205, 1.6867473125457764, 2.0114026069641113, 2.336057662963867, 2.660712718963623, 2.985367774963379, 3.3100228309631348, 3.6346781253814697, 3.9593331813812256, 4.283987998962402, 4.608643531799316, 4.933298587799072, 5.257953643798828, 5.582608699798584, 5.90726375579834, 6.231918811798096, 6.556573867797852, 6.881229400634766, 7.2058844566345215, 7.530539512634277, 7.855194568634033, 8.179849624633789, 8.504505157470703, 8.8291597366333, 9.153815269470215, 9.478469848632812, 9.803125381469727, 10.12778091430664, 10.452435493469238]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 10.0, 8.0, 7.0, 8.0, 8.0, 12.0, 11.0, 15.0, 18.0, 18.0, 23.0, 34.0, 19.0, 35.0, 28.0, 31.0, 36.0, 37.0, 47.0, 48.0, 39.0, 35.0, 36.0, 40.0, 49.0, 46.0, 36.0, 43.0, 31.0, 30.0, 30.0, 21.0, 17.0, 16.0, 14.0, 7.0, 17.0, 8.0, 8.0, 7.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.8173828125, -1.76824951171875, -1.7191162109375, -1.66998291015625, -1.620849609375, -1.57171630859375, -1.5225830078125, -1.47344970703125, -1.42431640625, -1.37518310546875, -1.3260498046875, -1.27691650390625, -1.227783203125, -1.17864990234375, -1.1295166015625, -1.08038330078125, -1.03125, -0.98211669921875, -0.9329833984375, -0.88385009765625, -0.834716796875, -0.78558349609375, -0.7364501953125, -0.68731689453125, -0.63818359375, -0.58905029296875, -0.5399169921875, -0.49078369140625, -0.441650390625, -0.39251708984375, -0.3433837890625, -0.29425048828125, -0.2451171875, -0.19598388671875, -0.1468505859375, -0.09771728515625, -0.048583984375, 0.00054931640625, 0.0496826171875, 0.09881591796875, 0.14794921875, 0.19708251953125, 0.2462158203125, 0.29534912109375, 0.344482421875, 0.39361572265625, 0.4427490234375, 0.49188232421875, 0.541015625, 0.59014892578125, 0.6392822265625, 0.68841552734375, 0.737548828125, 0.78668212890625, 0.8358154296875, 0.88494873046875, 0.93408203125, 0.98321533203125, 1.0323486328125, 1.08148193359375, 1.130615234375, 1.17974853515625, 1.2288818359375, 1.27801513671875, 1.3271484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 10.0, 18.0, 45.0, 49.0, 103.0, 169.0, 244.0, 344.0, 457.0, 761.0, 1009.0, 1483.0, 2154.0, 3290.0, 4948.0, 7273.0, 11656.0, 18308.0, 29867.0, 50107.0, 90535.0, 172786.0, 248567.0, 177242.0, 92789.0, 50920.0, 30461.0, 18305.0, 11711.0, 7566.0, 5026.0, 3371.0, 2218.0, 1519.0, 1016.0, 731.0, 483.0, 338.0, 251.0, 175.0, 103.0, 51.0, 22.0, 23.0, 19.0, 9.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.884765625, -1.8249664306640625, -1.765167236328125, -1.7053680419921875, -1.64556884765625, -1.5857696533203125, -1.525970458984375, -1.4661712646484375, -1.4063720703125, -1.3465728759765625, -1.286773681640625, -1.2269744873046875, -1.16717529296875, -1.1073760986328125, -1.047576904296875, -0.9877777099609375, -0.927978515625, -0.8681793212890625, -0.808380126953125, -0.7485809326171875, -0.68878173828125, -0.6289825439453125, -0.569183349609375, -0.5093841552734375, -0.4495849609375, -0.3897857666015625, -0.329986572265625, -0.2701873779296875, -0.21038818359375, -0.1505889892578125, -0.090789794921875, -0.0309906005859375, 0.02880859375, 0.0886077880859375, 0.148406982421875, 0.2082061767578125, 0.26800537109375, 0.3278045654296875, 0.387603759765625, 0.4474029541015625, 0.5072021484375, 0.5670013427734375, 0.626800537109375, 0.6865997314453125, 0.74639892578125, 0.8061981201171875, 0.865997314453125, 0.9257965087890625, 0.985595703125, 1.0453948974609375, 1.105194091796875, 1.1649932861328125, 1.22479248046875, 1.2845916748046875, 1.344390869140625, 1.4041900634765625, 1.4639892578125, 1.5237884521484375, 1.583587646484375, 1.6433868408203125, 1.70318603515625, 1.7629852294921875, 1.822784423828125, 1.8825836181640625, 1.9423828125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 3.0, 13.0, 13.0, 17.0, 21.0, 20.0, 20.0, 23.0, 20.0, 40.0, 36.0, 39.0, 41.0, 57.0, 39.0, 48.0, 46.0, 1065.0, 45.0, 39.0, 43.0, 30.0, 30.0, 29.0, 36.0, 16.0, 31.0, 31.0, 24.0, 15.0, 14.0, 12.0, 12.0, 12.0, 8.0, 9.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.853515625, -1.7980499267578125, -1.742584228515625, -1.6871185302734375, -1.63165283203125, -1.5761871337890625, -1.520721435546875, -1.4652557373046875, -1.4097900390625, -1.3543243408203125, -1.298858642578125, -1.2433929443359375, -1.18792724609375, -1.1324615478515625, -1.076995849609375, -1.0215301513671875, -0.966064453125, -0.9105987548828125, -0.855133056640625, -0.7996673583984375, -0.74420166015625, -0.6887359619140625, -0.633270263671875, -0.5778045654296875, -0.5223388671875, -0.4668731689453125, -0.411407470703125, -0.3559417724609375, -0.30047607421875, -0.2450103759765625, -0.189544677734375, -0.1340789794921875, -0.07861328125, -0.0231475830078125, 0.032318115234375, 0.0877838134765625, 0.14324951171875, 0.1987152099609375, 0.254180908203125, 0.3096466064453125, 0.3651123046875, 0.4205780029296875, 0.476043701171875, 0.5315093994140625, 0.58697509765625, 0.6424407958984375, 0.697906494140625, 0.7533721923828125, 0.808837890625, 0.8643035888671875, 0.919769287109375, 0.9752349853515625, 1.03070068359375, 1.0861663818359375, 1.141632080078125, 1.1970977783203125, 1.2525634765625, 1.3080291748046875, 1.363494873046875, 1.4189605712890625, 1.47442626953125, 1.5298919677734375, 1.585357666015625, 1.6408233642578125, 1.6962890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 12.0, 13.0, 19.0, 17.0, 26.0, 42.0, 65.0, 101.0, 164.0, 245.0, 322.0, 542.0, 761.0, 1170.0, 1957.0, 3352.0, 5719.0, 10186.0, 19726.0, 48300.0, 664439.0, 1242055.0, 52137.0, 20470.0, 10464.0, 5777.0, 3343.0, 2045.0, 1227.0, 825.0, 514.0, 332.0, 235.0, 168.0, 111.0, 79.0, 39.0, 51.0, 19.0, 24.0, 8.0, 10.0, 11.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.060546875, -2.9619140625, -2.86328125, -2.7646484375, -2.666015625, -2.5673828125, -2.46875, -2.3701171875, -2.271484375, -2.1728515625, -2.07421875, -1.9755859375, -1.876953125, -1.7783203125, -1.6796875, -1.5810546875, -1.482421875, -1.3837890625, -1.28515625, -1.1865234375, -1.087890625, -0.9892578125, -0.890625, -0.7919921875, -0.693359375, -0.5947265625, -0.49609375, -0.3974609375, -0.298828125, -0.2001953125, -0.1015625, -0.0029296875, 0.095703125, 0.1943359375, 0.29296875, 0.3916015625, 0.490234375, 0.5888671875, 0.6875, 0.7861328125, 0.884765625, 0.9833984375, 1.08203125, 1.1806640625, 1.279296875, 1.3779296875, 1.4765625, 1.5751953125, 1.673828125, 1.7724609375, 1.87109375, 1.9697265625, 2.068359375, 2.1669921875, 2.265625, 2.3642578125, 2.462890625, 2.5615234375, 2.66015625, 2.7587890625, 2.857421875, 2.9560546875, 3.0546875, 3.1533203125, 3.251953125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 8.0, 8.0, 8.0, 11.0, 17.0, 16.0, 9.0, 27.0, 42.0, 52.0, 85.0, 106.0, 118.0, 111.0, 78.0, 62.0, 48.0, 35.0, 35.0, 24.0, 15.0, 9.0, 12.0, 6.0, 7.0, 9.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.18894577026367188, -0.18257904052734375, -0.17621231079101562, -0.1698455810546875, -0.16347885131835938, -0.15711212158203125, -0.15074539184570312, -0.144378662109375, -0.13801193237304688, -0.13164520263671875, -0.12527847290039062, -0.1189117431640625, -0.11254501342773438, -0.10617828369140625, -0.09981155395507812, -0.09344482421875, -0.08707809448242188, -0.08071136474609375, -0.07434463500976562, -0.0679779052734375, -0.061611175537109375, -0.05524444580078125, -0.048877716064453125, -0.042510986328125, -0.036144256591796875, -0.02977752685546875, -0.023410797119140625, -0.0170440673828125, -0.010677337646484375, -0.00431060791015625, 0.002056121826171875, 0.0084228515625, 0.014789581298828125, 0.02115631103515625, 0.027523040771484375, 0.0338897705078125, 0.040256500244140625, 0.04662322998046875, 0.052989959716796875, 0.059356689453125, 0.06572341918945312, 0.07209014892578125, 0.07845687866210938, 0.0848236083984375, 0.09119033813476562, 0.09755706787109375, 0.10392379760742188, 0.11029052734375, 0.11665725708007812, 0.12302398681640625, 0.12939071655273438, 0.1357574462890625, 0.14212417602539062, 0.14849090576171875, 0.15485763549804688, 0.161224365234375, 0.16759109497070312, 0.17395782470703125, 0.18032455444335938, 0.1866912841796875, 0.19305801391601562, 0.19942474365234375, 0.20579147338867188, 0.212158203125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 4.0, 5.0, 9.0, 11.0, 11.0, 14.0, 17.0, 26.0, 38.0, 41.0, 62.0, 72.0, 103.0, 162.0, 326.0, 786.0, 3294.0, 20213.0, 705443.0, 299735.0, 14071.0, 2548.0, 716.0, 265.0, 159.0, 90.0, 81.0, 51.0, 33.0, 39.0, 23.0, 16.0, 23.0, 15.0, 13.0, 7.0, 3.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.419921875, -2.341644287109375, -2.26336669921875, -2.185089111328125, -2.1068115234375, -2.028533935546875, -1.95025634765625, -1.871978759765625, -1.793701171875, -1.715423583984375, -1.63714599609375, -1.558868408203125, -1.4805908203125, -1.402313232421875, -1.32403564453125, -1.245758056640625, -1.16748046875, -1.089202880859375, -1.01092529296875, -0.932647705078125, -0.8543701171875, -0.776092529296875, -0.69781494140625, -0.619537353515625, -0.541259765625, -0.462982177734375, -0.38470458984375, -0.306427001953125, -0.2281494140625, -0.149871826171875, -0.07159423828125, 0.006683349609375, 0.0849609375, 0.163238525390625, 0.24151611328125, 0.319793701171875, 0.3980712890625, 0.476348876953125, 0.55462646484375, 0.632904052734375, 0.711181640625, 0.789459228515625, 0.86773681640625, 0.946014404296875, 1.0242919921875, 1.102569580078125, 1.18084716796875, 1.259124755859375, 1.33740234375, 1.415679931640625, 1.49395751953125, 1.572235107421875, 1.6505126953125, 1.728790283203125, 1.80706787109375, 1.885345458984375, 1.963623046875, 2.041900634765625, 2.12017822265625, 2.198455810546875, 2.2767333984375, 2.355010986328125, 2.43328857421875, 2.511566162109375, 2.58984375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 10.0, 10.0, 14.0, 19.0, 31.0, 41.0, 68.0, 115.0, 160.0, 165.0, 107.0, 77.0, 46.0, 35.0, 27.0, 24.0, 10.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546922087669373, -0.5271629095077515, -0.4996336102485657, -0.4721042811870575, -0.4445749819278717, -0.4170456826686859, -0.38951635360717773, -0.36198705434799194, -0.33445775508880615, -0.30692845582962036, -0.27939915657043457, -0.2518698275089264, -0.2243405282497406, -0.1968112289905548, -0.16928191483020782, -0.14175260066986084, -0.11422330141067505, -0.08669399470090866, -0.05916468799114227, -0.031635381281375885, -0.004106074571609497, 0.023423224687576294, 0.05095253884792328, 0.07848185300827026, 0.10601115226745605, 0.13354045152664185, 0.16106976568698883, 0.18859907984733582, 0.2161283791065216, 0.2436576783657074, 0.2711870074272156, 0.29871630668640137, 0.3262455463409424, 0.3537748456001282, 0.38130414485931396, 0.40883347392082214, 0.43636277318000793, 0.4638920724391937, 0.4914214015007019, 0.5189507007598877, 0.5464800000190735, 0.5740092992782593, 0.6015385985374451, 0.6290678977966309, 0.6565972566604614, 0.6841264963150024, 0.711655855178833, 0.7391851544380188, 0.7667144536972046, 0.7942437529563904, 0.8217730522155762, 0.849302351474762, 0.8768316507339478, 0.9043610095977783, 0.9318903088569641, 0.9594196081161499, 0.9869489073753357, 1.0144782066345215, 1.042007565498352, 1.069536805152893, 1.0970661640167236, 1.1245954036712646, 1.1521247625350952, 1.1796541213989258, 1.2071833610534668]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 13.0, 8.0, 13.0, 17.0, 14.0, 19.0, 19.0, 15.0, 25.0, 23.0, 26.0, 24.0, 26.0, 43.0, 31.0, 25.0, 37.0, 27.0, 29.0, 41.0, 42.0, 46.0, 40.0, 34.0, 43.0, 37.0, 32.0, 32.0, 23.0, 30.0, 23.0, 21.0, 14.0, 17.0, 12.0, 13.0, 10.0, 6.0, 3.0, 4.0, 6.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4520917534828186, -0.4378017783164978, -0.423511803150177, -0.4092218577861786, -0.3949318826198578, -0.380641907453537, -0.3663519620895386, -0.3520619869232178, -0.337772011756897, -0.32348203659057617, -0.30919206142425537, -0.29490211606025696, -0.28061214089393616, -0.26632216572761536, -0.25203222036361694, -0.23774224519729614, -0.22345227003097534, -0.20916229486465454, -0.19487233459949493, -0.18058237433433533, -0.16629239916801453, -0.15200242400169373, -0.13771246373653412, -0.12342249602079391, -0.10913252830505371, -0.09484256058931351, -0.0805525928735733, -0.0662626251578331, -0.051972657442092896, -0.03768268972635269, -0.023392722010612488, -0.009102754294872284, 0.00518721342086792, 0.019477181136608124, 0.03376714885234833, 0.04805711656808853, 0.062347084283828735, 0.07663705199956894, 0.09092701971530914, 0.10521698743104935, 0.11950695514678955, 0.13379693031311035, 0.14808689057826996, 0.16237685084342957, 0.17666682600975037, 0.19095680117607117, 0.20524676144123077, 0.21953672170639038, 0.23382669687271118, 0.24811667203903198, 0.2624066472053528, 0.2766965925693512, 0.290986567735672, 0.3052765429019928, 0.3195664882659912, 0.333856463432312, 0.3481464385986328, 0.3624364137649536, 0.3767263889312744, 0.3910163342952728, 0.40530630946159363, 0.41959628462791443, 0.43388622999191284, 0.44817620515823364, 0.46246618032455444]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 10.0, 8.0, 8.0, 9.0, 11.0, 12.0, 16.0, 17.0, 23.0, 25.0, 29.0, 25.0, 35.0, 25.0, 38.0, 37.0, 34.0, 45.0, 50.0, 36.0, 38.0, 44.0, 31.0, 41.0, 54.0, 33.0, 43.0, 24.0, 40.0, 27.0, 19.0, 16.0, 13.0, 14.0, 11.0, 14.0, 7.0, 8.0, 6.0, 8.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7697906494140625, -1.720245361328125, -1.6707000732421875, -1.62115478515625, -1.5716094970703125, -1.522064208984375, -1.4725189208984375, -1.4229736328125, -1.3734283447265625, -1.323883056640625, -1.2743377685546875, -1.22479248046875, -1.1752471923828125, -1.125701904296875, -1.0761566162109375, -1.026611328125, -0.9770660400390625, -0.927520751953125, -0.8779754638671875, -0.82843017578125, -0.7788848876953125, -0.729339599609375, -0.6797943115234375, -0.6302490234375, -0.5807037353515625, -0.531158447265625, -0.4816131591796875, -0.43206787109375, -0.3825225830078125, -0.332977294921875, -0.2834320068359375, -0.23388671875, -0.1843414306640625, -0.134796142578125, -0.0852508544921875, -0.03570556640625, 0.0138397216796875, 0.063385009765625, 0.1129302978515625, 0.1624755859375, 0.2120208740234375, 0.261566162109375, 0.3111114501953125, 0.36065673828125, 0.4102020263671875, 0.459747314453125, 0.5092926025390625, 0.558837890625, 0.6083831787109375, 0.657928466796875, 0.7074737548828125, 0.75701904296875, 0.8065643310546875, 0.856109619140625, 0.9056549072265625, 0.9552001953125, 1.0047454833984375, 1.054290771484375, 1.1038360595703125, 1.15338134765625, 1.2029266357421875, 1.252471923828125, 1.3020172119140625, 1.3515625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 8.0, 9.0, 8.0, 15.0, 13.0, 35.0, 37.0, 64.0, 94.0, 136.0, 185.0, 328.0, 548.0, 969.0, 1771.0, 3436.0, 8061.0, 23836.0, 136423.0, 737197.0, 100889.0, 20196.0, 7148.0, 3214.0, 1621.0, 892.0, 509.0, 284.0, 198.0, 141.0, 70.0, 71.0, 33.0, 24.0, 20.0, 20.0, 7.0, 6.0, 4.0, 4.0, 11.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.37164306640625, -3.2764892578125, -3.18133544921875, -3.086181640625, -2.99102783203125, -2.8958740234375, -2.80072021484375, -2.70556640625, -2.61041259765625, -2.5152587890625, -2.42010498046875, -2.324951171875, -2.22979736328125, -2.1346435546875, -2.03948974609375, -1.9443359375, -1.84918212890625, -1.7540283203125, -1.65887451171875, -1.563720703125, -1.46856689453125, -1.3734130859375, -1.27825927734375, -1.18310546875, -1.08795166015625, -0.9927978515625, -0.89764404296875, -0.802490234375, -0.70733642578125, -0.6121826171875, -0.51702880859375, -0.421875, -0.32672119140625, -0.2315673828125, -0.13641357421875, -0.041259765625, 0.05389404296875, 0.1490478515625, 0.24420166015625, 0.33935546875, 0.43450927734375, 0.5296630859375, 0.62481689453125, 0.719970703125, 0.81512451171875, 0.9102783203125, 1.00543212890625, 1.1005859375, 1.19573974609375, 1.2908935546875, 1.38604736328125, 1.481201171875, 1.57635498046875, 1.6715087890625, 1.76666259765625, 1.86181640625, 1.95697021484375, 2.0521240234375, 2.14727783203125, 2.242431640625, 2.33758544921875, 2.4327392578125, 2.52789306640625, 2.623046875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 3.0, 6.0, 7.0, 13.0, 11.0, 18.0, 19.0, 29.0, 22.0, 31.0, 25.0, 37.0, 51.0, 47.0, 56.0, 65.0, 59.0, 126.0, 1506.0, 340.0, 93.0, 73.0, 46.0, 46.0, 48.0, 37.0, 37.0, 33.0, 21.0, 20.0, 21.0, 15.0, 16.0, 11.0, 13.0, 7.0, 6.0, 5.0, 7.0, 1.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.625, -5.44842529296875, -5.2718505859375, -5.09527587890625, -4.918701171875, -4.74212646484375, -4.5655517578125, -4.38897705078125, -4.21240234375, -4.03582763671875, -3.8592529296875, -3.68267822265625, -3.506103515625, -3.32952880859375, -3.1529541015625, -2.97637939453125, -2.7998046875, -2.62322998046875, -2.4466552734375, -2.27008056640625, -2.093505859375, -1.91693115234375, -1.7403564453125, -1.56378173828125, -1.38720703125, -1.21063232421875, -1.0340576171875, -0.85748291015625, -0.680908203125, -0.50433349609375, -0.3277587890625, -0.15118408203125, 0.025390625, 0.20196533203125, 0.3785400390625, 0.55511474609375, 0.731689453125, 0.90826416015625, 1.0848388671875, 1.26141357421875, 1.43798828125, 1.61456298828125, 1.7911376953125, 1.96771240234375, 2.144287109375, 2.32086181640625, 2.4974365234375, 2.67401123046875, 2.8505859375, 3.02716064453125, 3.2037353515625, 3.38031005859375, 3.556884765625, 3.73345947265625, 3.9100341796875, 4.08660888671875, 4.26318359375, 4.43975830078125, 4.6163330078125, 4.79290771484375, 4.969482421875, 5.14605712890625, 5.3226318359375, 5.49920654296875, 5.67578125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 9.0, 14.0, 27.0, 20.0, 36.0, 47.0, 93.0, 113.0, 218.0, 376.0, 874.0, 2635.0, 11218.0, 97378.0, 2947159.0, 71873.0, 9476.0, 2360.0, 826.0, 378.0, 197.0, 116.0, 77.0, 47.0, 36.0, 33.0, 7.0, 10.0, 7.0, 12.0, 5.0, 6.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.3570556640625, -11.964111328125, -11.5711669921875, -11.17822265625, -10.7852783203125, -10.392333984375, -9.9993896484375, -9.6064453125, -9.2135009765625, -8.820556640625, -8.4276123046875, -8.03466796875, -7.6417236328125, -7.248779296875, -6.8558349609375, -6.462890625, -6.0699462890625, -5.677001953125, -5.2840576171875, -4.89111328125, -4.4981689453125, -4.105224609375, -3.7122802734375, -3.3193359375, -2.9263916015625, -2.533447265625, -2.1405029296875, -1.74755859375, -1.3546142578125, -0.961669921875, -0.5687255859375, -0.17578125, 0.2171630859375, 0.610107421875, 1.0030517578125, 1.39599609375, 1.7889404296875, 2.181884765625, 2.5748291015625, 2.9677734375, 3.3607177734375, 3.753662109375, 4.1466064453125, 4.53955078125, 4.9324951171875, 5.325439453125, 5.7183837890625, 6.111328125, 6.5042724609375, 6.897216796875, 7.2901611328125, 7.68310546875, 8.0760498046875, 8.468994140625, 8.8619384765625, 9.2548828125, 9.6478271484375, 10.040771484375, 10.4337158203125, 10.82666015625, 11.2196044921875, 11.612548828125, 12.0054931640625, 12.3984375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 5.0, 18.0, 51.0, 96.0, 145.0, 262.0, 200.0, 109.0, 51.0, 36.0, 20.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.257352828979492, -10.545281410217285, -9.833209991455078, -9.121138572692871, -8.409067153930664, -7.696995735168457, -6.98492431640625, -6.272852897644043, -5.560781478881836, -4.848710060119629, -4.136638641357422, -3.424567222595215, -2.712495803833008, -2.000424385070801, -1.2883529663085938, -0.5762815475463867, 0.1357898712158203, 0.8478612899780273, 1.5599327087402344, 2.2720041275024414, 2.9840755462646484, 3.6961469650268555, 4.4082183837890625, 5.1202898025512695, 5.832361221313477, 6.544432640075684, 7.256504058837891, 7.968575477600098, 8.680646896362305, 9.392718315124512, 10.104789733886719, 10.816861152648926, 11.528934478759766, 12.241005897521973, 12.95307731628418, 13.665148735046387, 14.377220153808594, 15.0892915725708, 15.801362991333008, 16.51343536376953, 17.225505828857422, 17.937576293945312, 18.649648666381836, 19.36172103881836, 20.07379150390625, 20.78586196899414, 21.497934341430664, 22.210006713867188, 22.922077178955078, 23.63414764404297, 24.346220016479492, 25.058292388916016, 25.770362854003906, 26.482433319091797, 27.19450569152832, 27.906578063964844, 28.618648529052734, 29.330718994140625, 30.04279136657715, 30.754863739013672, 31.466934204101562, 32.17900466918945, 32.891075134277344, 33.6031494140625, 34.31521987915039]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 9.0, 3.0, 5.0, 6.0, 7.0, 5.0, 21.0, 20.0, 19.0, 22.0, 7.0, 24.0, 18.0, 29.0, 26.0, 33.0, 28.0, 45.0, 40.0, 35.0, 54.0, 36.0, 42.0, 39.0, 31.0, 43.0, 34.0, 38.0, 39.0, 21.0, 31.0, 29.0, 23.0, 21.0, 16.0, 13.0, 13.0, 11.0, 13.0, 11.0, 9.0, 6.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.666755676269531, -13.220799446105957, -12.774843215942383, -12.328887939453125, -11.88293170928955, -11.436975479125977, -10.991019248962402, -10.545063018798828, -10.09910774230957, -9.653151512145996, -9.207195281982422, -8.761240005493164, -8.31528377532959, -7.869327545166016, -7.423371315002441, -6.977415084838867, -6.531458854675293, -6.085502624511719, -5.639546871185303, -5.1935906410217285, -4.7476348876953125, -4.301678657531738, -3.855722427368164, -3.409766435623169, -2.963810443878174, -2.5178544521331787, -2.0718984603881836, -1.6259422302246094, -1.1799862384796143, -0.7340302467346191, -0.2880740165710449, 0.1578819751739502, 0.6038379669189453, 1.0497939586639404, 1.495750069618225, 1.9417061805725098, 2.387662172317505, 2.8336181640625, 3.279574394226074, 3.7255303859710693, 4.1714863777160645, 4.617442607879639, 5.063398361206055, 5.509354591369629, 5.955310821533203, 6.401266574859619, 6.847222805023193, 7.293178558349609, 7.739134788513184, 8.185091018676758, 8.631047248840332, 9.077003479003906, 9.522958755493164, 9.968914985656738, 10.414871215820312, 10.860827445983887, 11.306783676147461, 11.752739906311035, 12.19869613647461, 12.644651412963867, 13.090607643127441, 13.536563873291016, 13.98252010345459, 14.428476333618164, 14.874431610107422]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 8.0, 7.0, 13.0, 7.0, 6.0, 15.0, 12.0, 15.0, 21.0, 28.0, 22.0, 24.0, 29.0, 35.0, 30.0, 45.0, 39.0, 40.0, 49.0, 50.0, 49.0, 45.0, 37.0, 49.0, 43.0, 39.0, 31.0, 42.0, 24.0, 21.0, 24.0, 23.0, 16.0, 12.0, 13.0, 10.0, 10.0, 7.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.060546875, -2.0076751708984375, -1.954803466796875, -1.9019317626953125, -1.84906005859375, -1.7961883544921875, -1.743316650390625, -1.6904449462890625, -1.6375732421875, -1.5847015380859375, -1.531829833984375, -1.4789581298828125, -1.42608642578125, -1.3732147216796875, -1.320343017578125, -1.2674713134765625, -1.214599609375, -1.1617279052734375, -1.108856201171875, -1.0559844970703125, -1.00311279296875, -0.9502410888671875, -0.897369384765625, -0.8444976806640625, -0.7916259765625, -0.7387542724609375, -0.685882568359375, -0.6330108642578125, -0.58013916015625, -0.5272674560546875, -0.474395751953125, -0.4215240478515625, -0.36865234375, -0.3157806396484375, -0.262908935546875, -0.2100372314453125, -0.15716552734375, -0.1042938232421875, -0.051422119140625, 0.0014495849609375, 0.0543212890625, 0.1071929931640625, 0.160064697265625, 0.2129364013671875, 0.26580810546875, 0.3186798095703125, 0.371551513671875, 0.4244232177734375, 0.477294921875, 0.5301666259765625, 0.583038330078125, 0.6359100341796875, 0.68878173828125, 0.7416534423828125, 0.794525146484375, 0.8473968505859375, 0.9002685546875, 0.9531402587890625, 1.006011962890625, 1.0588836669921875, 1.11175537109375, 1.1646270751953125, 1.217498779296875, 1.2703704833984375, 1.3232421875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 6.0, 10.0, 12.0, 12.0, 27.0, 31.0, 41.0, 70.0, 111.0, 187.0, 310.0, 491.0, 857.0, 1623.0, 2894.0, 5667.0, 11583.0, 28297.0, 206245.0, 3386751.0, 483154.0, 38283.0, 13903.0, 6455.0, 3161.0, 1747.0, 981.0, 548.0, 322.0, 187.0, 109.0, 65.0, 38.0, 27.0, 19.0, 11.0, 9.0, 9.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.19329833984375, -6.0194091796875, -5.84552001953125, -5.671630859375, -5.49774169921875, -5.3238525390625, -5.14996337890625, -4.97607421875, -4.80218505859375, -4.6282958984375, -4.45440673828125, -4.280517578125, -4.10662841796875, -3.9327392578125, -3.75885009765625, -3.5849609375, -3.41107177734375, -3.2371826171875, -3.06329345703125, -2.889404296875, -2.71551513671875, -2.5416259765625, -2.36773681640625, -2.19384765625, -2.01995849609375, -1.8460693359375, -1.67218017578125, -1.498291015625, -1.32440185546875, -1.1505126953125, -0.97662353515625, -0.802734375, -0.62884521484375, -0.4549560546875, -0.28106689453125, -0.107177734375, 0.06671142578125, 0.2406005859375, 0.41448974609375, 0.58837890625, 0.76226806640625, 0.9361572265625, 1.11004638671875, 1.283935546875, 1.45782470703125, 1.6317138671875, 1.80560302734375, 1.9794921875, 2.15338134765625, 2.3272705078125, 2.50115966796875, 2.675048828125, 2.84893798828125, 3.0228271484375, 3.19671630859375, 3.37060546875, 3.54449462890625, 3.7183837890625, 3.89227294921875, 4.066162109375, 4.24005126953125, 4.4139404296875, 4.58782958984375, 4.76171875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 8.0, 11.0, 9.0, 20.0, 22.0, 31.0, 34.0, 67.0, 131.0, 349.0, 1092.0, 1371.0, 512.0, 170.0, 93.0, 61.0, 31.0, 17.0, 15.0, 11.0, 8.0, 6.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.80267333984375, -5.5623779296875, -5.32208251953125, -5.081787109375, -4.84149169921875, -4.6011962890625, -4.36090087890625, -4.12060546875, -3.88031005859375, -3.6400146484375, -3.39971923828125, -3.159423828125, -2.91912841796875, -2.6788330078125, -2.43853759765625, -2.1982421875, -1.95794677734375, -1.7176513671875, -1.47735595703125, -1.237060546875, -0.99676513671875, -0.7564697265625, -0.51617431640625, -0.27587890625, -0.03558349609375, 0.2047119140625, 0.44500732421875, 0.685302734375, 0.92559814453125, 1.1658935546875, 1.40618896484375, 1.646484375, 1.88677978515625, 2.1270751953125, 2.36737060546875, 2.607666015625, 2.84796142578125, 3.0882568359375, 3.32855224609375, 3.56884765625, 3.80914306640625, 4.0494384765625, 4.28973388671875, 4.530029296875, 4.77032470703125, 5.0106201171875, 5.25091552734375, 5.4912109375, 5.73150634765625, 5.9718017578125, 6.21209716796875, 6.452392578125, 6.69268798828125, 6.9329833984375, 7.17327880859375, 7.41357421875, 7.65386962890625, 7.8941650390625, 8.13446044921875, 8.374755859375, 8.61505126953125, 8.8553466796875, 9.09564208984375, 9.3359375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 17.0, 30.0, 39.0, 80.0, 99.0, 215.0, 372.0, 844.0, 2059.0, 6410.0, 23075.0, 155346.0, 3807341.0, 164487.0, 23405.0, 6572.0, 2116.0, 845.0, 407.0, 196.0, 111.0, 72.0, 37.0, 34.0, 27.0, 12.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.8671875, -15.465576171875, -15.06396484375, -14.662353515625, -14.2607421875, -13.859130859375, -13.45751953125, -13.055908203125, -12.654296875, -12.252685546875, -11.85107421875, -11.449462890625, -11.0478515625, -10.646240234375, -10.24462890625, -9.843017578125, -9.44140625, -9.039794921875, -8.63818359375, -8.236572265625, -7.8349609375, -7.433349609375, -7.03173828125, -6.630126953125, -6.228515625, -5.826904296875, -5.42529296875, -5.023681640625, -4.6220703125, -4.220458984375, -3.81884765625, -3.417236328125, -3.015625, -2.614013671875, -2.21240234375, -1.810791015625, -1.4091796875, -1.007568359375, -0.60595703125, -0.204345703125, 0.197265625, 0.598876953125, 1.00048828125, 1.402099609375, 1.8037109375, 2.205322265625, 2.60693359375, 3.008544921875, 3.41015625, 3.811767578125, 4.21337890625, 4.614990234375, 5.0166015625, 5.418212890625, 5.81982421875, 6.221435546875, 6.623046875, 7.024658203125, 7.42626953125, 7.827880859375, 8.2294921875, 8.631103515625, 9.03271484375, 9.434326171875, 9.8359375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 11.0, 18.0, 35.0, 103.0, 196.0, 281.0, 180.0, 86.0, 49.0, 18.0, 14.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.337921142578125, -32.02690505981445, -30.71588706970215, -29.404869079589844, -28.093852996826172, -26.7828369140625, -25.471818923950195, -24.16080093383789, -22.84978485107422, -21.538768768310547, -20.227750778198242, -18.916732788085938, -17.605716705322266, -16.294700622558594, -14.983682632446289, -13.6726655960083, -12.361648559570312, -11.050631523132324, -9.739614486694336, -8.428597450256348, -7.117580413818359, -5.806563377380371, -4.495546340942383, -3.1845293045043945, -1.8735122680664062, -0.562495231628418, 0.7485218048095703, 2.0595388412475586, 3.370555877685547, 4.681572914123535, 5.992589950561523, 7.303606986999512, 8.6146240234375, 9.925641059875488, 11.236658096313477, 12.547675132751465, 13.858692169189453, 15.169709205627441, 16.48072624206543, 17.791744232177734, 19.102760314941406, 20.413776397705078, 21.724794387817383, 23.035812377929688, 24.34682846069336, 25.65784454345703, 26.968862533569336, 28.27988052368164, 29.590896606445312, 30.901912689208984, 32.212928771972656, 33.523948669433594, 34.834964752197266, 36.14598083496094, 37.457000732421875, 38.76801681518555, 40.07903289794922, 41.39004898071289, 42.70106506347656, 44.0120849609375, 45.32310104370117, 46.634117126464844, 47.94513702392578, 49.25615310668945, 50.567169189453125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 5.0, 13.0, 13.0, 15.0, 13.0, 13.0, 18.0, 28.0, 22.0, 34.0, 24.0, 31.0, 45.0, 31.0, 30.0, 37.0, 40.0, 32.0, 43.0, 37.0, 47.0, 37.0, 42.0, 44.0, 32.0, 24.0, 28.0, 22.0, 24.0, 19.0, 18.0, 29.0, 17.0, 18.0, 15.0, 9.0, 6.0, 7.0, 4.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.921573638916016, -11.559412002563477, -11.197250366210938, -10.835089683532715, -10.472928047180176, -10.110766410827637, -9.748605728149414, -9.386444091796875, -9.024282455444336, -8.662120819091797, -8.299959182739258, -7.937798500061035, -7.575636863708496, -7.213475227355957, -6.851314067840576, -6.489152908325195, -6.126991271972656, -5.764829635620117, -5.402668476104736, -5.0405073165893555, -4.678345680236816, -4.316184043884277, -3.9540228843688965, -3.5918614864349365, -3.2297000885009766, -2.8675386905670166, -2.5053772926330566, -2.1432158946990967, -1.7810544967651367, -1.4188930988311768, -1.0567317008972168, -0.6945703029632568, -0.33240795135498047, 0.029753446578979492, 0.39191484451293945, 0.7540762424468994, 1.1162376403808594, 1.4783990383148193, 1.8405604362487793, 2.2027218341827393, 2.564883232116699, 2.927044630050659, 3.289206027984619, 3.651367425918579, 4.013528823852539, 4.375690460205078, 4.737851619720459, 5.10001277923584, 5.462174415588379, 5.824336051940918, 6.186497211456299, 6.54865837097168, 6.910820007324219, 7.272981643676758, 7.635142803192139, 7.9973039627075195, 8.359465599060059, 8.721627235412598, 9.08378791809082, 9.44594955444336, 9.808111190795898, 10.170272827148438, 10.532434463500977, 10.8945951461792, 11.256756782531738]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 4.0, 11.0, 12.0, 9.0, 8.0, 15.0, 19.0, 16.0, 20.0, 22.0, 25.0, 22.0, 25.0, 32.0, 46.0, 32.0, 45.0, 29.0, 43.0, 46.0, 51.0, 37.0, 48.0, 44.0, 33.0, 41.0, 26.0, 30.0, 24.0, 29.0, 31.0, 13.0, 20.0, 23.0, 12.0, 8.0, 15.0, 5.0, 10.0, 4.0, 4.0, 10.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8037109375, -1.75494384765625, -1.7061767578125, -1.65740966796875, -1.608642578125, -1.55987548828125, -1.5111083984375, -1.46234130859375, -1.41357421875, -1.36480712890625, -1.3160400390625, -1.26727294921875, -1.218505859375, -1.16973876953125, -1.1209716796875, -1.07220458984375, -1.0234375, -0.97467041015625, -0.9259033203125, -0.87713623046875, -0.828369140625, -0.77960205078125, -0.7308349609375, -0.68206787109375, -0.63330078125, -0.58453369140625, -0.5357666015625, -0.48699951171875, -0.438232421875, -0.38946533203125, -0.3406982421875, -0.29193115234375, -0.2431640625, -0.19439697265625, -0.1456298828125, -0.09686279296875, -0.048095703125, 0.00067138671875, 0.0494384765625, 0.09820556640625, 0.14697265625, 0.19573974609375, 0.2445068359375, 0.29327392578125, 0.342041015625, 0.39080810546875, 0.4395751953125, 0.48834228515625, 0.537109375, 0.58587646484375, 0.6346435546875, 0.68341064453125, 0.732177734375, 0.78094482421875, 0.8297119140625, 0.87847900390625, 0.92724609375, 0.97601318359375, 1.0247802734375, 1.07354736328125, 1.122314453125, 1.17108154296875, 1.2198486328125, 1.26861572265625, 1.3173828125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 9.0, 15.0, 24.0, 28.0, 39.0, 47.0, 73.0, 153.0, 201.0, 313.0, 436.0, 696.0, 1058.0, 1682.0, 2688.0, 4133.0, 6644.0, 10496.0, 17971.0, 32165.0, 64191.0, 157747.0, 486594.0, 132086.0, 57043.0, 29026.0, 16423.0, 9855.0, 5848.0, 3856.0, 2398.0, 1577.0, 1021.0, 652.0, 407.0, 318.0, 199.0, 123.0, 99.0, 59.0, 42.0, 35.0, 23.0, 18.0, 6.0, 8.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.8896484375, -1.83135986328125, -1.7730712890625, -1.71478271484375, -1.656494140625, -1.59820556640625, -1.5399169921875, -1.48162841796875, -1.42333984375, -1.36505126953125, -1.3067626953125, -1.24847412109375, -1.190185546875, -1.13189697265625, -1.0736083984375, -1.01531982421875, -0.95703125, -0.89874267578125, -0.8404541015625, -0.78216552734375, -0.723876953125, -0.66558837890625, -0.6072998046875, -0.54901123046875, -0.49072265625, -0.43243408203125, -0.3741455078125, -0.31585693359375, -0.257568359375, -0.19927978515625, -0.1409912109375, -0.08270263671875, -0.0244140625, 0.03387451171875, 0.0921630859375, 0.15045166015625, 0.208740234375, 0.26702880859375, 0.3253173828125, 0.38360595703125, 0.44189453125, 0.50018310546875, 0.5584716796875, 0.61676025390625, 0.675048828125, 0.73333740234375, 0.7916259765625, 0.84991455078125, 0.908203125, 0.96649169921875, 1.0247802734375, 1.08306884765625, 1.141357421875, 1.19964599609375, 1.2579345703125, 1.31622314453125, 1.37451171875, 1.43280029296875, 1.4910888671875, 1.54937744140625, 1.607666015625, 1.66595458984375, 1.7242431640625, 1.78253173828125, 1.8408203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 4.0, 10.0, 11.0, 18.0, 19.0, 10.0, 16.0, 23.0, 28.0, 28.0, 34.0, 43.0, 27.0, 30.0, 43.0, 35.0, 44.0, 41.0, 1057.0, 42.0, 41.0, 37.0, 43.0, 27.0, 28.0, 27.0, 29.0, 27.0, 24.0, 20.0, 34.0, 10.0, 20.0, 12.0, 16.0, 14.0, 7.0, 3.0, 11.0, 7.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3583984375, -1.315765380859375, -1.27313232421875, -1.230499267578125, -1.1878662109375, -1.145233154296875, -1.10260009765625, -1.059967041015625, -1.017333984375, -0.974700927734375, -0.93206787109375, -0.889434814453125, -0.8468017578125, -0.804168701171875, -0.76153564453125, -0.718902587890625, -0.67626953125, -0.633636474609375, -0.59100341796875, -0.548370361328125, -0.5057373046875, -0.463104248046875, -0.42047119140625, -0.377838134765625, -0.335205078125, -0.292572021484375, -0.24993896484375, -0.207305908203125, -0.1646728515625, -0.122039794921875, -0.07940673828125, -0.036773681640625, 0.005859375, 0.048492431640625, 0.09112548828125, 0.133758544921875, 0.1763916015625, 0.219024658203125, 0.26165771484375, 0.304290771484375, 0.346923828125, 0.389556884765625, 0.43218994140625, 0.474822998046875, 0.5174560546875, 0.560089111328125, 0.60272216796875, 0.645355224609375, 0.68798828125, 0.730621337890625, 0.77325439453125, 0.815887451171875, 0.8585205078125, 0.901153564453125, 0.94378662109375, 0.986419677734375, 1.029052734375, 1.071685791015625, 1.11431884765625, 1.156951904296875, 1.1995849609375, 1.242218017578125, 1.28485107421875, 1.327484130859375, 1.3701171875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 10.0, 16.0, 13.0, 16.0, 26.0, 37.0, 61.0, 71.0, 99.0, 108.0, 193.0, 244.0, 346.0, 502.0, 790.0, 1200.0, 1850.0, 2903.0, 4987.0, 9643.0, 22940.0, 135221.0, 1831454.0, 50868.0, 15191.0, 7371.0, 3973.0, 2292.0, 1474.0, 959.0, 630.0, 450.0, 290.0, 231.0, 133.0, 136.0, 111.0, 71.0, 46.0, 42.0, 26.0, 31.0, 19.0, 16.0, 13.0, 4.0, 6.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.05859375, -1.988311767578125, -1.91802978515625, -1.847747802734375, -1.7774658203125, -1.707183837890625, -1.63690185546875, -1.566619873046875, -1.496337890625, -1.426055908203125, -1.35577392578125, -1.285491943359375, -1.2152099609375, -1.144927978515625, -1.07464599609375, -1.004364013671875, -0.93408203125, -0.863800048828125, -0.79351806640625, -0.723236083984375, -0.6529541015625, -0.582672119140625, -0.51239013671875, -0.442108154296875, -0.371826171875, -0.301544189453125, -0.23126220703125, -0.160980224609375, -0.0906982421875, -0.020416259765625, 0.04986572265625, 0.120147705078125, 0.1904296875, 0.260711669921875, 0.33099365234375, 0.401275634765625, 0.4715576171875, 0.541839599609375, 0.61212158203125, 0.682403564453125, 0.752685546875, 0.822967529296875, 0.89324951171875, 0.963531494140625, 1.0338134765625, 1.104095458984375, 1.17437744140625, 1.244659423828125, 1.31494140625, 1.385223388671875, 1.45550537109375, 1.525787353515625, 1.5960693359375, 1.666351318359375, 1.73663330078125, 1.806915283203125, 1.877197265625, 1.947479248046875, 2.01776123046875, 2.088043212890625, 2.1583251953125, 2.228607177734375, 2.29888916015625, 2.369171142578125, 2.439453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 23.0, 18.0, 28.0, 24.0, 55.0, 55.0, 84.0, 147.0, 150.0, 112.0, 90.0, 47.0, 41.0, 21.0, 23.0, 14.0, 8.0, 6.0, 6.0, 4.0, 1.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.098388671875, -0.0954446792602539, -0.09250068664550781, -0.08955669403076172, -0.08661270141601562, -0.08366870880126953, -0.08072471618652344, -0.07778072357177734, -0.07483673095703125, -0.07189273834228516, -0.06894874572753906, -0.06600475311279297, -0.06306076049804688, -0.06011676788330078, -0.05717277526855469, -0.054228782653808594, -0.0512847900390625, -0.048340797424316406, -0.04539680480957031, -0.04245281219482422, -0.039508819580078125, -0.03656482696533203, -0.03362083435058594, -0.030676841735839844, -0.02773284912109375, -0.024788856506347656, -0.021844863891601562, -0.01890087127685547, -0.015956878662109375, -0.013012886047363281, -0.010068893432617188, -0.007124900817871094, -0.004180908203125, -0.0012369155883789062, 0.0017070770263671875, 0.004651069641113281, 0.007595062255859375, 0.010539054870605469, 0.013483047485351562, 0.016427040100097656, 0.01937103271484375, 0.022315025329589844, 0.025259017944335938, 0.02820301055908203, 0.031147003173828125, 0.03409099578857422, 0.03703498840332031, 0.039978981018066406, 0.0429229736328125, 0.045866966247558594, 0.04881095886230469, 0.05175495147705078, 0.054698944091796875, 0.05764293670654297, 0.06058692932128906, 0.06353092193603516, 0.06647491455078125, 0.06941890716552734, 0.07236289978027344, 0.07530689239501953, 0.07825088500976562, 0.08119487762451172, 0.08413887023925781, 0.0870828628540039, 0.09002685546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 15.0, 8.0, 6.0, 9.0, 18.0, 18.0, 22.0, 25.0, 50.0, 67.0, 113.0, 166.0, 338.0, 908.0, 3971.0, 35312.0, 865772.0, 131030.0, 8086.0, 1526.0, 467.0, 222.0, 122.0, 70.0, 51.0, 40.0, 16.0, 16.0, 16.0, 18.0, 11.0, 4.0, 13.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.910736083984375, -0.88006591796875, -0.849395751953125, -0.8187255859375, -0.788055419921875, -0.75738525390625, -0.726715087890625, -0.696044921875, -0.665374755859375, -0.63470458984375, -0.604034423828125, -0.5733642578125, -0.542694091796875, -0.51202392578125, -0.481353759765625, -0.45068359375, -0.420013427734375, -0.38934326171875, -0.358673095703125, -0.3280029296875, -0.297332763671875, -0.26666259765625, -0.235992431640625, -0.205322265625, -0.174652099609375, -0.14398193359375, -0.113311767578125, -0.0826416015625, -0.051971435546875, -0.02130126953125, 0.009368896484375, 0.0400390625, 0.070709228515625, 0.10137939453125, 0.132049560546875, 0.1627197265625, 0.193389892578125, 0.22406005859375, 0.254730224609375, 0.285400390625, 0.316070556640625, 0.34674072265625, 0.377410888671875, 0.4080810546875, 0.438751220703125, 0.46942138671875, 0.500091552734375, 0.53076171875, 0.561431884765625, 0.59210205078125, 0.622772216796875, 0.6534423828125, 0.684112548828125, 0.71478271484375, 0.745452880859375, 0.776123046875, 0.806793212890625, 0.83746337890625, 0.868133544921875, 0.8988037109375, 0.929473876953125, 0.96014404296875, 0.990814208984375, 1.021484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 11.0, 23.0, 27.0, 81.0, 96.0, 161.0, 179.0, 154.0, 95.0, 68.0, 35.0, 25.0, 16.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2787837088108063, -0.2682065963745117, -0.25762948393821716, -0.2470523715019226, -0.23647525906562805, -0.2258981466293335, -0.21532101929187775, -0.2047439068555832, -0.19416679441928864, -0.18358968198299408, -0.17301256954669952, -0.16243544220924377, -0.15185832977294922, -0.14128121733665466, -0.1307041049003601, -0.12012699246406555, -0.109549880027771, -0.09897276759147644, -0.08839565515518188, -0.07781853526830673, -0.06724142283201218, -0.05666431039571762, -0.04608719050884247, -0.03551007807254791, -0.024932965636253357, -0.014355851337313652, -0.003778737038373947, 0.006798379123210907, 0.017375491559505463, 0.02795260399580002, 0.03852972388267517, 0.04910683631896973, 0.059683918952941895, 0.07026103138923645, 0.080838143825531, 0.09141526371240616, 0.10199237614870071, 0.11256948858499527, 0.12314660847187042, 0.13372372090816498, 0.14430083334445953, 0.1548779457807541, 0.16545505821704865, 0.1760321855545044, 0.18660929799079895, 0.1971864104270935, 0.20776352286338806, 0.21834063529968262, 0.22891774773597717, 0.23949486017227173, 0.2500719726085663, 0.26064908504486084, 0.2712261974811554, 0.28180330991744995, 0.2923804521560669, 0.30295753479003906, 0.313534677028656, 0.32411178946495056, 0.3346889019012451, 0.3452660143375397, 0.35584312677383423, 0.3664202392101288, 0.37699735164642334, 0.3875744938850403, 0.39815157651901245]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 3.0, 6.0, 10.0, 14.0, 17.0, 9.0, 18.0, 25.0, 28.0, 30.0, 28.0, 36.0, 33.0, 44.0, 45.0, 25.0, 43.0, 43.0, 44.0, 43.0, 41.0, 36.0, 48.0, 31.0, 36.0, 44.0, 26.0, 30.0, 27.0, 21.0, 23.0, 14.0, 16.0, 10.0, 7.0, 10.0, 8.0, 8.0, 0.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.13014668226242065, -0.12589511275291443, -0.1216435357928276, -0.11739195883274078, -0.11314038932323456, -0.10888881981372833, -0.10463724285364151, -0.10038566589355469, -0.09613409638404846, -0.09188252687454224, -0.08763094991445541, -0.08337937295436859, -0.07912780344486237, -0.07487623393535614, -0.07062465697526932, -0.0663730800151825, -0.06212151050567627, -0.057869937270879745, -0.05361836403608322, -0.0493667908012867, -0.04511521756649017, -0.04086364433169365, -0.036612071096897125, -0.0323604978621006, -0.028108924627304077, -0.023857351392507553, -0.01960577815771103, -0.015354204922914505, -0.011102631688117981, -0.006851058453321457, -0.002599485218524933, 0.0016520880162715912, 0.005903661251068115, 0.01015523448586464, 0.014406807720661163, 0.018658380955457687, 0.02290995419025421, 0.027161527425050735, 0.03141310065984726, 0.035664673894643784, 0.03991624712944031, 0.04416782036423683, 0.048419393599033356, 0.05267096683382988, 0.056922540068626404, 0.06117411330342293, 0.06542568653821945, 0.06967726349830627, 0.0739288330078125, 0.07818040251731873, 0.08243197947740555, 0.08668355643749237, 0.0909351259469986, 0.09518669545650482, 0.09943827241659164, 0.10368984937667847, 0.10794141888618469, 0.11219298839569092, 0.11644456535577774, 0.12069614231586456, 0.12494771182537079, 0.12919928133487701, 0.13345086574554443, 0.13770243525505066, 0.14195400476455688]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 13.0, 12.0, 9.0, 7.0, 15.0, 21.0, 13.0, 20.0, 20.0, 31.0, 20.0, 27.0, 29.0, 47.0, 30.0, 45.0, 33.0, 42.0, 42.0, 55.0, 35.0, 48.0, 44.0, 35.0, 43.0, 23.0, 30.0, 25.0, 29.0, 30.0, 13.0, 20.0, 24.0, 12.0, 8.0, 14.0, 5.0, 10.0, 5.0, 5.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.810546875, -1.7615966796875, -1.712646484375, -1.6636962890625, -1.61474609375, -1.5657958984375, -1.516845703125, -1.4678955078125, -1.4189453125, -1.3699951171875, -1.321044921875, -1.2720947265625, -1.22314453125, -1.1741943359375, -1.125244140625, -1.0762939453125, -1.02734375, -0.9783935546875, -0.929443359375, -0.8804931640625, -0.83154296875, -0.7825927734375, -0.733642578125, -0.6846923828125, -0.6357421875, -0.5867919921875, -0.537841796875, -0.4888916015625, -0.43994140625, -0.3909912109375, -0.342041015625, -0.2930908203125, -0.244140625, -0.1951904296875, -0.146240234375, -0.0972900390625, -0.04833984375, 0.0006103515625, 0.049560546875, 0.0985107421875, 0.1474609375, 0.1964111328125, 0.245361328125, 0.2943115234375, 0.34326171875, 0.3922119140625, 0.441162109375, 0.4901123046875, 0.5390625, 0.5880126953125, 0.636962890625, 0.6859130859375, 0.73486328125, 0.7838134765625, 0.832763671875, 0.8817138671875, 0.9306640625, 0.9796142578125, 1.028564453125, 1.0775146484375, 1.12646484375, 1.1754150390625, 1.224365234375, 1.2733154296875, 1.322265625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 12.0, 6.0, 23.0, 21.0, 30.0, 48.0, 67.0, 103.0, 152.0, 231.0, 358.0, 614.0, 1027.0, 1768.0, 2968.0, 5125.0, 9462.0, 19870.0, 55546.0, 285600.0, 523753.0, 87667.0, 27120.0, 11911.0, 6209.0, 3508.0, 2034.0, 1221.0, 763.0, 441.0, 282.0, 219.0, 114.0, 80.0, 55.0, 35.0, 29.0, 14.0, 17.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.216796875, -2.14996337890625, -2.0831298828125, -2.01629638671875, -1.949462890625, -1.88262939453125, -1.8157958984375, -1.74896240234375, -1.68212890625, -1.61529541015625, -1.5484619140625, -1.48162841796875, -1.414794921875, -1.34796142578125, -1.2811279296875, -1.21429443359375, -1.1474609375, -1.08062744140625, -1.0137939453125, -0.94696044921875, -0.880126953125, -0.81329345703125, -0.7464599609375, -0.67962646484375, -0.61279296875, -0.54595947265625, -0.4791259765625, -0.41229248046875, -0.345458984375, -0.27862548828125, -0.2117919921875, -0.14495849609375, -0.078125, -0.01129150390625, 0.0555419921875, 0.12237548828125, 0.189208984375, 0.25604248046875, 0.3228759765625, 0.38970947265625, 0.45654296875, 0.52337646484375, 0.5902099609375, 0.65704345703125, 0.723876953125, 0.79071044921875, 0.8575439453125, 0.92437744140625, 0.9912109375, 1.05804443359375, 1.1248779296875, 1.19171142578125, 1.258544921875, 1.32537841796875, 1.3922119140625, 1.45904541015625, 1.52587890625, 1.59271240234375, 1.6595458984375, 1.72637939453125, 1.793212890625, 1.86004638671875, 1.9268798828125, 1.99371337890625, 2.060546875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 9.0, 6.0, 15.0, 7.0, 6.0, 17.0, 18.0, 9.0, 15.0, 33.0, 25.0, 41.0, 28.0, 47.0, 39.0, 59.0, 59.0, 77.0, 156.0, 1521.0, 267.0, 100.0, 60.0, 52.0, 52.0, 41.0, 35.0, 36.0, 35.0, 29.0, 19.0, 18.0, 17.0, 14.0, 17.0, 15.0, 11.0, 9.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.87152099609375, -4.7078857421875, -4.54425048828125, -4.380615234375, -4.21697998046875, -4.0533447265625, -3.88970947265625, -3.72607421875, -3.56243896484375, -3.3988037109375, -3.23516845703125, -3.071533203125, -2.90789794921875, -2.7442626953125, -2.58062744140625, -2.4169921875, -2.25335693359375, -2.0897216796875, -1.92608642578125, -1.762451171875, -1.59881591796875, -1.4351806640625, -1.27154541015625, -1.10791015625, -0.94427490234375, -0.7806396484375, -0.61700439453125, -0.453369140625, -0.28973388671875, -0.1260986328125, 0.03753662109375, 0.201171875, 0.36480712890625, 0.5284423828125, 0.69207763671875, 0.855712890625, 1.01934814453125, 1.1829833984375, 1.34661865234375, 1.51025390625, 1.67388916015625, 1.8375244140625, 2.00115966796875, 2.164794921875, 2.32843017578125, 2.4920654296875, 2.65570068359375, 2.8193359375, 2.98297119140625, 3.1466064453125, 3.31024169921875, 3.473876953125, 3.63751220703125, 3.8011474609375, 3.96478271484375, 4.12841796875, 4.29205322265625, 4.4556884765625, 4.61932373046875, 4.782958984375, 4.94659423828125, 5.1102294921875, 5.27386474609375, 5.4375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 9.0, 14.0, 24.0, 34.0, 73.0, 116.0, 250.0, 612.0, 2049.0, 19298.0, 3021488.0, 96034.0, 4129.0, 869.0, 330.0, 154.0, 81.0, 53.0, 22.0, 17.0, 14.0, 8.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.421875, -14.771240234375, -14.12060546875, -13.469970703125, -12.8193359375, -12.168701171875, -11.51806640625, -10.867431640625, -10.216796875, -9.566162109375, -8.91552734375, -8.264892578125, -7.6142578125, -6.963623046875, -6.31298828125, -5.662353515625, -5.01171875, -4.361083984375, -3.71044921875, -3.059814453125, -2.4091796875, -1.758544921875, -1.10791015625, -0.457275390625, 0.193359375, 0.843994140625, 1.49462890625, 2.145263671875, 2.7958984375, 3.446533203125, 4.09716796875, 4.747802734375, 5.3984375, 6.049072265625, 6.69970703125, 7.350341796875, 8.0009765625, 8.651611328125, 9.30224609375, 9.952880859375, 10.603515625, 11.254150390625, 11.90478515625, 12.555419921875, 13.2060546875, 13.856689453125, 14.50732421875, 15.157958984375, 15.80859375, 16.459228515625, 17.10986328125, 17.760498046875, 18.4111328125, 19.061767578125, 19.71240234375, 20.363037109375, 21.013671875, 21.664306640625, 22.31494140625, 22.965576171875, 23.6162109375, 24.266845703125, 24.91748046875, 25.568115234375, 26.21875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 38.0, 474.0, 444.0, 60.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.03237915039062, -136.45553588867188, -133.87867736816406, -131.3018341064453, -128.72499084472656, -126.14813995361328, -123.5712890625, -120.99444580078125, -118.41759490966797, -115.84074401855469, -113.26390075683594, -110.68704986572266, -108.11019897460938, -105.53335571289062, -102.95650482177734, -100.37965393066406, -97.80281066894531, -95.22595977783203, -92.64911651611328, -90.072265625, -87.49541473388672, -84.91857147216797, -82.34172058105469, -79.76487731933594, -77.18801879882812, -74.61116790771484, -72.0343246459961, -69.45747375488281, -66.88062286376953, -64.30377960205078, -61.7269287109375, -59.150081634521484, -56.57323455810547, -53.99638748168945, -51.41953659057617, -48.842689514160156, -46.26584243774414, -43.688995361328125, -41.112144470214844, -38.53529739379883, -35.95845031738281, -33.3816032409668, -30.80475425720215, -28.2279052734375, -25.651058197021484, -23.074209213256836, -20.497360229492188, -17.920513153076172, -15.34366226196289, -12.766814231872559, -10.189966201782227, -7.613117218017578, -5.036269187927246, -2.459421157836914, 0.11742782592773438, 2.69427490234375, 5.271123886108398, 7.8479719161987305, 10.424819946289062, 13.001668930053711, 15.578516960144043, 18.155364990234375, 20.732213973999023, 23.30906105041504, 25.885910034179688]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 2.0, 5.0, 9.0, 12.0, 15.0, 10.0, 19.0, 15.0, 15.0, 30.0, 25.0, 30.0, 42.0, 31.0, 42.0, 40.0, 56.0, 33.0, 44.0, 39.0, 42.0, 44.0, 41.0, 39.0, 27.0, 42.0, 29.0, 24.0, 18.0, 22.0, 25.0, 18.0, 24.0, 16.0, 11.0, 8.0, 12.0, 8.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.162546157836914, -15.656578063964844, -15.150609970092773, -14.644641876220703, -14.138673782348633, -13.632705688476562, -13.126737594604492, -12.620769500732422, -12.114801406860352, -11.608833312988281, -11.102865219116211, -10.59689712524414, -10.09092903137207, -9.5849609375, -9.07899284362793, -8.57302474975586, -8.067056655883789, -7.561088562011719, -7.055120468139648, -6.549152374267578, -6.043184280395508, -5.5372161865234375, -5.031248092651367, -4.525279998779297, -4.019311904907227, -3.5133438110351562, -3.007375717163086, -2.5014076232910156, -1.9954395294189453, -1.489471435546875, -0.9835033416748047, -0.4775352478027344, 0.02843475341796875, 0.5344028472900391, 1.0403709411621094, 1.5463390350341797, 2.05230712890625, 2.5582752227783203, 3.0642433166503906, 3.570211410522461, 4.076179504394531, 4.582147598266602, 5.088115692138672, 5.594083786010742, 6.1000518798828125, 6.606019973754883, 7.111988067626953, 7.617956161499023, 8.123924255371094, 8.629892349243164, 9.135860443115234, 9.641828536987305, 10.147796630859375, 10.653764724731445, 11.159732818603516, 11.665700912475586, 12.171669006347656, 12.677637100219727, 13.183605194091797, 13.689573287963867, 14.195541381835938, 14.701509475708008, 15.207477569580078, 15.713445663452148, 16.21941375732422]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 12.0, 17.0, 16.0, 16.0, 19.0, 19.0, 15.0, 23.0, 23.0, 21.0, 20.0, 29.0, 42.0, 36.0, 36.0, 38.0, 37.0, 43.0, 48.0, 45.0, 45.0, 36.0, 46.0, 38.0, 29.0, 29.0, 24.0, 22.0, 37.0, 18.0, 21.0, 19.0, 17.0, 18.0, 9.0, 8.0, 10.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.8427734375, -1.79205322265625, -1.7413330078125, -1.69061279296875, -1.639892578125, -1.58917236328125, -1.5384521484375, -1.48773193359375, -1.43701171875, -1.38629150390625, -1.3355712890625, -1.28485107421875, -1.234130859375, -1.18341064453125, -1.1326904296875, -1.08197021484375, -1.03125, -0.98052978515625, -0.9298095703125, -0.87908935546875, -0.828369140625, -0.77764892578125, -0.7269287109375, -0.67620849609375, -0.62548828125, -0.57476806640625, -0.5240478515625, -0.47332763671875, -0.422607421875, -0.37188720703125, -0.3211669921875, -0.27044677734375, -0.2197265625, -0.16900634765625, -0.1182861328125, -0.06756591796875, -0.016845703125, 0.03387451171875, 0.0845947265625, 0.13531494140625, 0.18603515625, 0.23675537109375, 0.2874755859375, 0.33819580078125, 0.388916015625, 0.43963623046875, 0.4903564453125, 0.54107666015625, 0.591796875, 0.64251708984375, 0.6932373046875, 0.74395751953125, 0.794677734375, 0.84539794921875, 0.8961181640625, 0.94683837890625, 0.99755859375, 1.04827880859375, 1.0989990234375, 1.14971923828125, 1.200439453125, 1.25115966796875, 1.3018798828125, 1.35260009765625, 1.4033203125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 9.0, 8.0, 19.0, 12.0, 21.0, 31.0, 39.0, 45.0, 60.0, 95.0, 116.0, 146.0, 235.0, 329.0, 429.0, 580.0, 841.0, 1290.0, 1917.0, 2777.0, 4176.0, 6542.0, 10864.0, 20136.0, 50688.0, 293503.0, 2192353.0, 1349367.0, 175479.0, 38027.0, 16730.0, 9642.0, 5891.0, 3945.0, 2491.0, 1607.0, 1144.0, 822.0, 591.0, 357.0, 255.0, 178.0, 128.0, 92.0, 68.0, 59.0, 45.0, 30.0, 22.0, 21.0, 8.0, 9.0, 8.0, 3.0, 3.0, 3.0, 2.0], "bins": [-3.52734375, -3.423187255859375, -3.31903076171875, -3.214874267578125, -3.1107177734375, -3.006561279296875, -2.90240478515625, -2.798248291015625, -2.694091796875, -2.589935302734375, -2.48577880859375, -2.381622314453125, -2.2774658203125, -2.173309326171875, -2.06915283203125, -1.964996337890625, -1.86083984375, -1.756683349609375, -1.65252685546875, -1.548370361328125, -1.4442138671875, -1.340057373046875, -1.23590087890625, -1.131744384765625, -1.027587890625, -0.923431396484375, -0.81927490234375, -0.715118408203125, -0.6109619140625, -0.506805419921875, -0.40264892578125, -0.298492431640625, -0.1943359375, -0.090179443359375, 0.01397705078125, 0.118133544921875, 0.2222900390625, 0.326446533203125, 0.43060302734375, 0.534759521484375, 0.638916015625, 0.743072509765625, 0.84722900390625, 0.951385498046875, 1.0555419921875, 1.159698486328125, 1.26385498046875, 1.368011474609375, 1.47216796875, 1.576324462890625, 1.68048095703125, 1.784637451171875, 1.8887939453125, 1.992950439453125, 2.09710693359375, 2.201263427734375, 2.305419921875, 2.409576416015625, 2.51373291015625, 2.617889404296875, 2.7220458984375, 2.826202392578125, 2.93035888671875, 3.034515380859375, 3.138671875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 8.0, 3.0, 2.0, 2.0, 7.0, 13.0, 16.0, 14.0, 21.0, 26.0, 29.0, 46.0, 70.0, 87.0, 143.0, 242.0, 457.0, 787.0, 853.0, 462.0, 295.0, 164.0, 91.0, 47.0, 29.0, 32.0, 27.0, 16.0, 9.0, 16.0, 15.0, 6.0, 9.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-4.734375, -4.59930419921875, -4.4642333984375, -4.32916259765625, -4.194091796875, -4.05902099609375, -3.9239501953125, -3.78887939453125, -3.65380859375, -3.51873779296875, -3.3836669921875, -3.24859619140625, -3.113525390625, -2.97845458984375, -2.8433837890625, -2.70831298828125, -2.5732421875, -2.43817138671875, -2.3031005859375, -2.16802978515625, -2.032958984375, -1.89788818359375, -1.7628173828125, -1.62774658203125, -1.49267578125, -1.35760498046875, -1.2225341796875, -1.08746337890625, -0.952392578125, -0.81732177734375, -0.6822509765625, -0.54718017578125, -0.412109375, -0.27703857421875, -0.1419677734375, -0.00689697265625, 0.128173828125, 0.26324462890625, 0.3983154296875, 0.53338623046875, 0.66845703125, 0.80352783203125, 0.9385986328125, 1.07366943359375, 1.208740234375, 1.34381103515625, 1.4788818359375, 1.61395263671875, 1.7490234375, 1.88409423828125, 2.0191650390625, 2.15423583984375, 2.289306640625, 2.42437744140625, 2.5594482421875, 2.69451904296875, 2.82958984375, 2.96466064453125, 3.0997314453125, 3.23480224609375, 3.369873046875, 3.50494384765625, 3.6400146484375, 3.77508544921875, 3.91015625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 8.0, 5.0, 29.0, 25.0, 42.0, 80.0, 149.0, 211.0, 400.0, 755.0, 1376.0, 2562.0, 5470.0, 11850.0, 31250.0, 125215.0, 2813569.0, 1079898.0, 79246.0, 23557.0, 9385.0, 4423.0, 2119.0, 1188.0, 610.0, 340.0, 199.0, 119.0, 76.0, 41.0, 32.0, 12.0, 8.0, 6.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.890625, -7.64300537109375, -7.3953857421875, -7.14776611328125, -6.900146484375, -6.65252685546875, -6.4049072265625, -6.15728759765625, -5.90966796875, -5.66204833984375, -5.4144287109375, -5.16680908203125, -4.919189453125, -4.67156982421875, -4.4239501953125, -4.17633056640625, -3.9287109375, -3.68109130859375, -3.4334716796875, -3.18585205078125, -2.938232421875, -2.69061279296875, -2.4429931640625, -2.19537353515625, -1.94775390625, -1.70013427734375, -1.4525146484375, -1.20489501953125, -0.957275390625, -0.70965576171875, -0.4620361328125, -0.21441650390625, 0.033203125, 0.28082275390625, 0.5284423828125, 0.77606201171875, 1.023681640625, 1.27130126953125, 1.5189208984375, 1.76654052734375, 2.01416015625, 2.26177978515625, 2.5093994140625, 2.75701904296875, 3.004638671875, 3.25225830078125, 3.4998779296875, 3.74749755859375, 3.9951171875, 4.24273681640625, 4.4903564453125, 4.73797607421875, 4.985595703125, 5.23321533203125, 5.4808349609375, 5.72845458984375, 5.97607421875, 6.22369384765625, 6.4713134765625, 6.71893310546875, 6.966552734375, 7.21417236328125, 7.4617919921875, 7.70941162109375, 7.95703125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 7.0, 10.0, 21.0, 46.0, 63.0, 162.0, 219.0, 200.0, 146.0, 50.0, 33.0, 20.0, 7.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.51634979248047, -47.32965850830078, -46.14296340942383, -44.95627212524414, -43.76957702636719, -42.5828857421875, -41.39619445800781, -40.209503173828125, -39.02280807495117, -37.836116790771484, -36.64942169189453, -35.462730407714844, -34.276039123535156, -33.0893440246582, -31.902652740478516, -30.715959548950195, -29.529266357421875, -28.342573165893555, -27.155879974365234, -25.969188690185547, -24.782495498657227, -23.595802307128906, -22.40911102294922, -21.2224178314209, -20.035724639892578, -18.849031448364258, -17.662338256835938, -16.47564697265625, -15.28895378112793, -14.10226058959961, -12.915568351745605, -11.728876113891602, -10.542179107666016, -9.355485916137695, -8.168793678283691, -6.982100963592529, -5.795408248901367, -4.608715534210205, -3.422022819519043, -2.235330581665039, -1.0486373901367188, 0.13805532455444336, 1.3247480392456055, 2.5114407539367676, 3.6981334686279297, 4.884826183319092, 6.071518898010254, 7.258211135864258, 8.444904327392578, 9.631597518920898, 10.818289756774902, 12.004981994628906, 13.191675186157227, 14.378368377685547, 15.56506061553955, 16.751752853393555, 17.938446044921875, 19.125139236450195, 20.311832427978516, 21.498523712158203, 22.685216903686523, 23.871910095214844, 25.05860137939453, 26.24529457092285, 27.431987762451172]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 4.0, 6.0, 6.0, 11.0, 11.0, 13.0, 12.0, 17.0, 21.0, 31.0, 26.0, 25.0, 28.0, 42.0, 39.0, 28.0, 37.0, 42.0, 47.0, 48.0, 38.0, 45.0, 61.0, 39.0, 38.0, 38.0, 32.0, 29.0, 31.0, 20.0, 20.0, 17.0, 16.0, 16.0, 15.0, 3.0, 8.0, 10.0, 5.0, 4.0, 1.0, 13.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.840534210205078, -12.437233924865723, -12.033934593200684, -11.630634307861328, -11.227334976196289, -10.824034690856934, -10.420734405517578, -10.017435073852539, -9.6141357421875, -9.210835456848145, -8.807536125183105, -8.40423583984375, -8.000936508178711, -7.5976362228393555, -7.194336414337158, -6.791036605834961, -6.3877363204956055, -5.984436511993408, -5.581136703491211, -5.1778364181518555, -4.774537086486816, -4.371236801147461, -3.9679369926452637, -3.5646371841430664, -3.161337375640869, -2.758037567138672, -2.3547377586364746, -1.9514377117156982, -1.548137903213501, -1.1448380947113037, -0.7415380477905273, -0.3382382392883301, 0.06506156921386719, 0.46836143732070923, 0.8716613054275513, 1.274961233139038, 1.6782610416412354, 2.0815608501434326, 2.484860897064209, 2.8881607055664062, 3.2914605140686035, 3.694760322570801, 4.098060131072998, 4.501359939575195, 4.904660224914551, 5.30795955657959, 5.711259841918945, 6.114559650421143, 6.51785945892334, 6.921159267425537, 7.324459075927734, 7.72775936126709, 8.131058692932129, 8.534358978271484, 8.937658309936523, 9.340958595275879, 9.744258880615234, 10.14755916595459, 10.550858497619629, 10.954158782958984, 11.357458114624023, 11.760758399963379, 12.164058685302734, 12.567358016967773, 12.970657348632812]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 11.0, 14.0, 16.0, 14.0, 14.0, 23.0, 15.0, 22.0, 17.0, 28.0, 43.0, 36.0, 36.0, 25.0, 33.0, 32.0, 37.0, 41.0, 60.0, 36.0, 40.0, 37.0, 49.0, 27.0, 36.0, 37.0, 30.0, 23.0, 31.0, 19.0, 18.0, 19.0, 11.0, 17.0, 18.0, 8.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.77734375, -1.72821044921875, -1.6790771484375, -1.62994384765625, -1.580810546875, -1.53167724609375, -1.4825439453125, -1.43341064453125, -1.38427734375, -1.33514404296875, -1.2860107421875, -1.23687744140625, -1.187744140625, -1.13861083984375, -1.0894775390625, -1.04034423828125, -0.9912109375, -0.94207763671875, -0.8929443359375, -0.84381103515625, -0.794677734375, -0.74554443359375, -0.6964111328125, -0.64727783203125, -0.59814453125, -0.54901123046875, -0.4998779296875, -0.45074462890625, -0.401611328125, -0.35247802734375, -0.3033447265625, -0.25421142578125, -0.205078125, -0.15594482421875, -0.1068115234375, -0.05767822265625, -0.008544921875, 0.04058837890625, 0.0897216796875, 0.13885498046875, 0.18798828125, 0.23712158203125, 0.2862548828125, 0.33538818359375, 0.384521484375, 0.43365478515625, 0.4827880859375, 0.53192138671875, 0.5810546875, 0.63018798828125, 0.6793212890625, 0.72845458984375, 0.777587890625, 0.82672119140625, 0.8758544921875, 0.92498779296875, 0.97412109375, 1.02325439453125, 1.0723876953125, 1.12152099609375, 1.170654296875, 1.21978759765625, 1.2689208984375, 1.31805419921875, 1.3671875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 9.0, 17.0, 21.0, 47.0, 76.0, 95.0, 98.0, 182.0, 227.0, 362.0, 544.0, 893.0, 1273.0, 1813.0, 2911.0, 4335.0, 6523.0, 10436.0, 16339.0, 26465.0, 44677.0, 79163.0, 149037.0, 238822.0, 200795.0, 110377.0, 60038.0, 34449.0, 20809.0, 13258.0, 8488.0, 5411.0, 3473.0, 2340.0, 1601.0, 1050.0, 656.0, 427.0, 301.0, 226.0, 121.0, 103.0, 85.0, 52.0, 38.0, 26.0, 22.0, 12.0, 10.0, 8.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.43359375, -1.386993408203125, -1.34039306640625, -1.293792724609375, -1.2471923828125, -1.200592041015625, -1.15399169921875, -1.107391357421875, -1.060791015625, -1.014190673828125, -0.96759033203125, -0.920989990234375, -0.8743896484375, -0.827789306640625, -0.78118896484375, -0.734588623046875, -0.68798828125, -0.641387939453125, -0.59478759765625, -0.548187255859375, -0.5015869140625, -0.454986572265625, -0.40838623046875, -0.361785888671875, -0.315185546875, -0.268585205078125, -0.22198486328125, -0.175384521484375, -0.1287841796875, -0.082183837890625, -0.03558349609375, 0.011016845703125, 0.0576171875, 0.104217529296875, 0.15081787109375, 0.197418212890625, 0.2440185546875, 0.290618896484375, 0.33721923828125, 0.383819580078125, 0.430419921875, 0.477020263671875, 0.52362060546875, 0.570220947265625, 0.6168212890625, 0.663421630859375, 0.71002197265625, 0.756622314453125, 0.80322265625, 0.849822998046875, 0.89642333984375, 0.943023681640625, 0.9896240234375, 1.036224365234375, 1.08282470703125, 1.129425048828125, 1.176025390625, 1.222625732421875, 1.26922607421875, 1.315826416015625, 1.3624267578125, 1.409027099609375, 1.45562744140625, 1.502227783203125, 1.548828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 7.0, 5.0, 13.0, 15.0, 9.0, 18.0, 17.0, 19.0, 24.0, 32.0, 40.0, 41.0, 34.0, 44.0, 33.0, 41.0, 53.0, 41.0, 1071.0, 33.0, 40.0, 53.0, 37.0, 37.0, 40.0, 39.0, 31.0, 24.0, 20.0, 23.0, 16.0, 13.0, 11.0, 7.0, 4.0, 7.0, 9.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.60546875, -1.5599517822265625, -1.514434814453125, -1.4689178466796875, -1.42340087890625, -1.3778839111328125, -1.332366943359375, -1.2868499755859375, -1.2413330078125, -1.1958160400390625, -1.150299072265625, -1.1047821044921875, -1.05926513671875, -1.0137481689453125, -0.968231201171875, -0.9227142333984375, -0.877197265625, -0.8316802978515625, -0.786163330078125, -0.7406463623046875, -0.69512939453125, -0.6496124267578125, -0.604095458984375, -0.5585784912109375, -0.5130615234375, -0.4675445556640625, -0.422027587890625, -0.3765106201171875, -0.33099365234375, -0.2854766845703125, -0.239959716796875, -0.1944427490234375, -0.14892578125, -0.1034088134765625, -0.057891845703125, -0.0123748779296875, 0.03314208984375, 0.0786590576171875, 0.124176025390625, 0.1696929931640625, 0.2152099609375, 0.2607269287109375, 0.306243896484375, 0.3517608642578125, 0.39727783203125, 0.4427947998046875, 0.488311767578125, 0.5338287353515625, 0.579345703125, 0.6248626708984375, 0.670379638671875, 0.7158966064453125, 0.76141357421875, 0.8069305419921875, 0.852447509765625, 0.8979644775390625, 0.9434814453125, 0.9889984130859375, 1.034515380859375, 1.0800323486328125, 1.12554931640625, 1.1710662841796875, 1.216583251953125, 1.2621002197265625, 1.3076171875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 11.0, 10.0, 9.0, 10.0, 10.0, 17.0, 25.0, 28.0, 38.0, 61.0, 90.0, 108.0, 165.0, 214.0, 292.0, 469.0, 739.0, 1018.0, 1644.0, 2675.0, 4676.0, 8148.0, 16383.0, 40716.0, 757415.0, 1183137.0, 41968.0, 16377.0, 8422.0, 4618.0, 2686.0, 1679.0, 1117.0, 666.0, 469.0, 317.0, 203.0, 141.0, 112.0, 68.0, 48.0, 45.0, 40.0, 18.0, 12.0, 15.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0], "bins": [-2.505859375, -2.4381561279296875, -2.370452880859375, -2.3027496337890625, -2.23504638671875, -2.1673431396484375, -2.099639892578125, -2.0319366455078125, -1.9642333984375, -1.8965301513671875, -1.828826904296875, -1.7611236572265625, -1.69342041015625, -1.6257171630859375, -1.558013916015625, -1.4903106689453125, -1.422607421875, -1.3549041748046875, -1.287200927734375, -1.2194976806640625, -1.15179443359375, -1.0840911865234375, -1.016387939453125, -0.9486846923828125, -0.8809814453125, -0.8132781982421875, -0.745574951171875, -0.6778717041015625, -0.61016845703125, -0.5424652099609375, -0.474761962890625, -0.4070587158203125, -0.33935546875, -0.2716522216796875, -0.203948974609375, -0.1362457275390625, -0.06854248046875, -0.0008392333984375, 0.066864013671875, 0.1345672607421875, 0.2022705078125, 0.2699737548828125, 0.337677001953125, 0.4053802490234375, 0.47308349609375, 0.5407867431640625, 0.608489990234375, 0.6761932373046875, 0.743896484375, 0.8115997314453125, 0.879302978515625, 0.9470062255859375, 1.01470947265625, 1.0824127197265625, 1.150115966796875, 1.2178192138671875, 1.2855224609375, 1.3532257080078125, 1.420928955078125, 1.4886322021484375, 1.55633544921875, 1.6240386962890625, 1.691741943359375, 1.7594451904296875, 1.8271484375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 10.0, 9.0, 12.0, 19.0, 21.0, 34.0, 54.0, 74.0, 92.0, 97.0, 116.0, 103.0, 88.0, 69.0, 64.0, 35.0, 36.0, 16.0, 16.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0816650390625, -0.078704833984375, -0.07574462890625, -0.072784423828125, -0.06982421875, -0.066864013671875, -0.06390380859375, -0.060943603515625, -0.0579833984375, -0.055023193359375, -0.05206298828125, -0.049102783203125, -0.046142578125, -0.043182373046875, -0.04022216796875, -0.037261962890625, -0.0343017578125, -0.031341552734375, -0.02838134765625, -0.025421142578125, -0.0224609375, -0.019500732421875, -0.01654052734375, -0.013580322265625, -0.0106201171875, -0.007659912109375, -0.00469970703125, -0.001739501953125, 0.001220703125, 0.004180908203125, 0.00714111328125, 0.010101318359375, 0.0130615234375, 0.016021728515625, 0.01898193359375, 0.021942138671875, 0.02490234375, 0.027862548828125, 0.03082275390625, 0.033782958984375, 0.0367431640625, 0.039703369140625, 0.04266357421875, 0.045623779296875, 0.048583984375, 0.051544189453125, 0.05450439453125, 0.057464599609375, 0.0604248046875, 0.063385009765625, 0.06634521484375, 0.069305419921875, 0.072265625, 0.075225830078125, 0.07818603515625, 0.081146240234375, 0.0841064453125, 0.087066650390625, 0.09002685546875, 0.092987060546875, 0.095947265625, 0.098907470703125, 0.10186767578125, 0.104827880859375, 0.1077880859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 10.0, 16.0, 23.0, 29.0, 44.0, 77.0, 124.0, 205.0, 461.0, 1612.0, 14702.0, 782000.0, 240740.0, 6602.0, 1084.0, 333.0, 187.0, 99.0, 55.0, 41.0, 29.0, 21.0, 15.0, 4.0, 8.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3369140625, -1.29962158203125, -1.2623291015625, -1.22503662109375, -1.187744140625, -1.15045166015625, -1.1131591796875, -1.07586669921875, -1.03857421875, -1.00128173828125, -0.9639892578125, -0.92669677734375, -0.889404296875, -0.85211181640625, -0.8148193359375, -0.77752685546875, -0.740234375, -0.70294189453125, -0.6656494140625, -0.62835693359375, -0.591064453125, -0.55377197265625, -0.5164794921875, -0.47918701171875, -0.44189453125, -0.40460205078125, -0.3673095703125, -0.33001708984375, -0.292724609375, -0.25543212890625, -0.2181396484375, -0.18084716796875, -0.1435546875, -0.10626220703125, -0.0689697265625, -0.03167724609375, 0.005615234375, 0.04290771484375, 0.0802001953125, 0.11749267578125, 0.15478515625, 0.19207763671875, 0.2293701171875, 0.26666259765625, 0.303955078125, 0.34124755859375, 0.3785400390625, 0.41583251953125, 0.453125, 0.49041748046875, 0.5277099609375, 0.56500244140625, 0.602294921875, 0.63958740234375, 0.6768798828125, 0.71417236328125, 0.75146484375, 0.78875732421875, 0.8260498046875, 0.86334228515625, 0.900634765625, 0.93792724609375, 0.9752197265625, 1.01251220703125, 1.0498046875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 18.0, 64.0, 161.0, 285.0, 239.0, 132.0, 50.0, 32.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405505895614624, -0.3891640901565552, -0.3728223145008087, -0.35648050904273987, -0.3401387333869934, -0.32379692792892456, -0.3074551224708557, -0.29111331701278687, -0.2747715413570404, -0.25842973589897156, -0.2420879602432251, -0.22574615478515625, -0.2094043642282486, -0.19306257367134094, -0.1767207682132721, -0.16037897765636444, -0.1440371870994568, -0.12769539654254913, -0.11135359853506088, -0.09501180052757263, -0.07867000997066498, -0.062328219413757324, -0.045986421406269073, -0.029644623398780823, -0.013302832841873169, 0.0030389614403247833, 0.019380755722522736, 0.03572255000472069, 0.05206434428691864, 0.0684061348438263, 0.08474793285131454, 0.1010897308588028, 0.11743158102035522, 0.13377337157726288, 0.15011516213417053, 0.16645696759223938, 0.18279875814914703, 0.1991405487060547, 0.21548235416412354, 0.2318241447210312, 0.24816593527793884, 0.2645077407360077, 0.28084951639175415, 0.297191321849823, 0.31353312730789185, 0.3298749029636383, 0.34621670842170715, 0.3625584840774536, 0.37890028953552246, 0.3952420949935913, 0.41158387064933777, 0.4279256761074066, 0.4442674517631531, 0.4606092572212219, 0.47695106267929077, 0.4932928681373596, 0.5096346139907837, 0.5259764194488525, 0.5423182249069214, 0.5586599707603455, 0.5750017762184143, 0.5913435816764832, 0.607685387134552, 0.6240271925926208, 0.6403689980506897]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 6.0, 8.0, 9.0, 12.0, 20.0, 17.0, 19.0, 26.0, 11.0, 29.0, 39.0, 34.0, 33.0, 39.0, 39.0, 40.0, 39.0, 45.0, 38.0, 41.0, 49.0, 36.0, 38.0, 35.0, 46.0, 31.0, 30.0, 32.0, 19.0, 17.0, 22.0, 10.0, 19.0, 11.0, 9.0, 15.0, 9.0, 2.0, 5.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11792051792144775, -0.11418847739696503, -0.1104564368724823, -0.10672439634799957, -0.10299235582351685, -0.09926031529903412, -0.09552828222513199, -0.09179624170064926, -0.08806420117616653, -0.08433216065168381, -0.08060012012720108, -0.07686807960271835, -0.07313604652881622, -0.0694040060043335, -0.06567196547985077, -0.06193992495536804, -0.058207884430885315, -0.05447584390640259, -0.05074380338191986, -0.04701176658272743, -0.043279726058244705, -0.03954768553376198, -0.03581564873456955, -0.03208360821008682, -0.028351567685604095, -0.02461952716112137, -0.02088748849928379, -0.017155449837446213, -0.013423409312963486, -0.009691368788480759, -0.005959330126643181, -0.002227291464805603, 0.001504749059677124, 0.0052367886528372765, 0.008968828245997429, 0.012700867839157581, 0.016432907432317734, 0.02016494795680046, 0.02389698661863804, 0.027629025280475616, 0.031361065804958344, 0.03509310632944107, 0.0388251468539238, 0.042557183653116226, 0.04628922417759895, 0.05002126470208168, 0.05375330150127411, 0.057485342025756836, 0.06121738255023956, 0.06494942307472229, 0.06868146359920502, 0.07241350412368774, 0.07614554464817047, 0.0798775851726532, 0.08360961824655533, 0.08734165877103806, 0.09107369929552078, 0.09480573982000351, 0.09853778034448624, 0.10226982086896896, 0.1060018539428711, 0.10973389446735382, 0.11346593499183655, 0.11719797551631927, 0.120930016040802]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 17.0, 13.0, 16.0, 20.0, 15.0, 22.0, 20.0, 27.0, 45.0, 31.0, 38.0, 27.0, 33.0, 35.0, 34.0, 43.0, 56.0, 36.0, 38.0, 39.0, 49.0, 29.0, 36.0, 34.0, 32.0, 22.0, 32.0, 19.0, 23.0, 15.0, 9.0, 17.0, 17.0, 9.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.77734375, -1.7281646728515625, -1.678985595703125, -1.6298065185546875, -1.58062744140625, -1.5314483642578125, -1.482269287109375, -1.4330902099609375, -1.3839111328125, -1.3347320556640625, -1.285552978515625, -1.2363739013671875, -1.18719482421875, -1.1380157470703125, -1.088836669921875, -1.0396575927734375, -0.990478515625, -0.9412994384765625, -0.892120361328125, -0.8429412841796875, -0.79376220703125, -0.7445831298828125, -0.695404052734375, -0.6462249755859375, -0.5970458984375, -0.5478668212890625, -0.498687744140625, -0.4495086669921875, -0.40032958984375, -0.3511505126953125, -0.301971435546875, -0.2527923583984375, -0.20361328125, -0.1544342041015625, -0.105255126953125, -0.0560760498046875, -0.00689697265625, 0.0422821044921875, 0.091461181640625, 0.1406402587890625, 0.1898193359375, 0.2389984130859375, 0.288177490234375, 0.3373565673828125, 0.38653564453125, 0.4357147216796875, 0.484893798828125, 0.5340728759765625, 0.583251953125, 0.6324310302734375, 0.681610107421875, 0.7307891845703125, 0.77996826171875, 0.8291473388671875, 0.878326416015625, 0.9275054931640625, 0.9766845703125, 1.0258636474609375, 1.075042724609375, 1.1242218017578125, 1.17340087890625, 1.2225799560546875, 1.271759033203125, 1.3209381103515625, 1.3701171875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 15.0, 20.0, 26.0, 36.0, 42.0, 64.0, 80.0, 126.0, 166.0, 227.0, 357.0, 546.0, 797.0, 1249.0, 1919.0, 3117.0, 5303.0, 9887.0, 20934.0, 61465.0, 298427.0, 488994.0, 97049.0, 28748.0, 12281.0, 6431.0, 3636.0, 2224.0, 1484.0, 930.0, 589.0, 435.0, 268.0, 182.0, 153.0, 100.0, 61.0, 45.0, 34.0, 26.0, 25.0, 17.0, 12.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.328369140625, -2.24853515625, -2.168701171875, -2.0888671875, -2.009033203125, -1.92919921875, -1.849365234375, -1.76953125, -1.689697265625, -1.60986328125, -1.530029296875, -1.4501953125, -1.370361328125, -1.29052734375, -1.210693359375, -1.130859375, -1.051025390625, -0.97119140625, -0.891357421875, -0.8115234375, -0.731689453125, -0.65185546875, -0.572021484375, -0.4921875, -0.412353515625, -0.33251953125, -0.252685546875, -0.1728515625, -0.093017578125, -0.01318359375, 0.066650390625, 0.146484375, 0.226318359375, 0.30615234375, 0.385986328125, 0.4658203125, 0.545654296875, 0.62548828125, 0.705322265625, 0.78515625, 0.864990234375, 0.94482421875, 1.024658203125, 1.1044921875, 1.184326171875, 1.26416015625, 1.343994140625, 1.423828125, 1.503662109375, 1.58349609375, 1.663330078125, 1.7431640625, 1.822998046875, 1.90283203125, 1.982666015625, 2.0625, 2.142333984375, 2.22216796875, 2.302001953125, 2.3818359375, 2.461669921875, 2.54150390625, 2.621337890625, 2.701171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 1.0, 12.0, 14.0, 11.0, 9.0, 23.0, 13.0, 17.0, 25.0, 31.0, 33.0, 40.0, 38.0, 53.0, 63.0, 74.0, 90.0, 166.0, 1381.0, 324.0, 131.0, 81.0, 55.0, 44.0, 45.0, 37.0, 33.0, 35.0, 26.0, 21.0, 26.0, 23.0, 13.0, 17.0, 6.0, 10.0, 3.0, 5.0, 6.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -5.039794921875, -4.87646484375, -4.713134765625, -4.5498046875, -4.386474609375, -4.22314453125, -4.059814453125, -3.896484375, -3.733154296875, -3.56982421875, -3.406494140625, -3.2431640625, -3.079833984375, -2.91650390625, -2.753173828125, -2.58984375, -2.426513671875, -2.26318359375, -2.099853515625, -1.9365234375, -1.773193359375, -1.60986328125, -1.446533203125, -1.283203125, -1.119873046875, -0.95654296875, -0.793212890625, -0.6298828125, -0.466552734375, -0.30322265625, -0.139892578125, 0.0234375, 0.186767578125, 0.35009765625, 0.513427734375, 0.6767578125, 0.840087890625, 1.00341796875, 1.166748046875, 1.330078125, 1.493408203125, 1.65673828125, 1.820068359375, 1.9833984375, 2.146728515625, 2.31005859375, 2.473388671875, 2.63671875, 2.800048828125, 2.96337890625, 3.126708984375, 3.2900390625, 3.453369140625, 3.61669921875, 3.780029296875, 3.943359375, 4.106689453125, 4.27001953125, 4.433349609375, 4.5966796875, 4.760009765625, 4.92333984375, 5.086669921875, 5.25]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 6.0, 13.0, 20.0, 34.0, 43.0, 76.0, 136.0, 207.0, 407.0, 993.0, 3206.0, 26608.0, 2840743.0, 260301.0, 9606.0, 1868.0, 663.0, 319.0, 170.0, 94.0, 61.0, 48.0, 24.0, 13.0, 10.0, 9.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.3521728515625, -14.884033203125, -14.4158935546875, -13.94775390625, -13.4796142578125, -13.011474609375, -12.5433349609375, -12.0751953125, -11.6070556640625, -11.138916015625, -10.6707763671875, -10.20263671875, -9.7344970703125, -9.266357421875, -8.7982177734375, -8.330078125, -7.8619384765625, -7.393798828125, -6.9256591796875, -6.45751953125, -5.9893798828125, -5.521240234375, -5.0531005859375, -4.5849609375, -4.1168212890625, -3.648681640625, -3.1805419921875, -2.71240234375, -2.2442626953125, -1.776123046875, -1.3079833984375, -0.83984375, -0.3717041015625, 0.096435546875, 0.5645751953125, 1.03271484375, 1.5008544921875, 1.968994140625, 2.4371337890625, 2.9052734375, 3.3734130859375, 3.841552734375, 4.3096923828125, 4.77783203125, 5.2459716796875, 5.714111328125, 6.1822509765625, 6.650390625, 7.1185302734375, 7.586669921875, 8.0548095703125, 8.52294921875, 8.9910888671875, 9.459228515625, 9.9273681640625, 10.3955078125, 10.8636474609375, 11.331787109375, 11.7999267578125, 12.26806640625, 12.7362060546875, 13.204345703125, 13.6724853515625, 14.140625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 41.0, 779.0, 186.0, 9.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.293222427368164, -15.20516586303711, -11.117109298706055, -7.029052734375, -2.9409961700439453, 1.1470603942871094, 5.235116958618164, 9.323173522949219, 13.411230087280273, 17.499286651611328, 21.587343215942383, 25.675399780273438, 29.763456344604492, 33.85151290893555, 37.93956756591797, 42.027626037597656, 46.115684509277344, 50.20374298095703, 54.29179763793945, 58.379852294921875, 62.46791076660156, 66.55596923828125, 70.64402770996094, 74.7320785522461, 78.82013702392578, 82.90819549560547, 86.99624633789062, 91.08430480957031, 95.17236328125, 99.26042175292969, 103.34848022460938, 107.43653106689453, 111.52459716796875, 115.61265563964844, 119.70071411132812, 123.78876495361328, 127.87682342529297, 131.96487426757812, 136.0529327392578, 140.1409912109375, 144.2290496826172, 148.31710815429688, 152.40516662597656, 156.49322509765625, 160.58126831054688, 164.66932678222656, 168.75738525390625, 172.84544372558594, 176.93350219726562, 181.0215606689453, 185.109619140625, 189.1976776123047, 193.28573608398438, 197.373779296875, 201.4618377685547, 205.54989624023438, 209.63795471191406, 213.72601318359375, 217.81407165527344, 221.90213012695312, 225.99017333984375, 230.07823181152344, 234.16629028320312, 238.2543487548828, 242.3424072265625]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 10.0, 16.0, 14.0, 15.0, 20.0, 19.0, 24.0, 27.0, 22.0, 37.0, 30.0, 34.0, 44.0, 42.0, 36.0, 41.0, 47.0, 43.0, 44.0, 36.0, 40.0, 34.0, 41.0, 46.0, 32.0, 24.0, 15.0, 27.0, 22.0, 16.0, 24.0, 14.0, 10.0, 9.0, 5.0, 8.0, 11.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.917949676513672, -13.493365287780762, -13.068781852722168, -12.644197463989258, -12.219614028930664, -11.795029640197754, -11.370445251464844, -10.94586181640625, -10.52127742767334, -10.09669303894043, -9.672109603881836, -9.247525215148926, -8.822940826416016, -8.398357391357422, -7.973773002624512, -7.54918909072876, -7.124605178833008, -6.700021266937256, -6.275437355041504, -5.850852966308594, -5.426269054412842, -5.00168514251709, -4.57710075378418, -4.152516841888428, -3.727932929992676, -3.303349018096924, -2.8787648677825928, -2.4541807174682617, -2.0295968055725098, -1.6050128936767578, -1.1804287433624268, -0.7558445930480957, -0.33126068115234375, 0.09332334995269775, 0.5179073810577393, 0.9424914121627808, 1.3670754432678223, 1.7916593551635742, 2.2162435054779053, 2.6408276557922363, 3.0654115676879883, 3.4899954795837402, 3.9145796298980713, 4.339163780212402, 4.763747692108154, 5.188331604003906, 5.612915992736816, 6.037499904632568, 6.46208381652832, 6.886667728424072, 7.311251640319824, 7.735836029052734, 8.160419464111328, 8.585003852844238, 9.009588241577148, 9.434171676635742, 9.858756065368652, 10.283340454101562, 10.707923889160156, 11.132508277893066, 11.557092666625977, 11.98167610168457, 12.40626049041748, 12.83084487915039, 13.255428314208984]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 6.0, 13.0, 16.0, 15.0, 6.0, 12.0, 23.0, 18.0, 25.0, 22.0, 27.0, 37.0, 46.0, 37.0, 34.0, 29.0, 27.0, 33.0, 47.0, 34.0, 44.0, 42.0, 36.0, 47.0, 39.0, 39.0, 32.0, 24.0, 26.0, 25.0, 24.0, 16.0, 11.0, 14.0, 13.0, 12.0, 12.0, 4.0, 5.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-1.85546875, -1.80633544921875, -1.7572021484375, -1.70806884765625, -1.658935546875, -1.60980224609375, -1.5606689453125, -1.51153564453125, -1.46240234375, -1.41326904296875, -1.3641357421875, -1.31500244140625, -1.265869140625, -1.21673583984375, -1.1676025390625, -1.11846923828125, -1.0693359375, -1.02020263671875, -0.9710693359375, -0.92193603515625, -0.872802734375, -0.82366943359375, -0.7745361328125, -0.72540283203125, -0.67626953125, -0.62713623046875, -0.5780029296875, -0.52886962890625, -0.479736328125, -0.43060302734375, -0.3814697265625, -0.33233642578125, -0.283203125, -0.23406982421875, -0.1849365234375, -0.13580322265625, -0.086669921875, -0.03753662109375, 0.0115966796875, 0.06072998046875, 0.10986328125, 0.15899658203125, 0.2081298828125, 0.25726318359375, 0.306396484375, 0.35552978515625, 0.4046630859375, 0.45379638671875, 0.5029296875, 0.55206298828125, 0.6011962890625, 0.65032958984375, 0.699462890625, 0.74859619140625, 0.7977294921875, 0.84686279296875, 0.89599609375, 0.94512939453125, 0.9942626953125, 1.04339599609375, 1.092529296875, 1.14166259765625, 1.1907958984375, 1.23992919921875, 1.2890625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 11.0, 18.0, 15.0, 19.0, 29.0, 50.0, 64.0, 95.0, 119.0, 199.0, 245.0, 361.0, 575.0, 776.0, 1332.0, 2062.0, 3672.0, 6837.0, 13867.0, 35453.0, 301234.0, 3121070.0, 618109.0, 53189.0, 17163.0, 7872.0, 4014.0, 2242.0, 1290.0, 790.0, 531.0, 332.0, 196.0, 150.0, 103.0, 70.0, 39.0, 27.0, 20.0, 14.0, 11.0, 7.0, 3.0, 4.0], "bins": [-6.5546875, -6.397186279296875, -6.23968505859375, -6.082183837890625, -5.9246826171875, -5.767181396484375, -5.60968017578125, -5.452178955078125, -5.294677734375, -5.137176513671875, -4.97967529296875, -4.822174072265625, -4.6646728515625, -4.507171630859375, -4.34967041015625, -4.192169189453125, -4.03466796875, -3.877166748046875, -3.71966552734375, -3.562164306640625, -3.4046630859375, -3.247161865234375, -3.08966064453125, -2.932159423828125, -2.774658203125, -2.617156982421875, -2.45965576171875, -2.302154541015625, -2.1446533203125, -1.987152099609375, -1.82965087890625, -1.672149658203125, -1.5146484375, -1.357147216796875, -1.19964599609375, -1.042144775390625, -0.8846435546875, -0.727142333984375, -0.56964111328125, -0.412139892578125, -0.254638671875, -0.097137451171875, 0.06036376953125, 0.217864990234375, 0.3753662109375, 0.532867431640625, 0.69036865234375, 0.847869873046875, 1.00537109375, 1.162872314453125, 1.32037353515625, 1.477874755859375, 1.6353759765625, 1.792877197265625, 1.95037841796875, 2.107879638671875, 2.265380859375, 2.422882080078125, 2.58038330078125, 2.737884521484375, 2.8953857421875, 3.052886962890625, 3.21038818359375, 3.367889404296875, 3.525390625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 3.0, 10.0, 13.0, 17.0, 11.0, 14.0, 26.0, 36.0, 59.0, 82.0, 146.0, 244.0, 478.0, 723.0, 816.0, 547.0, 296.0, 153.0, 97.0, 77.0, 47.0, 35.0, 23.0, 33.0, 15.0, 17.0, 10.0, 12.0, 4.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.66796875, -4.53521728515625, -4.4024658203125, -4.26971435546875, -4.136962890625, -4.00421142578125, -3.8714599609375, -3.73870849609375, -3.60595703125, -3.47320556640625, -3.3404541015625, -3.20770263671875, -3.074951171875, -2.94219970703125, -2.8094482421875, -2.67669677734375, -2.5439453125, -2.41119384765625, -2.2784423828125, -2.14569091796875, -2.012939453125, -1.88018798828125, -1.7474365234375, -1.61468505859375, -1.48193359375, -1.34918212890625, -1.2164306640625, -1.08367919921875, -0.950927734375, -0.81817626953125, -0.6854248046875, -0.55267333984375, -0.419921875, -0.28717041015625, -0.1544189453125, -0.02166748046875, 0.111083984375, 0.24383544921875, 0.3765869140625, 0.50933837890625, 0.64208984375, 0.77484130859375, 0.9075927734375, 1.04034423828125, 1.173095703125, 1.30584716796875, 1.4385986328125, 1.57135009765625, 1.7041015625, 1.83685302734375, 1.9696044921875, 2.10235595703125, 2.235107421875, 2.36785888671875, 2.5006103515625, 2.63336181640625, 2.76611328125, 2.89886474609375, 3.0316162109375, 3.16436767578125, 3.297119140625, 3.42987060546875, 3.5626220703125, 3.69537353515625, 3.828125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 7.0, 7.0, 12.0, 31.0, 34.0, 70.0, 99.0, 173.0, 356.0, 661.0, 1324.0, 2911.0, 7064.0, 20078.0, 80049.0, 1517574.0, 2427715.0, 98564.0, 23271.0, 8038.0, 3252.0, 1489.0, 686.0, 361.0, 182.0, 99.0, 62.0, 46.0, 24.0, 15.0, 4.0, 12.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8482666015625, -7.587158203125, -7.3260498046875, -7.06494140625, -6.8038330078125, -6.542724609375, -6.2816162109375, -6.0205078125, -5.7593994140625, -5.498291015625, -5.2371826171875, -4.97607421875, -4.7149658203125, -4.453857421875, -4.1927490234375, -3.931640625, -3.6705322265625, -3.409423828125, -3.1483154296875, -2.88720703125, -2.6260986328125, -2.364990234375, -2.1038818359375, -1.8427734375, -1.5816650390625, -1.320556640625, -1.0594482421875, -0.79833984375, -0.5372314453125, -0.276123046875, -0.0150146484375, 0.24609375, 0.5072021484375, 0.768310546875, 1.0294189453125, 1.29052734375, 1.5516357421875, 1.812744140625, 2.0738525390625, 2.3349609375, 2.5960693359375, 2.857177734375, 3.1182861328125, 3.37939453125, 3.6405029296875, 3.901611328125, 4.1627197265625, 4.423828125, 4.6849365234375, 4.946044921875, 5.2071533203125, 5.46826171875, 5.7293701171875, 5.990478515625, 6.2515869140625, 6.5126953125, 6.7738037109375, 7.034912109375, 7.2960205078125, 7.55712890625, 7.8182373046875, 8.079345703125, 8.3404541015625, 8.6015625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 14.0, 24.0, 52.0, 98.0, 192.0, 270.0, 162.0, 104.0, 47.0, 19.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.03641128540039, -53.8255500793457, -52.61469268798828, -51.403831481933594, -50.19297409057617, -48.982112884521484, -47.77125549316406, -46.560394287109375, -45.34953308105469, -44.138671875, -42.92781448364258, -41.71695327758789, -40.50609588623047, -39.29523468017578, -38.08437728881836, -36.87351608276367, -35.66265869140625, -34.45179748535156, -33.24094009399414, -32.03007888793945, -30.81922149658203, -29.608360290527344, -28.39750099182129, -27.186641693115234, -25.97578239440918, -24.764923095703125, -23.55406379699707, -22.343204498291016, -21.132343292236328, -19.921485900878906, -18.71062469482422, -17.499765396118164, -16.288904190063477, -15.078044891357422, -13.867185592651367, -12.656325340270996, -11.445466041564941, -10.234606742858887, -9.023746490478516, -7.812887191772461, -6.602027893066406, -5.391168594360352, -4.180308818817139, -2.969449281692505, -1.758589744567871, -0.5477304458618164, 0.6631293296813965, 1.8739891052246094, 3.084848403930664, 4.295707702636719, 5.506567478179932, 6.7174272537231445, 7.928286552429199, 9.139145851135254, 10.350006103515625, 11.56086540222168, 12.771724700927734, 13.982583999633789, 15.193443298339844, 16.4043025970459, 17.615161895751953, 18.82602310180664, 20.036882400512695, 21.24774169921875, 22.458600997924805]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 10.0, 12.0, 9.0, 12.0, 21.0, 12.0, 18.0, 24.0, 36.0, 20.0, 26.0, 23.0, 21.0, 38.0, 37.0, 35.0, 46.0, 28.0, 29.0, 38.0, 45.0, 39.0, 28.0, 44.0, 44.0, 26.0, 35.0, 17.0, 31.0, 22.0, 14.0, 30.0, 19.0, 16.0, 22.0, 13.0, 8.0, 7.0, 7.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.21301555633545, -8.891881942749023, -8.570747375488281, -8.249613761901855, -7.9284796714782715, -7.6073455810546875, -7.2862114906311035, -6.9650774002075195, -6.643943786621094, -6.32280969619751, -6.001675605773926, -5.6805419921875, -5.359407901763916, -5.038273811340332, -4.717139720916748, -4.396005630493164, -4.07487154006958, -3.753737449645996, -3.432603597640991, -3.1114695072174072, -2.7903356552124023, -2.4692015647888184, -2.1480674743652344, -1.8269336223602295, -1.5057995319366455, -1.184665560722351, -0.8635315299034119, -0.5423974990844727, -0.22126352787017822, 0.09987044334411621, 0.4210045337677002, 0.7421383857727051, 1.063272476196289, 1.3844064474105835, 1.705540418624878, 2.026674509048462, 2.347808361053467, 2.668942451477051, 2.9900765419006348, 3.3112103939056396, 3.6323444843292236, 3.9534785747528076, 4.2746124267578125, 4.5957465171813965, 4.9168806076049805, 5.238014221191406, 5.559148788452148, 5.880282402038574, 6.201416492462158, 6.522550582885742, 6.843684673309326, 7.16481876373291, 7.485952377319336, 7.80708646774292, 8.128220558166504, 8.44935417175293, 8.770488739013672, 9.091622352600098, 9.41275691986084, 9.733890533447266, 10.055025100708008, 10.376158714294434, 10.69729232788086, 11.018426895141602, 11.339560508728027]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 4.0, 15.0, 19.0, 8.0, 28.0, 18.0, 26.0, 31.0, 30.0, 30.0, 35.0, 43.0, 38.0, 44.0, 39.0, 21.0, 45.0, 37.0, 43.0, 39.0, 45.0, 24.0, 41.0, 20.0, 39.0, 39.0, 29.0, 32.0, 29.0, 16.0, 11.0, 17.0, 9.0, 9.0, 6.0, 9.0, 2.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5888671875, -1.5391082763671875, -1.489349365234375, -1.4395904541015625, -1.38983154296875, -1.3400726318359375, -1.290313720703125, -1.2405548095703125, -1.1907958984375, -1.1410369873046875, -1.091278076171875, -1.0415191650390625, -0.99176025390625, -0.9420013427734375, -0.892242431640625, -0.8424835205078125, -0.792724609375, -0.7429656982421875, -0.693206787109375, -0.6434478759765625, -0.59368896484375, -0.5439300537109375, -0.494171142578125, -0.4444122314453125, -0.3946533203125, -0.3448944091796875, -0.295135498046875, -0.2453765869140625, -0.19561767578125, -0.1458587646484375, -0.096099853515625, -0.0463409423828125, 0.00341796875, 0.0531768798828125, 0.102935791015625, 0.1526947021484375, 0.20245361328125, 0.2522125244140625, 0.301971435546875, 0.3517303466796875, 0.4014892578125, 0.4512481689453125, 0.501007080078125, 0.5507659912109375, 0.60052490234375, 0.6502838134765625, 0.700042724609375, 0.7498016357421875, 0.799560546875, 0.8493194580078125, 0.899078369140625, 0.9488372802734375, 0.99859619140625, 1.0483551025390625, 1.098114013671875, 1.1478729248046875, 1.1976318359375, 1.2473907470703125, 1.297149658203125, 1.3469085693359375, 1.39666748046875, 1.4464263916015625, 1.496185302734375, 1.5459442138671875, 1.595703125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 10.0, 7.0, 16.0, 21.0, 24.0, 56.0, 79.0, 103.0, 175.0, 284.0, 511.0, 899.0, 1892.0, 3918.0, 8852.0, 21616.0, 56710.0, 177576.0, 523143.0, 163174.0, 53271.0, 20229.0, 8325.0, 3738.0, 1758.0, 889.0, 479.0, 278.0, 148.0, 122.0, 70.0, 49.0, 33.0, 20.0, 20.0, 16.0, 11.0, 6.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0721588134765625, -1.030059814453125, -0.9879608154296875, -0.94586181640625, -0.9037628173828125, -0.861663818359375, -0.8195648193359375, -0.7774658203125, -0.7353668212890625, -0.693267822265625, -0.6511688232421875, -0.60906982421875, -0.5669708251953125, -0.524871826171875, -0.4827728271484375, -0.440673828125, -0.3985748291015625, -0.356475830078125, -0.3143768310546875, -0.27227783203125, -0.2301788330078125, -0.188079833984375, -0.1459808349609375, -0.1038818359375, -0.0617828369140625, -0.019683837890625, 0.0224151611328125, 0.06451416015625, 0.1066131591796875, 0.148712158203125, 0.1908111572265625, 0.23291015625, 0.2750091552734375, 0.317108154296875, 0.3592071533203125, 0.40130615234375, 0.4434051513671875, 0.485504150390625, 0.5276031494140625, 0.5697021484375, 0.6118011474609375, 0.653900146484375, 0.6959991455078125, 0.73809814453125, 0.7801971435546875, 0.822296142578125, 0.8643951416015625, 0.906494140625, 0.9485931396484375, 0.990692138671875, 1.0327911376953125, 1.07489013671875, 1.1169891357421875, 1.159088134765625, 1.2011871337890625, 1.2432861328125, 1.2853851318359375, 1.327484130859375, 1.3695831298828125, 1.41168212890625, 1.4537811279296875, 1.495880126953125, 1.5379791259765625, 1.580078125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 7.0, 8.0, 13.0, 21.0, 12.0, 15.0, 25.0, 23.0, 19.0, 27.0, 26.0, 35.0, 44.0, 20.0, 28.0, 39.0, 44.0, 43.0, 41.0, 1061.0, 44.0, 40.0, 32.0, 40.0, 39.0, 39.0, 27.0, 29.0, 17.0, 23.0, 22.0, 19.0, 12.0, 15.0, 10.0, 16.0, 11.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.2257232666015625, -1.187774658203125, -1.1498260498046875, -1.11187744140625, -1.0739288330078125, -1.035980224609375, -0.9980316162109375, -0.9600830078125, -0.9221343994140625, -0.884185791015625, -0.8462371826171875, -0.80828857421875, -0.7703399658203125, -0.732391357421875, -0.6944427490234375, -0.656494140625, -0.6185455322265625, -0.580596923828125, -0.5426483154296875, -0.50469970703125, -0.4667510986328125, -0.428802490234375, -0.3908538818359375, -0.3529052734375, -0.3149566650390625, -0.277008056640625, -0.2390594482421875, -0.20111083984375, -0.1631622314453125, -0.125213623046875, -0.0872650146484375, -0.04931640625, -0.0113677978515625, 0.026580810546875, 0.0645294189453125, 0.10247802734375, 0.1404266357421875, 0.178375244140625, 0.2163238525390625, 0.2542724609375, 0.2922210693359375, 0.330169677734375, 0.3681182861328125, 0.40606689453125, 0.4440155029296875, 0.481964111328125, 0.5199127197265625, 0.557861328125, 0.5958099365234375, 0.633758544921875, 0.6717071533203125, 0.70965576171875, 0.7476043701171875, 0.785552978515625, 0.8235015869140625, 0.8614501953125, 0.8993988037109375, 0.937347412109375, 0.9752960205078125, 1.01324462890625, 1.0511932373046875, 1.089141845703125, 1.1270904541015625, 1.1650390625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 17.0, 12.0, 24.0, 26.0, 40.0, 68.0, 73.0, 123.0, 151.0, 213.0, 340.0, 544.0, 803.0, 1236.0, 2170.0, 3776.0, 7004.0, 14834.0, 52843.0, 1858270.0, 114249.0, 20373.0, 8665.0, 4417.0, 2632.0, 1489.0, 927.0, 577.0, 355.0, 271.0, 174.0, 104.0, 92.0, 62.0, 49.0, 39.0, 20.0, 20.0, 15.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.54296875, -1.494232177734375, -1.44549560546875, -1.396759033203125, -1.3480224609375, -1.299285888671875, -1.25054931640625, -1.201812744140625, -1.153076171875, -1.104339599609375, -1.05560302734375, -1.006866455078125, -0.9581298828125, -0.909393310546875, -0.86065673828125, -0.811920166015625, -0.76318359375, -0.714447021484375, -0.66571044921875, -0.616973876953125, -0.5682373046875, -0.519500732421875, -0.47076416015625, -0.422027587890625, -0.373291015625, -0.324554443359375, -0.27581787109375, -0.227081298828125, -0.1783447265625, -0.129608154296875, -0.08087158203125, -0.032135009765625, 0.0166015625, 0.065338134765625, 0.11407470703125, 0.162811279296875, 0.2115478515625, 0.260284423828125, 0.30902099609375, 0.357757568359375, 0.406494140625, 0.455230712890625, 0.50396728515625, 0.552703857421875, 0.6014404296875, 0.650177001953125, 0.69891357421875, 0.747650146484375, 0.79638671875, 0.845123291015625, 0.89385986328125, 0.942596435546875, 0.9913330078125, 1.040069580078125, 1.08880615234375, 1.137542724609375, 1.186279296875, 1.235015869140625, 1.28375244140625, 1.332489013671875, 1.3812255859375, 1.429962158203125, 1.47869873046875, 1.527435302734375, 1.576171875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 14.0, 12.0, 16.0, 15.0, 28.0, 34.0, 63.0, 80.0, 83.0, 110.0, 101.0, 111.0, 85.0, 52.0, 50.0, 33.0, 29.0, 13.0, 20.0, 5.0, 10.0, 5.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057464599609375, -0.05543851852416992, -0.053412437438964844, -0.051386356353759766, -0.04936027526855469, -0.04733419418334961, -0.04530811309814453, -0.04328203201293945, -0.041255950927734375, -0.0392298698425293, -0.03720378875732422, -0.03517770767211914, -0.03315162658691406, -0.031125545501708984, -0.029099464416503906, -0.027073383331298828, -0.02504730224609375, -0.023021221160888672, -0.020995140075683594, -0.018969058990478516, -0.016942977905273438, -0.01491689682006836, -0.012890815734863281, -0.010864734649658203, -0.008838653564453125, -0.006812572479248047, -0.004786491394042969, -0.0027604103088378906, -0.0007343292236328125, 0.0012917518615722656, 0.0033178329467773438, 0.005343914031982422, 0.0073699951171875, 0.009396076202392578, 0.011422157287597656, 0.013448238372802734, 0.015474319458007812, 0.01750040054321289, 0.01952648162841797, 0.021552562713623047, 0.023578643798828125, 0.025604724884033203, 0.02763080596923828, 0.02965688705444336, 0.03168296813964844, 0.033709049224853516, 0.035735130310058594, 0.03776121139526367, 0.03978729248046875, 0.04181337356567383, 0.043839454650878906, 0.045865535736083984, 0.04789161682128906, 0.04991769790649414, 0.05194377899169922, 0.0539698600769043, 0.055995941162109375, 0.05802202224731445, 0.06004810333251953, 0.06207418441772461, 0.06410026550292969, 0.06612634658813477, 0.06815242767333984, 0.07017850875854492, 0.07220458984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 7.0, 7.0, 12.0, 14.0, 18.0, 24.0, 34.0, 66.0, 90.0, 135.0, 227.0, 573.0, 2335.0, 26468.0, 902349.0, 109589.0, 4976.0, 828.0, 307.0, 172.0, 79.0, 74.0, 46.0, 33.0, 16.0, 12.0, 17.0, 14.0, 4.0, 5.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.85107421875, -0.8265380859375, -0.802001953125, -0.7774658203125, -0.7529296875, -0.7283935546875, -0.703857421875, -0.6793212890625, -0.65478515625, -0.6302490234375, -0.605712890625, -0.5811767578125, -0.556640625, -0.5321044921875, -0.507568359375, -0.4830322265625, -0.45849609375, -0.4339599609375, -0.409423828125, -0.3848876953125, -0.3603515625, -0.3358154296875, -0.311279296875, -0.2867431640625, -0.26220703125, -0.2376708984375, -0.213134765625, -0.1885986328125, -0.1640625, -0.1395263671875, -0.114990234375, -0.0904541015625, -0.06591796875, -0.0413818359375, -0.016845703125, 0.0076904296875, 0.0322265625, 0.0567626953125, 0.081298828125, 0.1058349609375, 0.13037109375, 0.1549072265625, 0.179443359375, 0.2039794921875, 0.228515625, 0.2530517578125, 0.277587890625, 0.3021240234375, 0.32666015625, 0.3511962890625, 0.375732421875, 0.4002685546875, 0.4248046875, 0.4493408203125, 0.473876953125, 0.4984130859375, 0.52294921875, 0.5474853515625, 0.572021484375, 0.5965576171875, 0.62109375, 0.6456298828125, 0.670166015625, 0.6947021484375, 0.71923828125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 12.0, 14.0, 36.0, 42.0, 58.0, 71.0, 119.0, 137.0, 150.0, 132.0, 76.0, 44.0, 39.0, 27.0, 17.0, 8.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07822079956531525, -0.07326024770736694, -0.06829970329999924, -0.06333915144205093, -0.05837860330939293, -0.053418055176734924, -0.04845750331878662, -0.043496955186128616, -0.03853640705347061, -0.03357585892081261, -0.028615308925509453, -0.0236547589302063, -0.018694210797548294, -0.01373366266489029, -0.008773112669587135, -0.0038125626742839813, 0.0011479854583740234, 0.006108534522354603, 0.011069083586335182, 0.016029633581638336, 0.02099018171429634, 0.025950729846954346, 0.0309112798422575, 0.035871829837560654, 0.04083237797021866, 0.04579292610287666, 0.05075347423553467, 0.05571402609348297, 0.060674574226140976, 0.06563512235879898, 0.07059567421674728, 0.07555621862411499, 0.08051678538322449, 0.08547733724117279, 0.0904378816485405, 0.0953984335064888, 0.1003589779138565, 0.10531952977180481, 0.11028008162975311, 0.11524063348770142, 0.12020117789506912, 0.12516172230243683, 0.13012227416038513, 0.13508282601833344, 0.14004337787628174, 0.14500391483306885, 0.14996446669101715, 0.15492501854896545, 0.15988557040691376, 0.16484612226486206, 0.16980667412281036, 0.17476721107959747, 0.17972776293754578, 0.18468831479549408, 0.18964886665344238, 0.19460941851139069, 0.199569970369339, 0.2045305222272873, 0.2094910740852356, 0.2144516110420227, 0.219412162899971, 0.2243727147579193, 0.22933326661586761, 0.23429381847381592, 0.23925435543060303]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 11.0, 13.0, 14.0, 13.0, 20.0, 15.0, 19.0, 25.0, 19.0, 22.0, 36.0, 26.0, 26.0, 36.0, 29.0, 41.0, 39.0, 43.0, 48.0, 50.0, 47.0, 40.0, 36.0, 29.0, 39.0, 32.0, 28.0, 24.0, 21.0, 26.0, 27.0, 14.0, 17.0, 15.0, 12.0, 12.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07231849431991577, -0.07020852714776993, -0.06809855997562408, -0.06598858535289764, -0.0638786181807518, -0.06176865100860596, -0.059658680111169815, -0.05754870921373367, -0.05543874204158783, -0.053328774869441986, -0.051218803972005844, -0.0491088330745697, -0.04699886590242386, -0.044888898730278015, -0.04277892783284187, -0.04066895693540573, -0.03855898976325989, -0.036449022591114044, -0.0343390516936779, -0.03222908079624176, -0.030119113624095917, -0.028009144589304924, -0.02589917555451393, -0.02378920651972294, -0.021679237484931946, -0.019569268450140953, -0.01745929941534996, -0.015349330380558968, -0.013239361345767975, -0.011129392310976982, -0.00901942327618599, -0.006909454241394997, -0.004799485206604004, -0.002689516171813011, -0.0005795471370220184, 0.0015304218977689743, 0.003640390932559967, 0.00575035996735096, 0.007860329002141953, 0.009970298036932945, 0.012080267071723938, 0.01419023610651493, 0.016300205141305923, 0.018410174176096916, 0.02052014321088791, 0.0226301122456789, 0.024740081280469894, 0.026850050315260887, 0.02896001935005188, 0.031069988384842873, 0.033179957419633865, 0.03528992831707001, 0.03739989548921585, 0.039509862661361694, 0.041619833558797836, 0.04372980445623398, 0.04583977162837982, 0.047949738800525665, 0.05005970969796181, 0.05216968059539795, 0.05427964776754379, 0.056389614939689636, 0.05849958583712578, 0.06060955673456192, 0.06271952390670776]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 7.0, 5.0, 14.0, 20.0, 9.0, 24.0, 22.0, 26.0, 29.0, 34.0, 27.0, 36.0, 43.0, 37.0, 45.0, 40.0, 22.0, 44.0, 36.0, 43.0, 38.0, 46.0, 24.0, 42.0, 18.0, 42.0, 39.0, 28.0, 34.0, 25.0, 17.0, 12.0, 16.0, 8.0, 9.0, 7.0, 9.0, 1.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.5418701171875, -1.491943359375, -1.4420166015625, -1.39208984375, -1.3421630859375, -1.292236328125, -1.2423095703125, -1.1923828125, -1.1424560546875, -1.092529296875, -1.0426025390625, -0.99267578125, -0.9427490234375, -0.892822265625, -0.8428955078125, -0.79296875, -0.7430419921875, -0.693115234375, -0.6431884765625, -0.59326171875, -0.5433349609375, -0.493408203125, -0.4434814453125, -0.3935546875, -0.3436279296875, -0.293701171875, -0.2437744140625, -0.19384765625, -0.1439208984375, -0.093994140625, -0.0440673828125, 0.005859375, 0.0557861328125, 0.105712890625, 0.1556396484375, 0.20556640625, 0.2554931640625, 0.305419921875, 0.3553466796875, 0.4052734375, 0.4552001953125, 0.505126953125, 0.5550537109375, 0.60498046875, 0.6549072265625, 0.704833984375, 0.7547607421875, 0.8046875, 0.8546142578125, 0.904541015625, 0.9544677734375, 1.00439453125, 1.0543212890625, 1.104248046875, 1.1541748046875, 1.2041015625, 1.2540283203125, 1.303955078125, 1.3538818359375, 1.40380859375, 1.4537353515625, 1.503662109375, 1.5535888671875, 1.603515625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 9.0, 20.0, 19.0, 25.0, 36.0, 60.0, 75.0, 125.0, 176.0, 241.0, 392.0, 585.0, 936.0, 1579.0, 2663.0, 4871.0, 10560.0, 31264.0, 140101.0, 579320.0, 206780.0, 42015.0, 12963.0, 5783.0, 3031.0, 1796.0, 1086.0, 666.0, 421.0, 288.0, 202.0, 133.0, 93.0, 62.0, 40.0, 40.0, 19.0, 15.0, 13.0, 7.0, 9.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.787109375, -2.6929931640625, -2.598876953125, -2.5047607421875, -2.41064453125, -2.3165283203125, -2.222412109375, -2.1282958984375, -2.0341796875, -1.9400634765625, -1.845947265625, -1.7518310546875, -1.65771484375, -1.5635986328125, -1.469482421875, -1.3753662109375, -1.28125, -1.1871337890625, -1.093017578125, -0.9989013671875, -0.90478515625, -0.8106689453125, -0.716552734375, -0.6224365234375, -0.5283203125, -0.4342041015625, -0.340087890625, -0.2459716796875, -0.15185546875, -0.0577392578125, 0.036376953125, 0.1304931640625, 0.224609375, 0.3187255859375, 0.412841796875, 0.5069580078125, 0.60107421875, 0.6951904296875, 0.789306640625, 0.8834228515625, 0.9775390625, 1.0716552734375, 1.165771484375, 1.2598876953125, 1.35400390625, 1.4481201171875, 1.542236328125, 1.6363525390625, 1.73046875, 1.8245849609375, 1.918701171875, 2.0128173828125, 2.10693359375, 2.2010498046875, 2.295166015625, 2.3892822265625, 2.4833984375, 2.5775146484375, 2.671630859375, 2.7657470703125, 2.85986328125, 2.9539794921875, 3.048095703125, 3.1422119140625, 3.236328125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 8.0, 6.0, 16.0, 7.0, 11.0, 8.0, 23.0, 24.0, 18.0, 26.0, 31.0, 37.0, 31.0, 48.0, 47.0, 57.0, 80.0, 139.0, 248.0, 1453.0, 169.0, 108.0, 87.0, 45.0, 43.0, 35.0, 37.0, 26.0, 26.0, 20.0, 21.0, 17.0, 16.0, 11.0, 15.0, 9.0, 7.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-4.47265625, -4.33428955078125, -4.1959228515625, -4.05755615234375, -3.919189453125, -3.78082275390625, -3.6424560546875, -3.50408935546875, -3.36572265625, -3.22735595703125, -3.0889892578125, -2.95062255859375, -2.812255859375, -2.67388916015625, -2.5355224609375, -2.39715576171875, -2.2587890625, -2.12042236328125, -1.9820556640625, -1.84368896484375, -1.705322265625, -1.56695556640625, -1.4285888671875, -1.29022216796875, -1.15185546875, -1.01348876953125, -0.8751220703125, -0.73675537109375, -0.598388671875, -0.46002197265625, -0.3216552734375, -0.18328857421875, -0.044921875, 0.09344482421875, 0.2318115234375, 0.37017822265625, 0.508544921875, 0.64691162109375, 0.7852783203125, 0.92364501953125, 1.06201171875, 1.20037841796875, 1.3387451171875, 1.47711181640625, 1.615478515625, 1.75384521484375, 1.8922119140625, 2.03057861328125, 2.1689453125, 2.30731201171875, 2.4456787109375, 2.58404541015625, 2.722412109375, 2.86077880859375, 2.9991455078125, 3.13751220703125, 3.27587890625, 3.41424560546875, 3.5526123046875, 3.69097900390625, 3.829345703125, 3.96771240234375, 4.1060791015625, 4.24444580078125, 4.3828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 4.0, 9.0, 16.0, 15.0, 19.0, 26.0, 31.0, 41.0, 43.0, 60.0, 75.0, 126.0, 189.0, 309.0, 587.0, 1471.0, 5483.0, 39702.0, 2106416.0, 956378.0, 27643.0, 4292.0, 1259.0, 554.0, 266.0, 180.0, 114.0, 80.0, 69.0, 48.0, 39.0, 26.0, 28.0, 19.0, 16.0, 14.0, 15.0, 9.0, 6.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-8.40625, -8.158447265625, -7.91064453125, -7.662841796875, -7.4150390625, -7.167236328125, -6.91943359375, -6.671630859375, -6.423828125, -6.176025390625, -5.92822265625, -5.680419921875, -5.4326171875, -5.184814453125, -4.93701171875, -4.689208984375, -4.44140625, -4.193603515625, -3.94580078125, -3.697998046875, -3.4501953125, -3.202392578125, -2.95458984375, -2.706787109375, -2.458984375, -2.211181640625, -1.96337890625, -1.715576171875, -1.4677734375, -1.219970703125, -0.97216796875, -0.724365234375, -0.4765625, -0.228759765625, 0.01904296875, 0.266845703125, 0.5146484375, 0.762451171875, 1.01025390625, 1.258056640625, 1.505859375, 1.753662109375, 2.00146484375, 2.249267578125, 2.4970703125, 2.744873046875, 2.99267578125, 3.240478515625, 3.48828125, 3.736083984375, 3.98388671875, 4.231689453125, 4.4794921875, 4.727294921875, 4.97509765625, 5.222900390625, 5.470703125, 5.718505859375, 5.96630859375, 6.214111328125, 6.4619140625, 6.709716796875, 6.95751953125, 7.205322265625, 7.453125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 30.0, 69.0, 245.0, 374.0, 221.0, 55.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.673301696777344, -51.70579147338867, -50.73828125, -49.77077102661133, -48.803260803222656, -47.835750579833984, -46.86824035644531, -45.90073013305664, -44.93321990966797, -43.9657096862793, -42.998199462890625, -42.03068923950195, -41.06317901611328, -40.09566879272461, -39.12815856933594, -38.160648345947266, -37.19314193725586, -36.22563171386719, -35.258121490478516, -34.290611267089844, -33.32310104370117, -32.3555908203125, -31.388080596923828, -30.42057228088379, -29.453060150146484, -28.485549926757812, -27.51803970336914, -26.55052947998047, -25.583019256591797, -24.615509033203125, -23.647998809814453, -22.680490493774414, -21.71297836303711, -20.745468139648438, -19.777957916259766, -18.810447692871094, -17.842937469482422, -16.87542724609375, -15.907917976379395, -14.940408706665039, -13.972898483276367, -13.005388259887695, -12.037878036499023, -11.070367813110352, -10.102858543395996, -9.135348320007324, -8.167838096618652, -7.200328350067139, -6.232818603515625, -5.265308380126953, -4.2977986335754395, -3.3302884101867676, -2.362778425216675, -1.395268440246582, -0.42775821685791016, 0.5397515296936035, 1.5072617530822754, 2.474771738052368, 3.442281723022461, 4.409791946411133, 5.377302169799805, 6.344811916351318, 7.31232213973999, 8.279831886291504, 9.247342109680176]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 12.0, 5.0, 8.0, 11.0, 17.0, 10.0, 15.0, 20.0, 21.0, 31.0, 24.0, 30.0, 28.0, 29.0, 27.0, 40.0, 46.0, 31.0, 45.0, 30.0, 38.0, 40.0, 37.0, 47.0, 33.0, 42.0, 28.0, 32.0, 24.0, 27.0, 25.0, 19.0, 18.0, 20.0, 18.0, 9.0, 18.0, 8.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.996842384338379, -12.593564987182617, -12.190286636352539, -11.787009239196777, -11.383731842041016, -10.980453491210938, -10.577176094055176, -10.173898696899414, -9.770620346069336, -9.367342948913574, -8.964064598083496, -8.560787200927734, -8.157509803771973, -7.754231929779053, -7.350954055786133, -6.947676658630371, -6.544399261474609, -6.1411213874816895, -5.737843990325928, -5.334566116333008, -4.931288719177246, -4.528010845184326, -4.124732971191406, -3.7214553356170654, -3.3181777000427246, -2.914900064468384, -2.511622428894043, -2.108344554901123, -1.7050669193267822, -1.3017892837524414, -0.8985114097595215, -0.49523377418518066, -0.09195613861083984, 0.31132155656814575, 0.7145992517471313, 1.1178770065307617, 1.5211546421051025, 1.9244322776794434, 2.3277101516723633, 2.730987787246704, 3.134265422821045, 3.5375430583953857, 3.9408206939697266, 4.3440985679626465, 4.747376441955566, 5.150653839111328, 5.553931713104248, 5.957209587097168, 6.36048698425293, 6.76376485824585, 7.167042255401611, 7.570320129394531, 7.973597526550293, 8.376874923706055, 8.780153274536133, 9.183430671691895, 9.586708068847656, 9.989985466003418, 10.393263816833496, 10.796541213989258, 11.19981861114502, 11.603096008300781, 12.00637435913086, 12.409651756286621, 12.8129301071167]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 15.0, 16.0, 17.0, 17.0, 28.0, 20.0, 20.0, 30.0, 31.0, 37.0, 41.0, 42.0, 29.0, 45.0, 38.0, 39.0, 41.0, 42.0, 38.0, 34.0, 41.0, 27.0, 44.0, 39.0, 32.0, 35.0, 29.0, 23.0, 15.0, 14.0, 12.0, 17.0, 12.0, 13.0, 0.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.62109375, -1.567718505859375, -1.51434326171875, -1.460968017578125, -1.4075927734375, -1.354217529296875, -1.30084228515625, -1.247467041015625, -1.194091796875, -1.140716552734375, -1.08734130859375, -1.033966064453125, -0.9805908203125, -0.927215576171875, -0.87384033203125, -0.820465087890625, -0.76708984375, -0.713714599609375, -0.66033935546875, -0.606964111328125, -0.5535888671875, -0.500213623046875, -0.44683837890625, -0.393463134765625, -0.340087890625, -0.286712646484375, -0.23333740234375, -0.179962158203125, -0.1265869140625, -0.073211669921875, -0.01983642578125, 0.033538818359375, 0.0869140625, 0.140289306640625, 0.19366455078125, 0.247039794921875, 0.3004150390625, 0.353790283203125, 0.40716552734375, 0.460540771484375, 0.513916015625, 0.567291259765625, 0.62066650390625, 0.674041748046875, 0.7274169921875, 0.780792236328125, 0.83416748046875, 0.887542724609375, 0.94091796875, 0.994293212890625, 1.04766845703125, 1.101043701171875, 1.1544189453125, 1.207794189453125, 1.26116943359375, 1.314544677734375, 1.367919921875, 1.421295166015625, 1.47467041015625, 1.528045654296875, 1.5814208984375, 1.634796142578125, 1.68817138671875, 1.741546630859375, 1.794921875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 5.0, 8.0, 10.0, 14.0, 20.0, 35.0, 69.0, 72.0, 141.0, 190.0, 238.0, 390.0, 614.0, 1007.0, 1737.0, 2962.0, 5664.0, 12053.0, 37760.0, 334842.0, 3138212.0, 580833.0, 49973.0, 14073.0, 6258.0, 3018.0, 1691.0, 955.0, 569.0, 377.0, 212.0, 118.0, 53.0, 33.0, 27.0, 13.0, 15.0, 6.0, 3.0, 3.0, 0.0, 2.0], "bins": [-6.8671875, -6.7059326171875, -6.544677734375, -6.3834228515625, -6.22216796875, -6.0609130859375, -5.899658203125, -5.7384033203125, -5.5771484375, -5.4158935546875, -5.254638671875, -5.0933837890625, -4.93212890625, -4.7708740234375, -4.609619140625, -4.4483642578125, -4.287109375, -4.1258544921875, -3.964599609375, -3.8033447265625, -3.64208984375, -3.4808349609375, -3.319580078125, -3.1583251953125, -2.9970703125, -2.8358154296875, -2.674560546875, -2.5133056640625, -2.35205078125, -2.1907958984375, -2.029541015625, -1.8682861328125, -1.70703125, -1.5457763671875, -1.384521484375, -1.2232666015625, -1.06201171875, -0.9007568359375, -0.739501953125, -0.5782470703125, -0.4169921875, -0.2557373046875, -0.094482421875, 0.0667724609375, 0.22802734375, 0.3892822265625, 0.550537109375, 0.7117919921875, 0.873046875, 1.0343017578125, 1.195556640625, 1.3568115234375, 1.51806640625, 1.6793212890625, 1.840576171875, 2.0018310546875, 2.1630859375, 2.3243408203125, 2.485595703125, 2.6468505859375, 2.80810546875, 2.9693603515625, 3.130615234375, 3.2918701171875, 3.453125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 8.0, 15.0, 12.0, 16.0, 14.0, 28.0, 41.0, 48.0, 76.0, 146.0, 231.0, 408.0, 672.0, 809.0, 587.0, 368.0, 190.0, 129.0, 65.0, 42.0, 30.0, 32.0, 23.0, 10.0, 20.0, 9.0, 4.0, 4.0, 6.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.986328125, -3.859375, -3.732421875, -3.60546875, -3.478515625, -3.3515625, -3.224609375, -3.09765625, -2.970703125, -2.84375, -2.716796875, -2.58984375, -2.462890625, -2.3359375, -2.208984375, -2.08203125, -1.955078125, -1.828125, -1.701171875, -1.57421875, -1.447265625, -1.3203125, -1.193359375, -1.06640625, -0.939453125, -0.8125, -0.685546875, -0.55859375, -0.431640625, -0.3046875, -0.177734375, -0.05078125, 0.076171875, 0.203125, 0.330078125, 0.45703125, 0.583984375, 0.7109375, 0.837890625, 0.96484375, 1.091796875, 1.21875, 1.345703125, 1.47265625, 1.599609375, 1.7265625, 1.853515625, 1.98046875, 2.107421875, 2.234375, 2.361328125, 2.48828125, 2.615234375, 2.7421875, 2.869140625, 2.99609375, 3.123046875, 3.25, 3.376953125, 3.50390625, 3.630859375, 3.7578125, 3.884765625, 4.01171875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 13.0, 24.0, 34.0, 52.0, 72.0, 142.0, 222.0, 522.0, 1063.0, 2350.0, 5965.0, 17427.0, 81580.0, 2355592.0, 1634983.0, 68814.0, 15758.0, 5404.0, 2271.0, 924.0, 464.0, 229.0, 121.0, 79.0, 44.0, 28.0, 15.0, 19.0, 10.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.9608154296875, -7.695068359375, -7.4293212890625, -7.16357421875, -6.8978271484375, -6.632080078125, -6.3663330078125, -6.1005859375, -5.8348388671875, -5.569091796875, -5.3033447265625, -5.03759765625, -4.7718505859375, -4.506103515625, -4.2403564453125, -3.974609375, -3.7088623046875, -3.443115234375, -3.1773681640625, -2.91162109375, -2.6458740234375, -2.380126953125, -2.1143798828125, -1.8486328125, -1.5828857421875, -1.317138671875, -1.0513916015625, -0.78564453125, -0.5198974609375, -0.254150390625, 0.0115966796875, 0.27734375, 0.5430908203125, 0.808837890625, 1.0745849609375, 1.34033203125, 1.6060791015625, 1.871826171875, 2.1375732421875, 2.4033203125, 2.6690673828125, 2.934814453125, 3.2005615234375, 3.46630859375, 3.7320556640625, 3.997802734375, 4.2635498046875, 4.529296875, 4.7950439453125, 5.060791015625, 5.3265380859375, 5.59228515625, 5.8580322265625, 6.123779296875, 6.3895263671875, 6.6552734375, 6.9210205078125, 7.186767578125, 7.4525146484375, 7.71826171875, 7.9840087890625, 8.249755859375, 8.5155029296875, 8.78125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 9.0, 25.0, 37.0, 65.0, 124.0, 210.0, 227.0, 162.0, 80.0, 30.0, 23.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.91034698486328, -40.867374420166016, -39.82440185546875, -38.78142547607422, -37.73845291137695, -36.69548034667969, -35.65250778198242, -34.609535217285156, -33.56656265258789, -32.523590087890625, -31.480615615844727, -30.43764305114746, -29.394670486450195, -28.351696014404297, -27.30872344970703, -26.265750885009766, -25.222776412963867, -24.1798038482666, -23.136829376220703, -22.093856811523438, -21.050884246826172, -20.007911682128906, -18.964937210083008, -17.921964645385742, -16.878990173339844, -15.836016654968262, -14.793044090270996, -13.750070571899414, -12.707098007202148, -11.664124488830566, -10.621150970458984, -9.578178405761719, -8.535207748413086, -7.492234706878662, -6.449261665344238, -5.406288146972656, -4.363315105438232, -3.3203420639038086, -2.2773685455322266, -1.2343955039978027, -0.1914224624633789, 0.8515506982803345, 1.8945238590240479, 2.937497138977051, 3.9804701805114746, 5.023443222045898, 6.0664167404174805, 7.109389781951904, 8.152362823486328, 9.19533634185791, 10.238308906555176, 11.281282424926758, 12.324254989624023, 13.367228507995605, 14.410202026367188, 15.453174591064453, 16.49614715576172, 17.539119720458984, 18.582094192504883, 19.62506675720215, 20.668039321899414, 21.711013793945312, 22.753986358642578, 23.796958923339844, 24.839933395385742]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 6.0, 5.0, 12.0, 8.0, 13.0, 20.0, 16.0, 9.0, 20.0, 18.0, 29.0, 25.0, 14.0, 28.0, 29.0, 42.0, 35.0, 31.0, 37.0, 38.0, 48.0, 40.0, 51.0, 28.0, 33.0, 38.0, 36.0, 29.0, 32.0, 23.0, 21.0, 23.0, 26.0, 18.0, 14.0, 19.0, 18.0, 9.0, 8.0, 11.0, 11.0, 7.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.15669059753418, -8.843356132507324, -8.530020713806152, -8.216686248779297, -7.903350830078125, -7.5900163650512695, -7.276681423187256, -6.963346481323242, -6.6500115394592285, -6.336676597595215, -6.023341655731201, -5.7100067138671875, -5.396672248840332, -5.08333683013916, -4.770002365112305, -4.456667423248291, -4.143332481384277, -3.8299975395202637, -3.51666259765625, -3.2033278942108154, -2.8899929523468018, -2.576658010482788, -2.2633233070373535, -1.9499883651733398, -1.6366534233093262, -1.3233184814453125, -1.0099836587905884, -0.6966487765312195, -0.3833138942718506, -0.06997895240783691, 0.2433558702468872, 0.5566906929016113, 0.8700265884399414, 1.183361530303955, 1.4966963529586792, 1.8100311756134033, 2.123366117477417, 2.4367010593414307, 2.7500357627868652, 3.063370704650879, 3.3767056465148926, 3.6900405883789062, 4.00337553024292, 4.316710472106934, 4.630044937133789, 4.943380355834961, 5.256714820861816, 5.57004976272583, 5.883384704589844, 6.196719646453857, 6.510054588317871, 6.823389530181885, 7.136724472045898, 7.450058937072754, 7.763393878936768, 8.076728820800781, 8.390064239501953, 8.703398704528809, 9.01673412322998, 9.330068588256836, 9.643404006958008, 9.956738471984863, 10.270073890686035, 10.58340835571289, 10.896742820739746]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 8.0, 7.0, 7.0, 8.0, 12.0, 15.0, 20.0, 21.0, 22.0, 29.0, 24.0, 34.0, 33.0, 37.0, 41.0, 51.0, 45.0, 35.0, 36.0, 46.0, 40.0, 52.0, 37.0, 42.0, 41.0, 33.0, 25.0, 30.0, 25.0, 25.0, 27.0, 18.0, 6.0, 10.0, 11.0, 6.0, 10.0, 6.0, 6.0, 4.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.845703125, -1.7945709228515625, -1.743438720703125, -1.6923065185546875, -1.64117431640625, -1.5900421142578125, -1.538909912109375, -1.4877777099609375, -1.4366455078125, -1.3855133056640625, -1.334381103515625, -1.2832489013671875, -1.23211669921875, -1.1809844970703125, -1.129852294921875, -1.0787200927734375, -1.027587890625, -0.9764556884765625, -0.925323486328125, -0.8741912841796875, -0.82305908203125, -0.7719268798828125, -0.720794677734375, -0.6696624755859375, -0.6185302734375, -0.5673980712890625, -0.516265869140625, -0.4651336669921875, -0.41400146484375, -0.3628692626953125, -0.311737060546875, -0.2606048583984375, -0.20947265625, -0.1583404541015625, -0.107208251953125, -0.0560760498046875, -0.00494384765625, 0.0461883544921875, 0.097320556640625, 0.1484527587890625, 0.1995849609375, 0.2507171630859375, 0.301849365234375, 0.3529815673828125, 0.40411376953125, 0.4552459716796875, 0.506378173828125, 0.5575103759765625, 0.608642578125, 0.6597747802734375, 0.710906982421875, 0.7620391845703125, 0.81317138671875, 0.8643035888671875, 0.915435791015625, 0.9665679931640625, 1.0177001953125, 1.0688323974609375, 1.119964599609375, 1.1710968017578125, 1.22222900390625, 1.2733612060546875, 1.324493408203125, 1.3756256103515625, 1.4267578125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 10.0, 8.0, 9.0, 16.0, 13.0, 24.0, 28.0, 47.0, 78.0, 101.0, 160.0, 225.0, 348.0, 630.0, 1202.0, 2333.0, 5262.0, 13144.0, 36534.0, 124518.0, 511434.0, 252398.0, 63608.0, 21132.0, 8066.0, 3474.0, 1618.0, 808.0, 487.0, 268.0, 189.0, 110.0, 92.0, 53.0, 39.0, 37.0, 18.0, 12.0, 8.0, 3.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2080078125, -1.167388916015625, -1.12677001953125, -1.086151123046875, -1.0455322265625, -1.004913330078125, -0.96429443359375, -0.923675537109375, -0.883056640625, -0.842437744140625, -0.80181884765625, -0.761199951171875, -0.7205810546875, -0.679962158203125, -0.63934326171875, -0.598724365234375, -0.55810546875, -0.517486572265625, -0.47686767578125, -0.436248779296875, -0.3956298828125, -0.355010986328125, -0.31439208984375, -0.273773193359375, -0.233154296875, -0.192535400390625, -0.15191650390625, -0.111297607421875, -0.0706787109375, -0.030059814453125, 0.01055908203125, 0.051177978515625, 0.091796875, 0.132415771484375, 0.17303466796875, 0.213653564453125, 0.2542724609375, 0.294891357421875, 0.33551025390625, 0.376129150390625, 0.416748046875, 0.457366943359375, 0.49798583984375, 0.538604736328125, 0.5792236328125, 0.619842529296875, 0.66046142578125, 0.701080322265625, 0.74169921875, 0.782318115234375, 0.82293701171875, 0.863555908203125, 0.9041748046875, 0.944793701171875, 0.98541259765625, 1.026031494140625, 1.066650390625, 1.107269287109375, 1.14788818359375, 1.188507080078125, 1.2291259765625, 1.269744873046875, 1.31036376953125, 1.350982666015625, 1.3916015625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 5.0, 14.0, 16.0, 15.0, 13.0, 22.0, 20.0, 24.0, 24.0, 33.0, 43.0, 39.0, 27.0, 40.0, 33.0, 50.0, 46.0, 1078.0, 47.0, 36.0, 35.0, 41.0, 40.0, 38.0, 28.0, 30.0, 31.0, 25.0, 23.0, 15.0, 18.0, 12.0, 13.0, 11.0, 10.0, 4.0, 6.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2705078125, -1.230682373046875, -1.19085693359375, -1.151031494140625, -1.1112060546875, -1.071380615234375, -1.03155517578125, -0.991729736328125, -0.951904296875, -0.912078857421875, -0.87225341796875, -0.832427978515625, -0.7926025390625, -0.752777099609375, -0.71295166015625, -0.673126220703125, -0.63330078125, -0.593475341796875, -0.55364990234375, -0.513824462890625, -0.4739990234375, -0.434173583984375, -0.39434814453125, -0.354522705078125, -0.314697265625, -0.274871826171875, -0.23504638671875, -0.195220947265625, -0.1553955078125, -0.115570068359375, -0.07574462890625, -0.035919189453125, 0.00390625, 0.043731689453125, 0.08355712890625, 0.123382568359375, 0.1632080078125, 0.203033447265625, 0.24285888671875, 0.282684326171875, 0.322509765625, 0.362335205078125, 0.40216064453125, 0.441986083984375, 0.4818115234375, 0.521636962890625, 0.56146240234375, 0.601287841796875, 0.64111328125, 0.680938720703125, 0.72076416015625, 0.760589599609375, 0.8004150390625, 0.840240478515625, 0.88006591796875, 0.919891357421875, 0.959716796875, 0.999542236328125, 1.03936767578125, 1.079193115234375, 1.1190185546875, 1.158843994140625, 1.19866943359375, 1.238494873046875, 1.2783203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 14.0, 9.0, 28.0, 22.0, 36.0, 84.0, 142.0, 316.0, 636.0, 1505.0, 3806.0, 12000.0, 67150.0, 1959673.0, 37442.0, 8949.0, 2982.0, 1200.0, 559.0, 261.0, 126.0, 59.0, 37.0, 24.0, 23.0, 16.0, 14.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.799957275390625, -1.72296142578125, -1.645965576171875, -1.5689697265625, -1.491973876953125, -1.41497802734375, -1.337982177734375, -1.260986328125, -1.183990478515625, -1.10699462890625, -1.029998779296875, -0.9530029296875, -0.876007080078125, -0.79901123046875, -0.722015380859375, -0.64501953125, -0.568023681640625, -0.49102783203125, -0.414031982421875, -0.3370361328125, -0.260040283203125, -0.18304443359375, -0.106048583984375, -0.029052734375, 0.047943115234375, 0.12493896484375, 0.201934814453125, 0.2789306640625, 0.355926513671875, 0.43292236328125, 0.509918212890625, 0.5869140625, 0.663909912109375, 0.74090576171875, 0.817901611328125, 0.8948974609375, 0.971893310546875, 1.04888916015625, 1.125885009765625, 1.202880859375, 1.279876708984375, 1.35687255859375, 1.433868408203125, 1.5108642578125, 1.587860107421875, 1.66485595703125, 1.741851806640625, 1.81884765625, 1.895843505859375, 1.97283935546875, 2.049835205078125, 2.1268310546875, 2.203826904296875, 2.28082275390625, 2.357818603515625, 2.434814453125, 2.511810302734375, 2.58880615234375, 2.665802001953125, 2.7427978515625, 2.819793701171875, 2.89678955078125, 2.973785400390625, 3.05078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 9.0, 7.0, 8.0, 11.0, 16.0, 26.0, 33.0, 44.0, 73.0, 82.0, 105.0, 133.0, 89.0, 101.0, 59.0, 44.0, 33.0, 20.0, 19.0, 18.0, 12.0, 9.0, 8.0, 6.0, 10.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.06179618835449219, -0.059627532958984375, -0.05745887756347656, -0.05529022216796875, -0.05312156677246094, -0.050952911376953125, -0.04878425598144531, -0.0466156005859375, -0.04444694519042969, -0.042278289794921875, -0.04010963439941406, -0.03794097900390625, -0.03577232360839844, -0.033603668212890625, -0.03143501281738281, -0.029266357421875, -0.027097702026367188, -0.024929046630859375, -0.022760391235351562, -0.02059173583984375, -0.018423080444335938, -0.016254425048828125, -0.014085769653320312, -0.0119171142578125, -0.009748458862304688, -0.007579803466796875, -0.0054111480712890625, -0.00324249267578125, -0.0010738372802734375, 0.001094818115234375, 0.0032634735107421875, 0.00543212890625, 0.0076007843017578125, 0.009769439697265625, 0.011938095092773438, 0.01410675048828125, 0.016275405883789062, 0.018444061279296875, 0.020612716674804688, 0.0227813720703125, 0.024950027465820312, 0.027118682861328125, 0.029287338256835938, 0.03145599365234375, 0.03362464904785156, 0.035793304443359375, 0.03796195983886719, 0.040130615234375, 0.04229927062988281, 0.044467926025390625, 0.04663658142089844, 0.04880523681640625, 0.05097389221191406, 0.053142547607421875, 0.05531120300292969, 0.0574798583984375, 0.05964851379394531, 0.061817169189453125, 0.06398582458496094, 0.06615447998046875, 0.06832313537597656, 0.07049179077148438, 0.07266044616699219, 0.0748291015625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 11.0, 9.0, 12.0, 11.0, 21.0, 27.0, 32.0, 46.0, 68.0, 90.0, 192.0, 487.0, 2019.0, 35650.0, 973862.0, 33041.0, 1970.0, 433.0, 193.0, 115.0, 71.0, 42.0, 29.0, 29.0, 25.0, 6.0, 13.0, 11.0, 6.0, 2.0, 3.0, 0.0, 5.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0146255493164062, -0.9843292236328125, -0.9540328979492188, -0.923736572265625, -0.8934402465820312, -0.8631439208984375, -0.8328475952148438, -0.80255126953125, -0.7722549438476562, -0.7419586181640625, -0.7116622924804688, -0.681365966796875, -0.6510696411132812, -0.6207733154296875, -0.5904769897460938, -0.5601806640625, -0.5298843383789062, -0.4995880126953125, -0.46929168701171875, -0.438995361328125, -0.40869903564453125, -0.3784027099609375, -0.34810638427734375, -0.31781005859375, -0.28751373291015625, -0.2572174072265625, -0.22692108154296875, -0.196624755859375, -0.16632843017578125, -0.1360321044921875, -0.10573577880859375, -0.075439453125, -0.04514312744140625, -0.0148468017578125, 0.01544952392578125, 0.045745849609375, 0.07604217529296875, 0.1063385009765625, 0.13663482666015625, 0.16693115234375, 0.19722747802734375, 0.2275238037109375, 0.25782012939453125, 0.288116455078125, 0.31841278076171875, 0.3487091064453125, 0.37900543212890625, 0.4093017578125, 0.43959808349609375, 0.4698944091796875, 0.5001907348632812, 0.530487060546875, 0.5607833862304688, 0.5910797119140625, 0.6213760375976562, 0.65167236328125, 0.6819686889648438, 0.7122650146484375, 0.7425613403320312, 0.772857666015625, 0.8031539916992188, 0.8334503173828125, 0.8637466430664062, 0.89404296875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 31.0, 65.0, 320.0, 399.0, 140.0, 42.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4144311845302582, -0.4007175862789154, -0.387004017829895, -0.37329041957855225, -0.35957685112953186, -0.3458632528781891, -0.3321496844291687, -0.3184360861778259, -0.30472251772880554, -0.29100891947746277, -0.2772953510284424, -0.2635817527770996, -0.24986818432807922, -0.23615458607673645, -0.22244101762771606, -0.2087274193763733, -0.1950138360261917, -0.18130025267601013, -0.16758666932582855, -0.15387308597564697, -0.1401595026254654, -0.1264459192752838, -0.11273232847452164, -0.09901874512434006, -0.08530516177415848, -0.0715915784239769, -0.05787799507379532, -0.04416440799832344, -0.03045082464814186, -0.016737237572669983, -0.0030236542224884033, 0.010689929127693176, 0.024403512477874756, 0.038117095828056335, 0.051830679178237915, 0.0655442625284195, 0.07925784587860107, 0.09297143667936325, 0.10668502002954483, 0.12039860337972641, 0.1341121792793274, 0.14782576262950897, 0.16153934597969055, 0.17525292932987213, 0.1889665126800537, 0.20268011093139648, 0.21639367938041687, 0.23010727763175964, 0.24382086098194122, 0.2575344443321228, 0.2712480425834656, 0.28496161103248596, 0.29867520928382874, 0.3123887777328491, 0.3261023759841919, 0.3398159444332123, 0.35352954268455505, 0.3672431409358978, 0.3809567093849182, 0.394670307636261, 0.40838387608528137, 0.42209747433662415, 0.43581104278564453, 0.4495246410369873, 0.4632382094860077]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 11.0, 9.0, 15.0, 15.0, 20.0, 21.0, 23.0, 32.0, 21.0, 28.0, 28.0, 42.0, 36.0, 48.0, 43.0, 35.0, 39.0, 38.0, 36.0, 32.0, 48.0, 49.0, 29.0, 26.0, 29.0, 29.0, 28.0, 23.0, 15.0, 24.0, 14.0, 15.0, 13.0, 14.0, 9.0, 12.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06801897287368774, -0.06586844474077225, -0.06371791660785675, -0.061567388474941254, -0.05941686034202576, -0.05726633220911026, -0.05511580407619476, -0.052965275943279266, -0.05081474781036377, -0.04866421967744827, -0.046513691544532776, -0.04436316341161728, -0.04221263527870178, -0.040062107145786285, -0.03791157901287079, -0.03576105087995529, -0.033610522747039795, -0.0314599946141243, -0.0293094664812088, -0.027158938348293304, -0.025008410215377808, -0.02285788208246231, -0.020707353949546814, -0.018556825816631317, -0.01640629768371582, -0.014255769550800323, -0.012105241417884827, -0.00995471328496933, -0.007804185152053833, -0.005653657019138336, -0.0035031288862228394, -0.0013526007533073425, 0.0007979273796081543, 0.002948455512523651, 0.005098983645439148, 0.007249511778354645, 0.009400039911270142, 0.011550568044185638, 0.013701096177101135, 0.015851624310016632, 0.01800215244293213, 0.020152680575847626, 0.022303208708763123, 0.02445373684167862, 0.026604264974594116, 0.028754793107509613, 0.03090532124042511, 0.03305584937334061, 0.035206377506256104, 0.0373569056391716, 0.0395074337720871, 0.041657961905002594, 0.04380849003791809, 0.04595901817083359, 0.048109546303749084, 0.05026007443666458, 0.05241060256958008, 0.054561130702495575, 0.05671165883541107, 0.05886218696832657, 0.061012715101242065, 0.06316324323415756, 0.06531377136707306, 0.06746429949998856, 0.06961482763290405]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 3.0, 10.0, 11.0, 14.0, 20.0, 22.0, 22.0, 30.0, 25.0, 33.0, 33.0, 35.0, 43.0, 52.0, 44.0, 34.0, 37.0, 47.0, 38.0, 52.0, 37.0, 42.0, 41.0, 35.0, 23.0, 33.0, 24.0, 25.0, 26.0, 17.0, 8.0, 11.0, 11.0, 4.0, 11.0, 7.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.8525390625, -1.8013153076171875, -1.750091552734375, -1.6988677978515625, -1.64764404296875, -1.5964202880859375, -1.545196533203125, -1.4939727783203125, -1.4427490234375, -1.3915252685546875, -1.340301513671875, -1.2890777587890625, -1.23785400390625, -1.1866302490234375, -1.135406494140625, -1.0841827392578125, -1.032958984375, -0.9817352294921875, -0.930511474609375, -0.8792877197265625, -0.82806396484375, -0.7768402099609375, -0.725616455078125, -0.6743927001953125, -0.6231689453125, -0.5719451904296875, -0.520721435546875, -0.4694976806640625, -0.41827392578125, -0.3670501708984375, -0.315826416015625, -0.2646026611328125, -0.21337890625, -0.1621551513671875, -0.110931396484375, -0.0597076416015625, -0.00848388671875, 0.0427398681640625, 0.093963623046875, 0.1451873779296875, 0.1964111328125, 0.2476348876953125, 0.298858642578125, 0.3500823974609375, 0.40130615234375, 0.4525299072265625, 0.503753662109375, 0.5549774169921875, 0.606201171875, 0.6574249267578125, 0.708648681640625, 0.7598724365234375, 0.81109619140625, 0.8623199462890625, 0.913543701171875, 0.9647674560546875, 1.0159912109375, 1.0672149658203125, 1.118438720703125, 1.1696624755859375, 1.22088623046875, 1.2721099853515625, 1.323333740234375, 1.3745574951171875, 1.42578125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 2.0, 10.0, 18.0, 11.0, 25.0, 41.0, 45.0, 67.0, 109.0, 150.0, 187.0, 350.0, 500.0, 887.0, 1613.0, 3139.0, 8500.0, 34564.0, 327810.0, 596933.0, 53982.0, 11117.0, 3942.0, 1854.0, 970.0, 600.0, 332.0, 234.0, 165.0, 125.0, 77.0, 59.0, 46.0, 29.0, 21.0, 12.0, 14.0, 3.0, 4.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.43359375, -5.27886962890625, -5.1241455078125, -4.96942138671875, -4.814697265625, -4.65997314453125, -4.5052490234375, -4.35052490234375, -4.19580078125, -4.04107666015625, -3.8863525390625, -3.73162841796875, -3.576904296875, -3.42218017578125, -3.2674560546875, -3.11273193359375, -2.9580078125, -2.80328369140625, -2.6485595703125, -2.49383544921875, -2.339111328125, -2.18438720703125, -2.0296630859375, -1.87493896484375, -1.72021484375, -1.56549072265625, -1.4107666015625, -1.25604248046875, -1.101318359375, -0.94659423828125, -0.7918701171875, -0.63714599609375, -0.482421875, -0.32769775390625, -0.1729736328125, -0.01824951171875, 0.136474609375, 0.29119873046875, 0.4459228515625, 0.60064697265625, 0.75537109375, 0.91009521484375, 1.0648193359375, 1.21954345703125, 1.374267578125, 1.52899169921875, 1.6837158203125, 1.83843994140625, 1.9931640625, 2.14788818359375, 2.3026123046875, 2.45733642578125, 2.612060546875, 2.76678466796875, 2.9215087890625, 3.07623291015625, 3.23095703125, 3.38568115234375, 3.5404052734375, 3.69512939453125, 3.849853515625, 4.00457763671875, 4.1593017578125, 4.31402587890625, 4.46875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 10.0, 8.0, 11.0, 9.0, 12.0, 10.0, 19.0, 19.0, 14.0, 19.0, 22.0, 32.0, 34.0, 37.0, 45.0, 61.0, 61.0, 107.0, 142.0, 274.0, 1375.0, 190.0, 89.0, 66.0, 51.0, 54.0, 45.0, 29.0, 18.0, 28.0, 20.0, 29.0, 15.0, 18.0, 12.0, 9.0, 10.0, 5.0, 6.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.03436279296875, -3.9007568359375, -3.76715087890625, -3.633544921875, -3.49993896484375, -3.3663330078125, -3.23272705078125, -3.09912109375, -2.96551513671875, -2.8319091796875, -2.69830322265625, -2.564697265625, -2.43109130859375, -2.2974853515625, -2.16387939453125, -2.0302734375, -1.89666748046875, -1.7630615234375, -1.62945556640625, -1.495849609375, -1.36224365234375, -1.2286376953125, -1.09503173828125, -0.96142578125, -0.82781982421875, -0.6942138671875, -0.56060791015625, -0.427001953125, -0.29339599609375, -0.1597900390625, -0.02618408203125, 0.107421875, 0.24102783203125, 0.3746337890625, 0.50823974609375, 0.641845703125, 0.77545166015625, 0.9090576171875, 1.04266357421875, 1.17626953125, 1.30987548828125, 1.4434814453125, 1.57708740234375, 1.710693359375, 1.84429931640625, 1.9779052734375, 2.11151123046875, 2.2451171875, 2.37872314453125, 2.5123291015625, 2.64593505859375, 2.779541015625, 2.91314697265625, 3.0467529296875, 3.18035888671875, 3.31396484375, 3.44757080078125, 3.5811767578125, 3.71478271484375, 3.848388671875, 3.98199462890625, 4.1156005859375, 4.24920654296875, 4.3828125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 6.0, 9.0, 11.0, 18.0, 15.0, 21.0, 37.0, 46.0, 59.0, 91.0, 87.0, 108.0, 143.0, 241.0, 445.0, 1219.0, 5131.0, 45393.0, 2355133.0, 709177.0, 22827.0, 3296.0, 892.0, 374.0, 238.0, 153.0, 121.0, 96.0, 71.0, 55.0, 44.0, 31.0, 19.0, 16.0, 16.0, 18.0, 9.0, 5.0, 2.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.3984375, -8.1348876953125, -7.871337890625, -7.6077880859375, -7.34423828125, -7.0806884765625, -6.817138671875, -6.5535888671875, -6.2900390625, -6.0264892578125, -5.762939453125, -5.4993896484375, -5.23583984375, -4.9722900390625, -4.708740234375, -4.4451904296875, -4.181640625, -3.9180908203125, -3.654541015625, -3.3909912109375, -3.12744140625, -2.8638916015625, -2.600341796875, -2.3367919921875, -2.0732421875, -1.8096923828125, -1.546142578125, -1.2825927734375, -1.01904296875, -0.7554931640625, -0.491943359375, -0.2283935546875, 0.03515625, 0.2987060546875, 0.562255859375, 0.8258056640625, 1.08935546875, 1.3529052734375, 1.616455078125, 1.8800048828125, 2.1435546875, 2.4071044921875, 2.670654296875, 2.9342041015625, 3.19775390625, 3.4613037109375, 3.724853515625, 3.9884033203125, 4.251953125, 4.5155029296875, 4.779052734375, 5.0426025390625, 5.30615234375, 5.5697021484375, 5.833251953125, 6.0968017578125, 6.3603515625, 6.6239013671875, 6.887451171875, 7.1510009765625, 7.41455078125, 7.6781005859375, 7.941650390625, 8.2052001953125, 8.46875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 117.0, 699.0, 181.0, 15.0, 1.0, 0.0, 0.0, 1.0], "bins": [-119.16944885253906, -117.10120391845703, -115.03295135498047, -112.96470642089844, -110.8964614868164, -108.82821655273438, -106.75996398925781, -104.69171905517578, -102.62347412109375, -100.55522918701172, -98.48697662353516, -96.41873168945312, -94.3504867553711, -92.28224182128906, -90.2139892578125, -88.14574432373047, -86.0774917602539, -84.00924682617188, -81.94099426269531, -79.87274932861328, -77.80450439453125, -75.73625183105469, -73.66800689697266, -71.59976196289062, -69.53150939941406, -67.46326446533203, -65.39501190185547, -63.32676696777344, -61.258522033691406, -59.19027328491211, -57.12202453613281, -55.05377960205078, -52.98554229736328, -50.917293548583984, -48.84904861450195, -46.780799865722656, -44.712554931640625, -42.64430618286133, -40.57605743408203, -38.5078125, -36.4395637512207, -34.371315002441406, -32.303070068359375, -30.234821319580078, -28.166574478149414, -26.09832763671875, -24.030078887939453, -21.96183204650879, -19.893585205078125, -17.82533836364746, -15.75709056854248, -13.6888427734375, -11.620595932006836, -9.552349090576172, -7.484101295471191, -5.415853500366211, -3.347606658935547, -1.2793593406677246, 0.7888879776000977, 2.85713529586792, 4.925382614135742, 6.993629455566406, 9.061877250671387, 11.130125045776367, 13.198371887207031]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 7.0, 9.0, 12.0, 12.0, 14.0, 13.0, 21.0, 11.0, 22.0, 39.0, 20.0, 34.0, 39.0, 38.0, 35.0, 40.0, 41.0, 36.0, 52.0, 42.0, 31.0, 32.0, 32.0, 37.0, 28.0, 33.0, 26.0, 30.0, 26.0, 20.0, 22.0, 27.0, 15.0, 12.0, 10.0, 12.0, 11.0, 10.0, 5.0, 7.0, 7.0, 6.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.20268440246582, -10.823832511901855, -10.44498062133789, -10.06612777709961, -9.687275886535645, -9.30842399597168, -8.929572105407715, -8.55072021484375, -8.171867370605469, -7.793015480041504, -7.414163112640381, -7.035311222076416, -6.656458854675293, -6.277606964111328, -5.898755073547363, -5.519903182983398, -5.141051292419434, -4.762199401855469, -4.383347034454346, -4.004495143890381, -3.625643014907837, -3.246790885925293, -2.867938995361328, -2.489086866378784, -2.1102347373962402, -1.7313826084136963, -1.352530598640442, -0.9736785888671875, -0.5948264598846436, -0.2159743309020996, 0.16287755966186523, 0.5417296886444092, 0.9205808639526367, 1.2994329929351807, 1.678285002708435, 2.0571370124816895, 2.4359891414642334, 2.8148412704467773, 3.193693161010742, 3.572545289993286, 3.95139741897583, 4.330249309539795, 4.709101676940918, 5.087953567504883, 5.466805458068848, 5.845657825469971, 6.2245097160339355, 6.603362083435059, 6.982213973999023, 7.361065864562988, 7.739918231964111, 8.118770599365234, 8.4976224899292, 8.876474380493164, 9.255326271057129, 9.634178161621094, 10.013031005859375, 10.39188289642334, 10.770734786987305, 11.149587631225586, 11.52843952178955, 11.907291412353516, 12.28614330291748, 12.664995193481445, 13.04384708404541]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 10.0, 3.0, 14.0, 7.0, 11.0, 13.0, 17.0, 24.0, 28.0, 24.0, 30.0, 40.0, 32.0, 34.0, 42.0, 41.0, 37.0, 52.0, 40.0, 57.0, 43.0, 41.0, 49.0, 42.0, 31.0, 31.0, 34.0, 30.0, 29.0, 18.0, 19.0, 15.0, 10.0, 8.0, 8.0, 9.0, 7.0, 1.0, 6.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0], "bins": [-2.0625, -2.0079498291015625, -1.953399658203125, -1.8988494873046875, -1.84429931640625, -1.7897491455078125, -1.735198974609375, -1.6806488037109375, -1.6260986328125, -1.5715484619140625, -1.516998291015625, -1.4624481201171875, -1.40789794921875, -1.3533477783203125, -1.298797607421875, -1.2442474365234375, -1.189697265625, -1.1351470947265625, -1.080596923828125, -1.0260467529296875, -0.97149658203125, -0.9169464111328125, -0.862396240234375, -0.8078460693359375, -0.7532958984375, -0.6987457275390625, -0.644195556640625, -0.5896453857421875, -0.53509521484375, -0.4805450439453125, -0.425994873046875, -0.3714447021484375, -0.31689453125, -0.2623443603515625, -0.207794189453125, -0.1532440185546875, -0.09869384765625, -0.0441436767578125, 0.010406494140625, 0.0649566650390625, 0.1195068359375, 0.1740570068359375, 0.228607177734375, 0.2831573486328125, 0.33770751953125, 0.3922576904296875, 0.446807861328125, 0.5013580322265625, 0.555908203125, 0.6104583740234375, 0.665008544921875, 0.7195587158203125, 0.77410888671875, 0.8286590576171875, 0.883209228515625, 0.9377593994140625, 0.9923095703125, 1.0468597412109375, 1.101409912109375, 1.1559600830078125, 1.21051025390625, 1.2650604248046875, 1.319610595703125, 1.3741607666015625, 1.4287109375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 5.0, 9.0, 13.0, 14.0, 16.0, 25.0, 37.0, 50.0, 70.0, 117.0, 163.0, 233.0, 335.0, 574.0, 954.0, 1555.0, 2752.0, 5196.0, 10569.0, 26549.0, 135148.0, 2600766.0, 1294122.0, 76651.0, 19812.0, 8390.0, 4282.0, 2342.0, 1378.0, 788.0, 467.0, 309.0, 201.0, 143.0, 91.0, 50.0, 33.0, 22.0, 16.0, 11.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-6.7421875, -6.56414794921875, -6.3861083984375, -6.20806884765625, -6.030029296875, -5.85198974609375, -5.6739501953125, -5.49591064453125, -5.31787109375, -5.13983154296875, -4.9617919921875, -4.78375244140625, -4.605712890625, -4.42767333984375, -4.2496337890625, -4.07159423828125, -3.8935546875, -3.71551513671875, -3.5374755859375, -3.35943603515625, -3.181396484375, -3.00335693359375, -2.8253173828125, -2.64727783203125, -2.46923828125, -2.29119873046875, -2.1131591796875, -1.93511962890625, -1.757080078125, -1.57904052734375, -1.4010009765625, -1.22296142578125, -1.044921875, -0.86688232421875, -0.6888427734375, -0.51080322265625, -0.332763671875, -0.15472412109375, 0.0233154296875, 0.20135498046875, 0.37939453125, 0.55743408203125, 0.7354736328125, 0.91351318359375, 1.091552734375, 1.26959228515625, 1.4476318359375, 1.62567138671875, 1.8037109375, 1.98175048828125, 2.1597900390625, 2.33782958984375, 2.515869140625, 2.69390869140625, 2.8719482421875, 3.04998779296875, 3.22802734375, 3.40606689453125, 3.5841064453125, 3.76214599609375, 3.940185546875, 4.11822509765625, 4.2962646484375, 4.47430419921875, 4.65234375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 6.0, 7.0, 7.0, 8.0, 4.0, 12.0, 13.0, 22.0, 30.0, 31.0, 40.0, 50.0, 82.0, 123.0, 175.0, 317.0, 519.0, 726.0, 640.0, 411.0, 268.0, 154.0, 116.0, 79.0, 57.0, 41.0, 30.0, 25.0, 20.0, 13.0, 9.0, 4.0, 11.0, 4.0, 4.0, 9.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.582611083984375, -3.46990966796875, -3.357208251953125, -3.2445068359375, -3.131805419921875, -3.01910400390625, -2.906402587890625, -2.793701171875, -2.680999755859375, -2.56829833984375, -2.455596923828125, -2.3428955078125, -2.230194091796875, -2.11749267578125, -2.004791259765625, -1.89208984375, -1.779388427734375, -1.66668701171875, -1.553985595703125, -1.4412841796875, -1.328582763671875, -1.21588134765625, -1.103179931640625, -0.990478515625, -0.877777099609375, -0.76507568359375, -0.652374267578125, -0.5396728515625, -0.426971435546875, -0.31427001953125, -0.201568603515625, -0.0888671875, 0.023834228515625, 0.13653564453125, 0.249237060546875, 0.3619384765625, 0.474639892578125, 0.58734130859375, 0.700042724609375, 0.812744140625, 0.925445556640625, 1.03814697265625, 1.150848388671875, 1.2635498046875, 1.376251220703125, 1.48895263671875, 1.601654052734375, 1.71435546875, 1.827056884765625, 1.93975830078125, 2.052459716796875, 2.1651611328125, 2.277862548828125, 2.39056396484375, 2.503265380859375, 2.615966796875, 2.728668212890625, 2.84136962890625, 2.954071044921875, 3.0667724609375, 3.179473876953125, 3.29217529296875, 3.404876708984375, 3.517578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 9.0, 15.0, 9.0, 10.0, 25.0, 34.0, 51.0, 84.0, 98.0, 192.0, 324.0, 641.0, 1296.0, 2725.0, 6261.0, 16421.0, 55957.0, 464007.0, 3324635.0, 256905.0, 41306.0, 13269.0, 5230.0, 2332.0, 1128.0, 547.0, 280.0, 159.0, 101.0, 74.0, 36.0, 37.0, 10.0, 10.0, 13.0, 11.0, 4.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.09375, -6.8677978515625, -6.641845703125, -6.4158935546875, -6.18994140625, -5.9639892578125, -5.738037109375, -5.5120849609375, -5.2861328125, -5.0601806640625, -4.834228515625, -4.6082763671875, -4.38232421875, -4.1563720703125, -3.930419921875, -3.7044677734375, -3.478515625, -3.2525634765625, -3.026611328125, -2.8006591796875, -2.57470703125, -2.3487548828125, -2.122802734375, -1.8968505859375, -1.6708984375, -1.4449462890625, -1.218994140625, -0.9930419921875, -0.76708984375, -0.5411376953125, -0.315185546875, -0.0892333984375, 0.13671875, 0.3626708984375, 0.588623046875, 0.8145751953125, 1.04052734375, 1.2664794921875, 1.492431640625, 1.7183837890625, 1.9443359375, 2.1702880859375, 2.396240234375, 2.6221923828125, 2.84814453125, 3.0740966796875, 3.300048828125, 3.5260009765625, 3.751953125, 3.9779052734375, 4.203857421875, 4.4298095703125, 4.65576171875, 4.8817138671875, 5.107666015625, 5.3336181640625, 5.5595703125, 5.7855224609375, 6.011474609375, 6.2374267578125, 6.46337890625, 6.6893310546875, 6.915283203125, 7.1412353515625, 7.3671875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 14.0, 26.0, 60.0, 114.0, 230.0, 296.0, 141.0, 76.0, 31.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.291709899902344, -50.13016891479492, -48.9686279296875, -47.80708694458008, -46.645545959472656, -45.484004974365234, -44.32246398925781, -43.160919189453125, -41.99938201904297, -40.83784103393555, -39.676300048828125, -38.5147590637207, -37.35321807861328, -36.19167709350586, -35.03013610839844, -33.86859130859375, -32.70705032348633, -31.545509338378906, -30.383968353271484, -29.222427368164062, -28.06088638305664, -26.89934539794922, -25.737802505493164, -24.576261520385742, -23.41472053527832, -22.2531795501709, -21.091638565063477, -19.930097579956055, -18.7685546875, -17.607013702392578, -16.445472717285156, -15.283931732177734, -14.122390747070312, -12.96084976196289, -11.799308776855469, -10.63776683807373, -9.476225852966309, -8.314684867858887, -7.153143405914307, -5.991601943969727, -4.830060958862305, -3.6685197353363037, -2.5069785118103027, -1.3454372882843018, -0.18389606475830078, 0.9776449203491211, 2.139186382293701, 3.3007278442382812, 4.462268829345703, 5.623809814453125, 6.785351276397705, 7.946892738342285, 9.108433723449707, 10.269974708557129, 11.431516647338867, 12.593057632446289, 13.754598617553711, 14.916139602661133, 16.077680587768555, 17.239221572875977, 18.40076446533203, 19.562305450439453, 20.723846435546875, 21.885387420654297, 23.04692840576172]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 8.0, 9.0, 10.0, 17.0, 18.0, 24.0, 20.0, 23.0, 24.0, 35.0, 39.0, 37.0, 38.0, 34.0, 58.0, 43.0, 42.0, 46.0, 30.0, 46.0, 36.0, 38.0, 37.0, 29.0, 34.0, 31.0, 23.0, 28.0, 22.0, 16.0, 17.0, 16.0, 15.0, 7.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.133099555969238, -9.810467720031738, -9.487835884094238, -9.165204048156738, -8.842572212219238, -8.519940376281738, -8.197308540344238, -7.8746771812438965, -7.5520453453063965, -7.2294135093688965, -6.9067816734313965, -6.5841498374938965, -6.261518478393555, -5.938886642456055, -5.616254806518555, -5.293622970581055, -4.970991134643555, -4.648359298706055, -4.325727462768555, -4.003095626831055, -3.680464029312134, -3.357832193374634, -3.035200595855713, -2.712568759918213, -2.389936923980713, -2.067305088043213, -1.7446733713150024, -1.422041654586792, -1.099409818649292, -0.776777982711792, -0.45414626598358154, -0.1315145492553711, 0.1911172866821289, 0.5137490630149841, 0.8363808393478394, 1.1590125560760498, 1.4816443920135498, 1.8042762279510498, 2.1269078254699707, 2.4495396614074707, 2.7721714973449707, 3.0948033332824707, 3.4174351692199707, 3.7400667667388916, 4.0626983642578125, 4.3853302001953125, 4.7079620361328125, 5.0305938720703125, 5.3532257080078125, 5.6758575439453125, 5.9984893798828125, 6.3211212158203125, 6.6437530517578125, 6.9663848876953125, 7.289016246795654, 7.611648082733154, 7.934279918670654, 8.256911277770996, 8.579543113708496, 8.902174949645996, 9.224806785583496, 9.547438621520996, 9.870070457458496, 10.192702293395996, 10.515334129333496]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 11.0, 10.0, 16.0, 11.0, 17.0, 22.0, 22.0, 28.0, 27.0, 31.0, 45.0, 52.0, 59.0, 42.0, 56.0, 61.0, 50.0, 46.0, 49.0, 51.0, 51.0, 40.0, 36.0, 46.0, 27.0, 19.0, 16.0, 13.0, 18.0, 9.0, 6.0, 5.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.500091552734375, -2.43572998046875, -2.371368408203125, -2.3070068359375, -2.242645263671875, -2.17828369140625, -2.113922119140625, -2.049560546875, -1.985198974609375, -1.92083740234375, -1.856475830078125, -1.7921142578125, -1.727752685546875, -1.66339111328125, -1.599029541015625, -1.53466796875, -1.470306396484375, -1.40594482421875, -1.341583251953125, -1.2772216796875, -1.212860107421875, -1.14849853515625, -1.084136962890625, -1.019775390625, -0.955413818359375, -0.89105224609375, -0.826690673828125, -0.7623291015625, -0.697967529296875, -0.63360595703125, -0.569244384765625, -0.5048828125, -0.440521240234375, -0.37615966796875, -0.311798095703125, -0.2474365234375, -0.183074951171875, -0.11871337890625, -0.054351806640625, 0.010009765625, 0.074371337890625, 0.13873291015625, 0.203094482421875, 0.2674560546875, 0.331817626953125, 0.39617919921875, 0.460540771484375, 0.52490234375, 0.589263916015625, 0.65362548828125, 0.717987060546875, 0.7823486328125, 0.846710205078125, 0.91107177734375, 0.975433349609375, 1.039794921875, 1.104156494140625, 1.16851806640625, 1.232879638671875, 1.2972412109375, 1.361602783203125, 1.42596435546875, 1.490325927734375, 1.5546875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 11.0, 9.0, 12.0, 16.0, 23.0, 34.0, 48.0, 97.0, 141.0, 210.0, 283.0, 472.0, 806.0, 1527.0, 2882.0, 6876.0, 17418.0, 52735.0, 225393.0, 562342.0, 121224.0, 33866.0, 11899.0, 4961.0, 2255.0, 1206.0, 646.0, 418.0, 265.0, 143.0, 106.0, 68.0, 50.0, 36.0, 26.0, 16.0, 10.0, 13.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9921875, -0.9640884399414062, -0.9359893798828125, -0.9078903198242188, -0.879791259765625, -0.8516921997070312, -0.8235931396484375, -0.7954940795898438, -0.76739501953125, -0.7392959594726562, -0.7111968994140625, -0.6830978393554688, -0.654998779296875, -0.6268997192382812, -0.5988006591796875, -0.5707015991210938, -0.5426025390625, -0.5145034790039062, -0.4864044189453125, -0.45830535888671875, -0.430206298828125, -0.40210723876953125, -0.3740081787109375, -0.34590911865234375, -0.31781005859375, -0.28971099853515625, -0.2616119384765625, -0.23351287841796875, -0.205413818359375, -0.17731475830078125, -0.1492156982421875, -0.12111663818359375, -0.093017578125, -0.06491851806640625, -0.0368194580078125, -0.00872039794921875, 0.019378662109375, 0.04747772216796875, 0.0755767822265625, 0.10367584228515625, 0.13177490234375, 0.15987396240234375, 0.1879730224609375, 0.21607208251953125, 0.244171142578125, 0.27227020263671875, 0.3003692626953125, 0.32846832275390625, 0.3565673828125, 0.38466644287109375, 0.4127655029296875, 0.44086456298828125, 0.468963623046875, 0.49706268310546875, 0.5251617431640625, 0.5532608032226562, 0.58135986328125, 0.6094589233398438, 0.6375579833984375, 0.6656570434570312, 0.693756103515625, 0.7218551635742188, 0.7499542236328125, 0.7780532836914062, 0.80615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 7.0, 11.0, 6.0, 10.0, 5.0, 10.0, 20.0, 18.0, 27.0, 11.0, 21.0, 21.0, 32.0, 8.0, 34.0, 31.0, 37.0, 38.0, 38.0, 35.0, 35.0, 1055.0, 35.0, 43.0, 37.0, 37.0, 38.0, 32.0, 29.0, 40.0, 22.0, 29.0, 23.0, 20.0, 22.0, 16.0, 17.0, 13.0, 6.0, 11.0, 11.0, 14.0, 10.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.935546875, -0.9019317626953125, -0.868316650390625, -0.8347015380859375, -0.80108642578125, -0.7674713134765625, -0.733856201171875, -0.7002410888671875, -0.6666259765625, -0.6330108642578125, -0.599395751953125, -0.5657806396484375, -0.53216552734375, -0.4985504150390625, -0.464935302734375, -0.4313201904296875, -0.397705078125, -0.3640899658203125, -0.330474853515625, -0.2968597412109375, -0.26324462890625, -0.2296295166015625, -0.196014404296875, -0.1623992919921875, -0.1287841796875, -0.0951690673828125, -0.061553955078125, -0.0279388427734375, 0.00567626953125, 0.0392913818359375, 0.072906494140625, 0.1065216064453125, 0.14013671875, 0.1737518310546875, 0.207366943359375, 0.2409820556640625, 0.27459716796875, 0.3082122802734375, 0.341827392578125, 0.3754425048828125, 0.4090576171875, 0.4426727294921875, 0.476287841796875, 0.5099029541015625, 0.54351806640625, 0.5771331787109375, 0.610748291015625, 0.6443634033203125, 0.677978515625, 0.7115936279296875, 0.745208740234375, 0.7788238525390625, 0.81243896484375, 0.8460540771484375, 0.879669189453125, 0.9132843017578125, 0.9468994140625, 0.9805145263671875, 1.014129638671875, 1.0477447509765625, 1.08135986328125, 1.1149749755859375, 1.148590087890625, 1.1822052001953125, 1.2158203125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 14.0, 13.0, 21.0, 39.0, 53.0, 85.0, 121.0, 196.0, 334.0, 629.0, 1152.0, 2303.0, 5264.0, 13994.0, 65508.0, 1935170.0, 50376.0, 12465.0, 4711.0, 2141.0, 1054.0, 568.0, 359.0, 209.0, 111.0, 74.0, 51.0, 19.0, 32.0, 16.0, 11.0, 9.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3642578125, -1.3194427490234375, -1.274627685546875, -1.2298126220703125, -1.18499755859375, -1.1401824951171875, -1.095367431640625, -1.0505523681640625, -1.0057373046875, -0.9609222412109375, -0.916107177734375, -0.8712921142578125, -0.82647705078125, -0.7816619873046875, -0.736846923828125, -0.6920318603515625, -0.647216796875, -0.6024017333984375, -0.557586669921875, -0.5127716064453125, -0.46795654296875, -0.4231414794921875, -0.378326416015625, -0.3335113525390625, -0.2886962890625, -0.2438812255859375, -0.199066162109375, -0.1542510986328125, -0.10943603515625, -0.0646209716796875, -0.019805908203125, 0.0250091552734375, 0.06982421875, 0.1146392822265625, 0.159454345703125, 0.2042694091796875, 0.24908447265625, 0.2938995361328125, 0.338714599609375, 0.3835296630859375, 0.4283447265625, 0.4731597900390625, 0.517974853515625, 0.5627899169921875, 0.60760498046875, 0.6524200439453125, 0.697235107421875, 0.7420501708984375, 0.786865234375, 0.8316802978515625, 0.876495361328125, 0.9213104248046875, 0.96612548828125, 1.0109405517578125, 1.055755615234375, 1.1005706787109375, 1.1453857421875, 1.1902008056640625, 1.235015869140625, 1.2798309326171875, 1.32464599609375, 1.3694610595703125, 1.414276123046875, 1.4590911865234375, 1.50390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 10.0, 21.0, 24.0, 91.0, 188.0, 323.0, 197.0, 71.0, 30.0, 15.0, 10.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11505126953125, -0.1116180419921875, -0.108184814453125, -0.1047515869140625, -0.101318359375, -0.0978851318359375, -0.094451904296875, -0.0910186767578125, -0.08758544921875, -0.0841522216796875, -0.080718994140625, -0.0772857666015625, -0.0738525390625, -0.0704193115234375, -0.066986083984375, -0.0635528564453125, -0.06011962890625, -0.0566864013671875, -0.053253173828125, -0.0498199462890625, -0.04638671875, -0.0429534912109375, -0.039520263671875, -0.0360870361328125, -0.03265380859375, -0.0292205810546875, -0.025787353515625, -0.0223541259765625, -0.0189208984375, -0.0154876708984375, -0.012054443359375, -0.0086212158203125, -0.00518798828125, -0.0017547607421875, 0.001678466796875, 0.0051116943359375, 0.008544921875, 0.0119781494140625, 0.015411376953125, 0.0188446044921875, 0.02227783203125, 0.0257110595703125, 0.029144287109375, 0.0325775146484375, 0.0360107421875, 0.0394439697265625, 0.042877197265625, 0.0463104248046875, 0.04974365234375, 0.0531768798828125, 0.056610107421875, 0.0600433349609375, 0.0634765625, 0.0669097900390625, 0.070343017578125, 0.0737762451171875, 0.07720947265625, 0.0806427001953125, 0.084075927734375, 0.0875091552734375, 0.0909423828125, 0.0943756103515625, 0.097808837890625, 0.1012420654296875, 0.10467529296875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 10.0, 24.0, 58.0, 341.0, 4961.0, 1037046.0, 5590.0, 390.0, 64.0, 27.0, 7.0, 5.0, 7.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.157379150390625, -2.08428955078125, -2.011199951171875, -1.9381103515625, -1.865020751953125, -1.79193115234375, -1.718841552734375, -1.645751953125, -1.572662353515625, -1.49957275390625, -1.426483154296875, -1.3533935546875, -1.280303955078125, -1.20721435546875, -1.134124755859375, -1.06103515625, -0.987945556640625, -0.91485595703125, -0.841766357421875, -0.7686767578125, -0.695587158203125, -0.62249755859375, -0.549407958984375, -0.476318359375, -0.403228759765625, -0.33013916015625, -0.257049560546875, -0.1839599609375, -0.110870361328125, -0.03778076171875, 0.035308837890625, 0.1083984375, 0.181488037109375, 0.25457763671875, 0.327667236328125, 0.4007568359375, 0.473846435546875, 0.54693603515625, 0.620025634765625, 0.693115234375, 0.766204833984375, 0.83929443359375, 0.912384033203125, 0.9854736328125, 1.058563232421875, 1.13165283203125, 1.204742431640625, 1.27783203125, 1.350921630859375, 1.42401123046875, 1.497100830078125, 1.5701904296875, 1.643280029296875, 1.71636962890625, 1.789459228515625, 1.862548828125, 1.935638427734375, 2.00872802734375, 2.081817626953125, 2.1549072265625, 2.227996826171875, 2.30108642578125, 2.374176025390625, 2.447265625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 15.0, 33.0, 49.0, 76.0, 180.0, 196.0, 168.0, 116.0, 63.0, 42.0, 18.0, 18.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2827790677547455, -0.277199923992157, -0.27162081003189087, -0.26604166626930237, -0.26046252250671387, -0.25488340854644775, -0.24930426478385925, -0.24372512102127075, -0.23814599215984344, -0.23256686329841614, -0.22698771953582764, -0.22140859067440033, -0.21582946181297302, -0.21025031805038452, -0.20467118918895721, -0.1990920603275299, -0.1935129165649414, -0.1879337877035141, -0.1823546439409256, -0.1767755150794983, -0.1711963713169098, -0.16561724245548248, -0.16003811359405518, -0.15445896983146667, -0.14887984097003937, -0.14330071210861206, -0.13772156834602356, -0.13214243948459625, -0.12656331062316895, -0.12098416686058044, -0.11540503799915314, -0.10982590168714523, -0.10424675792455673, -0.09866762161254883, -0.09308849275112152, -0.08750935643911362, -0.08193022012710571, -0.07635108381509781, -0.0707719475030899, -0.0651928186416626, -0.059613682329654694, -0.05403454601764679, -0.048455413430929184, -0.04287628084421158, -0.037297144532203674, -0.03171800822019577, -0.026138875633478165, -0.02055974304676056, -0.014980606734752655, -0.0094014722853899, -0.0038223378360271454, 0.0017567966133356094, 0.007335931062698364, 0.012915065512061119, 0.018494199961423874, 0.02407333254814148, 0.029652468860149384, 0.03523160517215729, 0.04081073775887489, 0.0463898703455925, 0.0519690066576004, 0.05754814296960831, 0.06312727928161621, 0.06870640814304352, 0.07428554445505142]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 9.0, 7.0, 11.0, 18.0, 23.0, 29.0, 36.0, 30.0, 37.0, 45.0, 53.0, 55.0, 51.0, 62.0, 53.0, 53.0, 58.0, 64.0, 63.0, 43.0, 37.0, 23.0, 30.0, 21.0, 25.0, 15.0, 15.0, 10.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11900782585144043, -0.11489129811525345, -0.11077477037906647, -0.10665824264287949, -0.1025417149066925, -0.09842517971992493, -0.09430865198373795, -0.09019212424755096, -0.08607559651136398, -0.081959068775177, -0.07784254103899002, -0.07372601330280304, -0.06960947811603546, -0.06549295783042908, -0.0613764226436615, -0.05725989490747452, -0.05314336717128754, -0.049026839435100555, -0.044910311698913574, -0.040793780237436295, -0.03667725250124931, -0.03256072476506233, -0.0284441951662302, -0.02432766556739807, -0.02021113783121109, -0.01609461009502411, -0.011978080496191978, -0.007861551828682423, -0.003745023161172867, 0.0003715045750141144, 0.004488034173846245, 0.008604563772678375, 0.012721091508865356, 0.016837619245052338, 0.020954148843884468, 0.0250706784427166, 0.02918720617890358, 0.03330373391509056, 0.03742026537656784, 0.04153679311275482, 0.0456533208489418, 0.049769848585128784, 0.053886376321315765, 0.058002907782793045, 0.062119435518980026, 0.06623595952987671, 0.07035249471664429, 0.07446902245283127, 0.07858555018901825, 0.08270207792520523, 0.08681860566139221, 0.0909351333975792, 0.09505166113376617, 0.09916819632053375, 0.10328472405672073, 0.10740125179290771, 0.1115177795290947, 0.11563430726528168, 0.11975083500146866, 0.12386736273765564, 0.12798389792442322, 0.1321004182100296, 0.13621695339679718, 0.14033347368240356, 0.14445000886917114]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 10.0, 11.0, 14.0, 13.0, 15.0, 23.0, 23.0, 27.0, 28.0, 30.0, 46.0, 52.0, 59.0, 43.0, 50.0, 66.0, 51.0, 44.0, 47.0, 53.0, 52.0, 40.0, 35.0, 46.0, 28.0, 19.0, 16.0, 13.0, 18.0, 9.0, 6.0, 5.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.5058135986328125, -2.441314697265625, -2.3768157958984375, -2.31231689453125, -2.2478179931640625, -2.183319091796875, -2.1188201904296875, -2.0543212890625, -1.9898223876953125, -1.925323486328125, -1.8608245849609375, -1.79632568359375, -1.7318267822265625, -1.667327880859375, -1.6028289794921875, -1.538330078125, -1.4738311767578125, -1.409332275390625, -1.3448333740234375, -1.28033447265625, -1.2158355712890625, -1.151336669921875, -1.0868377685546875, -1.0223388671875, -0.9578399658203125, -0.893341064453125, -0.8288421630859375, -0.76434326171875, -0.6998443603515625, -0.635345458984375, -0.5708465576171875, -0.50634765625, -0.4418487548828125, -0.377349853515625, -0.3128509521484375, -0.24835205078125, -0.1838531494140625, -0.119354248046875, -0.0548553466796875, 0.0096435546875, 0.0741424560546875, 0.138641357421875, 0.2031402587890625, 0.26763916015625, 0.3321380615234375, 0.396636962890625, 0.4611358642578125, 0.525634765625, 0.5901336669921875, 0.654632568359375, 0.7191314697265625, 0.78363037109375, 0.8481292724609375, 0.912628173828125, 0.9771270751953125, 1.0416259765625, 1.1061248779296875, 1.170623779296875, 1.2351226806640625, 1.29962158203125, 1.3641204833984375, 1.428619384765625, 1.4931182861328125, 1.5576171875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 4.0, 4.0, 12.0, 10.0, 21.0, 22.0, 33.0, 61.0, 84.0, 127.0, 235.0, 405.0, 711.0, 1077.0, 2028.0, 4211.0, 10548.0, 48069.0, 660959.0, 276478.0, 28068.0, 7830.0, 3385.0, 1736.0, 984.0, 559.0, 346.0, 198.0, 126.0, 80.0, 40.0, 33.0, 25.0, 15.0, 10.0, 5.0, 4.0, 3.0, 7.0, 3.0, 2.0, 1.0], "bins": [-8.6328125, -8.4215087890625, -8.210205078125, -7.9989013671875, -7.78759765625, -7.5762939453125, -7.364990234375, -7.1536865234375, -6.9423828125, -6.7310791015625, -6.519775390625, -6.3084716796875, -6.09716796875, -5.8858642578125, -5.674560546875, -5.4632568359375, -5.251953125, -5.0406494140625, -4.829345703125, -4.6180419921875, -4.40673828125, -4.1954345703125, -3.984130859375, -3.7728271484375, -3.5615234375, -3.3502197265625, -3.138916015625, -2.9276123046875, -2.71630859375, -2.5050048828125, -2.293701171875, -2.0823974609375, -1.87109375, -1.6597900390625, -1.448486328125, -1.2371826171875, -1.02587890625, -0.8145751953125, -0.603271484375, -0.3919677734375, -0.1806640625, 0.0306396484375, 0.241943359375, 0.4532470703125, 0.66455078125, 0.8758544921875, 1.087158203125, 1.2984619140625, 1.509765625, 1.7210693359375, 1.932373046875, 2.1436767578125, 2.35498046875, 2.5662841796875, 2.777587890625, 2.9888916015625, 3.2001953125, 3.4114990234375, 3.622802734375, 3.8341064453125, 4.04541015625, 4.2567138671875, 4.468017578125, 4.6793212890625, 4.890625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 10.0, 11.0, 8.0, 14.0, 13.0, 19.0, 24.0, 24.0, 27.0, 41.0, 44.0, 35.0, 50.0, 64.0, 67.0, 104.0, 155.0, 1415.0, 250.0, 141.0, 90.0, 71.0, 62.0, 43.0, 40.0, 33.0, 30.0, 21.0, 22.0, 25.0, 12.0, 10.0, 12.0, 9.0, 7.0, 7.0, 5.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.33984375, -4.1990966796875, -4.058349609375, -3.9176025390625, -3.77685546875, -3.6361083984375, -3.495361328125, -3.3546142578125, -3.2138671875, -3.0731201171875, -2.932373046875, -2.7916259765625, -2.65087890625, -2.5101318359375, -2.369384765625, -2.2286376953125, -2.087890625, -1.9471435546875, -1.806396484375, -1.6656494140625, -1.52490234375, -1.3841552734375, -1.243408203125, -1.1026611328125, -0.9619140625, -0.8211669921875, -0.680419921875, -0.5396728515625, -0.39892578125, -0.2581787109375, -0.117431640625, 0.0233154296875, 0.1640625, 0.3048095703125, 0.445556640625, 0.5863037109375, 0.72705078125, 0.8677978515625, 1.008544921875, 1.1492919921875, 1.2900390625, 1.4307861328125, 1.571533203125, 1.7122802734375, 1.85302734375, 1.9937744140625, 2.134521484375, 2.2752685546875, 2.416015625, 2.5567626953125, 2.697509765625, 2.8382568359375, 2.97900390625, 3.1197509765625, 3.260498046875, 3.4012451171875, 3.5419921875, 3.6827392578125, 3.823486328125, 3.9642333984375, 4.10498046875, 4.2457275390625, 4.386474609375, 4.5272216796875, 4.66796875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 3.0, 6.0, 4.0, 9.0, 22.0, 31.0, 40.0, 88.0, 112.0, 249.0, 527.0, 1382.0, 5365.0, 165932.0, 2950324.0, 17471.0, 2506.0, 828.0, 368.0, 180.0, 94.0, 62.0, 29.0, 21.0, 19.0, 7.0, 7.0, 5.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.9375, -20.343505859375, -19.74951171875, -19.155517578125, -18.5615234375, -17.967529296875, -17.37353515625, -16.779541015625, -16.185546875, -15.591552734375, -14.99755859375, -14.403564453125, -13.8095703125, -13.215576171875, -12.62158203125, -12.027587890625, -11.43359375, -10.839599609375, -10.24560546875, -9.651611328125, -9.0576171875, -8.463623046875, -7.86962890625, -7.275634765625, -6.681640625, -6.087646484375, -5.49365234375, -4.899658203125, -4.3056640625, -3.711669921875, -3.11767578125, -2.523681640625, -1.9296875, -1.335693359375, -0.74169921875, -0.147705078125, 0.4462890625, 1.040283203125, 1.63427734375, 2.228271484375, 2.822265625, 3.416259765625, 4.01025390625, 4.604248046875, 5.1982421875, 5.792236328125, 6.38623046875, 6.980224609375, 7.57421875, 8.168212890625, 8.76220703125, 9.356201171875, 9.9501953125, 10.544189453125, 11.13818359375, 11.732177734375, 12.326171875, 12.920166015625, 13.51416015625, 14.108154296875, 14.7021484375, 15.296142578125, 15.89013671875, 16.484130859375, 17.078125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 46.0, 215.0, 504.0, 208.0, 30.0, 5.0, 1.0, 1.0], "bins": [-91.44905090332031, -89.88472747802734, -88.32040405273438, -86.75608825683594, -85.19176483154297, -83.62744140625, -82.06311798095703, -80.49879455566406, -78.9344711303711, -77.37014770507812, -75.80582427978516, -74.24150085449219, -72.67718505859375, -71.11286163330078, -69.54853820800781, -67.98421478271484, -66.41989135742188, -64.8555679321289, -63.2912483215332, -61.726924896240234, -60.162601470947266, -58.59828186035156, -57.033958435058594, -55.469635009765625, -53.90531921386719, -52.34099578857422, -50.776676177978516, -49.21235275268555, -47.64802932739258, -46.083709716796875, -44.519386291503906, -42.95506286621094, -41.3907356262207, -39.826412200927734, -38.26209259033203, -36.69776916503906, -35.133445739746094, -33.569122314453125, -32.00480270385742, -30.440479278564453, -28.87615966796875, -27.311838150024414, -25.747514724731445, -24.18319320678711, -22.61886978149414, -21.054548263549805, -19.49022674560547, -17.9259033203125, -16.36157989501953, -14.797257423400879, -13.232934951782227, -11.66861343383789, -10.104290962219238, -8.539968490600586, -6.97564697265625, -5.411324501037598, -3.8470029830932617, -2.2826807498931885, -0.7183585166931152, 0.8459634780883789, 2.4102859497070312, 3.9746084213256836, 5.5389299392700195, 7.103252410888672, 8.667574882507324]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 14.0, 7.0, 19.0, 18.0, 16.0, 27.0, 25.0, 17.0, 29.0, 28.0, 36.0, 40.0, 35.0, 43.0, 37.0, 56.0, 49.0, 31.0, 47.0, 46.0, 40.0, 47.0, 27.0, 37.0, 36.0, 29.0, 21.0, 21.0, 26.0, 15.0, 21.0, 23.0, 7.0, 6.0, 6.0, 7.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.397384643554688, -11.978484153747559, -11.559584617614746, -11.140684127807617, -10.721783638000488, -10.302884101867676, -9.883983612060547, -9.465084075927734, -9.046183586120605, -8.627283096313477, -8.208383560180664, -7.789483070373535, -7.3705830574035645, -6.951683044433594, -6.532782554626465, -6.113882541656494, -5.694982051849365, -5.2760820388793945, -4.857181549072266, -4.438281536102295, -4.019381523132324, -3.6004812717437744, -3.1815810203552246, -2.762681007385254, -2.343780755996704, -1.9248806238174438, -1.5059804916381836, -1.0870802402496338, -0.6681801080703735, -0.24927997589111328, 0.16962027549743652, 0.5885202884674072, 1.007420539855957, 1.4263206720352173, 1.8452208042144775, 2.2641210556030273, 2.683021068572998, 3.101921319961548, 3.5208215713500977, 3.9397215843200684, 4.358621597290039, 4.77752161026001, 5.196422100067139, 5.615322113037109, 6.03422212600708, 6.453122138977051, 6.87202262878418, 7.29092264175415, 7.709823131561279, 8.12872314453125, 8.547623634338379, 8.966524124145508, 9.38542366027832, 9.80432415008545, 10.223224639892578, 10.64212417602539, 11.06102466583252, 11.479925155639648, 11.898824691772461, 12.31772518157959, 12.736625671386719, 13.155525207519531, 13.57442569732666, 13.993326187133789, 14.412225723266602]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 4.0, 9.0, 11.0, 10.0, 19.0, 20.0, 19.0, 19.0, 19.0, 38.0, 33.0, 36.0, 45.0, 45.0, 46.0, 49.0, 55.0, 47.0, 59.0, 49.0, 49.0, 53.0, 45.0, 29.0, 34.0, 31.0, 20.0, 16.0, 19.0, 21.0, 11.0, 11.0, 9.0, 2.0, 6.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-2.61328125, -2.54840087890625, -2.4835205078125, -2.41864013671875, -2.353759765625, -2.28887939453125, -2.2239990234375, -2.15911865234375, -2.09423828125, -2.02935791015625, -1.9644775390625, -1.89959716796875, -1.834716796875, -1.76983642578125, -1.7049560546875, -1.64007568359375, -1.5751953125, -1.51031494140625, -1.4454345703125, -1.38055419921875, -1.315673828125, -1.25079345703125, -1.1859130859375, -1.12103271484375, -1.05615234375, -0.99127197265625, -0.9263916015625, -0.86151123046875, -0.796630859375, -0.73175048828125, -0.6668701171875, -0.60198974609375, -0.537109375, -0.47222900390625, -0.4073486328125, -0.34246826171875, -0.277587890625, -0.21270751953125, -0.1478271484375, -0.08294677734375, -0.01806640625, 0.04681396484375, 0.1116943359375, 0.17657470703125, 0.241455078125, 0.30633544921875, 0.3712158203125, 0.43609619140625, 0.5009765625, 0.56585693359375, 0.6307373046875, 0.69561767578125, 0.760498046875, 0.82537841796875, 0.8902587890625, 0.95513916015625, 1.02001953125, 1.08489990234375, 1.1497802734375, 1.21466064453125, 1.279541015625, 1.34442138671875, 1.4093017578125, 1.47418212890625, 1.5390625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 11.0, 11.0, 20.0, 17.0, 36.0, 60.0, 78.0, 132.0, 189.0, 266.0, 491.0, 793.0, 1343.0, 2452.0, 4732.0, 10977.0, 33363.0, 236001.0, 2913592.0, 888643.0, 69369.0, 17775.0, 6808.0, 3171.0, 1669.0, 918.0, 561.0, 303.0, 183.0, 103.0, 75.0, 48.0, 33.0, 14.0, 15.0, 13.0, 3.0, 2.0], "bins": [-7.34375, -7.1795654296875, -7.015380859375, -6.8511962890625, -6.68701171875, -6.5228271484375, -6.358642578125, -6.1944580078125, -6.0302734375, -5.8660888671875, -5.701904296875, -5.5377197265625, -5.37353515625, -5.2093505859375, -5.045166015625, -4.8809814453125, -4.716796875, -4.5526123046875, -4.388427734375, -4.2242431640625, -4.06005859375, -3.8958740234375, -3.731689453125, -3.5675048828125, -3.4033203125, -3.2391357421875, -3.074951171875, -2.9107666015625, -2.74658203125, -2.5823974609375, -2.418212890625, -2.2540283203125, -2.08984375, -1.9256591796875, -1.761474609375, -1.5972900390625, -1.43310546875, -1.2689208984375, -1.104736328125, -0.9405517578125, -0.7763671875, -0.6121826171875, -0.447998046875, -0.2838134765625, -0.11962890625, 0.0445556640625, 0.208740234375, 0.3729248046875, 0.537109375, 0.7012939453125, 0.865478515625, 1.0296630859375, 1.19384765625, 1.3580322265625, 1.522216796875, 1.6864013671875, 1.8505859375, 2.0147705078125, 2.178955078125, 2.3431396484375, 2.50732421875, 2.6715087890625, 2.835693359375, 2.9998779296875, 3.1640625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 11.0, 11.0, 17.0, 16.0, 25.0, 31.0, 42.0, 50.0, 77.0, 104.0, 178.0, 267.0, 483.0, 684.0, 736.0, 471.0, 254.0, 171.0, 105.0, 73.0, 54.0, 36.0, 30.0, 30.0, 20.0, 17.0, 7.0, 6.0, 12.0, 10.0, 5.0, 4.0, 6.0, 2.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.01953125, -3.904693603515625, -3.78985595703125, -3.675018310546875, -3.5601806640625, -3.445343017578125, -3.33050537109375, -3.215667724609375, -3.100830078125, -2.985992431640625, -2.87115478515625, -2.756317138671875, -2.6414794921875, -2.526641845703125, -2.41180419921875, -2.296966552734375, -2.18212890625, -2.067291259765625, -1.95245361328125, -1.837615966796875, -1.7227783203125, -1.607940673828125, -1.49310302734375, -1.378265380859375, -1.263427734375, -1.148590087890625, -1.03375244140625, -0.918914794921875, -0.8040771484375, -0.689239501953125, -0.57440185546875, -0.459564208984375, -0.3447265625, -0.229888916015625, -0.11505126953125, -0.000213623046875, 0.1146240234375, 0.229461669921875, 0.34429931640625, 0.459136962890625, 0.573974609375, 0.688812255859375, 0.80364990234375, 0.918487548828125, 1.0333251953125, 1.148162841796875, 1.26300048828125, 1.377838134765625, 1.49267578125, 1.607513427734375, 1.72235107421875, 1.837188720703125, 1.9520263671875, 2.066864013671875, 2.18170166015625, 2.296539306640625, 2.411376953125, 2.526214599609375, 2.64105224609375, 2.755889892578125, 2.8707275390625, 2.985565185546875, 3.10040283203125, 3.215240478515625, 3.330078125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 7.0, 9.0, 9.0, 13.0, 10.0, 23.0, 19.0, 38.0, 38.0, 52.0, 87.0, 159.0, 379.0, 1086.0, 4562.0, 24410.0, 465834.0, 3609961.0, 74478.0, 9773.0, 2076.0, 636.0, 230.0, 126.0, 63.0, 49.0, 33.0, 27.0, 22.0, 18.0, 11.0, 12.0, 3.0, 2.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8359375, -11.444580078125, -11.05322265625, -10.661865234375, -10.2705078125, -9.879150390625, -9.48779296875, -9.096435546875, -8.705078125, -8.313720703125, -7.92236328125, -7.531005859375, -7.1396484375, -6.748291015625, -6.35693359375, -5.965576171875, -5.57421875, -5.182861328125, -4.79150390625, -4.400146484375, -4.0087890625, -3.617431640625, -3.22607421875, -2.834716796875, -2.443359375, -2.052001953125, -1.66064453125, -1.269287109375, -0.8779296875, -0.486572265625, -0.09521484375, 0.296142578125, 0.6875, 1.078857421875, 1.47021484375, 1.861572265625, 2.2529296875, 2.644287109375, 3.03564453125, 3.427001953125, 3.818359375, 4.209716796875, 4.60107421875, 4.992431640625, 5.3837890625, 5.775146484375, 6.16650390625, 6.557861328125, 6.94921875, 7.340576171875, 7.73193359375, 8.123291015625, 8.5146484375, 8.906005859375, 9.29736328125, 9.688720703125, 10.080078125, 10.471435546875, 10.86279296875, 11.254150390625, 11.6455078125, 12.036865234375, 12.42822265625, 12.819580078125, 13.2109375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 10.0, 51.0, 125.0, 301.0, 306.0, 148.0, 43.0, 12.0, 12.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.43632125854492, -42.90555953979492, -41.37479782104492, -39.84403991699219, -38.31327819824219, -36.78251647949219, -35.25175476074219, -33.72099304199219, -32.19023513793945, -30.659473419189453, -29.128713607788086, -27.597951889038086, -26.06719207763672, -24.53643035888672, -23.00566864013672, -21.47490882873535, -19.94414710998535, -18.41338539123535, -16.882625579833984, -15.351863861083984, -13.821104049682617, -12.290342330932617, -10.759581565856934, -9.22882080078125, -7.698060035705566, -6.167299270629883, -4.636538505554199, -3.1057772636413574, -1.5750164985656738, -0.044255733489990234, 1.4865055084228516, 3.017266273498535, 4.548027038574219, 6.078787803649902, 7.609548568725586, 9.140310287475586, 10.671070098876953, 12.201831817626953, 13.732592582702637, 15.26335334777832, 16.794113159179688, 18.324874877929688, 19.855634689331055, 21.386396408081055, 22.917156219482422, 24.447917938232422, 25.978679656982422, 27.50943946838379, 29.04020118713379, 30.57096290588379, 32.101722717285156, 33.632484436035156, 35.163246154785156, 36.69400405883789, 38.22476577758789, 39.75552749633789, 41.28628921508789, 42.81705093383789, 44.34781265258789, 45.878570556640625, 47.409332275390625, 48.940093994140625, 50.470855712890625, 52.001617431640625, 53.53237533569336]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 6.0, 9.0, 9.0, 13.0, 13.0, 13.0, 17.0, 27.0, 18.0, 24.0, 24.0, 18.0, 35.0, 30.0, 27.0, 31.0, 36.0, 51.0, 42.0, 34.0, 39.0, 38.0, 43.0, 34.0, 34.0, 37.0, 48.0, 31.0, 33.0, 20.0, 21.0, 26.0, 26.0, 28.0, 11.0, 12.0, 13.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.662485122680664, -10.342297554016113, -10.022109985351562, -9.701922416687012, -9.381734848022461, -9.061546325683594, -8.741358757019043, -8.421171188354492, -8.100983619689941, -7.780796051025391, -7.46060848236084, -7.140420436859131, -6.82023286819458, -6.500045299530029, -6.17985725402832, -5.8596696853637695, -5.539482116699219, -5.219294548034668, -4.899106979370117, -4.578918933868408, -4.258731365203857, -3.9385437965393066, -3.6183559894561768, -3.298168182373047, -2.977980613708496, -2.6577930450439453, -2.3376052379608154, -2.0174174308776855, -1.6972298622131348, -1.3770421743392944, -1.056854486465454, -0.7366666793823242, -0.41647815704345703, -0.0962904691696167, 0.22389721870422363, 0.544084906578064, 0.8642725944519043, 1.1844602823257446, 1.504647970199585, 1.8248357772827148, 2.1450233459472656, 2.4652109146118164, 2.7853987216949463, 3.105586528778076, 3.425774097442627, 3.7459616661071777, 4.066149711608887, 4.3863372802734375, 4.706524848937988, 5.026712417602539, 5.34689998626709, 5.667088031768799, 5.98727560043335, 6.3074631690979, 6.627651214599609, 6.94783878326416, 7.268026351928711, 7.588213920593262, 7.9084014892578125, 8.228589057922363, 8.548776626586914, 8.868965148925781, 9.189152717590332, 9.509340286254883, 9.829527854919434]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 2.0, 8.0, 9.0, 6.0, 7.0, 13.0, 10.0, 17.0, 23.0, 26.0, 26.0, 30.0, 37.0, 39.0, 33.0, 40.0, 46.0, 42.0, 57.0, 44.0, 43.0, 47.0, 41.0, 37.0, 47.0, 38.0, 32.0, 28.0, 29.0, 21.0, 22.0, 21.0, 18.0, 19.0, 7.0, 9.0, 5.0, 4.0, 6.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7448883056640625, -1.689971923828125, -1.6350555419921875, -1.58013916015625, -1.5252227783203125, -1.470306396484375, -1.4153900146484375, -1.3604736328125, -1.3055572509765625, -1.250640869140625, -1.1957244873046875, -1.14080810546875, -1.0858917236328125, -1.030975341796875, -0.9760589599609375, -0.921142578125, -0.8662261962890625, -0.811309814453125, -0.7563934326171875, -0.70147705078125, -0.6465606689453125, -0.591644287109375, -0.5367279052734375, -0.4818115234375, -0.4268951416015625, -0.371978759765625, -0.3170623779296875, -0.26214599609375, -0.2072296142578125, -0.152313232421875, -0.0973968505859375, -0.04248046875, 0.0124359130859375, 0.067352294921875, 0.1222686767578125, 0.17718505859375, 0.2321014404296875, 0.287017822265625, 0.3419342041015625, 0.3968505859375, 0.4517669677734375, 0.506683349609375, 0.5615997314453125, 0.61651611328125, 0.6714324951171875, 0.726348876953125, 0.7812652587890625, 0.836181640625, 0.8910980224609375, 0.946014404296875, 1.0009307861328125, 1.05584716796875, 1.1107635498046875, 1.165679931640625, 1.2205963134765625, 1.2755126953125, 1.3304290771484375, 1.385345458984375, 1.4402618408203125, 1.49517822265625, 1.5500946044921875, 1.605010986328125, 1.6599273681640625, 1.71484375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 12.0, 5.0, 15.0, 29.0, 33.0, 68.0, 89.0, 117.0, 201.0, 335.0, 569.0, 920.0, 1626.0, 2788.0, 5061.0, 9450.0, 18494.0, 37451.0, 84228.0, 217727.0, 369113.0, 167840.0, 67697.0, 31105.0, 15360.0, 8074.0, 4284.0, 2378.0, 1351.0, 811.0, 485.0, 313.0, 168.0, 127.0, 91.0, 44.0, 30.0, 23.0, 10.0, 12.0, 4.0, 7.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.372802734375, -0.3622627258300781, -0.35172271728515625, -0.3411827087402344, -0.3306427001953125, -0.3201026916503906, -0.30956268310546875, -0.2990226745605469, -0.288482666015625, -0.2779426574707031, -0.26740264892578125, -0.2568626403808594, -0.2463226318359375, -0.23578262329101562, -0.22524261474609375, -0.21470260620117188, -0.20416259765625, -0.19362258911132812, -0.18308258056640625, -0.17254257202148438, -0.1620025634765625, -0.15146255493164062, -0.14092254638671875, -0.13038253784179688, -0.119842529296875, -0.10930252075195312, -0.09876251220703125, -0.08822250366210938, -0.0776824951171875, -0.06714248657226562, -0.05660247802734375, -0.046062469482421875, -0.0355224609375, -0.024982452392578125, -0.01444244384765625, -0.003902435302734375, 0.0066375732421875, 0.017177581787109375, 0.02771759033203125, 0.038257598876953125, 0.048797607421875, 0.059337615966796875, 0.06987762451171875, 0.08041763305664062, 0.0909576416015625, 0.10149765014648438, 0.11203765869140625, 0.12257766723632812, 0.13311767578125, 0.14365768432617188, 0.15419769287109375, 0.16473770141601562, 0.1752777099609375, 0.18581771850585938, 0.19635772705078125, 0.20689773559570312, 0.217437744140625, 0.22797775268554688, 0.23851776123046875, 0.24905776977539062, 0.2595977783203125, 0.2701377868652344, 0.28067779541015625, 0.2912178039550781, 0.3017578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 1.0, 8.0, 7.0, 3.0, 2.0, 12.0, 12.0, 11.0, 17.0, 18.0, 9.0, 22.0, 17.0, 22.0, 30.0, 26.0, 32.0, 33.0, 31.0, 27.0, 41.0, 46.0, 47.0, 1056.0, 37.0, 39.0, 38.0, 38.0, 36.0, 41.0, 41.0, 31.0, 29.0, 22.0, 18.0, 18.0, 14.0, 22.0, 10.0, 13.0, 8.0, 9.0, 9.0, 5.0, 3.0, 7.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.94384765625, -0.9097061157226562, -0.8755645751953125, -0.8414230346679688, -0.807281494140625, -0.7731399536132812, -0.7389984130859375, -0.7048568725585938, -0.67071533203125, -0.6365737915039062, -0.6024322509765625, -0.5682907104492188, -0.534149169921875, -0.5000076293945312, -0.4658660888671875, -0.43172454833984375, -0.3975830078125, -0.36344146728515625, -0.3292999267578125, -0.29515838623046875, -0.261016845703125, -0.22687530517578125, -0.1927337646484375, -0.15859222412109375, -0.12445068359375, -0.09030914306640625, -0.0561676025390625, -0.02202606201171875, 0.012115478515625, 0.04625701904296875, 0.0803985595703125, 0.11454010009765625, 0.148681640625, 0.18282318115234375, 0.2169647216796875, 0.25110626220703125, 0.285247802734375, 0.31938934326171875, 0.3535308837890625, 0.38767242431640625, 0.42181396484375, 0.45595550537109375, 0.4900970458984375, 0.5242385864257812, 0.558380126953125, 0.5925216674804688, 0.6266632080078125, 0.6608047485351562, 0.6949462890625, 0.7290878295898438, 0.7632293701171875, 0.7973709106445312, 0.831512451171875, 0.8656539916992188, 0.8997955322265625, 0.9339370727539062, 0.96807861328125, 1.0022201538085938, 1.0363616943359375, 1.0705032348632812, 1.104644775390625, 1.1387863159179688, 1.1729278564453125, 1.2070693969726562, 1.2412109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 12.0, 13.0, 17.0, 28.0, 56.0, 55.0, 78.0, 107.0, 234.0, 370.0, 687.0, 1311.0, 2654.0, 5600.0, 13093.0, 44420.0, 1878037.0, 115750.0, 19419.0, 7765.0, 3476.0, 1728.0, 928.0, 459.0, 303.0, 180.0, 114.0, 75.0, 52.0, 28.0, 19.0, 21.0, 13.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6388702392578125, -0.616607666015625, -0.5943450927734375, -0.57208251953125, -0.5498199462890625, -0.527557373046875, -0.5052947998046875, -0.4830322265625, -0.4607696533203125, -0.438507080078125, -0.4162445068359375, -0.39398193359375, -0.3717193603515625, -0.349456787109375, -0.3271942138671875, -0.304931640625, -0.2826690673828125, -0.260406494140625, -0.2381439208984375, -0.21588134765625, -0.1936187744140625, -0.171356201171875, -0.1490936279296875, -0.1268310546875, -0.1045684814453125, -0.082305908203125, -0.0600433349609375, -0.03778076171875, -0.0155181884765625, 0.006744384765625, 0.0290069580078125, 0.05126953125, 0.0735321044921875, 0.095794677734375, 0.1180572509765625, 0.14031982421875, 0.1625823974609375, 0.184844970703125, 0.2071075439453125, 0.2293701171875, 0.2516326904296875, 0.273895263671875, 0.2961578369140625, 0.31842041015625, 0.3406829833984375, 0.362945556640625, 0.3852081298828125, 0.407470703125, 0.4297332763671875, 0.451995849609375, 0.4742584228515625, 0.49652099609375, 0.5187835693359375, 0.541046142578125, 0.5633087158203125, 0.5855712890625, 0.6078338623046875, 0.630096435546875, 0.6523590087890625, 0.67462158203125, 0.6968841552734375, 0.719146728515625, 0.7414093017578125, 0.763671875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 8.0, 7.0, 20.0, 17.0, 29.0, 40.0, 40.0, 63.0, 62.0, 79.0, 91.0, 85.0, 78.0, 62.0, 74.0, 47.0, 29.0, 29.0, 19.0, 22.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0189361572265625, -0.018323421478271484, -0.01771068572998047, -0.017097949981689453, -0.016485214233398438, -0.015872478485107422, -0.015259742736816406, -0.01464700698852539, -0.014034271240234375, -0.01342153549194336, -0.012808799743652344, -0.012196063995361328, -0.011583328247070312, -0.010970592498779297, -0.010357856750488281, -0.009745121002197266, -0.00913238525390625, -0.008519649505615234, -0.007906913757324219, -0.007294178009033203, -0.0066814422607421875, -0.006068706512451172, -0.005455970764160156, -0.004843235015869141, -0.004230499267578125, -0.0036177635192871094, -0.0030050277709960938, -0.002392292022705078, -0.0017795562744140625, -0.0011668205261230469, -0.0005540847778320312, 5.8650970458984375e-05, 0.00067138671875, 0.0012841224670410156, 0.0018968582153320312, 0.002509593963623047, 0.0031223297119140625, 0.003735065460205078, 0.004347801208496094, 0.004960536956787109, 0.005573272705078125, 0.006186008453369141, 0.006798744201660156, 0.007411479949951172, 0.008024215698242188, 0.008636951446533203, 0.009249687194824219, 0.009862422943115234, 0.01047515869140625, 0.011087894439697266, 0.011700630187988281, 0.012313365936279297, 0.012926101684570312, 0.013538837432861328, 0.014151573181152344, 0.01476430892944336, 0.015377044677734375, 0.01598978042602539, 0.016602516174316406, 0.017215251922607422, 0.017827987670898438, 0.018440723419189453, 0.01905345916748047, 0.019666194915771484, 0.0202789306640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 12.0, 13.0, 10.0, 21.0, 22.0, 30.0, 28.0, 49.0, 88.0, 124.0, 209.0, 346.0, 989.0, 9356.0, 698326.0, 331680.0, 5590.0, 747.0, 328.0, 158.0, 133.0, 82.0, 45.0, 39.0, 24.0, 24.0, 8.0, 14.0, 13.0, 8.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3115234375, -0.3017616271972656, -0.29199981689453125, -0.2822380065917969, -0.2724761962890625, -0.2627143859863281, -0.25295257568359375, -0.24319076538085938, -0.233428955078125, -0.22366714477539062, -0.21390533447265625, -0.20414352416992188, -0.1943817138671875, -0.18461990356445312, -0.17485809326171875, -0.16509628295898438, -0.15533447265625, -0.14557266235351562, -0.13581085205078125, -0.12604904174804688, -0.1162872314453125, -0.10652542114257812, -0.09676361083984375, -0.08700180053710938, -0.077239990234375, -0.06747817993164062, -0.05771636962890625, -0.047954559326171875, -0.0381927490234375, -0.028430938720703125, -0.01866912841796875, -0.008907318115234375, 0.0008544921875, 0.010616302490234375, 0.02037811279296875, 0.030139923095703125, 0.0399017333984375, 0.049663543701171875, 0.05942535400390625, 0.06918716430664062, 0.078948974609375, 0.08871078491210938, 0.09847259521484375, 0.10823440551757812, 0.1179962158203125, 0.12775802612304688, 0.13751983642578125, 0.14728164672851562, 0.15704345703125, 0.16680526733398438, 0.17656707763671875, 0.18632888793945312, 0.1960906982421875, 0.20585250854492188, 0.21561431884765625, 0.22537612915039062, 0.235137939453125, 0.24489974975585938, 0.25466156005859375, 0.2644233703613281, 0.2741851806640625, 0.2839469909667969, 0.29370880126953125, 0.3034706115722656, 0.313232421875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 12.0, 22.0, 117.0, 529.0, 284.0, 43.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2698521912097931, -0.26323044300079346, -0.25660866498947144, -0.2499869167804718, -0.24336516857147217, -0.23674340546131134, -0.2301216423511505, -0.22349989414215088, -0.21687813103199005, -0.21025636792182922, -0.2036346197128296, -0.19701285660266876, -0.19039110839366913, -0.1837693452835083, -0.17714759707450867, -0.17052583396434784, -0.163904070854187, -0.15728230774402618, -0.15066055953502655, -0.14403879642486572, -0.1374170482158661, -0.13079528510570526, -0.12417352944612503, -0.1175517737865448, -0.11093002557754517, -0.10430826991796494, -0.0976865142583847, -0.09106475114822388, -0.08444299548864365, -0.07782123982906342, -0.07119948416948318, -0.06457772850990295, -0.057955965399742126, -0.051334209740161896, -0.04471245035529137, -0.038090694695711136, -0.03146893531084061, -0.024847179651260376, -0.018225423991680145, -0.011603664606809616, -0.004981908947229385, 0.0016398481093347073, 0.0082616051658988, 0.014883361756801605, 0.021505119279026985, 0.028126876801252365, 0.034748632460832596, 0.041370391845703125, 0.047992147505283356, 0.054613903164863586, 0.061235662549734116, 0.06785741448402405, 0.07447917759418488, 0.0811009332537651, 0.08772268891334534, 0.09434445202350616, 0.1009662002325058, 0.10758795589208603, 0.11420971155166626, 0.12083147466182709, 0.12745322287082672, 0.13407498598098755, 0.14069673418998718, 0.147318497300148, 0.15394026041030884]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 2.0, 6.0, 8.0, 5.0, 10.0, 14.0, 11.0, 15.0, 14.0, 25.0, 23.0, 31.0, 27.0, 23.0, 29.0, 36.0, 38.0, 34.0, 47.0, 34.0, 44.0, 45.0, 47.0, 33.0, 42.0, 44.0, 31.0, 33.0, 30.0, 36.0, 31.0, 27.0, 23.0, 26.0, 15.0, 12.0, 17.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.021211862564086914, -0.020591430366039276, -0.019971000030636787, -0.0193505696952343, -0.01873013749718666, -0.018109705299139023, -0.017489274963736534, -0.016868844628334045, -0.016248412430286407, -0.01562798023223877, -0.01500754989683628, -0.014387118630111217, -0.013766687363386154, -0.01314625609666109, -0.012525824829936028, -0.011905393563210964, -0.011284962296485901, -0.010664531029760838, -0.010044099763035774, -0.009423668496310711, -0.008803237229585648, -0.008182805962860584, -0.007562374696135521, -0.006941943429410458, -0.006321512162685394, -0.005701080895960331, -0.005080649629235268, -0.004460218362510204, -0.003839787095785141, -0.0032193558290600777, -0.0025989245623350143, -0.001978493295609951, -0.0013580620288848877, -0.0007376307621598244, -0.00011719949543476105, 0.0005032317712903023, 0.0011236630380153656, 0.001744094304740429, 0.0023645255714654922, 0.0029849568381905556, 0.003605388104915619, 0.004225819371640682, 0.0048462506383657455, 0.005466681905090809, 0.006087113171815872, 0.0067075444385409355, 0.007327975705265999, 0.007948406971991062, 0.008568838238716125, 0.009189269505441189, 0.009809700772166252, 0.010430132038891315, 0.011050563305616379, 0.011670994572341442, 0.012291425839066505, 0.012911857105791569, 0.013532288372516632, 0.014152719639241695, 0.014773150905966759, 0.015393582172691822, 0.016014013439416885, 0.016634445637464523, 0.017254875972867012, 0.0178753063082695, 0.01849573850631714]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 2.0, 8.0, 10.0, 5.0, 7.0, 13.0, 10.0, 17.0, 24.0, 26.0, 25.0, 31.0, 37.0, 38.0, 33.0, 40.0, 48.0, 43.0, 54.0, 44.0, 44.0, 46.0, 44.0, 37.0, 44.0, 37.0, 33.0, 30.0, 26.0, 23.0, 21.0, 21.0, 18.0, 19.0, 7.0, 9.0, 5.0, 4.0, 6.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.798828125, -1.7439117431640625, -1.688995361328125, -1.6340789794921875, -1.57916259765625, -1.5242462158203125, -1.469329833984375, -1.4144134521484375, -1.3594970703125, -1.3045806884765625, -1.249664306640625, -1.1947479248046875, -1.13983154296875, -1.0849151611328125, -1.029998779296875, -0.9750823974609375, -0.920166015625, -0.8652496337890625, -0.810333251953125, -0.7554168701171875, -0.70050048828125, -0.6455841064453125, -0.590667724609375, -0.5357513427734375, -0.4808349609375, -0.4259185791015625, -0.371002197265625, -0.3160858154296875, -0.26116943359375, -0.2062530517578125, -0.151336669921875, -0.0964202880859375, -0.04150390625, 0.0134124755859375, 0.068328857421875, 0.1232452392578125, 0.17816162109375, 0.2330780029296875, 0.287994384765625, 0.3429107666015625, 0.3978271484375, 0.4527435302734375, 0.507659912109375, 0.5625762939453125, 0.61749267578125, 0.6724090576171875, 0.727325439453125, 0.7822418212890625, 0.837158203125, 0.8920745849609375, 0.946990966796875, 1.0019073486328125, 1.05682373046875, 1.1117401123046875, 1.166656494140625, 1.2215728759765625, 1.2764892578125, 1.3314056396484375, 1.386322021484375, 1.4412384033203125, 1.49615478515625, 1.5510711669921875, 1.605987548828125, 1.6609039306640625, 1.7158203125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 13.0, 10.0, 14.0, 20.0, 25.0, 63.0, 74.0, 131.0, 205.0, 343.0, 641.0, 1197.0, 2208.0, 4454.0, 9225.0, 20994.0, 56662.0, 192424.0, 514247.0, 160816.0, 49074.0, 18827.0, 8311.0, 3998.0, 2069.0, 1045.0, 602.0, 303.0, 235.0, 114.0, 76.0, 35.0, 24.0, 16.0, 13.0, 12.0, 10.0, 12.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.822265625, -2.73785400390625, -2.6534423828125, -2.56903076171875, -2.484619140625, -2.40020751953125, -2.3157958984375, -2.23138427734375, -2.14697265625, -2.06256103515625, -1.9781494140625, -1.89373779296875, -1.809326171875, -1.72491455078125, -1.6405029296875, -1.55609130859375, -1.4716796875, -1.38726806640625, -1.3028564453125, -1.21844482421875, -1.134033203125, -1.04962158203125, -0.9652099609375, -0.88079833984375, -0.79638671875, -0.71197509765625, -0.6275634765625, -0.54315185546875, -0.458740234375, -0.37432861328125, -0.2899169921875, -0.20550537109375, -0.12109375, -0.03668212890625, 0.0477294921875, 0.13214111328125, 0.216552734375, 0.30096435546875, 0.3853759765625, 0.46978759765625, 0.55419921875, 0.63861083984375, 0.7230224609375, 0.80743408203125, 0.891845703125, 0.97625732421875, 1.0606689453125, 1.14508056640625, 1.2294921875, 1.31390380859375, 1.3983154296875, 1.48272705078125, 1.567138671875, 1.65155029296875, 1.7359619140625, 1.82037353515625, 1.90478515625, 1.98919677734375, 2.0736083984375, 2.15802001953125, 2.242431640625, 2.32684326171875, 2.4112548828125, 2.49566650390625, 2.580078125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 8.0, 7.0, 17.0, 12.0, 16.0, 15.0, 11.0, 21.0, 30.0, 26.0, 37.0, 29.0, 41.0, 44.0, 54.0, 73.0, 95.0, 173.0, 1359.0, 285.0, 177.0, 98.0, 58.0, 41.0, 30.0, 25.0, 33.0, 26.0, 29.0, 25.0, 24.0, 21.0, 15.0, 11.0, 13.0, 7.0, 7.0, 8.0, 9.0, 3.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.37109375, -4.2340087890625, -4.096923828125, -3.9598388671875, -3.82275390625, -3.6856689453125, -3.548583984375, -3.4114990234375, -3.2744140625, -3.1373291015625, -3.000244140625, -2.8631591796875, -2.72607421875, -2.5889892578125, -2.451904296875, -2.3148193359375, -2.177734375, -2.0406494140625, -1.903564453125, -1.7664794921875, -1.62939453125, -1.4923095703125, -1.355224609375, -1.2181396484375, -1.0810546875, -0.9439697265625, -0.806884765625, -0.6697998046875, -0.53271484375, -0.3956298828125, -0.258544921875, -0.1214599609375, 0.015625, 0.1527099609375, 0.289794921875, 0.4268798828125, 0.56396484375, 0.7010498046875, 0.838134765625, 0.9752197265625, 1.1123046875, 1.2493896484375, 1.386474609375, 1.5235595703125, 1.66064453125, 1.7977294921875, 1.934814453125, 2.0718994140625, 2.208984375, 2.3460693359375, 2.483154296875, 2.6202392578125, 2.75732421875, 2.8944091796875, 3.031494140625, 3.1685791015625, 3.3056640625, 3.4427490234375, 3.579833984375, 3.7169189453125, 3.85400390625, 3.9910888671875, 4.128173828125, 4.2652587890625, 4.40234375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 5.0, 6.0, 4.0, 1.0, 9.0, 7.0, 6.0, 7.0, 14.0, 19.0, 13.0, 18.0, 25.0, 26.0, 53.0, 47.0, 70.0, 85.0, 95.0, 115.0, 207.0, 403.0, 1065.0, 4586.0, 42310.0, 2136986.0, 927291.0, 26631.0, 3552.0, 880.0, 357.0, 222.0, 128.0, 104.0, 74.0, 63.0, 55.0, 24.0, 27.0, 26.0, 21.0, 16.0, 12.0, 11.0, 10.0, 5.0, 7.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.1171875, -7.8458251953125, -7.574462890625, -7.3031005859375, -7.03173828125, -6.7603759765625, -6.489013671875, -6.2176513671875, -5.9462890625, -5.6749267578125, -5.403564453125, -5.1322021484375, -4.86083984375, -4.5894775390625, -4.318115234375, -4.0467529296875, -3.775390625, -3.5040283203125, -3.232666015625, -2.9613037109375, -2.68994140625, -2.4185791015625, -2.147216796875, -1.8758544921875, -1.6044921875, -1.3331298828125, -1.061767578125, -0.7904052734375, -0.51904296875, -0.2476806640625, 0.023681640625, 0.2950439453125, 0.56640625, 0.8377685546875, 1.109130859375, 1.3804931640625, 1.65185546875, 1.9232177734375, 2.194580078125, 2.4659423828125, 2.7373046875, 3.0086669921875, 3.280029296875, 3.5513916015625, 3.82275390625, 4.0941162109375, 4.365478515625, 4.6368408203125, 4.908203125, 5.1795654296875, 5.450927734375, 5.7222900390625, 5.99365234375, 6.2650146484375, 6.536376953125, 6.8077392578125, 7.0791015625, 7.3504638671875, 7.621826171875, 7.8931884765625, 8.16455078125, 8.4359130859375, 8.707275390625, 8.9786376953125, 9.25]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [3.0, 5.0, 22.0, 101.0, 309.0, 375.0, 162.0, 33.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.595501899719238, -3.6967477798461914, -2.7979938983917236, -1.8992400169372559, -1.000485897064209, -0.10173177719116211, 0.7970218658447266, 1.6957759857177734, 2.5945301055908203, 3.493284225463867, 4.392038345336914, 5.290791988372803, 6.18954610824585, 7.0883002281188965, 7.987053871154785, 8.885807991027832, 9.784562110900879, 10.683316230773926, 11.582070350646973, 12.480823516845703, 13.37957763671875, 14.278331756591797, 15.177085876464844, 16.07583999633789, 16.974594116210938, 17.873348236083984, 18.77210235595703, 19.670856475830078, 20.569610595703125, 21.468364715576172, 22.36711883544922, 23.265872955322266, 24.164627075195312, 25.06338119506836, 25.962135314941406, 26.860889434814453, 27.7596435546875, 28.658397674560547, 29.557151794433594, 30.45590591430664, 31.354660034179688, 32.253414154052734, 33.15216827392578, 34.05092239379883, 34.949676513671875, 35.84843063354492, 36.74718475341797, 37.645938873291016, 38.54469299316406, 39.44344711303711, 40.342201232910156, 41.2409553527832, 42.13970947265625, 43.0384635925293, 43.937217712402344, 44.83597183227539, 45.73472213745117, 46.63347625732422, 47.532230377197266, 48.43098449707031, 49.32973861694336, 50.228492736816406, 51.12724685668945, 52.0260009765625, 52.92475509643555]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 7.0, 3.0, 3.0, 11.0, 16.0, 15.0, 16.0, 14.0, 19.0, 19.0, 23.0, 29.0, 26.0, 32.0, 28.0, 25.0, 40.0, 51.0, 38.0, 40.0, 47.0, 47.0, 32.0, 57.0, 49.0, 48.0, 40.0, 32.0, 25.0, 32.0, 27.0, 23.0, 12.0, 12.0, 9.0, 6.0, 4.0, 11.0, 3.0, 6.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.108867645263672, -10.720108032226562, -10.331348419189453, -9.942587852478027, -9.553828239440918, -9.165068626403809, -8.7763090133667, -8.387548446655273, -7.998788833618164, -7.610029220581055, -7.221269130706787, -6.832509517669678, -6.44374942779541, -6.054989814758301, -5.666230201721191, -5.277470111846924, -4.8887104988098145, -4.499950885772705, -4.1111907958984375, -3.722431182861328, -3.3336710929870605, -2.944911479949951, -2.5561516284942627, -2.167391777038574, -1.7786319255828857, -1.3898720741271973, -1.0011122226715088, -0.6123524904251099, -0.2235926389694214, 0.1651672124862671, 0.553926944732666, 0.9426867961883545, 1.331446647644043, 1.7202064990997314, 2.10896635055542, 2.4977259635925293, 2.886486053466797, 3.2752456665039062, 3.6640055179595947, 4.052765369415283, 4.441525459289551, 4.83028507232666, 5.219045162200928, 5.607804775238037, 5.996564865112305, 6.385324478149414, 6.774084091186523, 7.162844181060791, 7.5516037940979, 7.94036340713501, 8.329123497009277, 8.717883110046387, 9.106642723083496, 9.495403289794922, 9.884162902832031, 10.27292251586914, 10.66168212890625, 11.05044174194336, 11.439201354980469, 11.827961921691895, 12.216721534729004, 12.605481147766113, 12.994240760803223, 13.383001327514648, 13.771760940551758]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 6.0, 7.0, 4.0, 2.0, 11.0, 9.0, 12.0, 15.0, 16.0, 25.0, 24.0, 19.0, 38.0, 35.0, 32.0, 36.0, 45.0, 36.0, 36.0, 51.0, 43.0, 43.0, 48.0, 38.0, 45.0, 33.0, 26.0, 43.0, 35.0, 28.0, 22.0, 19.0, 28.0, 17.0, 14.0, 13.0, 8.0, 10.0, 6.0, 5.0, 8.0, 7.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.791015625, -1.7367095947265625, -1.682403564453125, -1.6280975341796875, -1.57379150390625, -1.5194854736328125, -1.465179443359375, -1.4108734130859375, -1.3565673828125, -1.3022613525390625, -1.247955322265625, -1.1936492919921875, -1.13934326171875, -1.0850372314453125, -1.030731201171875, -0.9764251708984375, -0.922119140625, -0.8678131103515625, -0.813507080078125, -0.7592010498046875, -0.70489501953125, -0.6505889892578125, -0.596282958984375, -0.5419769287109375, -0.4876708984375, -0.4333648681640625, -0.379058837890625, -0.3247528076171875, -0.27044677734375, -0.2161407470703125, -0.161834716796875, -0.1075286865234375, -0.05322265625, 0.0010833740234375, 0.055389404296875, 0.1096954345703125, 0.16400146484375, 0.2183074951171875, 0.272613525390625, 0.3269195556640625, 0.3812255859375, 0.4355316162109375, 0.489837646484375, 0.5441436767578125, 0.59844970703125, 0.6527557373046875, 0.707061767578125, 0.7613677978515625, 0.815673828125, 0.8699798583984375, 0.924285888671875, 0.9785919189453125, 1.03289794921875, 1.0872039794921875, 1.141510009765625, 1.1958160400390625, 1.2501220703125, 1.3044281005859375, 1.358734130859375, 1.4130401611328125, 1.46734619140625, 1.5216522216796875, 1.575958251953125, 1.6302642822265625, 1.6845703125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 19.0, 26.0, 25.0, 33.0, 65.0, 98.0, 108.0, 160.0, 266.0, 443.0, 724.0, 1338.0, 2466.0, 5047.0, 11331.0, 31320.0, 168459.0, 2289596.0, 1521732.0, 116287.0, 25565.0, 9528.0, 4423.0, 2290.0, 1154.0, 702.0, 353.0, 239.0, 123.0, 92.0, 68.0, 52.0, 36.0, 19.0, 20.0, 12.0, 7.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-5.3046875, -5.156982421875, -5.00927734375, -4.861572265625, -4.7138671875, -4.566162109375, -4.41845703125, -4.270751953125, -4.123046875, -3.975341796875, -3.82763671875, -3.679931640625, -3.5322265625, -3.384521484375, -3.23681640625, -3.089111328125, -2.94140625, -2.793701171875, -2.64599609375, -2.498291015625, -2.3505859375, -2.202880859375, -2.05517578125, -1.907470703125, -1.759765625, -1.612060546875, -1.46435546875, -1.316650390625, -1.1689453125, -1.021240234375, -0.87353515625, -0.725830078125, -0.578125, -0.430419921875, -0.28271484375, -0.135009765625, 0.0126953125, 0.160400390625, 0.30810546875, 0.455810546875, 0.603515625, 0.751220703125, 0.89892578125, 1.046630859375, 1.1943359375, 1.342041015625, 1.48974609375, 1.637451171875, 1.78515625, 1.932861328125, 2.08056640625, 2.228271484375, 2.3759765625, 2.523681640625, 2.67138671875, 2.819091796875, 2.966796875, 3.114501953125, 3.26220703125, 3.409912109375, 3.5576171875, 3.705322265625, 3.85302734375, 4.000732421875, 4.1484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 8.0, 5.0, 12.0, 6.0, 14.0, 25.0, 37.0, 62.0, 83.0, 136.0, 243.0, 461.0, 835.0, 913.0, 502.0, 265.0, 149.0, 92.0, 64.0, 37.0, 31.0, 26.0, 15.0, 17.0, 12.0, 9.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -2.98699951171875, -2.8450927734375, -2.70318603515625, -2.561279296875, -2.41937255859375, -2.2774658203125, -2.13555908203125, -1.99365234375, -1.85174560546875, -1.7098388671875, -1.56793212890625, -1.426025390625, -1.28411865234375, -1.1422119140625, -1.00030517578125, -0.8583984375, -0.71649169921875, -0.5745849609375, -0.43267822265625, -0.290771484375, -0.14886474609375, -0.0069580078125, 0.13494873046875, 0.27685546875, 0.41876220703125, 0.5606689453125, 0.70257568359375, 0.844482421875, 0.98638916015625, 1.1282958984375, 1.27020263671875, 1.412109375, 1.55401611328125, 1.6959228515625, 1.83782958984375, 1.979736328125, 2.12164306640625, 2.2635498046875, 2.40545654296875, 2.54736328125, 2.68927001953125, 2.8311767578125, 2.97308349609375, 3.114990234375, 3.25689697265625, 3.3988037109375, 3.54071044921875, 3.6826171875, 3.82452392578125, 3.9664306640625, 4.10833740234375, 4.250244140625, 4.39215087890625, 4.5340576171875, 4.67596435546875, 4.81787109375, 4.95977783203125, 5.1016845703125, 5.24359130859375, 5.385498046875, 5.52740478515625, 5.6693115234375, 5.81121826171875, 5.953125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 4.0, 9.0, 15.0, 16.0, 26.0, 31.0, 42.0, 64.0, 115.0, 180.0, 396.0, 1156.0, 6662.0, 87499.0, 3951117.0, 136115.0, 8533.0, 1393.0, 411.0, 187.0, 110.0, 76.0, 38.0, 25.0, 15.0, 12.0, 11.0, 6.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.359375, -19.8809814453125, -19.402587890625, -18.9241943359375, -18.44580078125, -17.9674072265625, -17.489013671875, -17.0106201171875, -16.5322265625, -16.0538330078125, -15.575439453125, -15.0970458984375, -14.61865234375, -14.1402587890625, -13.661865234375, -13.1834716796875, -12.705078125, -12.2266845703125, -11.748291015625, -11.2698974609375, -10.79150390625, -10.3131103515625, -9.834716796875, -9.3563232421875, -8.8779296875, -8.3995361328125, -7.921142578125, -7.4427490234375, -6.96435546875, -6.4859619140625, -6.007568359375, -5.5291748046875, -5.05078125, -4.5723876953125, -4.093994140625, -3.6156005859375, -3.13720703125, -2.6588134765625, -2.180419921875, -1.7020263671875, -1.2236328125, -0.7452392578125, -0.266845703125, 0.2115478515625, 0.68994140625, 1.1683349609375, 1.646728515625, 2.1251220703125, 2.603515625, 3.0819091796875, 3.560302734375, 4.0386962890625, 4.51708984375, 4.9954833984375, 5.473876953125, 5.9522705078125, 6.4306640625, 6.9090576171875, 7.387451171875, 7.8658447265625, 8.34423828125, 8.8226318359375, 9.301025390625, 9.7794189453125, 10.2578125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 11.0, 23.0, 40.0, 114.0, 242.0, 254.0, 174.0, 69.0, 45.0, 17.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0], "bins": [-56.02861404418945, -54.97510528564453, -53.921592712402344, -52.868080139160156, -51.814571380615234, -50.76106262207031, -49.707550048828125, -48.65403747558594, -47.600528717041016, -46.547019958496094, -45.493507385253906, -44.43999481201172, -43.3864860534668, -42.332977294921875, -41.27946472167969, -40.2259521484375, -39.17244338989258, -38.118934631347656, -37.06542205810547, -36.01190948486328, -34.95840072631836, -33.90489196777344, -32.85137939453125, -31.797868728637695, -30.74435806274414, -29.690847396850586, -28.63733673095703, -27.583826065063477, -26.530315399169922, -25.476804733276367, -24.423294067382812, -23.369783401489258, -22.316268920898438, -21.262758255004883, -20.209247589111328, -19.155736923217773, -18.10222625732422, -17.048715591430664, -15.99520492553711, -14.941694259643555, -13.888184547424316, -12.834673881530762, -11.781163215637207, -10.727652549743652, -9.674141883850098, -8.620631217956543, -7.567120552062988, -6.513609886169434, -5.460099220275879, -4.406588554382324, -3.3530778884887695, -2.299567222595215, -1.2460565567016602, -0.19254589080810547, 0.8609647750854492, 1.914475440979004, 2.9679861068725586, 4.021496772766113, 5.075007438659668, 6.128518104553223, 7.182028770446777, 8.235539436340332, 9.289050102233887, 10.342560768127441, 11.396071434020996]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 13.0, 5.0, 6.0, 9.0, 15.0, 13.0, 9.0, 16.0, 12.0, 25.0, 24.0, 28.0, 31.0, 33.0, 37.0, 39.0, 38.0, 43.0, 35.0, 51.0, 43.0, 40.0, 55.0, 37.0, 45.0, 39.0, 36.0, 35.0, 24.0, 20.0, 24.0, 22.0, 29.0, 13.0, 10.0, 8.0, 4.0, 9.0, 8.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-11.01626205444336, -10.68095874786377, -10.34565544128418, -10.010353088378906, -9.675049781799316, -9.339746475219727, -9.004444122314453, -8.669140815734863, -8.333837509155273, -7.998534202575684, -7.663231372833252, -7.32792854309082, -6.9926252365112305, -6.657321929931641, -6.322019100189209, -5.986716270446777, -5.6514129638671875, -5.316109657287598, -4.980806827545166, -4.645503997802734, -4.3102006912231445, -3.974897623062134, -3.639594554901123, -3.3042914867401123, -2.9689884185791016, -2.633685350418091, -2.29838228225708, -1.9630792140960693, -1.6277761459350586, -1.2924730777740479, -0.9571700096130371, -0.6218669414520264, -0.2865629196166992, 0.04874014854431152, 0.38404321670532227, 0.719346284866333, 1.0546493530273438, 1.3899524211883545, 1.7252554893493652, 2.060558557510376, 2.3958616256713867, 2.7311646938323975, 3.066467761993408, 3.401770830154419, 3.7370738983154297, 4.0723772048950195, 4.407680034637451, 4.742982864379883, 5.078286170959473, 5.4135894775390625, 5.748892307281494, 6.084195137023926, 6.419498443603516, 6.7548017501831055, 7.090104579925537, 7.425407409667969, 7.760710716247559, 8.096014022827148, 8.431316375732422, 8.766619682312012, 9.101922988891602, 9.437226295471191, 9.772529602050781, 10.107831954956055, 10.443135261535645]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 1.0, 6.0, 8.0, 10.0, 9.0, 18.0, 10.0, 13.0, 13.0, 21.0, 18.0, 24.0, 26.0, 29.0, 37.0, 32.0, 44.0, 38.0, 47.0, 43.0, 45.0, 35.0, 49.0, 45.0, 30.0, 30.0, 30.0, 36.0, 29.0, 26.0, 25.0, 34.0, 21.0, 13.0, 15.0, 18.0, 14.0, 10.0, 9.0, 13.0, 3.0, 7.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5830078125, -1.53399658203125, -1.4849853515625, -1.43597412109375, -1.386962890625, -1.33795166015625, -1.2889404296875, -1.23992919921875, -1.19091796875, -1.14190673828125, -1.0928955078125, -1.04388427734375, -0.994873046875, -0.94586181640625, -0.8968505859375, -0.84783935546875, -0.798828125, -0.74981689453125, -0.7008056640625, -0.65179443359375, -0.602783203125, -0.55377197265625, -0.5047607421875, -0.45574951171875, -0.40673828125, -0.35772705078125, -0.3087158203125, -0.25970458984375, -0.210693359375, -0.16168212890625, -0.1126708984375, -0.06365966796875, -0.0146484375, 0.03436279296875, 0.0833740234375, 0.13238525390625, 0.181396484375, 0.23040771484375, 0.2794189453125, 0.32843017578125, 0.37744140625, 0.42645263671875, 0.4754638671875, 0.52447509765625, 0.573486328125, 0.62249755859375, 0.6715087890625, 0.72052001953125, 0.76953125, 0.81854248046875, 0.8675537109375, 0.91656494140625, 0.965576171875, 1.01458740234375, 1.0635986328125, 1.11260986328125, 1.16162109375, 1.21063232421875, 1.2596435546875, 1.30865478515625, 1.357666015625, 1.40667724609375, 1.4556884765625, 1.50469970703125, 1.5537109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 7.0, 9.0, 12.0, 29.0, 23.0, 53.0, 71.0, 118.0, 164.0, 228.0, 347.0, 491.0, 695.0, 1068.0, 1649.0, 2435.0, 3589.0, 5430.0, 8144.0, 12688.0, 19314.0, 29694.0, 49245.0, 87938.0, 178056.0, 264582.0, 167946.0, 84240.0, 46944.0, 28860.0, 18580.0, 11928.0, 8009.0, 5341.0, 3460.0, 2321.0, 1580.0, 1043.0, 677.0, 479.0, 345.0, 250.0, 158.0, 106.0, 77.0, 43.0, 25.0, 20.0, 18.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.180908203125, -0.17533493041992188, -0.16976165771484375, -0.16418838500976562, -0.1586151123046875, -0.15304183959960938, -0.14746856689453125, -0.14189529418945312, -0.136322021484375, -0.13074874877929688, -0.12517547607421875, -0.11960220336914062, -0.1140289306640625, -0.10845565795898438, -0.10288238525390625, -0.09730911254882812, -0.09173583984375, -0.08616256713867188, -0.08058929443359375, -0.07501602172851562, -0.0694427490234375, -0.06386947631835938, -0.05829620361328125, -0.052722930908203125, -0.047149658203125, -0.041576385498046875, -0.03600311279296875, -0.030429840087890625, -0.0248565673828125, -0.019283294677734375, -0.01371002197265625, -0.008136749267578125, -0.0025634765625, 0.003009796142578125, 0.00858306884765625, 0.014156341552734375, 0.0197296142578125, 0.025302886962890625, 0.03087615966796875, 0.036449432373046875, 0.042022705078125, 0.047595977783203125, 0.05316925048828125, 0.058742523193359375, 0.0643157958984375, 0.06988906860351562, 0.07546234130859375, 0.08103561401367188, 0.08660888671875, 0.09218215942382812, 0.09775543212890625, 0.10332870483398438, 0.1089019775390625, 0.11447525024414062, 0.12004852294921875, 0.12562179565429688, 0.131195068359375, 0.13676834106445312, 0.14234161376953125, 0.14791488647460938, 0.1534881591796875, 0.15906143188476562, 0.16463470458984375, 0.17020797729492188, 0.17578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 11.0, 8.0, 11.0, 10.0, 17.0, 18.0, 23.0, 17.0, 24.0, 40.0, 31.0, 41.0, 36.0, 33.0, 35.0, 40.0, 40.0, 38.0, 1065.0, 36.0, 40.0, 44.0, 36.0, 43.0, 44.0, 34.0, 22.0, 32.0, 18.0, 20.0, 19.0, 20.0, 22.0, 13.0, 4.0, 12.0, 6.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9748687744140625, -0.938995361328125, -0.9031219482421875, -0.86724853515625, -0.8313751220703125, -0.795501708984375, -0.7596282958984375, -0.7237548828125, -0.6878814697265625, -0.652008056640625, -0.6161346435546875, -0.58026123046875, -0.5443878173828125, -0.508514404296875, -0.4726409912109375, -0.436767578125, -0.4008941650390625, -0.365020751953125, -0.3291473388671875, -0.29327392578125, -0.2574005126953125, -0.221527099609375, -0.1856536865234375, -0.1497802734375, -0.1139068603515625, -0.078033447265625, -0.0421600341796875, -0.00628662109375, 0.0295867919921875, 0.065460205078125, 0.1013336181640625, 0.13720703125, 0.1730804443359375, 0.208953857421875, 0.2448272705078125, 0.28070068359375, 0.3165740966796875, 0.352447509765625, 0.3883209228515625, 0.4241943359375, 0.4600677490234375, 0.495941162109375, 0.5318145751953125, 0.56768798828125, 0.6035614013671875, 0.639434814453125, 0.6753082275390625, 0.711181640625, 0.7470550537109375, 0.782928466796875, 0.8188018798828125, 0.85467529296875, 0.8905487060546875, 0.926422119140625, 0.9622955322265625, 0.9981689453125, 1.0340423583984375, 1.069915771484375, 1.1057891845703125, 1.14166259765625, 1.1775360107421875, 1.213409423828125, 1.2492828369140625, 1.28515625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 15.0, 17.0, 29.0, 40.0, 58.0, 77.0, 143.0, 227.0, 364.0, 548.0, 968.0, 1732.0, 3047.0, 5567.0, 11101.0, 26912.0, 195873.0, 1767901.0, 49579.0, 15920.0, 7657.0, 3937.0, 2263.0, 1237.0, 748.0, 457.0, 224.0, 170.0, 95.0, 75.0, 46.0, 37.0, 11.0, 11.0, 7.0, 6.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.392578125, -0.3800048828125, -0.367431640625, -0.3548583984375, -0.34228515625, -0.3297119140625, -0.317138671875, -0.3045654296875, -0.2919921875, -0.2794189453125, -0.266845703125, -0.2542724609375, -0.24169921875, -0.2291259765625, -0.216552734375, -0.2039794921875, -0.19140625, -0.1788330078125, -0.166259765625, -0.1536865234375, -0.14111328125, -0.1285400390625, -0.115966796875, -0.1033935546875, -0.0908203125, -0.0782470703125, -0.065673828125, -0.0531005859375, -0.04052734375, -0.0279541015625, -0.015380859375, -0.0028076171875, 0.009765625, 0.0223388671875, 0.034912109375, 0.0474853515625, 0.06005859375, 0.0726318359375, 0.085205078125, 0.0977783203125, 0.1103515625, 0.1229248046875, 0.135498046875, 0.1480712890625, 0.16064453125, 0.1732177734375, 0.185791015625, 0.1983642578125, 0.2109375, 0.2235107421875, 0.236083984375, 0.2486572265625, 0.26123046875, 0.2738037109375, 0.286376953125, 0.2989501953125, 0.3115234375, 0.3240966796875, 0.336669921875, 0.3492431640625, 0.36181640625, 0.3743896484375, 0.386962890625, 0.3995361328125, 0.412109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 9.0, 6.0, 8.0, 5.0, 13.0, 19.0, 17.0, 19.0, 25.0, 31.0, 36.0, 41.0, 38.0, 60.0, 51.0, 67.0, 53.0, 67.0, 59.0, 50.0, 53.0, 36.0, 45.0, 34.0, 24.0, 29.0, 24.0, 11.0, 8.0, 12.0, 7.0, 9.0, 1.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01267242431640625, -0.012281060218811035, -0.01188969612121582, -0.011498332023620605, -0.01110696792602539, -0.010715603828430176, -0.010324239730834961, -0.009932875633239746, -0.009541511535644531, -0.009150147438049316, -0.008758783340454102, -0.008367419242858887, -0.007976055145263672, -0.007584691047668457, -0.007193326950073242, -0.006801962852478027, -0.0064105987548828125, -0.006019234657287598, -0.005627870559692383, -0.005236506462097168, -0.004845142364501953, -0.004453778266906738, -0.0040624141693115234, -0.0036710500717163086, -0.0032796859741210938, -0.002888321876525879, -0.002496957778930664, -0.0021055936813354492, -0.0017142295837402344, -0.0013228654861450195, -0.0009315013885498047, -0.0005401372909545898, -0.000148773193359375, 0.00024259090423583984, 0.0006339550018310547, 0.0010253190994262695, 0.0014166831970214844, 0.0018080472946166992, 0.002199411392211914, 0.002590775489807129, 0.0029821395874023438, 0.0033735036849975586, 0.0037648677825927734, 0.004156231880187988, 0.004547595977783203, 0.004938960075378418, 0.005330324172973633, 0.005721688270568848, 0.0061130523681640625, 0.006504416465759277, 0.006895780563354492, 0.007287144660949707, 0.007678508758544922, 0.008069872856140137, 0.008461236953735352, 0.008852601051330566, 0.009243965148925781, 0.009635329246520996, 0.010026693344116211, 0.010418057441711426, 0.01080942153930664, 0.011200785636901855, 0.01159214973449707, 0.011983513832092285, 0.0123748779296875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 10.0, 11.0, 15.0, 17.0, 22.0, 29.0, 22.0, 58.0, 67.0, 96.0, 133.0, 186.0, 378.0, 1410.0, 16779.0, 786266.0, 234996.0, 6331.0, 789.0, 295.0, 176.0, 125.0, 86.0, 61.0, 38.0, 29.0, 31.0, 19.0, 10.0, 11.0, 5.0, 8.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21142578125, -0.20433807373046875, -0.1972503662109375, -0.19016265869140625, -0.183074951171875, -0.17598724365234375, -0.1688995361328125, -0.16181182861328125, -0.15472412109375, -0.14763641357421875, -0.1405487060546875, -0.13346099853515625, -0.126373291015625, -0.11928558349609375, -0.1121978759765625, -0.10511016845703125, -0.0980224609375, -0.09093475341796875, -0.0838470458984375, -0.07675933837890625, -0.069671630859375, -0.06258392333984375, -0.0554962158203125, -0.04840850830078125, -0.04132080078125, -0.03423309326171875, -0.0271453857421875, -0.02005767822265625, -0.012969970703125, -0.00588226318359375, 0.0012054443359375, 0.00829315185546875, 0.015380859375, 0.02246856689453125, 0.0295562744140625, 0.03664398193359375, 0.043731689453125, 0.05081939697265625, 0.0579071044921875, 0.06499481201171875, 0.07208251953125, 0.07917022705078125, 0.0862579345703125, 0.09334564208984375, 0.100433349609375, 0.10752105712890625, 0.1146087646484375, 0.12169647216796875, 0.1287841796875, 0.13587188720703125, 0.1429595947265625, 0.15004730224609375, 0.157135009765625, 0.16422271728515625, 0.1713104248046875, 0.17839813232421875, 0.18548583984375, 0.19257354736328125, 0.1996612548828125, 0.20674896240234375, 0.213836669921875, 0.22092437744140625, 0.2280120849609375, 0.23509979248046875, 0.2421875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 21.0, 93.0, 306.0, 413.0, 117.0, 40.0, 12.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09588763862848282, -0.09281691908836365, -0.08974619954824448, -0.0866754800081253, -0.08360475301742554, -0.08053403347730637, -0.0774633139371872, -0.07439259439706802, -0.07132187485694885, -0.06825115531682968, -0.06518043577671051, -0.06210971251130104, -0.05903898924589157, -0.0559682697057724, -0.05289755016565323, -0.04982683062553406, -0.04675610363483429, -0.04368538409471512, -0.04061466082930565, -0.03754394128918648, -0.03447321802377701, -0.03140249848365784, -0.028331778943538666, -0.025261057540774345, -0.022190336138010025, -0.019119614735245705, -0.016048893332481384, -0.012978173792362213, -0.009907452389597893, -0.006836730986833572, -0.0037660114467144012, -0.0006952900439500809, 0.0023754239082336426, 0.005446144845336676, 0.008516865782439709, 0.011587586253881454, 0.014658307656645775, 0.017729029059410095, 0.020799748599529266, 0.023870470002293587, 0.026941191405057907, 0.030011912807822227, 0.03308263421058655, 0.03615335375070572, 0.03922407329082489, 0.04229479655623436, 0.04536551609635353, 0.048436239361763, 0.05150695890188217, 0.05457767844200134, 0.05764840170741081, 0.060719121247529984, 0.06378984451293945, 0.06686056405305862, 0.0699312835931778, 0.07300200313329697, 0.07607272267341614, 0.07914344221353531, 0.08221416175365448, 0.08528488874435425, 0.08835560828447342, 0.09142632782459259, 0.09449704736471176, 0.09756776690483093, 0.1006384938955307]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 9.0, 7.0, 13.0, 12.0, 10.0, 17.0, 26.0, 15.0, 21.0, 30.0, 29.0, 41.0, 28.0, 34.0, 38.0, 40.0, 42.0, 48.0, 40.0, 39.0, 39.0, 39.0, 39.0, 39.0, 23.0, 24.0, 28.0, 28.0, 20.0, 25.0, 30.0, 16.0, 13.0, 12.0, 19.0, 11.0, 12.0, 14.0, 7.0, 2.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010076463222503662, -0.009728092700242996, -0.00937972217798233, -0.009031351655721664, -0.008682981133460999, -0.008334610611200333, -0.007986240088939667, -0.007637869566679001, -0.007289499044418335, -0.006941128522157669, -0.006592757999897003, -0.006244387477636337, -0.005896016955375671, -0.0055476464331150055, -0.00519927591085434, -0.004850905388593674, -0.004502534866333008, -0.004154164344072342, -0.003805793821811676, -0.00345742329955101, -0.0031090527772903442, -0.0027606822550296783, -0.0024123117327690125, -0.0020639412105083466, -0.0017155706882476807, -0.0013672001659870148, -0.0010188296437263489, -0.000670459121465683, -0.0003220885992050171, 2.6281923055648804e-05, 0.0003746524453163147, 0.0007230229675769806, 0.0010713934898376465, 0.0014197640120983124, 0.0017681345343589783, 0.002116505056619644, 0.00246487557888031, 0.002813246101140976, 0.003161616623401642, 0.0035099871456623077, 0.0038583576679229736, 0.0042067281901836395, 0.004555098712444305, 0.004903469234704971, 0.005251839756965637, 0.005600210279226303, 0.005948580801486969, 0.006296951323747635, 0.006645321846008301, 0.006993692368268967, 0.007342062890529633, 0.0076904334127902985, 0.008038803935050964, 0.00838717445731163, 0.008735544979572296, 0.009083915501832962, 0.009432286024093628, 0.009780656546354294, 0.01012902706861496, 0.010477397590875626, 0.010825768113136292, 0.011174138635396957, 0.011522509157657623, 0.01187087967991829, 0.012219250202178955]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 1.0, 6.0, 7.0, 12.0, 8.0, 18.0, 10.0, 13.0, 12.0, 22.0, 18.0, 24.0, 26.0, 29.0, 36.0, 33.0, 44.0, 37.0, 48.0, 43.0, 45.0, 34.0, 47.0, 47.0, 31.0, 29.0, 31.0, 35.0, 29.0, 27.0, 25.0, 34.0, 21.0, 13.0, 15.0, 18.0, 14.0, 10.0, 9.0, 13.0, 3.0, 7.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5830078125, -1.5340118408203125, -1.485015869140625, -1.4360198974609375, -1.38702392578125, -1.3380279541015625, -1.289031982421875, -1.2400360107421875, -1.1910400390625, -1.1420440673828125, -1.093048095703125, -1.0440521240234375, -0.99505615234375, -0.9460601806640625, -0.897064208984375, -0.8480682373046875, -0.799072265625, -0.7500762939453125, -0.701080322265625, -0.6520843505859375, -0.60308837890625, -0.5540924072265625, -0.505096435546875, -0.4561004638671875, -0.4071044921875, -0.3581085205078125, -0.309112548828125, -0.2601165771484375, -0.21112060546875, -0.1621246337890625, -0.113128662109375, -0.0641326904296875, -0.01513671875, 0.0338592529296875, 0.082855224609375, 0.1318511962890625, 0.18084716796875, 0.2298431396484375, 0.278839111328125, 0.3278350830078125, 0.3768310546875, 0.4258270263671875, 0.474822998046875, 0.5238189697265625, 0.57281494140625, 0.6218109130859375, 0.670806884765625, 0.7198028564453125, 0.768798828125, 0.8177947998046875, 0.866790771484375, 0.9157867431640625, 0.96478271484375, 1.0137786865234375, 1.062774658203125, 1.1117706298828125, 1.1607666015625, 1.2097625732421875, 1.258758544921875, 1.3077545166015625, 1.35675048828125, 1.4057464599609375, 1.454742431640625, 1.5037384033203125, 1.552734375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 11.0, 21.0, 24.0, 47.0, 49.0, 82.0, 139.0, 181.0, 297.0, 414.0, 676.0, 1100.0, 1859.0, 3234.0, 6213.0, 12498.0, 27238.0, 64924.0, 173715.0, 437887.0, 190002.0, 70565.0, 29026.0, 13146.0, 6518.0, 3554.0, 1898.0, 1133.0, 703.0, 479.0, 285.0, 205.0, 146.0, 85.0, 60.0, 46.0, 22.0, 25.0, 19.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0], "bins": [-2.859375, -2.7811279296875, -2.702880859375, -2.6246337890625, -2.54638671875, -2.4681396484375, -2.389892578125, -2.3116455078125, -2.2333984375, -2.1551513671875, -2.076904296875, -1.9986572265625, -1.92041015625, -1.8421630859375, -1.763916015625, -1.6856689453125, -1.607421875, -1.5291748046875, -1.450927734375, -1.3726806640625, -1.29443359375, -1.2161865234375, -1.137939453125, -1.0596923828125, -0.9814453125, -0.9031982421875, -0.824951171875, -0.7467041015625, -0.66845703125, -0.5902099609375, -0.511962890625, -0.4337158203125, -0.35546875, -0.2772216796875, -0.198974609375, -0.1207275390625, -0.04248046875, 0.0357666015625, 0.114013671875, 0.1922607421875, 0.2705078125, 0.3487548828125, 0.427001953125, 0.5052490234375, 0.58349609375, 0.6617431640625, 0.739990234375, 0.8182373046875, 0.896484375, 0.9747314453125, 1.052978515625, 1.1312255859375, 1.20947265625, 1.2877197265625, 1.365966796875, 1.4442138671875, 1.5224609375, 1.6007080078125, 1.678955078125, 1.7572021484375, 1.83544921875, 1.9136962890625, 1.991943359375, 2.0701904296875, 2.1484375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 6.0, 8.0, 13.0, 22.0, 14.0, 10.0, 33.0, 25.0, 30.0, 30.0, 29.0, 36.0, 37.0, 55.0, 69.0, 94.0, 169.0, 1388.0, 294.0, 161.0, 112.0, 68.0, 41.0, 42.0, 27.0, 39.0, 26.0, 18.0, 22.0, 15.0, 14.0, 18.0, 12.0, 13.0, 8.0, 10.0, 6.0, 6.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.2635498046875, -4.120849609375, -3.9781494140625, -3.83544921875, -3.6927490234375, -3.550048828125, -3.4073486328125, -3.2646484375, -3.1219482421875, -2.979248046875, -2.8365478515625, -2.69384765625, -2.5511474609375, -2.408447265625, -2.2657470703125, -2.123046875, -1.9803466796875, -1.837646484375, -1.6949462890625, -1.55224609375, -1.4095458984375, -1.266845703125, -1.1241455078125, -0.9814453125, -0.8387451171875, -0.696044921875, -0.5533447265625, -0.41064453125, -0.2679443359375, -0.125244140625, 0.0174560546875, 0.16015625, 0.3028564453125, 0.445556640625, 0.5882568359375, 0.73095703125, 0.8736572265625, 1.016357421875, 1.1590576171875, 1.3017578125, 1.4444580078125, 1.587158203125, 1.7298583984375, 1.87255859375, 2.0152587890625, 2.157958984375, 2.3006591796875, 2.443359375, 2.5860595703125, 2.728759765625, 2.8714599609375, 3.01416015625, 3.1568603515625, 3.299560546875, 3.4422607421875, 3.5849609375, 3.7276611328125, 3.870361328125, 4.0130615234375, 4.15576171875, 4.2984619140625, 4.441162109375, 4.5838623046875, 4.7265625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 13.0, 24.0, 66.0, 132.0, 330.0, 1082.0, 4769.0, 3083446.0, 52972.0, 1854.0, 610.0, 219.0, 92.0, 36.0, 24.0, 6.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.703125, -29.79296875, -28.8828125, -27.97265625, -27.0625, -26.15234375, -25.2421875, -24.33203125, -23.421875, -22.51171875, -21.6015625, -20.69140625, -19.78125, -18.87109375, -17.9609375, -17.05078125, -16.140625, -15.23046875, -14.3203125, -13.41015625, -12.5, -11.58984375, -10.6796875, -9.76953125, -8.859375, -7.94921875, -7.0390625, -6.12890625, -5.21875, -4.30859375, -3.3984375, -2.48828125, -1.578125, -0.66796875, 0.2421875, 1.15234375, 2.0625, 2.97265625, 3.8828125, 4.79296875, 5.703125, 6.61328125, 7.5234375, 8.43359375, 9.34375, 10.25390625, 11.1640625, 12.07421875, 12.984375, 13.89453125, 14.8046875, 15.71484375, 16.625, 17.53515625, 18.4453125, 19.35546875, 20.265625, 21.17578125, 22.0859375, 22.99609375, 23.90625, 24.81640625, 25.7265625, 26.63671875, 27.546875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 208.0, 797.0, 12.0, 0.0, 1.0, 0.0, 1.0], "bins": [-206.1995391845703, -202.65684509277344, -199.11415100097656, -195.5714569091797, -192.02877807617188, -188.486083984375, -184.94338989257812, -181.40069580078125, -177.85800170898438, -174.3153076171875, -170.77261352539062, -167.22991943359375, -163.68724060058594, -160.14454650878906, -156.6018524169922, -153.0591583251953, -149.51646423339844, -145.97377014160156, -142.4310760498047, -138.8883819580078, -135.345703125, -131.80300903320312, -128.26031494140625, -124.71762084960938, -121.17493438720703, -117.63224029541016, -114.08955383300781, -110.54685974121094, -107.00416564941406, -103.46147155761719, -99.91878509521484, -96.37609100341797, -92.83340454101562, -89.29071044921875, -85.7480239868164, -82.20532989501953, -78.66263580322266, -75.11994934082031, -71.57725524902344, -68.03456115722656, -64.49186706542969, -60.94917678833008, -57.4064826965332, -53.863792419433594, -50.32109832763672, -46.77840805053711, -43.2357177734375, -39.693023681640625, -36.15032958984375, -32.60763931274414, -29.064945220947266, -25.522254943847656, -21.97956085205078, -18.436870574951172, -14.89417839050293, -11.351486206054688, -7.808795928955078, -4.266103744506836, -0.723412036895752, 2.819279670715332, 6.361971855163574, 9.9046630859375, 13.447355270385742, 16.990047454833984, 20.532739639282227]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 4.0, 7.0, 3.0, 10.0, 13.0, 12.0, 17.0, 29.0, 32.0, 26.0, 25.0, 35.0, 39.0, 34.0, 53.0, 45.0, 59.0, 53.0, 48.0, 36.0, 32.0, 51.0, 43.0, 32.0, 33.0, 38.0, 23.0, 33.0, 21.0, 14.0, 21.0, 15.0, 11.0, 3.0, 14.0, 8.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.119260787963867, -10.709782600402832, -10.300304412841797, -9.890826225280762, -9.481348037719727, -9.071868896484375, -8.66239070892334, -8.252912521362305, -7.8434343338012695, -7.433956146240234, -7.024477958679199, -6.614999294281006, -6.205521106719971, -5.7960429191589355, -5.386564254760742, -4.977086067199707, -4.567607879638672, -4.158129692077637, -3.7486512660980225, -3.339172840118408, -2.929694652557373, -2.520216464996338, -2.1107380390167236, -1.7012596130371094, -1.2917814254760742, -0.8823031187057495, -0.4728248119354248, -0.0633465051651001, 0.3461318016052246, 0.7556099891662598, 1.165088415145874, 1.5745668411254883, 1.9840459823608398, 2.393524169921875, 2.8030025959014893, 3.2124810218811035, 3.6219592094421387, 4.031437397003174, 4.440916061401367, 4.850394248962402, 5.2598724365234375, 5.669350624084473, 6.078828811645508, 6.488307476043701, 6.897785663604736, 7.3072638511657715, 7.716742515563965, 8.126220703125, 8.535698890686035, 8.94517707824707, 9.354655265808105, 9.76413345336914, 10.173612594604492, 10.583089828491211, 10.992568969726562, 11.402047157287598, 11.811525344848633, 12.221003532409668, 12.630481719970703, 13.039959907531738, 13.449438095092773, 13.858917236328125, 14.26839542388916, 14.677873611450195, 15.08735179901123]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 10.0, 16.0, 14.0, 11.0, 14.0, 16.0, 17.0, 33.0, 22.0, 30.0, 32.0, 29.0, 37.0, 38.0, 44.0, 45.0, 40.0, 39.0, 48.0, 40.0, 33.0, 41.0, 37.0, 30.0, 30.0, 25.0, 19.0, 23.0, 22.0, 23.0, 16.0, 14.0, 15.0, 12.0, 17.0, 7.0, 8.0, 8.0, 8.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.75390625, -1.7021942138671875, -1.650482177734375, -1.5987701416015625, -1.54705810546875, -1.4953460693359375, -1.443634033203125, -1.3919219970703125, -1.3402099609375, -1.2884979248046875, -1.236785888671875, -1.1850738525390625, -1.13336181640625, -1.0816497802734375, -1.029937744140625, -0.9782257080078125, -0.926513671875, -0.8748016357421875, -0.823089599609375, -0.7713775634765625, -0.71966552734375, -0.6679534912109375, -0.616241455078125, -0.5645294189453125, -0.5128173828125, -0.4611053466796875, -0.409393310546875, -0.3576812744140625, -0.30596923828125, -0.2542572021484375, -0.202545166015625, -0.1508331298828125, -0.09912109375, -0.0474090576171875, 0.004302978515625, 0.0560150146484375, 0.10772705078125, 0.1594390869140625, 0.211151123046875, 0.2628631591796875, 0.3145751953125, 0.3662872314453125, 0.417999267578125, 0.4697113037109375, 0.52142333984375, 0.5731353759765625, 0.624847412109375, 0.6765594482421875, 0.728271484375, 0.7799835205078125, 0.831695556640625, 0.8834075927734375, 0.93511962890625, 0.9868316650390625, 1.038543701171875, 1.0902557373046875, 1.1419677734375, 1.1936798095703125, 1.245391845703125, 1.2971038818359375, 1.34881591796875, 1.4005279541015625, 1.452239990234375, 1.5039520263671875, 1.5556640625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 6.0, 22.0, 10.0, 28.0, 37.0, 64.0, 81.0, 111.0, 168.0, 229.0, 387.0, 725.0, 1293.0, 2490.0, 5740.0, 14930.0, 54424.0, 568860.0, 3138494.0, 340458.0, 41856.0, 13100.0, 5287.0, 2468.0, 1224.0, 654.0, 392.0, 230.0, 151.0, 97.0, 80.0, 56.0, 38.0, 29.0, 18.0, 16.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.83203125, -5.6673583984375, -5.502685546875, -5.3380126953125, -5.17333984375, -5.0086669921875, -4.843994140625, -4.6793212890625, -4.5146484375, -4.3499755859375, -4.185302734375, -4.0206298828125, -3.85595703125, -3.6912841796875, -3.526611328125, -3.3619384765625, -3.197265625, -3.0325927734375, -2.867919921875, -2.7032470703125, -2.53857421875, -2.3739013671875, -2.209228515625, -2.0445556640625, -1.8798828125, -1.7152099609375, -1.550537109375, -1.3858642578125, -1.22119140625, -1.0565185546875, -0.891845703125, -0.7271728515625, -0.5625, -0.3978271484375, -0.233154296875, -0.0684814453125, 0.09619140625, 0.2608642578125, 0.425537109375, 0.5902099609375, 0.7548828125, 0.9195556640625, 1.084228515625, 1.2489013671875, 1.41357421875, 1.5782470703125, 1.742919921875, 1.9075927734375, 2.072265625, 2.2369384765625, 2.401611328125, 2.5662841796875, 2.73095703125, 2.8956298828125, 3.060302734375, 3.2249755859375, 3.3896484375, 3.5543212890625, 3.718994140625, 3.8836669921875, 4.04833984375, 4.2130126953125, 4.377685546875, 4.5423583984375, 4.70703125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 20.0, 13.0, 21.0, 13.0, 36.0, 36.0, 39.0, 67.0, 125.0, 175.0, 251.0, 458.0, 695.0, 755.0, 489.0, 311.0, 177.0, 105.0, 70.0, 48.0, 31.0, 28.0, 22.0, 15.0, 11.0, 9.0, 6.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.15234375, -4.03729248046875, -3.9222412109375, -3.80718994140625, -3.692138671875, -3.57708740234375, -3.4620361328125, -3.34698486328125, -3.23193359375, -3.11688232421875, -3.0018310546875, -2.88677978515625, -2.771728515625, -2.65667724609375, -2.5416259765625, -2.42657470703125, -2.3115234375, -2.19647216796875, -2.0814208984375, -1.96636962890625, -1.851318359375, -1.73626708984375, -1.6212158203125, -1.50616455078125, -1.39111328125, -1.27606201171875, -1.1610107421875, -1.04595947265625, -0.930908203125, -0.81585693359375, -0.7008056640625, -0.58575439453125, -0.470703125, -0.35565185546875, -0.2406005859375, -0.12554931640625, -0.010498046875, 0.10455322265625, 0.2196044921875, 0.33465576171875, 0.44970703125, 0.56475830078125, 0.6798095703125, 0.79486083984375, 0.909912109375, 1.02496337890625, 1.1400146484375, 1.25506591796875, 1.3701171875, 1.48516845703125, 1.6002197265625, 1.71527099609375, 1.830322265625, 1.94537353515625, 2.0604248046875, 2.17547607421875, 2.29052734375, 2.40557861328125, 2.5206298828125, 2.63568115234375, 2.750732421875, 2.86578369140625, 2.9808349609375, 3.09588623046875, 3.2109375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 14.0, 14.0, 10.0, 24.0, 37.0, 51.0, 63.0, 113.0, 243.0, 790.0, 4084.0, 60105.0, 3977975.0, 142159.0, 6755.0, 1043.0, 330.0, 155.0, 88.0, 45.0, 29.0, 31.0, 24.0, 20.0, 16.0, 6.0, 11.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8828125, -13.3406982421875, -12.798583984375, -12.2564697265625, -11.71435546875, -11.1722412109375, -10.630126953125, -10.0880126953125, -9.5458984375, -9.0037841796875, -8.461669921875, -7.9195556640625, -7.37744140625, -6.8353271484375, -6.293212890625, -5.7510986328125, -5.208984375, -4.6668701171875, -4.124755859375, -3.5826416015625, -3.04052734375, -2.4984130859375, -1.956298828125, -1.4141845703125, -0.8720703125, -0.3299560546875, 0.212158203125, 0.7542724609375, 1.29638671875, 1.8385009765625, 2.380615234375, 2.9227294921875, 3.46484375, 4.0069580078125, 4.549072265625, 5.0911865234375, 5.63330078125, 6.1754150390625, 6.717529296875, 7.2596435546875, 7.8017578125, 8.3438720703125, 8.885986328125, 9.4281005859375, 9.97021484375, 10.5123291015625, 11.054443359375, 11.5965576171875, 12.138671875, 12.6807861328125, 13.222900390625, 13.7650146484375, 14.30712890625, 14.8492431640625, 15.391357421875, 15.9334716796875, 16.4755859375, 17.0177001953125, 17.559814453125, 18.1019287109375, 18.64404296875, 19.1861572265625, 19.728271484375, 20.2703857421875, 20.8125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 20.0, 40.0, 115.0, 212.0, 293.0, 176.0, 88.0, 37.0, 18.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4249382019043, -33.33045959472656, -32.23598098754883, -31.141502380371094, -30.04702377319336, -28.952545166015625, -27.85806655883789, -26.763587951660156, -25.669109344482422, -24.574630737304688, -23.480152130126953, -22.38567352294922, -21.291194915771484, -20.19671630859375, -19.102237701416016, -18.00775909423828, -16.913280487060547, -15.818801879882812, -14.724323272705078, -13.629844665527344, -12.53536605834961, -11.440887451171875, -10.34640884399414, -9.251930236816406, -8.157451629638672, -7.0629730224609375, -5.968494415283203, -4.874015808105469, -3.7795372009277344, -2.68505859375, -1.5905799865722656, -0.49610137939453125, 0.5983772277832031, 1.6928558349609375, 2.787334442138672, 3.8818130493164062, 4.976291656494141, 6.070770263671875, 7.165248870849609, 8.259727478027344, 9.354206085205078, 10.448684692382812, 11.543163299560547, 12.637641906738281, 13.732120513916016, 14.82659912109375, 15.921077728271484, 17.01555633544922, 18.110034942626953, 19.204513549804688, 20.298992156982422, 21.393470764160156, 22.48794937133789, 23.582427978515625, 24.67690658569336, 25.771385192871094, 26.865863800048828, 27.960342407226562, 29.054821014404297, 30.14929962158203, 31.243778228759766, 32.3382568359375, 33.432735443115234, 34.52721405029297, 35.6216926574707]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 6.0, 3.0, 6.0, 14.0, 8.0, 15.0, 15.0, 12.0, 14.0, 12.0, 22.0, 12.0, 26.0, 40.0, 28.0, 33.0, 33.0, 47.0, 33.0, 31.0, 35.0, 40.0, 33.0, 36.0, 42.0, 44.0, 36.0, 40.0, 35.0, 29.0, 31.0, 25.0, 17.0, 22.0, 17.0, 20.0, 22.0, 9.0, 11.0, 10.0, 5.0, 8.0, 4.0, 2.0, 6.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.577730178833008, -8.27817440032959, -7.978619575500488, -7.6790642738342285, -7.379508972167969, -7.079953193664551, -6.780397891998291, -6.480842590332031, -6.1812872886657715, -5.881731986999512, -5.582176685333252, -5.282621383666992, -4.983065605163574, -4.683510780334473, -4.383955001831055, -4.084399700164795, -3.784844398498535, -3.4852890968322754, -3.1857337951660156, -2.8861782550811768, -2.586622953414917, -2.2870676517486572, -1.987512230873108, -1.6879568099975586, -1.3884015083312988, -1.088846206665039, -0.7892907857894897, -0.4897354245185852, -0.19018006324768066, 0.1093752384185791, 0.4089306592941284, 0.7084860801696777, 1.008042335510254, 1.3075976371765137, 1.607153058052063, 1.9067084789276123, 2.206263780593872, 2.505819082260132, 2.8053746223449707, 3.1049299240112305, 3.4044852256774902, 3.70404052734375, 4.00359582901001, 4.3031511306762695, 4.6027069091796875, 4.902261734008789, 5.201817512512207, 5.501372814178467, 5.800928115844727, 6.100483417510986, 6.400038719177246, 6.699594020843506, 6.999149322509766, 7.298705101013184, 7.598260402679443, 7.897815704345703, 8.197370529174805, 8.496926307678223, 8.796481132507324, 9.096036911010742, 9.395591735839844, 9.695147514343262, 9.994702339172363, 10.294258117675781, 10.5938138961792]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 3.0, 8.0, 7.0, 11.0, 10.0, 19.0, 9.0, 17.0, 26.0, 26.0, 22.0, 26.0, 25.0, 41.0, 38.0, 41.0, 43.0, 52.0, 45.0, 45.0, 50.0, 40.0, 47.0, 31.0, 28.0, 31.0, 32.0, 31.0, 22.0, 20.0, 30.0, 22.0, 21.0, 18.0, 18.0, 8.0, 8.0, 11.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8896484375, -1.83514404296875, -1.7806396484375, -1.72613525390625, -1.671630859375, -1.61712646484375, -1.5626220703125, -1.50811767578125, -1.45361328125, -1.39910888671875, -1.3446044921875, -1.29010009765625, -1.235595703125, -1.18109130859375, -1.1265869140625, -1.07208251953125, -1.017578125, -0.96307373046875, -0.9085693359375, -0.85406494140625, -0.799560546875, -0.74505615234375, -0.6905517578125, -0.63604736328125, -0.58154296875, -0.52703857421875, -0.4725341796875, -0.41802978515625, -0.363525390625, -0.30902099609375, -0.2545166015625, -0.20001220703125, -0.1455078125, -0.09100341796875, -0.0364990234375, 0.01800537109375, 0.072509765625, 0.12701416015625, 0.1815185546875, 0.23602294921875, 0.29052734375, 0.34503173828125, 0.3995361328125, 0.45404052734375, 0.508544921875, 0.56304931640625, 0.6175537109375, 0.67205810546875, 0.7265625, 0.78106689453125, 0.8355712890625, 0.89007568359375, 0.944580078125, 0.99908447265625, 1.0535888671875, 1.10809326171875, 1.16259765625, 1.21710205078125, 1.2716064453125, 1.32611083984375, 1.380615234375, 1.43511962890625, 1.4896240234375, 1.54412841796875, 1.5986328125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 9.0, 16.0, 22.0, 23.0, 44.0, 57.0, 98.0, 120.0, 193.0, 361.0, 535.0, 964.0, 1590.0, 2875.0, 4781.0, 8501.0, 15071.0, 26729.0, 49874.0, 103395.0, 245019.0, 306036.0, 141733.0, 63881.0, 33602.0, 18282.0, 10401.0, 5933.0, 3450.0, 1935.0, 1169.0, 677.0, 426.0, 263.0, 169.0, 105.0, 68.0, 38.0, 33.0, 24.0, 21.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2254638671875, -0.21923255920410156, -0.21300125122070312, -0.2067699432373047, -0.20053863525390625, -0.1943073272705078, -0.18807601928710938, -0.18184471130371094, -0.1756134033203125, -0.16938209533691406, -0.16315078735351562, -0.1569194793701172, -0.15068817138671875, -0.1444568634033203, -0.13822555541992188, -0.13199424743652344, -0.125762939453125, -0.11953163146972656, -0.11330032348632812, -0.10706901550292969, -0.10083770751953125, -0.09460639953613281, -0.08837509155273438, -0.08214378356933594, -0.0759124755859375, -0.06968116760253906, -0.06344985961914062, -0.05721855163574219, -0.05098724365234375, -0.04475593566894531, -0.038524627685546875, -0.03229331970214844, -0.02606201171875, -0.019830703735351562, -0.013599395751953125, -0.0073680877685546875, -0.00113677978515625, 0.0050945281982421875, 0.011325836181640625, 0.017557144165039062, 0.0237884521484375, 0.030019760131835938, 0.036251068115234375, 0.04248237609863281, 0.04871368408203125, 0.05494499206542969, 0.061176300048828125, 0.06740760803222656, 0.073638916015625, 0.07987022399902344, 0.08610153198242188, 0.09233283996582031, 0.09856414794921875, 0.10479545593261719, 0.11102676391601562, 0.11725807189941406, 0.1234893798828125, 0.12972068786621094, 0.13595199584960938, 0.1421833038330078, 0.14841461181640625, 0.1546459197998047, 0.16087722778320312, 0.16710853576660156, 0.17333984375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 7.0, 9.0, 13.0, 21.0, 22.0, 20.0, 26.0, 20.0, 35.0, 26.0, 28.0, 23.0, 29.0, 34.0, 41.0, 50.0, 48.0, 1066.0, 50.0, 44.0, 32.0, 37.0, 35.0, 36.0, 30.0, 35.0, 22.0, 34.0, 19.0, 18.0, 22.0, 12.0, 9.0, 12.0, 7.0, 13.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.2880859375, -1.2519378662109375, -1.215789794921875, -1.1796417236328125, -1.14349365234375, -1.1073455810546875, -1.071197509765625, -1.0350494384765625, -0.9989013671875, -0.9627532958984375, -0.926605224609375, -0.8904571533203125, -0.85430908203125, -0.8181610107421875, -0.782012939453125, -0.7458648681640625, -0.709716796875, -0.6735687255859375, -0.637420654296875, -0.6012725830078125, -0.56512451171875, -0.5289764404296875, -0.492828369140625, -0.4566802978515625, -0.4205322265625, -0.3843841552734375, -0.348236083984375, -0.3120880126953125, -0.27593994140625, -0.2397918701171875, -0.203643798828125, -0.1674957275390625, -0.13134765625, -0.0951995849609375, -0.059051513671875, -0.0229034423828125, 0.01324462890625, 0.0493927001953125, 0.085540771484375, 0.1216888427734375, 0.1578369140625, 0.1939849853515625, 0.230133056640625, 0.2662811279296875, 0.30242919921875, 0.3385772705078125, 0.374725341796875, 0.4108734130859375, 0.447021484375, 0.4831695556640625, 0.519317626953125, 0.5554656982421875, 0.59161376953125, 0.6277618408203125, 0.663909912109375, 0.7000579833984375, 0.7362060546875, 0.7723541259765625, 0.808502197265625, 0.8446502685546875, 0.88079833984375, 0.9169464111328125, 0.953094482421875, 0.9892425537109375, 1.025390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 11.0, 10.0, 12.0, 20.0, 23.0, 34.0, 52.0, 56.0, 86.0, 118.0, 139.0, 204.0, 334.0, 413.0, 588.0, 862.0, 1291.0, 1735.0, 2651.0, 4248.0, 6790.0, 11613.0, 24023.0, 83404.0, 1703325.0, 182776.0, 34550.0, 14768.0, 8176.0, 4865.0, 3132.0, 2100.0, 1395.0, 918.0, 641.0, 496.0, 359.0, 261.0, 188.0, 125.0, 95.0, 67.0, 45.0, 35.0, 24.0, 27.0, 23.0, 5.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.25439453125, -0.2468414306640625, -0.239288330078125, -0.2317352294921875, -0.22418212890625, -0.2166290283203125, -0.209075927734375, -0.2015228271484375, -0.1939697265625, -0.1864166259765625, -0.178863525390625, -0.1713104248046875, -0.16375732421875, -0.1562042236328125, -0.148651123046875, -0.1410980224609375, -0.133544921875, -0.1259918212890625, -0.118438720703125, -0.1108856201171875, -0.10333251953125, -0.0957794189453125, -0.088226318359375, -0.0806732177734375, -0.0731201171875, -0.0655670166015625, -0.058013916015625, -0.0504608154296875, -0.04290771484375, -0.0353546142578125, -0.027801513671875, -0.0202484130859375, -0.0126953125, -0.0051422119140625, 0.002410888671875, 0.0099639892578125, 0.01751708984375, 0.0250701904296875, 0.032623291015625, 0.0401763916015625, 0.0477294921875, 0.0552825927734375, 0.062835693359375, 0.0703887939453125, 0.07794189453125, 0.0854949951171875, 0.093048095703125, 0.1006011962890625, 0.108154296875, 0.1157073974609375, 0.123260498046875, 0.1308135986328125, 0.13836669921875, 0.1459197998046875, 0.153472900390625, 0.1610260009765625, 0.1685791015625, 0.1761322021484375, 0.183685302734375, 0.1912384033203125, 0.19879150390625, 0.2063446044921875, 0.213897705078125, 0.2214508056640625, 0.22900390625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 2.0, 3.0, 6.0, 8.0, 15.0, 15.0, 21.0, 31.0, 35.0, 50.0, 57.0, 70.0, 99.0, 109.0, 95.0, 70.0, 65.0, 67.0, 41.0, 34.0, 24.0, 12.0, 15.0, 12.0, 8.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016693115234375, -0.0160677433013916, -0.015442371368408203, -0.014816999435424805, -0.014191627502441406, -0.013566255569458008, -0.01294088363647461, -0.012315511703491211, -0.011690139770507812, -0.011064767837524414, -0.010439395904541016, -0.009814023971557617, -0.009188652038574219, -0.00856328010559082, -0.007937908172607422, -0.0073125362396240234, -0.006687164306640625, -0.0060617923736572266, -0.005436420440673828, -0.00481104850769043, -0.004185676574707031, -0.003560304641723633, -0.0029349327087402344, -0.002309560775756836, -0.0016841888427734375, -0.001058816909790039, -0.0004334449768066406, 0.0001919269561767578, 0.0008172988891601562, 0.0014426708221435547, 0.002068042755126953, 0.0026934146881103516, 0.00331878662109375, 0.0039441585540771484, 0.004569530487060547, 0.005194902420043945, 0.005820274353027344, 0.006445646286010742, 0.007071018218994141, 0.007696390151977539, 0.008321762084960938, 0.008947134017944336, 0.009572505950927734, 0.010197877883911133, 0.010823249816894531, 0.01144862174987793, 0.012073993682861328, 0.012699365615844727, 0.013324737548828125, 0.013950109481811523, 0.014575481414794922, 0.01520085334777832, 0.01582622528076172, 0.016451597213745117, 0.017076969146728516, 0.017702341079711914, 0.018327713012695312, 0.01895308494567871, 0.01957845687866211, 0.020203828811645508, 0.020829200744628906, 0.021454572677612305, 0.022079944610595703, 0.0227053165435791, 0.0233306884765625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 9.0, 11.0, 15.0, 21.0, 27.0, 45.0, 61.0, 91.0, 170.0, 285.0, 949.0, 97336.0, 945882.0, 2690.0, 393.0, 205.0, 108.0, 59.0, 55.0, 38.0, 25.0, 20.0, 11.0, 7.0, 3.0, 5.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.464111328125, -0.45195770263671875, -0.4398040771484375, -0.42765045166015625, -0.415496826171875, -0.40334320068359375, -0.3911895751953125, -0.37903594970703125, -0.36688232421875, -0.35472869873046875, -0.3425750732421875, -0.33042144775390625, -0.318267822265625, -0.30611419677734375, -0.2939605712890625, -0.28180694580078125, -0.2696533203125, -0.25749969482421875, -0.2453460693359375, -0.23319244384765625, -0.221038818359375, -0.20888519287109375, -0.1967315673828125, -0.18457794189453125, -0.17242431640625, -0.16027069091796875, -0.1481170654296875, -0.13596343994140625, -0.123809814453125, -0.11165618896484375, -0.0995025634765625, -0.08734893798828125, -0.0751953125, -0.06304168701171875, -0.0508880615234375, -0.03873443603515625, -0.026580810546875, -0.01442718505859375, -0.0022735595703125, 0.00988006591796875, 0.02203369140625, 0.03418731689453125, 0.0463409423828125, 0.05849456787109375, 0.070648193359375, 0.08280181884765625, 0.0949554443359375, 0.10710906982421875, 0.1192626953125, 0.13141632080078125, 0.1435699462890625, 0.15572357177734375, 0.167877197265625, 0.18003082275390625, 0.1921844482421875, 0.20433807373046875, 0.21649169921875, 0.22864532470703125, 0.2407989501953125, 0.25295257568359375, 0.265106201171875, 0.27725982666015625, 0.2894134521484375, 0.30156707763671875, 0.313720703125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 41.0, 248.0, 512.0, 173.0, 29.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1556091010570526, -0.1524580419063568, -0.149306982755661, -0.1461559236049652, -0.1430048793554306, -0.1398538202047348, -0.136702761054039, -0.1335517019033432, -0.1304006427526474, -0.1272495836019516, -0.1240985319018364, -0.1209474727511406, -0.1177964136004448, -0.11464536190032959, -0.11149430274963379, -0.10834324359893799, -0.10519219189882278, -0.10204113274812698, -0.09889008104801178, -0.09573902189731598, -0.09258796274662018, -0.08943690359592438, -0.08628585189580917, -0.08313479274511337, -0.07998374104499817, -0.07683268189430237, -0.07368163019418716, -0.07053057104349136, -0.06737951189279556, -0.06422846019268036, -0.06107740104198456, -0.05792634189128876, -0.05477527901530266, -0.051624223589897156, -0.048473164439201355, -0.04532210901379585, -0.04217105358839035, -0.03901999443769455, -0.03586893901228905, -0.032717883586883545, -0.029566824436187744, -0.026415767148137093, -0.02326470986008644, -0.02011365443468094, -0.016962597146630287, -0.013811539858579636, -0.010660484433174133, -0.007509427145123482, -0.00435836985707283, -0.001207313034683466, 0.0019437437877058983, 0.005094800144433975, 0.008245857432484627, 0.011396914720535278, 0.01454797014594078, 0.017699027433991432, 0.020850084722042084, 0.024001142010092735, 0.027152199298143387, 0.03030325472354889, 0.03345431387424469, 0.03660536929965019, 0.039756424725055695, 0.042907483875751495, 0.046058539301157]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 2.0, 5.0, 12.0, 14.0, 17.0, 27.0, 21.0, 32.0, 32.0, 29.0, 45.0, 53.0, 50.0, 55.0, 41.0, 63.0, 64.0, 56.0, 56.0, 38.0, 36.0, 63.0, 33.0, 29.0, 28.0, 18.0, 22.0, 14.0, 8.0, 13.0, 6.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019090771675109863, -0.018468519672751427, -0.01784626767039299, -0.017224015668034554, -0.016601763665676117, -0.01597951166331768, -0.015357259660959244, -0.014735007658600807, -0.01411275565624237, -0.013490503653883934, -0.012868251651525497, -0.01224599964916706, -0.011623747646808624, -0.011001495644450188, -0.010379243642091751, -0.009756991639733315, -0.009134739637374878, -0.008512487635016441, -0.007890235632658005, -0.007267983630299568, -0.006645731627941132, -0.006023479625582695, -0.005401227623224258, -0.004778975620865822, -0.004156723618507385, -0.0035344716161489487, -0.002912219613790512, -0.0022899676114320755, -0.001667715609073639, -0.0010454636067152023, -0.00042321160435676575, 0.00019904039800167084, 0.0008212924003601074, 0.001443544402718544, 0.0020657964050769806, 0.002688048407435417, 0.0033103004097938538, 0.00393255241215229, 0.004554804414510727, 0.0051770564168691635, 0.0057993084192276, 0.006421560421586037, 0.007043812423944473, 0.00766606442630291, 0.008288316428661346, 0.008910568431019783, 0.00953282043337822, 0.010155072435736656, 0.010777324438095093, 0.01139957644045353, 0.012021828442811966, 0.012644080445170403, 0.013266332447528839, 0.013888584449887276, 0.014510836452245712, 0.015133088454604149, 0.015755340456962585, 0.016377592459321022, 0.01699984446167946, 0.017622096464037895, 0.018244348466396332, 0.01886660046875477, 0.019488852471113205, 0.02011110447347164, 0.020733356475830078]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 3.0, 8.0, 7.0, 11.0, 12.0, 18.0, 8.0, 17.0, 26.0, 26.0, 23.0, 25.0, 25.0, 42.0, 37.0, 42.0, 42.0, 52.0, 45.0, 46.0, 49.0, 41.0, 47.0, 30.0, 29.0, 30.0, 32.0, 32.0, 21.0, 20.0, 30.0, 22.0, 21.0, 18.0, 18.0, 8.0, 9.0, 10.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8896484375, -1.8351287841796875, -1.780609130859375, -1.7260894775390625, -1.67156982421875, -1.6170501708984375, -1.562530517578125, -1.5080108642578125, -1.4534912109375, -1.3989715576171875, -1.344451904296875, -1.2899322509765625, -1.23541259765625, -1.1808929443359375, -1.126373291015625, -1.0718536376953125, -1.017333984375, -0.9628143310546875, -0.908294677734375, -0.8537750244140625, -0.79925537109375, -0.7447357177734375, -0.690216064453125, -0.6356964111328125, -0.5811767578125, -0.5266571044921875, -0.472137451171875, -0.4176177978515625, -0.36309814453125, -0.3085784912109375, -0.254058837890625, -0.1995391845703125, -0.14501953125, -0.0904998779296875, -0.035980224609375, 0.0185394287109375, 0.07305908203125, 0.1275787353515625, 0.182098388671875, 0.2366180419921875, 0.2911376953125, 0.3456573486328125, 0.400177001953125, 0.4546966552734375, 0.50921630859375, 0.5637359619140625, 0.618255615234375, 0.6727752685546875, 0.727294921875, 0.7818145751953125, 0.836334228515625, 0.8908538818359375, 0.94537353515625, 0.9998931884765625, 1.054412841796875, 1.1089324951171875, 1.1634521484375, 1.2179718017578125, 1.272491455078125, 1.3270111083984375, 1.38153076171875, 1.4360504150390625, 1.490570068359375, 1.5450897216796875, 1.599609375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 4.0, 23.0, 30.0, 54.0, 69.0, 105.0, 173.0, 312.0, 526.0, 953.0, 1763.0, 3474.0, 7488.0, 17570.0, 49466.0, 303859.0, 551740.0, 70481.0, 22188.0, 9270.0, 4164.0, 2123.0, 1109.0, 602.0, 399.0, 243.0, 133.0, 66.0, 61.0, 31.0, 20.0, 14.0, 7.0, 5.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91015625, -4.7703857421875, -4.630615234375, -4.4908447265625, -4.35107421875, -4.2113037109375, -4.071533203125, -3.9317626953125, -3.7919921875, -3.6522216796875, -3.512451171875, -3.3726806640625, -3.23291015625, -3.0931396484375, -2.953369140625, -2.8135986328125, -2.673828125, -2.5340576171875, -2.394287109375, -2.2545166015625, -2.11474609375, -1.9749755859375, -1.835205078125, -1.6954345703125, -1.5556640625, -1.4158935546875, -1.276123046875, -1.1363525390625, -0.99658203125, -0.8568115234375, -0.717041015625, -0.5772705078125, -0.4375, -0.2977294921875, -0.157958984375, -0.0181884765625, 0.12158203125, 0.2613525390625, 0.401123046875, 0.5408935546875, 0.6806640625, 0.8204345703125, 0.960205078125, 1.0999755859375, 1.23974609375, 1.3795166015625, 1.519287109375, 1.6590576171875, 1.798828125, 1.9385986328125, 2.078369140625, 2.2181396484375, 2.35791015625, 2.4976806640625, 2.637451171875, 2.7772216796875, 2.9169921875, 3.0567626953125, 3.196533203125, 3.3363037109375, 3.47607421875, 3.6158447265625, 3.755615234375, 3.8953857421875, 4.03515625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 9.0, 14.0, 10.0, 15.0, 20.0, 22.0, 32.0, 34.0, 43.0, 54.0, 64.0, 57.0, 89.0, 187.0, 1449.0, 356.0, 148.0, 80.0, 52.0, 59.0, 50.0, 42.0, 28.0, 34.0, 23.0, 14.0, 15.0, 12.0, 7.0, 10.0, 6.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.140625, -6.95208740234375, -6.7635498046875, -6.57501220703125, -6.386474609375, -6.19793701171875, -6.0093994140625, -5.82086181640625, -5.63232421875, -5.44378662109375, -5.2552490234375, -5.06671142578125, -4.878173828125, -4.68963623046875, -4.5010986328125, -4.31256103515625, -4.1240234375, -3.93548583984375, -3.7469482421875, -3.55841064453125, -3.369873046875, -3.18133544921875, -2.9927978515625, -2.80426025390625, -2.61572265625, -2.42718505859375, -2.2386474609375, -2.05010986328125, -1.861572265625, -1.67303466796875, -1.4844970703125, -1.29595947265625, -1.107421875, -0.91888427734375, -0.7303466796875, -0.54180908203125, -0.353271484375, -0.16473388671875, 0.0238037109375, 0.21234130859375, 0.40087890625, 0.58941650390625, 0.7779541015625, 0.96649169921875, 1.155029296875, 1.34356689453125, 1.5321044921875, 1.72064208984375, 1.9091796875, 2.09771728515625, 2.2862548828125, 2.47479248046875, 2.663330078125, 2.85186767578125, 3.0404052734375, 3.22894287109375, 3.41748046875, 3.60601806640625, 3.7945556640625, 3.98309326171875, 4.171630859375, 4.36016845703125, 4.5487060546875, 4.73724365234375, 4.92578125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 7.0, 16.0, 11.0, 24.0, 28.0, 30.0, 50.0, 49.0, 75.0, 96.0, 170.0, 226.0, 465.0, 2096.0, 25404.0, 2853868.0, 254834.0, 6273.0, 965.0, 343.0, 200.0, 120.0, 74.0, 64.0, 52.0, 44.0, 27.0, 21.0, 24.0, 7.0, 13.0, 9.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7734375, -10.355224609375, -9.93701171875, -9.518798828125, -9.1005859375, -8.682373046875, -8.26416015625, -7.845947265625, -7.427734375, -7.009521484375, -6.59130859375, -6.173095703125, -5.7548828125, -5.336669921875, -4.91845703125, -4.500244140625, -4.08203125, -3.663818359375, -3.24560546875, -2.827392578125, -2.4091796875, -1.990966796875, -1.57275390625, -1.154541015625, -0.736328125, -0.318115234375, 0.10009765625, 0.518310546875, 0.9365234375, 1.354736328125, 1.77294921875, 2.191162109375, 2.609375, 3.027587890625, 3.44580078125, 3.864013671875, 4.2822265625, 4.700439453125, 5.11865234375, 5.536865234375, 5.955078125, 6.373291015625, 6.79150390625, 7.209716796875, 7.6279296875, 8.046142578125, 8.46435546875, 8.882568359375, 9.30078125, 9.718994140625, 10.13720703125, 10.555419921875, 10.9736328125, 11.391845703125, 11.81005859375, 12.228271484375, 12.646484375, 13.064697265625, 13.48291015625, 13.901123046875, 14.3193359375, 14.737548828125, 15.15576171875, 15.573974609375, 15.9921875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 290.0, 679.0, 40.0], "bins": [-137.56814575195312, -135.35604858398438, -133.1439666748047, -130.93186950683594, -128.7197723388672, -126.50768280029297, -124.29559326171875, -122.08350372314453, -119.87140655517578, -117.65931701660156, -115.44721984863281, -113.2351303100586, -111.02304077148438, -108.81094360351562, -106.5988540649414, -104.38676452636719, -102.17466735839844, -99.96257781982422, -97.75048065185547, -95.53839111328125, -93.32630157470703, -91.11420440673828, -88.90211486816406, -86.69002532958984, -84.47793579101562, -82.2658462524414, -80.05374908447266, -77.84165954589844, -75.62957000732422, -73.41747283935547, -71.20538330078125, -68.99329376220703, -66.78119659423828, -64.56910705566406, -62.35701370239258, -60.144920349121094, -57.93282699584961, -55.720733642578125, -53.508644104003906, -51.29655075073242, -49.08445739746094, -46.87236404418945, -44.660274505615234, -42.44818115234375, -40.236087799072266, -38.02399444580078, -35.81190490722656, -33.59981155395508, -31.387718200683594, -29.175626754760742, -26.963533401489258, -24.751441955566406, -22.539348602294922, -20.32725715637207, -18.11516571044922, -15.90307331085205, -13.690980911254883, -11.478888511657715, -9.266796112060547, -7.054704666137695, -4.842612266540527, -2.6305198669433594, -0.4184284210205078, 1.7936639785766602, 4.00575590133667]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 14.0, 11.0, 16.0, 13.0, 18.0, 23.0, 29.0, 25.0, 31.0, 35.0, 33.0, 40.0, 47.0, 46.0, 42.0, 41.0, 40.0, 47.0, 47.0, 43.0, 32.0, 40.0, 31.0, 34.0, 24.0, 38.0, 32.0, 22.0, 19.0, 14.0, 17.0, 13.0, 9.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.153592109680176, -14.691743850708008, -14.22989559173584, -13.768047332763672, -13.30620002746582, -12.844351768493652, -12.382503509521484, -11.920655250549316, -11.458806991577148, -10.99695873260498, -10.535110473632812, -10.073263168334961, -9.611414909362793, -9.149566650390625, -8.687718391418457, -8.225870132446289, -7.764022350311279, -7.302174091339111, -6.840326309204102, -6.378478050231934, -5.916629791259766, -5.454781532287598, -4.992933750152588, -4.53108549118042, -4.06923770904541, -3.6073896884918213, -3.1455414295196533, -2.6836934089660645, -2.2218451499938965, -1.7599971294403076, -1.2981491088867188, -0.8363008499145508, -0.3744525909423828, 0.08739551901817322, 0.5492436289787292, 1.011091709136963, 1.4729398488998413, 1.9347879886627197, 2.3966360092163086, 2.8584842681884766, 3.3203322887420654, 3.7821803092956543, 4.244028568267822, 4.705876350402832, 5.167724609375, 5.629572868347168, 6.091421127319336, 6.553269386291504, 7.015117168426514, 7.476965427398682, 7.938813209533691, 8.40066146850586, 8.862509727478027, 9.324357986450195, 9.786205291748047, 10.248054504394531, 10.709901809692383, 11.17175006866455, 11.633598327636719, 12.09544563293457, 12.557293891906738, 13.019142150878906, 13.480990409851074, 13.942838668823242, 14.40468692779541]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 9.0, 6.0, 11.0, 18.0, 13.0, 12.0, 16.0, 20.0, 30.0, 21.0, 30.0, 29.0, 33.0, 43.0, 35.0, 43.0, 46.0, 42.0, 36.0, 37.0, 37.0, 40.0, 35.0, 34.0, 17.0, 36.0, 36.0, 21.0, 27.0, 27.0, 21.0, 26.0, 17.0, 19.0, 10.0, 14.0, 11.0, 8.0, 8.0, 5.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.8671875, -1.8124847412109375, -1.757781982421875, -1.7030792236328125, -1.64837646484375, -1.5936737060546875, -1.538970947265625, -1.4842681884765625, -1.4295654296875, -1.3748626708984375, -1.320159912109375, -1.2654571533203125, -1.21075439453125, -1.1560516357421875, -1.101348876953125, -1.0466461181640625, -0.991943359375, -0.9372406005859375, -0.882537841796875, -0.8278350830078125, -0.77313232421875, -0.7184295654296875, -0.663726806640625, -0.6090240478515625, -0.5543212890625, -0.4996185302734375, -0.444915771484375, -0.3902130126953125, -0.33551025390625, -0.2808074951171875, -0.226104736328125, -0.1714019775390625, -0.11669921875, -0.0619964599609375, -0.007293701171875, 0.0474090576171875, 0.10211181640625, 0.1568145751953125, 0.211517333984375, 0.2662200927734375, 0.3209228515625, 0.3756256103515625, 0.430328369140625, 0.4850311279296875, 0.53973388671875, 0.5944366455078125, 0.649139404296875, 0.7038421630859375, 0.758544921875, 0.8132476806640625, 0.867950439453125, 0.9226531982421875, 0.97735595703125, 1.0320587158203125, 1.086761474609375, 1.1414642333984375, 1.1961669921875, 1.2508697509765625, 1.305572509765625, 1.3602752685546875, 1.41497802734375, 1.4696807861328125, 1.524383544921875, 1.5790863037109375, 1.6337890625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 4.0, 8.0, 6.0, 14.0, 20.0, 30.0, 60.0, 80.0, 112.0, 216.0, 354.0, 539.0, 947.0, 1697.0, 3340.0, 7094.0, 18096.0, 64589.0, 402884.0, 2162796.0, 1285230.0, 183262.0, 38115.0, 12919.0, 5508.0, 2752.0, 1408.0, 874.0, 501.0, 325.0, 205.0, 106.0, 57.0, 46.0, 24.0, 19.0, 10.0, 4.0, 7.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.533203125, -3.422119140625, -3.31103515625, -3.199951171875, -3.0888671875, -2.977783203125, -2.86669921875, -2.755615234375, -2.64453125, -2.533447265625, -2.42236328125, -2.311279296875, -2.2001953125, -2.089111328125, -1.97802734375, -1.866943359375, -1.755859375, -1.644775390625, -1.53369140625, -1.422607421875, -1.3115234375, -1.200439453125, -1.08935546875, -0.978271484375, -0.8671875, -0.756103515625, -0.64501953125, -0.533935546875, -0.4228515625, -0.311767578125, -0.20068359375, -0.089599609375, 0.021484375, 0.132568359375, 0.24365234375, 0.354736328125, 0.4658203125, 0.576904296875, 0.68798828125, 0.799072265625, 0.91015625, 1.021240234375, 1.13232421875, 1.243408203125, 1.3544921875, 1.465576171875, 1.57666015625, 1.687744140625, 1.798828125, 1.909912109375, 2.02099609375, 2.132080078125, 2.2431640625, 2.354248046875, 2.46533203125, 2.576416015625, 2.6875, 2.798583984375, 2.90966796875, 3.020751953125, 3.1318359375, 3.242919921875, 3.35400390625, 3.465087890625, 3.576171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 9.0, 12.0, 10.0, 24.0, 21.0, 21.0, 25.0, 32.0, 30.0, 46.0, 70.0, 92.0, 138.0, 197.0, 317.0, 444.0, 635.0, 549.0, 443.0, 281.0, 172.0, 154.0, 102.0, 67.0, 42.0, 36.0, 19.0, 22.0, 21.0, 6.0, 8.0, 6.0, 5.0, 3.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.5703125, -3.46832275390625, -3.3663330078125, -3.26434326171875, -3.162353515625, -3.06036376953125, -2.9583740234375, -2.85638427734375, -2.75439453125, -2.65240478515625, -2.5504150390625, -2.44842529296875, -2.346435546875, -2.24444580078125, -2.1424560546875, -2.04046630859375, -1.9384765625, -1.83648681640625, -1.7344970703125, -1.63250732421875, -1.530517578125, -1.42852783203125, -1.3265380859375, -1.22454833984375, -1.12255859375, -1.02056884765625, -0.9185791015625, -0.81658935546875, -0.714599609375, -0.61260986328125, -0.5106201171875, -0.40863037109375, -0.306640625, -0.20465087890625, -0.1026611328125, -0.00067138671875, 0.101318359375, 0.20330810546875, 0.3052978515625, 0.40728759765625, 0.50927734375, 0.61126708984375, 0.7132568359375, 0.81524658203125, 0.917236328125, 1.01922607421875, 1.1212158203125, 1.22320556640625, 1.3251953125, 1.42718505859375, 1.5291748046875, 1.63116455078125, 1.733154296875, 1.83514404296875, 1.9371337890625, 2.03912353515625, 2.14111328125, 2.24310302734375, 2.3450927734375, 2.44708251953125, 2.549072265625, 2.65106201171875, 2.7530517578125, 2.85504150390625, 2.95703125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 9.0, 9.0, 10.0, 15.0, 22.0, 33.0, 40.0, 54.0, 80.0, 142.0, 194.0, 396.0, 849.0, 2539.0, 13479.0, 187421.0, 3811258.0, 161018.0, 12541.0, 2377.0, 801.0, 356.0, 202.0, 120.0, 68.0, 53.0, 29.0, 38.0, 25.0, 23.0, 22.0, 12.0, 17.0, 4.0, 2.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.060791015625, -9.70751953125, -9.354248046875, -9.0009765625, -8.647705078125, -8.29443359375, -7.941162109375, -7.587890625, -7.234619140625, -6.88134765625, -6.528076171875, -6.1748046875, -5.821533203125, -5.46826171875, -5.114990234375, -4.76171875, -4.408447265625, -4.05517578125, -3.701904296875, -3.3486328125, -2.995361328125, -2.64208984375, -2.288818359375, -1.935546875, -1.582275390625, -1.22900390625, -0.875732421875, -0.5224609375, -0.169189453125, 0.18408203125, 0.537353515625, 0.890625, 1.243896484375, 1.59716796875, 1.950439453125, 2.3037109375, 2.656982421875, 3.01025390625, 3.363525390625, 3.716796875, 4.070068359375, 4.42333984375, 4.776611328125, 5.1298828125, 5.483154296875, 5.83642578125, 6.189697265625, 6.54296875, 6.896240234375, 7.24951171875, 7.602783203125, 7.9560546875, 8.309326171875, 8.66259765625, 9.015869140625, 9.369140625, 9.722412109375, 10.07568359375, 10.428955078125, 10.7822265625, 11.135498046875, 11.48876953125, 11.842041015625, 12.1953125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 25.0, 109.0, 387.0, 381.0, 91.0, 18.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.964784622192383, -27.04119300842285, -25.117603302001953, -23.194011688232422, -21.27042007446289, -19.346830368041992, -17.42323875427246, -15.499648094177246, -13.576057434082031, -11.652466773986816, -9.728876113891602, -7.80528450012207, -5.8816938400268555, -3.9581031799316406, -2.0345115661621094, -0.11092090606689453, 1.8126697540283203, 3.7362606525421143, 5.659851551055908, 7.583442687988281, 9.507033348083496, 11.430624008178711, 13.354215621948242, 15.277806282043457, 17.201396942138672, 19.124988555908203, 21.0485782623291, 22.972169876098633, 24.89575958251953, 26.819351196289062, 28.742942810058594, 30.666534423828125, 32.590126037597656, 34.51371765136719, 36.43730926513672, 38.36090087890625, 40.284488677978516, 42.20808029174805, 44.13167190551758, 46.05526351928711, 47.978851318359375, 49.902442932128906, 51.82603454589844, 53.74962615966797, 55.673213958740234, 57.596805572509766, 59.5203971862793, 61.44398880004883, 63.36758041381836, 65.29116821289062, 67.21475982666016, 69.13835144042969, 71.06194305419922, 72.98553466796875, 74.90912628173828, 76.83271789550781, 78.75630950927734, 80.67990112304688, 82.6034927368164, 84.52708435058594, 86.45067596435547, 88.374267578125, 90.2978515625, 92.22144317626953, 94.14503479003906]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 18.0, 10.0, 17.0, 17.0, 18.0, 22.0, 27.0, 17.0, 27.0, 32.0, 39.0, 36.0, 36.0, 42.0, 40.0, 49.0, 39.0, 52.0, 44.0, 45.0, 47.0, 42.0, 36.0, 34.0, 27.0, 30.0, 18.0, 22.0, 25.0, 12.0, 18.0, 13.0, 10.0, 7.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.081873893737793, -12.705885887145996, -12.3298978805542, -11.953910827636719, -11.577922821044922, -11.201934814453125, -10.825946807861328, -10.449958801269531, -10.073970794677734, -9.697982788085938, -9.32199478149414, -8.946006774902344, -8.570019721984863, -8.194031715393066, -7.8180437088012695, -7.442055702209473, -7.066068172454834, -6.690080165863037, -6.314092636108398, -5.938104629516602, -5.562116622924805, -5.186128616333008, -4.810141086578369, -4.434153079986572, -4.058165550231934, -3.682177782058716, -3.306189775466919, -2.930202007293701, -2.5542140007019043, -2.1782262325286865, -1.8022384643554688, -1.4262504577636719, -1.050262451171875, -0.6742745637893677, -0.2982867360115051, 0.07770109176635742, 0.45368897914886475, 0.8296768665313721, 1.2056646347045898, 1.5816526412963867, 1.9576404094696045, 2.3336281776428223, 2.709616184234619, 3.085603952407837, 3.4615917205810547, 3.8375797271728516, 4.213567733764648, 4.589555740356445, 4.965543270111084, 5.341531276702881, 5.7175188064575195, 6.093506813049316, 6.469494819641113, 6.84548282623291, 7.221470355987549, 7.597458362579346, 7.973445892333984, 8.349433898925781, 8.725421905517578, 9.101409912109375, 9.477396965026855, 9.853384971618652, 10.22937297821045, 10.605360984802246, 10.981348991394043]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 10.0, 5.0, 5.0, 11.0, 4.0, 11.0, 14.0, 8.0, 19.0, 15.0, 21.0, 32.0, 24.0, 24.0, 38.0, 31.0, 36.0, 45.0, 43.0, 37.0, 51.0, 33.0, 43.0, 36.0, 43.0, 41.0, 38.0, 33.0, 30.0, 28.0, 37.0, 25.0, 25.0, 15.0, 17.0, 18.0, 13.0, 7.0, 7.0, 7.0, 10.0, 7.0, 1.0, 1.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.912109375, -1.8584136962890625, -1.804718017578125, -1.7510223388671875, -1.69732666015625, -1.6436309814453125, -1.589935302734375, -1.5362396240234375, -1.4825439453125, -1.4288482666015625, -1.375152587890625, -1.3214569091796875, -1.26776123046875, -1.2140655517578125, -1.160369873046875, -1.1066741943359375, -1.052978515625, -0.9992828369140625, -0.945587158203125, -0.8918914794921875, -0.83819580078125, -0.7845001220703125, -0.730804443359375, -0.6771087646484375, -0.6234130859375, -0.5697174072265625, -0.516021728515625, -0.4623260498046875, -0.40863037109375, -0.3549346923828125, -0.301239013671875, -0.2475433349609375, -0.19384765625, -0.1401519775390625, -0.086456298828125, -0.0327606201171875, 0.02093505859375, 0.0746307373046875, 0.128326416015625, 0.1820220947265625, 0.2357177734375, 0.2894134521484375, 0.343109130859375, 0.3968048095703125, 0.45050048828125, 0.5041961669921875, 0.557891845703125, 0.6115875244140625, 0.665283203125, 0.7189788818359375, 0.772674560546875, 0.8263702392578125, 0.88006591796875, 0.9337615966796875, 0.987457275390625, 1.0411529541015625, 1.0948486328125, 1.1485443115234375, 1.202239990234375, 1.2559356689453125, 1.30963134765625, 1.3633270263671875, 1.417022705078125, 1.4707183837890625, 1.5244140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 7.0, 17.0, 22.0, 27.0, 56.0, 76.0, 108.0, 195.0, 290.0, 437.0, 701.0, 1100.0, 1715.0, 2725.0, 4203.0, 6236.0, 10149.0, 15776.0, 25372.0, 41814.0, 73441.0, 139865.0, 246891.0, 212506.0, 111167.0, 59895.0, 35096.0, 21080.0, 13374.0, 8490.0, 5608.0, 3595.0, 2365.0, 1473.0, 960.0, 612.0, 399.0, 263.0, 153.0, 96.0, 61.0, 46.0, 33.0, 10.0, 16.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.176025390625, -0.171112060546875, -0.16619873046875, -0.161285400390625, -0.1563720703125, -0.151458740234375, -0.14654541015625, -0.141632080078125, -0.13671875, -0.131805419921875, -0.12689208984375, -0.121978759765625, -0.1170654296875, -0.112152099609375, -0.10723876953125, -0.102325439453125, -0.097412109375, -0.092498779296875, -0.08758544921875, -0.082672119140625, -0.0777587890625, -0.072845458984375, -0.06793212890625, -0.063018798828125, -0.05810546875, -0.053192138671875, -0.04827880859375, -0.043365478515625, -0.0384521484375, -0.033538818359375, -0.02862548828125, -0.023712158203125, -0.018798828125, -0.013885498046875, -0.00897216796875, -0.004058837890625, 0.0008544921875, 0.005767822265625, 0.01068115234375, 0.015594482421875, 0.0205078125, 0.025421142578125, 0.03033447265625, 0.035247802734375, 0.0401611328125, 0.045074462890625, 0.04998779296875, 0.054901123046875, 0.059814453125, 0.064727783203125, 0.06964111328125, 0.074554443359375, 0.0794677734375, 0.084381103515625, 0.08929443359375, 0.094207763671875, 0.09912109375, 0.104034423828125, 0.10894775390625, 0.113861083984375, 0.1187744140625, 0.123687744140625, 0.12860107421875, 0.133514404296875, 0.138427734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 1.0, 6.0, 7.0, 6.0, 7.0, 18.0, 11.0, 18.0, 20.0, 24.0, 27.0, 28.0, 32.0, 39.0, 28.0, 36.0, 54.0, 52.0, 47.0, 1059.0, 43.0, 35.0, 42.0, 37.0, 43.0, 32.0, 36.0, 30.0, 31.0, 22.0, 31.0, 13.0, 18.0, 12.0, 19.0, 14.0, 8.0, 10.0, 6.0, 2.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.240234375, -1.2025299072265625, -1.164825439453125, -1.1271209716796875, -1.08941650390625, -1.0517120361328125, -1.014007568359375, -0.9763031005859375, -0.9385986328125, -0.9008941650390625, -0.863189697265625, -0.8254852294921875, -0.78778076171875, -0.7500762939453125, -0.712371826171875, -0.6746673583984375, -0.636962890625, -0.5992584228515625, -0.561553955078125, -0.5238494873046875, -0.48614501953125, -0.4484405517578125, -0.410736083984375, -0.3730316162109375, -0.3353271484375, -0.2976226806640625, -0.259918212890625, -0.2222137451171875, -0.18450927734375, -0.1468048095703125, -0.109100341796875, -0.0713958740234375, -0.03369140625, 0.0040130615234375, 0.041717529296875, 0.0794219970703125, 0.11712646484375, 0.1548309326171875, 0.192535400390625, 0.2302398681640625, 0.2679443359375, 0.3056488037109375, 0.343353271484375, 0.3810577392578125, 0.41876220703125, 0.4564666748046875, 0.494171142578125, 0.5318756103515625, 0.569580078125, 0.6072845458984375, 0.644989013671875, 0.6826934814453125, 0.72039794921875, 0.7581024169921875, 0.795806884765625, 0.8335113525390625, 0.8712158203125, 0.9089202880859375, 0.946624755859375, 0.9843292236328125, 1.02203369140625, 1.0597381591796875, 1.097442626953125, 1.1351470947265625, 1.1728515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 7.0, 7.0, 8.0, 13.0, 10.0, 26.0, 28.0, 34.0, 59.0, 78.0, 101.0, 141.0, 201.0, 267.0, 415.0, 531.0, 866.0, 1194.0, 1724.0, 2736.0, 4146.0, 6647.0, 11720.0, 24952.0, 101334.0, 1747985.0, 130946.0, 28165.0, 12572.0, 6996.0, 4445.0, 2736.0, 1825.0, 1291.0, 859.0, 651.0, 424.0, 268.0, 208.0, 148.0, 110.0, 80.0, 45.0, 38.0, 25.0, 25.0, 12.0, 12.0, 6.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.24560546875, -0.23806190490722656, -0.23051834106445312, -0.2229747772216797, -0.21543121337890625, -0.2078876495361328, -0.20034408569335938, -0.19280052185058594, -0.1852569580078125, -0.17771339416503906, -0.17016983032226562, -0.1626262664794922, -0.15508270263671875, -0.1475391387939453, -0.13999557495117188, -0.13245201110839844, -0.124908447265625, -0.11736488342285156, -0.10982131958007812, -0.10227775573730469, -0.09473419189453125, -0.08719062805175781, -0.07964706420898438, -0.07210350036621094, -0.0645599365234375, -0.05701637268066406, -0.049472808837890625, -0.04192924499511719, -0.03438568115234375, -0.026842117309570312, -0.019298553466796875, -0.011754989624023438, -0.00421142578125, 0.0033321380615234375, 0.010875701904296875, 0.018419265747070312, 0.02596282958984375, 0.03350639343261719, 0.041049957275390625, 0.04859352111816406, 0.0561370849609375, 0.06368064880371094, 0.07122421264648438, 0.07876777648925781, 0.08631134033203125, 0.09385490417480469, 0.10139846801757812, 0.10894203186035156, 0.116485595703125, 0.12402915954589844, 0.13157272338867188, 0.1391162872314453, 0.14665985107421875, 0.1542034149169922, 0.16174697875976562, 0.16929054260253906, 0.1768341064453125, 0.18437767028808594, 0.19192123413085938, 0.1994647979736328, 0.20700836181640625, 0.2145519256591797, 0.22209548950195312, 0.22963905334472656, 0.2371826171875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 9.0, 3.0, 17.0, 13.0, 17.0, 25.0, 26.0, 36.0, 35.0, 42.0, 51.0, 62.0, 61.0, 61.0, 62.0, 67.0, 56.0, 53.0, 53.0, 50.0, 34.0, 41.0, 19.0, 18.0, 22.0, 11.0, 10.0, 8.0, 6.0, 4.0, 7.0, 3.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01386260986328125, -0.013446688652038574, -0.013030767440795898, -0.012614846229553223, -0.012198925018310547, -0.011783003807067871, -0.011367082595825195, -0.01095116138458252, -0.010535240173339844, -0.010119318962097168, -0.009703397750854492, -0.009287476539611816, -0.00887155532836914, -0.008455634117126465, -0.008039712905883789, -0.007623791694641113, -0.0072078704833984375, -0.006791949272155762, -0.006376028060913086, -0.00596010684967041, -0.005544185638427734, -0.005128264427185059, -0.004712343215942383, -0.004296422004699707, -0.0038805007934570312, -0.0034645795822143555, -0.0030486583709716797, -0.002632737159729004, -0.002216815948486328, -0.0018008947372436523, -0.0013849735260009766, -0.0009690523147583008, -0.000553131103515625, -0.00013720989227294922, 0.00027871131896972656, 0.0006946325302124023, 0.0011105537414550781, 0.001526474952697754, 0.0019423961639404297, 0.0023583173751831055, 0.0027742385864257812, 0.003190159797668457, 0.003606081008911133, 0.004022002220153809, 0.004437923431396484, 0.00485384464263916, 0.005269765853881836, 0.005685687065124512, 0.0061016082763671875, 0.006517529487609863, 0.006933450698852539, 0.007349371910095215, 0.007765293121337891, 0.008181214332580566, 0.008597135543823242, 0.009013056755065918, 0.009428977966308594, 0.00984489917755127, 0.010260820388793945, 0.010676741600036621, 0.011092662811279297, 0.011508584022521973, 0.011924505233764648, 0.012340426445007324, 0.01275634765625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 16.0, 16.0, 22.0, 25.0, 39.0, 60.0, 68.0, 107.0, 168.0, 326.0, 974.0, 130210.0, 912699.0, 2664.0, 463.0, 211.0, 131.0, 80.0, 46.0, 51.0, 31.0, 25.0, 26.0, 13.0, 14.0, 8.0, 7.0, 4.0, 1.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.259521484375, -0.25092315673828125, -0.2423248291015625, -0.23372650146484375, -0.225128173828125, -0.21652984619140625, -0.2079315185546875, -0.19933319091796875, -0.19073486328125, -0.18213653564453125, -0.1735382080078125, -0.16493988037109375, -0.156341552734375, -0.14774322509765625, -0.1391448974609375, -0.13054656982421875, -0.1219482421875, -0.11334991455078125, -0.1047515869140625, -0.09615325927734375, -0.087554931640625, -0.07895660400390625, -0.0703582763671875, -0.06175994873046875, -0.05316162109375, -0.04456329345703125, -0.0359649658203125, -0.02736663818359375, -0.018768310546875, -0.01016998291015625, -0.0015716552734375, 0.00702667236328125, 0.015625, 0.02422332763671875, 0.0328216552734375, 0.04141998291015625, 0.050018310546875, 0.05861663818359375, 0.0672149658203125, 0.07581329345703125, 0.08441162109375, 0.09300994873046875, 0.1016082763671875, 0.11020660400390625, 0.118804931640625, 0.12740325927734375, 0.1360015869140625, 0.14459991455078125, 0.1531982421875, 0.16179656982421875, 0.1703948974609375, 0.17899322509765625, 0.187591552734375, 0.19618988037109375, 0.2047882080078125, 0.21338653564453125, 0.22198486328125, 0.23058319091796875, 0.2391815185546875, 0.24777984619140625, 0.256378173828125, 0.26497650146484375, 0.2735748291015625, 0.28217315673828125, 0.290771484375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 16.0, 29.0, 53.0, 81.0, 140.0, 173.0, 191.0, 120.0, 79.0, 40.0, 30.0, 22.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028109299018979073, -0.027230020612478256, -0.02635074220597744, -0.025471463799476624, -0.024592185392975807, -0.02371290698647499, -0.022833628579974174, -0.021954350173473358, -0.021075071766972542, -0.020195793360471725, -0.01931651495397091, -0.018437236547470093, -0.017557958140969276, -0.01667867973446846, -0.015799401327967644, -0.014920122921466827, -0.014040844514966011, -0.013161566108465195, -0.012282287701964378, -0.011403009295463562, -0.010523730888962746, -0.00964445248246193, -0.008765174075961113, -0.007885895669460297, -0.00700661726295948, -0.006127338856458664, -0.005248060449957848, -0.004368782043457031, -0.003489503636956215, -0.0026102252304553986, -0.0017309468239545822, -0.0008516684174537659, 2.7609989047050476e-05, 0.0009068883955478668, 0.0017861668020486832, 0.0026654452085494995, 0.003544723615050316, 0.004424002021551132, 0.0053032804280519485, 0.006182558834552765, 0.007061837241053581, 0.007941115647554398, 0.008820394054055214, 0.00969967246055603, 0.010578950867056847, 0.011458229273557663, 0.01233750768005848, 0.013216786086559296, 0.014096064493060112, 0.014975342899560928, 0.015854621306061745, 0.01673389971256256, 0.017613178119063377, 0.018492456525564194, 0.01937173493206501, 0.020251013338565826, 0.021130291745066643, 0.02200957015156746, 0.022888848558068275, 0.023768126964569092, 0.024647405371069908, 0.025526683777570724, 0.02640596218407154, 0.027285240590572357, 0.028164518997073174]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 7.0, 16.0, 23.0, 30.0, 34.0, 38.0, 39.0, 49.0, 55.0, 69.0, 63.0, 64.0, 43.0, 55.0, 50.0, 50.0, 52.0, 42.0, 43.0, 29.0, 33.0, 23.0, 23.0, 17.0, 11.0, 7.0, 5.0, 10.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01929992437362671, -0.018780957907438278, -0.018261991441249847, -0.017743024975061417, -0.017224058508872986, -0.016705092042684555, -0.016186125576496124, -0.015667159110307693, -0.015148192644119263, -0.014629226177930832, -0.014110259711742401, -0.01359129324555397, -0.01307232677936554, -0.012553360313177109, -0.012034393846988678, -0.011515427380800247, -0.010996460914611816, -0.010477494448423386, -0.009958527982234955, -0.009439561516046524, -0.008920595049858093, -0.008401628583669662, -0.007882662117481232, -0.007363695651292801, -0.00684472918510437, -0.006325762718915939, -0.0058067962527275085, -0.005287829786539078, -0.004768863320350647, -0.004249896854162216, -0.0037309303879737854, -0.0032119639217853546, -0.002692997455596924, -0.002174030989408493, -0.0016550645232200623, -0.0011360980570316315, -0.0006171315908432007, -9.81651246547699e-05, 0.0004208013415336609, 0.0009397678077220917, 0.0014587342739105225, 0.0019777007400989532, 0.002496667206287384, 0.003015633672475815, 0.0035346001386642456, 0.004053566604852676, 0.004572533071041107, 0.005091499537229538, 0.005610466003417969, 0.0061294324696063995, 0.00664839893579483, 0.007167365401983261, 0.007686331868171692, 0.008205298334360123, 0.008724264800548553, 0.009243231266736984, 0.009762197732925415, 0.010281164199113846, 0.010800130665302277, 0.011319097131490707, 0.011838063597679138, 0.012357030063867569, 0.012875996530056, 0.01339496299624443, 0.013913929462432861]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 9.0, 5.0, 5.0, 11.0, 5.0, 11.0, 13.0, 8.0, 19.0, 15.0, 20.0, 33.0, 24.0, 23.0, 39.0, 32.0, 35.0, 45.0, 42.0, 38.0, 52.0, 32.0, 44.0, 35.0, 43.0, 39.0, 40.0, 33.0, 30.0, 28.0, 37.0, 25.0, 25.0, 15.0, 17.0, 18.0, 13.0, 7.0, 7.0, 7.0, 10.0, 7.0, 1.0, 1.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.912109375, -1.8584136962890625, -1.804718017578125, -1.7510223388671875, -1.69732666015625, -1.6436309814453125, -1.589935302734375, -1.5362396240234375, -1.4825439453125, -1.4288482666015625, -1.375152587890625, -1.3214569091796875, -1.26776123046875, -1.2140655517578125, -1.160369873046875, -1.1066741943359375, -1.052978515625, -0.9992828369140625, -0.945587158203125, -0.8918914794921875, -0.83819580078125, -0.7845001220703125, -0.730804443359375, -0.6771087646484375, -0.6234130859375, -0.5697174072265625, -0.516021728515625, -0.4623260498046875, -0.40863037109375, -0.3549346923828125, -0.301239013671875, -0.2475433349609375, -0.19384765625, -0.1401519775390625, -0.086456298828125, -0.0327606201171875, 0.02093505859375, 0.0746307373046875, 0.128326416015625, 0.1820220947265625, 0.2357177734375, 0.2894134521484375, 0.343109130859375, 0.3968048095703125, 0.45050048828125, 0.5041961669921875, 0.557891845703125, 0.6115875244140625, 0.665283203125, 0.7189788818359375, 0.772674560546875, 0.8263702392578125, 0.88006591796875, 0.9337615966796875, 0.987457275390625, 1.0411529541015625, 1.0948486328125, 1.1485443115234375, 1.202239990234375, 1.2559356689453125, 1.30963134765625, 1.3633270263671875, 1.417022705078125, 1.4707183837890625, 1.5244140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 14.0, 9.0, 42.0, 57.0, 73.0, 144.0, 227.0, 327.0, 554.0, 1012.0, 1815.0, 3635.0, 7132.0, 14861.0, 33509.0, 85410.0, 277150.0, 408084.0, 127956.0, 47137.0, 19972.0, 9148.0, 4706.0, 2537.0, 1259.0, 701.0, 417.0, 250.0, 161.0, 95.0, 52.0, 30.0, 25.0, 16.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7265625, -2.6444091796875, -2.562255859375, -2.4801025390625, -2.39794921875, -2.3157958984375, -2.233642578125, -2.1514892578125, -2.0693359375, -1.9871826171875, -1.905029296875, -1.8228759765625, -1.74072265625, -1.6585693359375, -1.576416015625, -1.4942626953125, -1.412109375, -1.3299560546875, -1.247802734375, -1.1656494140625, -1.08349609375, -1.0013427734375, -0.919189453125, -0.8370361328125, -0.7548828125, -0.6727294921875, -0.590576171875, -0.5084228515625, -0.42626953125, -0.3441162109375, -0.261962890625, -0.1798095703125, -0.09765625, -0.0155029296875, 0.066650390625, 0.1488037109375, 0.23095703125, 0.3131103515625, 0.395263671875, 0.4774169921875, 0.5595703125, 0.6417236328125, 0.723876953125, 0.8060302734375, 0.88818359375, 0.9703369140625, 1.052490234375, 1.1346435546875, 1.216796875, 1.2989501953125, 1.381103515625, 1.4632568359375, 1.54541015625, 1.6275634765625, 1.709716796875, 1.7918701171875, 1.8740234375, 1.9561767578125, 2.038330078125, 2.1204833984375, 2.20263671875, 2.2847900390625, 2.366943359375, 2.4490966796875, 2.53125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 8.0, 14.0, 11.0, 18.0, 14.0, 15.0, 32.0, 31.0, 41.0, 36.0, 48.0, 37.0, 71.0, 73.0, 138.0, 358.0, 1425.0, 175.0, 88.0, 58.0, 43.0, 43.0, 30.0, 26.0, 29.0, 22.0, 21.0, 25.0, 17.0, 22.0, 14.0, 8.0, 7.0, 8.0, 5.0, 7.0, 7.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.9019775390625, -4.733642578125, -4.5653076171875, -4.39697265625, -4.2286376953125, -4.060302734375, -3.8919677734375, -3.7236328125, -3.5552978515625, -3.386962890625, -3.2186279296875, -3.05029296875, -2.8819580078125, -2.713623046875, -2.5452880859375, -2.376953125, -2.2086181640625, -2.040283203125, -1.8719482421875, -1.70361328125, -1.5352783203125, -1.366943359375, -1.1986083984375, -1.0302734375, -0.8619384765625, -0.693603515625, -0.5252685546875, -0.35693359375, -0.1885986328125, -0.020263671875, 0.1480712890625, 0.31640625, 0.4847412109375, 0.653076171875, 0.8214111328125, 0.98974609375, 1.1580810546875, 1.326416015625, 1.4947509765625, 1.6630859375, 1.8314208984375, 1.999755859375, 2.1680908203125, 2.33642578125, 2.5047607421875, 2.673095703125, 2.8414306640625, 3.009765625, 3.1781005859375, 3.346435546875, 3.5147705078125, 3.68310546875, 3.8514404296875, 4.019775390625, 4.1881103515625, 4.3564453125, 4.5247802734375, 4.693115234375, 4.8614501953125, 5.02978515625, 5.1981201171875, 5.366455078125, 5.5347900390625, 5.703125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 10.0, 6.0, 12.0, 15.0, 16.0, 19.0, 35.0, 46.0, 45.0, 62.0, 86.0, 107.0, 201.0, 358.0, 761.0, 2296.0, 10886.0, 117957.0, 2752767.0, 238903.0, 16084.0, 3013.0, 881.0, 375.0, 234.0, 154.0, 105.0, 50.0, 53.0, 42.0, 32.0, 28.0, 21.0, 9.0, 10.0, 7.0, 7.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8125, -7.5728759765625, -7.333251953125, -7.0936279296875, -6.85400390625, -6.6143798828125, -6.374755859375, -6.1351318359375, -5.8955078125, -5.6558837890625, -5.416259765625, -5.1766357421875, -4.93701171875, -4.6973876953125, -4.457763671875, -4.2181396484375, -3.978515625, -3.7388916015625, -3.499267578125, -3.2596435546875, -3.02001953125, -2.7803955078125, -2.540771484375, -2.3011474609375, -2.0615234375, -1.8218994140625, -1.582275390625, -1.3426513671875, -1.10302734375, -0.8634033203125, -0.623779296875, -0.3841552734375, -0.14453125, 0.0950927734375, 0.334716796875, 0.5743408203125, 0.81396484375, 1.0535888671875, 1.293212890625, 1.5328369140625, 1.7724609375, 2.0120849609375, 2.251708984375, 2.4913330078125, 2.73095703125, 2.9705810546875, 3.210205078125, 3.4498291015625, 3.689453125, 3.9290771484375, 4.168701171875, 4.4083251953125, 4.64794921875, 4.8875732421875, 5.127197265625, 5.3668212890625, 5.6064453125, 5.8460693359375, 6.085693359375, 6.3253173828125, 6.56494140625, 6.8045654296875, 7.044189453125, 7.2838134765625, 7.5234375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 41.0, 556.0, 401.0, 17.0, 0.0, 0.0, 1.0, 1.0], "bins": [-123.47514343261719, -121.34172821044922, -119.20831298828125, -117.07489776611328, -114.94148254394531, -112.80806732177734, -110.67465209960938, -108.5412368774414, -106.40782165527344, -104.27440643310547, -102.1409912109375, -100.00757598876953, -97.87416076660156, -95.7407455444336, -93.60733032226562, -91.47391510009766, -89.34049987792969, -87.20708465576172, -85.07366943359375, -82.94025421142578, -80.80683898925781, -78.67342376708984, -76.54000854492188, -74.4065933227539, -72.27317810058594, -70.13976287841797, -68.00634765625, -65.87293243408203, -63.73951721191406, -61.606101989746094, -59.472686767578125, -57.339271545410156, -55.20586395263672, -53.07244873046875, -50.93903350830078, -48.80561828613281, -46.672203063964844, -44.538787841796875, -42.405372619628906, -40.27195739746094, -38.13854217529297, -36.005126953125, -33.87171173095703, -31.738296508789062, -29.604881286621094, -27.471466064453125, -25.338050842285156, -23.204635620117188, -21.07122039794922, -18.93780517578125, -16.80438995361328, -14.670974731445312, -12.537559509277344, -10.404144287109375, -8.270729064941406, -6.1373138427734375, -4.003898620605469, -1.8704833984375, 0.26293182373046875, 2.3963470458984375, 4.529762268066406, 6.663177490234375, 8.796592712402344, 10.930007934570312, 13.063423156738281]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 3.0, 5.0, 11.0, 21.0, 12.0, 17.0, 15.0, 22.0, 28.0, 24.0, 26.0, 29.0, 41.0, 40.0, 31.0, 38.0, 42.0, 43.0, 52.0, 40.0, 51.0, 39.0, 34.0, 38.0, 33.0, 39.0, 29.0, 29.0, 26.0, 25.0, 21.0, 13.0, 8.0, 12.0, 12.0, 10.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.946799278259277, -11.505130767822266, -11.063461303710938, -10.62179183959961, -10.180123329162598, -9.738454818725586, -9.296785354614258, -8.85511589050293, -8.413447380065918, -7.971778392791748, -7.530109405517578, -7.088440418243408, -6.646771430969238, -6.205102443695068, -5.763433456420898, -5.3217644691467285, -4.880095481872559, -4.438426494598389, -3.9967575073242188, -3.555088520050049, -3.113419532775879, -2.671750545501709, -2.230081558227539, -1.7884125709533691, -1.3467435836791992, -0.9050745964050293, -0.4634056091308594, -0.021736621856689453, 0.41993236541748047, 0.8616013526916504, 1.3032703399658203, 1.7449393272399902, 2.1866092681884766, 2.6282782554626465, 3.0699472427368164, 3.5116162300109863, 3.9532852172851562, 4.394954204559326, 4.836623191833496, 5.278292179107666, 5.719961166381836, 6.161630153656006, 6.603299140930176, 7.044968128204346, 7.486637115478516, 7.9283061027526855, 8.369975090026855, 8.811643600463867, 9.253313064575195, 9.694982528686523, 10.136651039123535, 10.578319549560547, 11.019989013671875, 11.461658477783203, 11.903326988220215, 12.344995498657227, 12.786664962768555, 13.228334426879883, 13.670002937316895, 14.111671447753906, 14.553340911865234, 14.995010375976562, 15.436678886413574, 15.878347396850586, 16.320016860961914]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 11.0, 9.0, 15.0, 10.0, 13.0, 18.0, 25.0, 25.0, 17.0, 27.0, 37.0, 39.0, 41.0, 52.0, 40.0, 47.0, 37.0, 36.0, 44.0, 41.0, 53.0, 29.0, 41.0, 29.0, 30.0, 31.0, 32.0, 26.0, 25.0, 23.0, 19.0, 11.0, 10.0, 8.0, 7.0, 7.0, 6.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.083984375, -2.0269775390625, -1.969970703125, -1.9129638671875, -1.85595703125, -1.7989501953125, -1.741943359375, -1.6849365234375, -1.6279296875, -1.5709228515625, -1.513916015625, -1.4569091796875, -1.39990234375, -1.3428955078125, -1.285888671875, -1.2288818359375, -1.171875, -1.1148681640625, -1.057861328125, -1.0008544921875, -0.94384765625, -0.8868408203125, -0.829833984375, -0.7728271484375, -0.7158203125, -0.6588134765625, -0.601806640625, -0.5447998046875, -0.48779296875, -0.4307861328125, -0.373779296875, -0.3167724609375, -0.259765625, -0.2027587890625, -0.145751953125, -0.0887451171875, -0.03173828125, 0.0252685546875, 0.082275390625, 0.1392822265625, 0.1962890625, 0.2532958984375, 0.310302734375, 0.3673095703125, 0.42431640625, 0.4813232421875, 0.538330078125, 0.5953369140625, 0.65234375, 0.7093505859375, 0.766357421875, 0.8233642578125, 0.88037109375, 0.9373779296875, 0.994384765625, 1.0513916015625, 1.1083984375, 1.1654052734375, 1.222412109375, 1.2794189453125, 1.33642578125, 1.3934326171875, 1.450439453125, 1.5074462890625, 1.564453125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 4.0, 9.0, 11.0, 12.0, 12.0, 13.0, 24.0, 31.0, 68.0, 77.0, 153.0, 326.0, 562.0, 1154.0, 2237.0, 4900.0, 13972.0, 66300.0, 984143.0, 2881900.0, 196794.0, 26923.0, 8005.0, 3236.0, 1622.0, 783.0, 397.0, 240.0, 143.0, 72.0, 51.0, 31.0, 17.0, 10.0, 10.0, 11.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-6.3671875, -6.20892333984375, -6.0506591796875, -5.89239501953125, -5.734130859375, -5.57586669921875, -5.4176025390625, -5.25933837890625, -5.10107421875, -4.94281005859375, -4.7845458984375, -4.62628173828125, -4.468017578125, -4.30975341796875, -4.1514892578125, -3.99322509765625, -3.8349609375, -3.67669677734375, -3.5184326171875, -3.36016845703125, -3.201904296875, -3.04364013671875, -2.8853759765625, -2.72711181640625, -2.56884765625, -2.41058349609375, -2.2523193359375, -2.09405517578125, -1.935791015625, -1.77752685546875, -1.6192626953125, -1.46099853515625, -1.302734375, -1.14447021484375, -0.9862060546875, -0.82794189453125, -0.669677734375, -0.51141357421875, -0.3531494140625, -0.19488525390625, -0.03662109375, 0.12164306640625, 0.2799072265625, 0.43817138671875, 0.596435546875, 0.75469970703125, 0.9129638671875, 1.07122802734375, 1.2294921875, 1.38775634765625, 1.5460205078125, 1.70428466796875, 1.862548828125, 2.02081298828125, 2.1790771484375, 2.33734130859375, 2.49560546875, 2.65386962890625, 2.8121337890625, 2.97039794921875, 3.128662109375, 3.28692626953125, 3.4451904296875, 3.60345458984375, 3.76171875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 7.0, 7.0, 5.0, 9.0, 8.0, 18.0, 20.0, 42.0, 40.0, 57.0, 63.0, 88.0, 145.0, 235.0, 317.0, 545.0, 665.0, 551.0, 388.0, 229.0, 171.0, 103.0, 71.0, 69.0, 44.0, 32.0, 35.0, 24.0, 11.0, 11.0, 15.0, 8.0, 12.0, 11.0, 5.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.80682373046875, -2.7152099609375, -2.62359619140625, -2.531982421875, -2.44036865234375, -2.3487548828125, -2.25714111328125, -2.16552734375, -2.07391357421875, -1.9822998046875, -1.89068603515625, -1.799072265625, -1.70745849609375, -1.6158447265625, -1.52423095703125, -1.4326171875, -1.34100341796875, -1.2493896484375, -1.15777587890625, -1.066162109375, -0.97454833984375, -0.8829345703125, -0.79132080078125, -0.69970703125, -0.60809326171875, -0.5164794921875, -0.42486572265625, -0.333251953125, -0.24163818359375, -0.1500244140625, -0.05841064453125, 0.033203125, 0.12481689453125, 0.2164306640625, 0.30804443359375, 0.399658203125, 0.49127197265625, 0.5828857421875, 0.67449951171875, 0.76611328125, 0.85772705078125, 0.9493408203125, 1.04095458984375, 1.132568359375, 1.22418212890625, 1.3157958984375, 1.40740966796875, 1.4990234375, 1.59063720703125, 1.6822509765625, 1.77386474609375, 1.865478515625, 1.95709228515625, 2.0487060546875, 2.14031982421875, 2.23193359375, 2.32354736328125, 2.4151611328125, 2.50677490234375, 2.598388671875, 2.69000244140625, 2.7816162109375, 2.87322998046875, 2.96484375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 11.0, 17.0, 14.0, 16.0, 17.0, 22.0, 26.0, 64.0, 76.0, 98.0, 145.0, 278.0, 665.0, 1839.0, 6508.0, 38725.0, 1320344.0, 2757817.0, 55509.0, 8432.0, 2095.0, 750.0, 315.0, 146.0, 91.0, 66.0, 47.0, 48.0, 28.0, 17.0, 10.0, 13.0, 13.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.8671875, -9.5595703125, -9.251953125, -8.9443359375, -8.63671875, -8.3291015625, -8.021484375, -7.7138671875, -7.40625, -7.0986328125, -6.791015625, -6.4833984375, -6.17578125, -5.8681640625, -5.560546875, -5.2529296875, -4.9453125, -4.6376953125, -4.330078125, -4.0224609375, -3.71484375, -3.4072265625, -3.099609375, -2.7919921875, -2.484375, -2.1767578125, -1.869140625, -1.5615234375, -1.25390625, -0.9462890625, -0.638671875, -0.3310546875, -0.0234375, 0.2841796875, 0.591796875, 0.8994140625, 1.20703125, 1.5146484375, 1.822265625, 2.1298828125, 2.4375, 2.7451171875, 3.052734375, 3.3603515625, 3.66796875, 3.9755859375, 4.283203125, 4.5908203125, 4.8984375, 5.2060546875, 5.513671875, 5.8212890625, 6.12890625, 6.4365234375, 6.744140625, 7.0517578125, 7.359375, 7.6669921875, 7.974609375, 8.2822265625, 8.58984375, 8.8974609375, 9.205078125, 9.5126953125, 9.8203125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 10.0, 35.0, 81.0, 155.0, 198.0, 231.0, 144.0, 86.0, 35.0, 14.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.028812408447266, -19.28589630126953, -18.542980194091797, -17.800064086914062, -17.05714988708496, -16.314233779907227, -15.571317672729492, -14.828401565551758, -14.08548641204834, -13.342570304870605, -12.599655151367188, -11.856739044189453, -11.113822937011719, -10.3709077835083, -9.627991676330566, -8.885076522827148, -8.142160415649414, -7.399244785308838, -6.656329154968262, -5.913413047790527, -5.170497417449951, -4.427581787109375, -3.6846656799316406, -2.9417500495910645, -2.1988344192504883, -1.4559186697006226, -0.7130029201507568, 0.029912948608398438, 0.7728285789489746, 1.5157442092895508, 2.258660316467285, 3.0015759468078613, 3.7444915771484375, 4.487407207489014, 5.23032283782959, 5.973238945007324, 6.7161545753479, 7.459070205688477, 8.201986312866211, 8.944902420043945, 9.687817573547363, 10.430733680725098, 11.173648834228516, 11.91656494140625, 12.659481048583984, 13.402396202087402, 14.145312309265137, 14.888227462768555, 15.631143569946289, 16.374059677124023, 17.116975784301758, 17.85988998413086, 18.602806091308594, 19.345722198486328, 20.088638305664062, 20.831554412841797, 21.57447052001953, 22.317386627197266, 23.060302734375, 23.803218841552734, 24.546133041381836, 25.28904914855957, 26.031965255737305, 26.77488136291504, 27.51779556274414]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 6.0, 8.0, 7.0, 10.0, 6.0, 8.0, 18.0, 14.0, 24.0, 17.0, 14.0, 30.0, 37.0, 27.0, 30.0, 41.0, 32.0, 51.0, 29.0, 35.0, 46.0, 42.0, 47.0, 47.0, 43.0, 44.0, 28.0, 37.0, 33.0, 30.0, 26.0, 17.0, 24.0, 19.0, 9.0, 14.0, 18.0, 12.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.780767440795898, -8.489815711975098, -8.198864936828613, -7.9079132080078125, -7.61696195602417, -7.326010704040527, -7.035058975219727, -6.744107723236084, -6.453156471252441, -6.162205219268799, -5.871253967285156, -5.5803022384643555, -5.289350986480713, -4.99839973449707, -4.7074480056762695, -4.416496753692627, -4.125545501708984, -3.834594249725342, -3.54364275932312, -3.2526912689208984, -2.961740016937256, -2.6707887649536133, -2.3798372745513916, -2.08888578414917, -1.7979345321655273, -1.5069831609725952, -1.216031789779663, -0.925080418586731, -0.6341290473937988, -0.3431776762008667, -0.05222630500793457, 0.2387251853942871, 0.5296764373779297, 0.8206278085708618, 1.111579179763794, 1.402530550956726, 1.6934819221496582, 1.9844332933425903, 2.2753846645355225, 2.566336154937744, 2.8572874069213867, 3.1482386589050293, 3.439190149307251, 3.7301416397094727, 4.021092891693115, 4.312044143676758, 4.602995872497559, 4.893947124481201, 5.184898376464844, 5.475849628448486, 5.766800880432129, 6.05775260925293, 6.348703861236572, 6.639655113220215, 6.930606842041016, 7.221558094024658, 7.512509346008301, 7.803460597991943, 8.094411849975586, 8.385363578796387, 8.676315307617188, 8.967266082763672, 9.258217811584473, 9.549169540405273, 9.840120315551758]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 4.0, 5.0, 8.0, 8.0, 10.0, 10.0, 18.0, 28.0, 25.0, 23.0, 24.0, 28.0, 41.0, 43.0, 35.0, 46.0, 32.0, 47.0, 44.0, 46.0, 41.0, 38.0, 37.0, 35.0, 36.0, 30.0, 36.0, 23.0, 38.0, 28.0, 28.0, 12.0, 23.0, 16.0, 11.0, 11.0, 6.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.8318023681640625, -1.776885986328125, -1.7219696044921875, -1.66705322265625, -1.6121368408203125, -1.557220458984375, -1.5023040771484375, -1.4473876953125, -1.3924713134765625, -1.337554931640625, -1.2826385498046875, -1.22772216796875, -1.1728057861328125, -1.117889404296875, -1.0629730224609375, -1.008056640625, -0.9531402587890625, -0.898223876953125, -0.8433074951171875, -0.78839111328125, -0.7334747314453125, -0.678558349609375, -0.6236419677734375, -0.5687255859375, -0.5138092041015625, -0.458892822265625, -0.4039764404296875, -0.34906005859375, -0.2941436767578125, -0.239227294921875, -0.1843109130859375, -0.12939453125, -0.0744781494140625, -0.019561767578125, 0.0353546142578125, 0.09027099609375, 0.1451873779296875, 0.200103759765625, 0.2550201416015625, 0.3099365234375, 0.3648529052734375, 0.419769287109375, 0.4746856689453125, 0.52960205078125, 0.5845184326171875, 0.639434814453125, 0.6943511962890625, 0.749267578125, 0.8041839599609375, 0.859100341796875, 0.9140167236328125, 0.96893310546875, 1.0238494873046875, 1.078765869140625, 1.1336822509765625, 1.1885986328125, 1.2435150146484375, 1.298431396484375, 1.3533477783203125, 1.40826416015625, 1.4631805419921875, 1.518096923828125, 1.5730133056640625, 1.6279296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 8.0, 15.0, 17.0, 25.0, 39.0, 62.0, 89.0, 118.0, 196.0, 334.0, 400.0, 602.0, 916.0, 1316.0, 2075.0, 2898.0, 4485.0, 6865.0, 10366.0, 16426.0, 26357.0, 43815.0, 78623.0, 156798.0, 267882.0, 194796.0, 95891.0, 52294.0, 30582.0, 19063.0, 12055.0, 7711.0, 5171.0, 3330.0, 2265.0, 1493.0, 987.0, 751.0, 458.0, 308.0, 219.0, 148.0, 86.0, 69.0, 48.0, 29.0, 20.0, 16.0, 13.0, 12.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15673828125, -0.15178680419921875, -0.1468353271484375, -0.14188385009765625, -0.136932373046875, -0.13198089599609375, -0.1270294189453125, -0.12207794189453125, -0.11712646484375, -0.11217498779296875, -0.1072235107421875, -0.10227203369140625, -0.097320556640625, -0.09236907958984375, -0.0874176025390625, -0.08246612548828125, -0.0775146484375, -0.07256317138671875, -0.0676116943359375, -0.06266021728515625, -0.057708740234375, -0.05275726318359375, -0.0478057861328125, -0.04285430908203125, -0.03790283203125, -0.03295135498046875, -0.0279998779296875, -0.02304840087890625, -0.018096923828125, -0.01314544677734375, -0.0081939697265625, -0.00324249267578125, 0.001708984375, 0.00666046142578125, 0.0116119384765625, 0.01656341552734375, 0.021514892578125, 0.02646636962890625, 0.0314178466796875, 0.03636932373046875, 0.04132080078125, 0.04627227783203125, 0.0512237548828125, 0.05617523193359375, 0.061126708984375, 0.06607818603515625, 0.0710296630859375, 0.07598114013671875, 0.0809326171875, 0.08588409423828125, 0.0908355712890625, 0.09578704833984375, 0.100738525390625, 0.10569000244140625, 0.1106414794921875, 0.11559295654296875, 0.12054443359375, 0.12549591064453125, 0.1304473876953125, 0.13539886474609375, 0.140350341796875, 0.14530181884765625, 0.1502532958984375, 0.15520477294921875, 0.16015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 10.0, 11.0, 16.0, 14.0, 14.0, 21.0, 20.0, 27.0, 25.0, 33.0, 43.0, 39.0, 44.0, 39.0, 47.0, 50.0, 1067.0, 40.0, 43.0, 40.0, 41.0, 51.0, 36.0, 33.0, 26.0, 31.0, 23.0, 16.0, 23.0, 18.0, 16.0, 10.0, 8.0, 9.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2275390625, -1.1878509521484375, -1.148162841796875, -1.1084747314453125, -1.06878662109375, -1.0290985107421875, -0.989410400390625, -0.9497222900390625, -0.9100341796875, -0.8703460693359375, -0.830657958984375, -0.7909698486328125, -0.75128173828125, -0.7115936279296875, -0.671905517578125, -0.6322174072265625, -0.592529296875, -0.5528411865234375, -0.513153076171875, -0.4734649658203125, -0.43377685546875, -0.3940887451171875, -0.354400634765625, -0.3147125244140625, -0.2750244140625, -0.2353363037109375, -0.195648193359375, -0.1559600830078125, -0.11627197265625, -0.0765838623046875, -0.036895751953125, 0.0027923583984375, 0.04248046875, 0.0821685791015625, 0.121856689453125, 0.1615447998046875, 0.20123291015625, 0.2409210205078125, 0.280609130859375, 0.3202972412109375, 0.3599853515625, 0.3996734619140625, 0.439361572265625, 0.4790496826171875, 0.51873779296875, 0.5584259033203125, 0.598114013671875, 0.6378021240234375, 0.677490234375, 0.7171783447265625, 0.756866455078125, 0.7965545654296875, 0.83624267578125, 0.8759307861328125, 0.915618896484375, 0.9553070068359375, 0.9949951171875, 1.0346832275390625, 1.074371337890625, 1.1140594482421875, 1.15374755859375, 1.1934356689453125, 1.233123779296875, 1.2728118896484375, 1.3125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 5.0, 12.0, 17.0, 22.0, 32.0, 51.0, 69.0, 82.0, 121.0, 193.0, 267.0, 346.0, 537.0, 772.0, 1238.0, 1898.0, 2874.0, 4737.0, 7746.0, 15170.0, 39440.0, 407791.0, 1525045.0, 49105.0, 16765.0, 8657.0, 5067.0, 3062.0, 1986.0, 1320.0, 828.0, 592.0, 398.0, 267.0, 187.0, 131.0, 95.0, 62.0, 36.0, 31.0, 19.0, 15.0, 12.0, 4.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.255615234375, -0.2473907470703125, -0.239166259765625, -0.2309417724609375, -0.22271728515625, -0.2144927978515625, -0.206268310546875, -0.1980438232421875, -0.1898193359375, -0.1815948486328125, -0.173370361328125, -0.1651458740234375, -0.15692138671875, -0.1486968994140625, -0.140472412109375, -0.1322479248046875, -0.1240234375, -0.1157989501953125, -0.107574462890625, -0.0993499755859375, -0.09112548828125, -0.0829010009765625, -0.074676513671875, -0.0664520263671875, -0.0582275390625, -0.0500030517578125, -0.041778564453125, -0.0335540771484375, -0.02532958984375, -0.0171051025390625, -0.008880615234375, -0.0006561279296875, 0.007568359375, 0.0157928466796875, 0.024017333984375, 0.0322418212890625, 0.04046630859375, 0.0486907958984375, 0.056915283203125, 0.0651397705078125, 0.0733642578125, 0.0815887451171875, 0.089813232421875, 0.0980377197265625, 0.10626220703125, 0.1144866943359375, 0.122711181640625, 0.1309356689453125, 0.13916015625, 0.1473846435546875, 0.155609130859375, 0.1638336181640625, 0.17205810546875, 0.1802825927734375, 0.188507080078125, 0.1967315673828125, 0.2049560546875, 0.2131805419921875, 0.221405029296875, 0.2296295166015625, 0.23785400390625, 0.2460784912109375, 0.254302978515625, 0.2625274658203125, 0.270751953125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 4.0, 11.0, 9.0, 10.0, 23.0, 26.0, 22.0, 25.0, 31.0, 32.0, 42.0, 51.0, 57.0, 58.0, 63.0, 63.0, 59.0, 49.0, 67.0, 43.0, 51.0, 44.0, 23.0, 28.0, 22.0, 11.0, 19.0, 14.0, 8.0, 9.0, 6.0, 2.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01129913330078125, -0.010962724685668945, -0.01062631607055664, -0.010289907455444336, -0.009953498840332031, -0.009617090225219727, -0.009280681610107422, -0.008944272994995117, -0.008607864379882812, -0.008271455764770508, -0.007935047149658203, -0.0075986385345458984, -0.007262229919433594, -0.006925821304321289, -0.006589412689208984, -0.00625300407409668, -0.005916595458984375, -0.00558018684387207, -0.005243778228759766, -0.004907369613647461, -0.004570960998535156, -0.0042345523834228516, -0.003898143768310547, -0.003561735153198242, -0.0032253265380859375, -0.002888917922973633, -0.002552509307861328, -0.0022161006927490234, -0.0018796920776367188, -0.001543283462524414, -0.0012068748474121094, -0.0008704662322998047, -0.0005340576171875, -0.0001976490020751953, 0.00013875961303710938, 0.00047516822814941406, 0.0008115768432617188, 0.0011479854583740234, 0.0014843940734863281, 0.0018208026885986328, 0.0021572113037109375, 0.002493619918823242, 0.002830028533935547, 0.0031664371490478516, 0.0035028457641601562, 0.003839254379272461, 0.004175662994384766, 0.00451207160949707, 0.004848480224609375, 0.00518488883972168, 0.005521297454833984, 0.005857706069946289, 0.006194114685058594, 0.0065305233001708984, 0.006866931915283203, 0.007203340530395508, 0.0075397491455078125, 0.007876157760620117, 0.008212566375732422, 0.008548974990844727, 0.008885383605957031, 0.009221792221069336, 0.00955820083618164, 0.009894609451293945, 0.01023101806640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 13.0, 11.0, 15.0, 13.0, 26.0, 25.0, 34.0, 51.0, 73.0, 117.0, 149.0, 259.0, 484.0, 2863.0, 548332.0, 492133.0, 2647.0, 503.0, 216.0, 166.0, 108.0, 76.0, 42.0, 43.0, 27.0, 27.0, 26.0, 17.0, 12.0, 11.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2001953125, -0.19351959228515625, -0.1868438720703125, -0.18016815185546875, -0.173492431640625, -0.16681671142578125, -0.1601409912109375, -0.15346527099609375, -0.14678955078125, -0.14011383056640625, -0.1334381103515625, -0.12676239013671875, -0.120086669921875, -0.11341094970703125, -0.1067352294921875, -0.10005950927734375, -0.0933837890625, -0.08670806884765625, -0.0800323486328125, -0.07335662841796875, -0.066680908203125, -0.06000518798828125, -0.0533294677734375, -0.04665374755859375, -0.03997802734375, -0.03330230712890625, -0.0266265869140625, -0.01995086669921875, -0.013275146484375, -0.00659942626953125, 7.62939453125e-05, 0.00675201416015625, 0.013427734375, 0.02010345458984375, 0.0267791748046875, 0.03345489501953125, 0.040130615234375, 0.04680633544921875, 0.0534820556640625, 0.06015777587890625, 0.06683349609375, 0.07350921630859375, 0.0801849365234375, 0.08686065673828125, 0.093536376953125, 0.10021209716796875, 0.1068878173828125, 0.11356353759765625, 0.1202392578125, 0.12691497802734375, 0.1335906982421875, 0.14026641845703125, 0.146942138671875, 0.15361785888671875, 0.1602935791015625, 0.16696929931640625, 0.17364501953125, 0.18032073974609375, 0.1869964599609375, 0.19367218017578125, 0.200347900390625, 0.20702362060546875, 0.2136993408203125, 0.22037506103515625, 0.22705078125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 19.0, 53.0, 107.0, 234.0, 262.0, 199.0, 82.0, 32.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013863466680049896, -0.012639275752007961, -0.011415084823966026, -0.010190894827246666, -0.008966703899204731, -0.007742512971162796, -0.006518322508782148, -0.005294132046401501, -0.004069941118359566, -0.0028457504231482744, -0.0016215597279369831, -0.0003973690327256918, 0.0008268216624855995, 0.0020510125905275345, 0.003275203052908182, 0.00449939351528883, 0.005723584443330765, 0.0069477753713727, 0.008171966299414635, 0.009396156296133995, 0.01062034722417593, 0.011844538152217865, 0.013068728148937225, 0.01429291907697916, 0.015517110005021095, 0.016741300001740456, 0.017965491861104965, 0.019189681857824326, 0.020413871854543686, 0.021638063713908195, 0.022862253710627556, 0.024086445569992065, 0.025310635566711426, 0.026534825563430786, 0.027759017422795296, 0.028983207419514656, 0.030207399278879166, 0.031431589275598526, 0.032655779272317886, 0.03387996926903725, 0.035104162991046906, 0.036328352987766266, 0.037552542984485626, 0.038776736706495285, 0.040000926703214645, 0.041225116699934006, 0.042449306696653366, 0.043673496693372726, 0.04489768669009209, 0.04612187668681145, 0.04734606668353081, 0.048570260405540466, 0.04979445040225983, 0.05101864039897919, 0.05224283039569855, 0.05346702039241791, 0.05469121038913727, 0.05591540038585663, 0.05713959038257599, 0.05836378410458565, 0.05958797410130501, 0.06081216409802437, 0.06203635409474373, 0.06326054781675339, 0.06448473781347275]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 7.0, 7.0, 7.0, 6.0, 13.0, 11.0, 20.0, 13.0, 23.0, 18.0, 27.0, 37.0, 28.0, 31.0, 31.0, 39.0, 45.0, 44.0, 40.0, 54.0, 33.0, 57.0, 43.0, 44.0, 28.0, 24.0, 29.0, 27.0, 29.0, 39.0, 30.0, 17.0, 16.0, 9.0, 9.0, 14.0, 13.0, 8.0, 10.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009587585926055908, -0.009299896657466888, -0.009012207388877869, -0.008724518120288849, -0.008436828851699829, -0.00814913958311081, -0.00786145031452179, -0.00757376104593277, -0.00728607177734375, -0.00699838250875473, -0.0067106932401657104, -0.006423003971576691, -0.006135314702987671, -0.005847625434398651, -0.005559936165809631, -0.005272246897220612, -0.004984557628631592, -0.004696868360042572, -0.004409179091453552, -0.0041214898228645325, -0.0038338005542755127, -0.003546111285686493, -0.003258422017097473, -0.0029707327485084534, -0.0026830434799194336, -0.002395354211330414, -0.002107664942741394, -0.0018199756741523743, -0.0015322864055633545, -0.0012445971369743347, -0.0009569078683853149, -0.0006692185997962952, -0.0003815293312072754, -9.384006261825562e-05, 0.00019384920597076416, 0.00048153847455978394, 0.0007692277431488037, 0.0010569170117378235, 0.0013446062803268433, 0.001632295548915863, 0.0019199848175048828, 0.0022076740860939026, 0.0024953633546829224, 0.002783052623271942, 0.003070741891860962, 0.0033584311604499817, 0.0036461204290390015, 0.003933809697628021, 0.004221498966217041, 0.004509188234806061, 0.004796877503395081, 0.0050845667719841, 0.00537225604057312, 0.00565994530916214, 0.00594763457775116, 0.0062353238463401794, 0.006523013114929199, 0.006810702383518219, 0.007098391652107239, 0.0073860809206962585, 0.007673770189285278, 0.007961459457874298, 0.008249148726463318, 0.008536837995052338, 0.008824527263641357]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 4.0, 5.0, 8.0, 8.0, 9.0, 11.0, 18.0, 27.0, 26.0, 22.0, 25.0, 28.0, 41.0, 43.0, 36.0, 45.0, 32.0, 47.0, 44.0, 46.0, 41.0, 38.0, 37.0, 35.0, 36.0, 29.0, 37.0, 23.0, 38.0, 29.0, 26.0, 13.0, 23.0, 16.0, 11.0, 11.0, 6.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.8318023681640625, -1.776885986328125, -1.7219696044921875, -1.66705322265625, -1.6121368408203125, -1.557220458984375, -1.5023040771484375, -1.4473876953125, -1.3924713134765625, -1.337554931640625, -1.2826385498046875, -1.22772216796875, -1.1728057861328125, -1.117889404296875, -1.0629730224609375, -1.008056640625, -0.9531402587890625, -0.898223876953125, -0.8433074951171875, -0.78839111328125, -0.7334747314453125, -0.678558349609375, -0.6236419677734375, -0.5687255859375, -0.5138092041015625, -0.458892822265625, -0.4039764404296875, -0.34906005859375, -0.2941436767578125, -0.239227294921875, -0.1843109130859375, -0.12939453125, -0.0744781494140625, -0.019561767578125, 0.0353546142578125, 0.09027099609375, 0.1451873779296875, 0.200103759765625, 0.2550201416015625, 0.3099365234375, 0.3648529052734375, 0.419769287109375, 0.4746856689453125, 0.52960205078125, 0.5845184326171875, 0.639434814453125, 0.6943511962890625, 0.749267578125, 0.8041839599609375, 0.859100341796875, 0.9140167236328125, 0.96893310546875, 1.0238494873046875, 1.078765869140625, 1.1336822509765625, 1.1885986328125, 1.2435150146484375, 1.298431396484375, 1.3533477783203125, 1.40826416015625, 1.4631805419921875, 1.518096923828125, 1.5730133056640625, 1.6279296875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 13.0, 17.0, 17.0, 36.0, 54.0, 58.0, 103.0, 151.0, 225.0, 413.0, 734.0, 1374.0, 2581.0, 5273.0, 11941.0, 31997.0, 113927.0, 622320.0, 185926.0, 42501.0, 15410.0, 6631.0, 3047.0, 1644.0, 823.0, 480.0, 297.0, 156.0, 112.0, 77.0, 58.0, 33.0, 33.0, 34.0, 16.0, 10.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.943359375, -3.83270263671875, -3.7220458984375, -3.61138916015625, -3.500732421875, -3.39007568359375, -3.2794189453125, -3.16876220703125, -3.05810546875, -2.94744873046875, -2.8367919921875, -2.72613525390625, -2.615478515625, -2.50482177734375, -2.3941650390625, -2.28350830078125, -2.1728515625, -2.06219482421875, -1.9515380859375, -1.84088134765625, -1.730224609375, -1.61956787109375, -1.5089111328125, -1.39825439453125, -1.28759765625, -1.17694091796875, -1.0662841796875, -0.95562744140625, -0.844970703125, -0.73431396484375, -0.6236572265625, -0.51300048828125, -0.40234375, -0.29168701171875, -0.1810302734375, -0.07037353515625, 0.040283203125, 0.15093994140625, 0.2615966796875, 0.37225341796875, 0.48291015625, 0.59356689453125, 0.7042236328125, 0.81488037109375, 0.925537109375, 1.03619384765625, 1.1468505859375, 1.25750732421875, 1.3681640625, 1.47882080078125, 1.5894775390625, 1.70013427734375, 1.810791015625, 1.92144775390625, 2.0321044921875, 2.14276123046875, 2.25341796875, 2.36407470703125, 2.4747314453125, 2.58538818359375, 2.696044921875, 2.80670166015625, 2.9173583984375, 3.02801513671875, 3.138671875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 3.0, 8.0, 4.0, 8.0, 11.0, 11.0, 6.0, 22.0, 25.0, 33.0, 29.0, 36.0, 37.0, 57.0, 51.0, 60.0, 83.0, 129.0, 1458.0, 406.0, 124.0, 62.0, 43.0, 39.0, 29.0, 37.0, 37.0, 35.0, 21.0, 30.0, 21.0, 7.0, 17.0, 12.0, 9.0, 13.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.40625, -5.2559814453125, -5.105712890625, -4.9554443359375, -4.80517578125, -4.6549072265625, -4.504638671875, -4.3543701171875, -4.2041015625, -4.0538330078125, -3.903564453125, -3.7532958984375, -3.60302734375, -3.4527587890625, -3.302490234375, -3.1522216796875, -3.001953125, -2.8516845703125, -2.701416015625, -2.5511474609375, -2.40087890625, -2.2506103515625, -2.100341796875, -1.9500732421875, -1.7998046875, -1.6495361328125, -1.499267578125, -1.3489990234375, -1.19873046875, -1.0484619140625, -0.898193359375, -0.7479248046875, -0.59765625, -0.4473876953125, -0.297119140625, -0.1468505859375, 0.00341796875, 0.1536865234375, 0.303955078125, 0.4542236328125, 0.6044921875, 0.7547607421875, 0.905029296875, 1.0552978515625, 1.20556640625, 1.3558349609375, 1.506103515625, 1.6563720703125, 1.806640625, 1.9569091796875, 2.107177734375, 2.2574462890625, 2.40771484375, 2.5579833984375, 2.708251953125, 2.8585205078125, 3.0087890625, 3.1590576171875, 3.309326171875, 3.4595947265625, 3.60986328125, 3.7601318359375, 3.910400390625, 4.0606689453125, 4.2109375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 6.0, 11.0, 6.0, 18.0, 14.0, 17.0, 18.0, 39.0, 43.0, 40.0, 57.0, 76.0, 103.0, 150.0, 251.0, 581.0, 1799.0, 8127.0, 74199.0, 2901607.0, 142927.0, 11470.0, 2455.0, 697.0, 329.0, 177.0, 104.0, 76.0, 55.0, 51.0, 40.0, 42.0, 20.0, 12.0, 15.0, 15.0, 9.0, 11.0, 4.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.52734375, -7.27301025390625, -7.0186767578125, -6.76434326171875, -6.510009765625, -6.25567626953125, -6.0013427734375, -5.74700927734375, -5.49267578125, -5.23834228515625, -4.9840087890625, -4.72967529296875, -4.475341796875, -4.22100830078125, -3.9666748046875, -3.71234130859375, -3.4580078125, -3.20367431640625, -2.9493408203125, -2.69500732421875, -2.440673828125, -2.18634033203125, -1.9320068359375, -1.67767333984375, -1.42333984375, -1.16900634765625, -0.9146728515625, -0.66033935546875, -0.406005859375, -0.15167236328125, 0.1026611328125, 0.35699462890625, 0.611328125, 0.86566162109375, 1.1199951171875, 1.37432861328125, 1.628662109375, 1.88299560546875, 2.1373291015625, 2.39166259765625, 2.64599609375, 2.90032958984375, 3.1546630859375, 3.40899658203125, 3.663330078125, 3.91766357421875, 4.1719970703125, 4.42633056640625, 4.6806640625, 4.93499755859375, 5.1893310546875, 5.44366455078125, 5.697998046875, 5.95233154296875, 6.2066650390625, 6.46099853515625, 6.71533203125, 6.96966552734375, 7.2239990234375, 7.47833251953125, 7.732666015625, 7.98699951171875, 8.2413330078125, 8.49566650390625, 8.75]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 60.0, 229.0, 388.0, 228.0, 84.0, 16.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.815099716186523, -23.12384605407715, -22.432594299316406, -21.74134063720703, -21.050086975097656, -20.35883331298828, -19.667579650878906, -18.976327896118164, -18.28507423400879, -17.593820571899414, -16.902568817138672, -16.211315155029297, -15.520061492919922, -14.828807830810547, -14.137555122375488, -13.44630241394043, -12.755048751831055, -12.06379508972168, -11.372542381286621, -10.681289672851562, -9.990036010742188, -9.298782348632812, -8.607529640197754, -7.916276454925537, -7.22502326965332, -6.5337700843811035, -5.842516899108887, -5.15126371383667, -4.460010528564453, -3.7687573432922363, -3.0775041580200195, -2.3862509727478027, -1.694997787475586, -1.0037446022033691, -0.31249141693115234, 0.37876176834106445, 1.0700149536132812, 1.761268138885498, 2.452521324157715, 3.1437745094299316, 3.8350276947021484, 4.526280879974365, 5.217534065246582, 5.908787250518799, 6.600040435791016, 7.291293621063232, 7.982546806335449, 8.673799514770508, 9.365053176879883, 10.056306838989258, 10.747559547424316, 11.438812255859375, 12.13006591796875, 12.821319580078125, 13.512572288513184, 14.203824996948242, 14.895078659057617, 15.586332321166992, 16.277584075927734, 16.96883773803711, 17.660091400146484, 18.35134506225586, 19.042598724365234, 19.733850479125977, 20.42510414123535]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 8.0, 5.0, 5.0, 7.0, 9.0, 5.0, 15.0, 14.0, 20.0, 17.0, 21.0, 26.0, 32.0, 24.0, 37.0, 42.0, 31.0, 32.0, 51.0, 40.0, 29.0, 31.0, 48.0, 32.0, 38.0, 28.0, 37.0, 39.0, 41.0, 35.0, 28.0, 26.0, 21.0, 27.0, 12.0, 13.0, 17.0, 7.0, 11.0, 7.0, 4.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.588260650634766, -11.221020698547363, -10.853780746459961, -10.486541748046875, -10.119301795959473, -9.75206184387207, -9.384821891784668, -9.017581939697266, -8.65034294128418, -8.283102989196777, -7.915863513946533, -7.548623561859131, -7.181384086608887, -6.814144134521484, -6.446904182434082, -6.079664707183838, -5.7124247550964355, -5.345184803009033, -4.977945327758789, -4.610705375671387, -4.243465900421143, -3.8762259483337402, -3.508986234664917, -3.1417465209960938, -2.7745068073272705, -2.4072670936584473, -2.040027379989624, -1.6727875471115112, -1.305547833442688, -0.9383081197738647, -0.571068286895752, -0.2038285732269287, 0.16341114044189453, 0.5306508541107178, 0.8978906273841858, 1.2651304006576538, 1.632370114326477, 1.9996098279953003, 2.366849660873413, 2.7340893745422363, 3.1013290882110596, 3.468568801879883, 3.835808515548706, 4.203048229217529, 4.570288181304932, 4.937527656555176, 5.304767608642578, 5.6720075607299805, 6.039247035980225, 6.406486988067627, 6.773726463317871, 7.140966415405273, 7.508205890655518, 7.87544584274292, 8.242685317993164, 8.609925270080566, 8.977165222167969, 9.344405174255371, 9.711645126342773, 10.07888412475586, 10.446124076843262, 10.813364028930664, 11.180603981018066, 11.547843933105469, 11.915082931518555]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 9.0, 12.0, 13.0, 13.0, 12.0, 27.0, 28.0, 22.0, 23.0, 31.0, 40.0, 43.0, 35.0, 42.0, 31.0, 48.0, 46.0, 34.0, 42.0, 47.0, 34.0, 36.0, 28.0, 21.0, 37.0, 31.0, 42.0, 22.0, 22.0, 23.0, 16.0, 13.0, 13.0, 14.0, 7.0, 8.0, 4.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8291015625, -1.775634765625, -1.72216796875, -1.668701171875, -1.615234375, -1.561767578125, -1.50830078125, -1.454833984375, -1.4013671875, -1.347900390625, -1.29443359375, -1.240966796875, -1.1875, -1.134033203125, -1.08056640625, -1.027099609375, -0.9736328125, -0.920166015625, -0.86669921875, -0.813232421875, -0.759765625, -0.706298828125, -0.65283203125, -0.599365234375, -0.5458984375, -0.492431640625, -0.43896484375, -0.385498046875, -0.33203125, -0.278564453125, -0.22509765625, -0.171630859375, -0.1181640625, -0.064697265625, -0.01123046875, 0.042236328125, 0.095703125, 0.149169921875, 0.20263671875, 0.256103515625, 0.3095703125, 0.363037109375, 0.41650390625, 0.469970703125, 0.5234375, 0.576904296875, 0.63037109375, 0.683837890625, 0.7373046875, 0.790771484375, 0.84423828125, 0.897705078125, 0.951171875, 1.004638671875, 1.05810546875, 1.111572265625, 1.1650390625, 1.218505859375, 1.27197265625, 1.325439453125, 1.37890625, 1.432373046875, 1.48583984375, 1.539306640625, 1.5927734375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 3.0, 8.0, 9.0, 7.0, 12.0, 25.0, 40.0, 58.0, 76.0, 115.0, 197.0, 274.0, 420.0, 659.0, 1082.0, 1993.0, 3362.0, 6913.0, 15659.0, 45861.0, 242806.0, 2222061.0, 1439468.0, 151872.0, 34816.0, 12784.0, 5882.0, 3135.0, 1735.0, 1049.0, 616.0, 451.0, 264.0, 178.0, 128.0, 74.0, 56.0, 42.0, 25.0, 24.0, 16.0, 5.0, 1.0, 5.0, 5.0, 7.0], "bins": [-4.89453125, -4.771820068359375, -4.64910888671875, -4.526397705078125, -4.4036865234375, -4.280975341796875, -4.15826416015625, -4.035552978515625, -3.912841796875, -3.790130615234375, -3.66741943359375, -3.544708251953125, -3.4219970703125, -3.299285888671875, -3.17657470703125, -3.053863525390625, -2.93115234375, -2.808441162109375, -2.68572998046875, -2.563018798828125, -2.4403076171875, -2.317596435546875, -2.19488525390625, -2.072174072265625, -1.949462890625, -1.826751708984375, -1.70404052734375, -1.581329345703125, -1.4586181640625, -1.335906982421875, -1.21319580078125, -1.090484619140625, -0.9677734375, -0.845062255859375, -0.72235107421875, -0.599639892578125, -0.4769287109375, -0.354217529296875, -0.23150634765625, -0.108795166015625, 0.013916015625, 0.136627197265625, 0.25933837890625, 0.382049560546875, 0.5047607421875, 0.627471923828125, 0.75018310546875, 0.872894287109375, 0.99560546875, 1.118316650390625, 1.24102783203125, 1.363739013671875, 1.4864501953125, 1.609161376953125, 1.73187255859375, 1.854583740234375, 1.977294921875, 2.100006103515625, 2.22271728515625, 2.345428466796875, 2.4681396484375, 2.590850830078125, 2.71356201171875, 2.836273193359375, 2.958984375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 3.0, 10.0, 10.0, 15.0, 13.0, 10.0, 19.0, 21.0, 34.0, 39.0, 50.0, 94.0, 127.0, 200.0, 273.0, 457.0, 595.0, 613.0, 485.0, 306.0, 169.0, 147.0, 99.0, 60.0, 51.0, 33.0, 23.0, 18.0, 21.0, 13.0, 15.0, 13.0, 5.0, 5.0, 0.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.794921875, -2.704833984375, -2.61474609375, -2.524658203125, -2.4345703125, -2.344482421875, -2.25439453125, -2.164306640625, -2.07421875, -1.984130859375, -1.89404296875, -1.803955078125, -1.7138671875, -1.623779296875, -1.53369140625, -1.443603515625, -1.353515625, -1.263427734375, -1.17333984375, -1.083251953125, -0.9931640625, -0.903076171875, -0.81298828125, -0.722900390625, -0.6328125, -0.542724609375, -0.45263671875, -0.362548828125, -0.2724609375, -0.182373046875, -0.09228515625, -0.002197265625, 0.087890625, 0.177978515625, 0.26806640625, 0.358154296875, 0.4482421875, 0.538330078125, 0.62841796875, 0.718505859375, 0.80859375, 0.898681640625, 0.98876953125, 1.078857421875, 1.1689453125, 1.259033203125, 1.34912109375, 1.439208984375, 1.529296875, 1.619384765625, 1.70947265625, 1.799560546875, 1.8896484375, 1.979736328125, 2.06982421875, 2.159912109375, 2.25, 2.340087890625, 2.43017578125, 2.520263671875, 2.6103515625, 2.700439453125, 2.79052734375, 2.880615234375, 2.970703125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 6.0, 7.0, 8.0, 15.0, 27.0, 21.0, 32.0, 47.0, 48.0, 70.0, 106.0, 162.0, 370.0, 774.0, 1735.0, 4633.0, 14825.0, 73904.0, 1652180.0, 2331720.0, 88218.0, 16522.0, 5213.0, 1886.0, 765.0, 372.0, 186.0, 122.0, 71.0, 56.0, 32.0, 24.0, 25.0, 18.0, 12.0, 13.0, 12.0, 6.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33203125, -7.10321044921875, -6.8743896484375, -6.64556884765625, -6.416748046875, -6.18792724609375, -5.9591064453125, -5.73028564453125, -5.50146484375, -5.27264404296875, -5.0438232421875, -4.81500244140625, -4.586181640625, -4.35736083984375, -4.1285400390625, -3.89971923828125, -3.6708984375, -3.44207763671875, -3.2132568359375, -2.98443603515625, -2.755615234375, -2.52679443359375, -2.2979736328125, -2.06915283203125, -1.84033203125, -1.61151123046875, -1.3826904296875, -1.15386962890625, -0.925048828125, -0.69622802734375, -0.4674072265625, -0.23858642578125, -0.009765625, 0.21905517578125, 0.4478759765625, 0.67669677734375, 0.905517578125, 1.13433837890625, 1.3631591796875, 1.59197998046875, 1.82080078125, 2.04962158203125, 2.2784423828125, 2.50726318359375, 2.736083984375, 2.96490478515625, 3.1937255859375, 3.42254638671875, 3.6513671875, 3.88018798828125, 4.1090087890625, 4.33782958984375, 4.566650390625, 4.79547119140625, 5.0242919921875, 5.25311279296875, 5.48193359375, 5.71075439453125, 5.9395751953125, 6.16839599609375, 6.397216796875, 6.62603759765625, 6.8548583984375, 7.08367919921875, 7.3125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 10.0, 41.0, 112.0, 306.0, 344.0, 137.0, 40.0, 16.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.64571475982666, -8.462753295898438, -7.279791355133057, -6.096829414367676, -4.913867950439453, -3.7309064865112305, -2.5479445457458496, -1.3649826049804688, -0.1820211410522461, 1.0009405612945557, 2.1839022636413574, 3.366863965988159, 4.549825668334961, 5.732787132263184, 6.9157490730285645, 8.098711013793945, 9.281672477722168, 10.46463394165039, 11.64759635925293, 12.830557823181152, 14.013519287109375, 15.196480751037598, 16.37944221496582, 17.56240463256836, 18.745365142822266, 19.928327560424805, 21.11128807067871, 22.29425048828125, 23.477210998535156, 24.660173416137695, 25.843135833740234, 27.02609634399414, 28.209060668945312, 29.39202308654785, 30.574983596801758, 31.757946014404297, 32.9409065246582, 34.123870849609375, 35.30683135986328, 36.48979187011719, 37.672752380371094, 38.855712890625, 40.03867721557617, 41.22163772583008, 42.404598236083984, 43.587562561035156, 44.77052307128906, 45.95348358154297, 47.13644790649414, 48.31940841674805, 49.50237274169922, 50.685333251953125, 51.86829376220703, 53.05125427246094, 54.23421859741211, 55.417179107666016, 56.60014343261719, 57.783103942871094, 58.966068267822266, 60.14902877807617, 61.33198928833008, 62.51495361328125, 63.697914123535156, 64.88087463378906, 66.06383514404297]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 5.0, 14.0, 16.0, 18.0, 19.0, 25.0, 21.0, 23.0, 29.0, 27.0, 19.0, 28.0, 37.0, 34.0, 37.0, 35.0, 34.0, 35.0, 29.0, 32.0, 34.0, 35.0, 30.0, 47.0, 36.0, 31.0, 28.0, 29.0, 22.0, 23.0, 14.0, 20.0, 18.0, 9.0, 9.0, 27.0, 9.0, 9.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.9060821533203125, -7.661905288696289, -7.417728424072266, -7.173551559448242, -6.929374694824219, -6.685197830200195, -6.441020965576172, -6.196844100952148, -5.952667236328125, -5.708490371704102, -5.464313507080078, -5.220136642456055, -4.975959777832031, -4.731782913208008, -4.487606048583984, -4.243429183959961, -3.9992520809173584, -3.755075216293335, -3.5108983516693115, -3.266721487045288, -3.0225446224212646, -2.778367519378662, -2.5341906547546387, -2.2900137901306152, -2.045836925506592, -1.8016600608825684, -1.557483196258545, -1.3133063316345215, -1.069129467010498, -0.8249524831771851, -0.5807756185531616, -0.3365987539291382, -0.0924220085144043, 0.15175487101078033, 0.39593175053596497, 0.6401086449623108, 0.8842855095863342, 1.1284624338150024, 1.3726392984390259, 1.6168161630630493, 1.8609930276870728, 2.1051700115203857, 2.349346876144409, 2.5935237407684326, 2.837700605392456, 3.0818774700164795, 3.326054334640503, 3.5702311992645264, 3.81440806388855, 4.058585166931152, 4.302762031555176, 4.546938896179199, 4.791115760803223, 5.035292625427246, 5.2794694900512695, 5.523646354675293, 5.767823219299316, 6.01200008392334, 6.256176948547363, 6.500353813171387, 6.74453067779541, 6.988707542419434, 7.232884407043457, 7.4770612716674805, 7.721238136291504]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 5.0, 6.0, 3.0, 13.0, 14.0, 14.0, 16.0, 19.0, 23.0, 32.0, 25.0, 32.0, 38.0, 33.0, 37.0, 37.0, 36.0, 52.0, 54.0, 43.0, 35.0, 45.0, 38.0, 46.0, 36.0, 40.0, 20.0, 21.0, 33.0, 27.0, 16.0, 21.0, 18.0, 14.0, 12.0, 11.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.896484375, -1.8422698974609375, -1.788055419921875, -1.7338409423828125, -1.67962646484375, -1.6254119873046875, -1.571197509765625, -1.5169830322265625, -1.4627685546875, -1.4085540771484375, -1.354339599609375, -1.3001251220703125, -1.24591064453125, -1.1916961669921875, -1.137481689453125, -1.0832672119140625, -1.029052734375, -0.9748382568359375, -0.920623779296875, -0.8664093017578125, -0.81219482421875, -0.7579803466796875, -0.703765869140625, -0.6495513916015625, -0.5953369140625, -0.5411224365234375, -0.486907958984375, -0.4326934814453125, -0.37847900390625, -0.3242645263671875, -0.270050048828125, -0.2158355712890625, -0.16162109375, -0.1074066162109375, -0.053192138671875, 0.0010223388671875, 0.05523681640625, 0.1094512939453125, 0.163665771484375, 0.2178802490234375, 0.2720947265625, 0.3263092041015625, 0.380523681640625, 0.4347381591796875, 0.48895263671875, 0.5431671142578125, 0.597381591796875, 0.6515960693359375, 0.705810546875, 0.7600250244140625, 0.814239501953125, 0.8684539794921875, 0.92266845703125, 0.9768829345703125, 1.031097412109375, 1.0853118896484375, 1.1395263671875, 1.1937408447265625, 1.247955322265625, 1.3021697998046875, 1.35638427734375, 1.4105987548828125, 1.464813232421875, 1.5190277099609375, 1.5732421875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 8.0, 16.0, 24.0, 43.0, 48.0, 64.0, 126.0, 150.0, 270.0, 391.0, 585.0, 911.0, 1398.0, 2144.0, 3383.0, 5153.0, 8111.0, 13044.0, 21048.0, 35226.0, 61544.0, 111976.0, 217723.0, 248853.0, 136688.0, 72543.0, 41465.0, 24664.0, 15001.0, 9372.0, 6012.0, 3645.0, 2358.0, 1506.0, 1015.0, 712.0, 423.0, 298.0, 188.0, 142.0, 86.0, 59.0, 52.0, 29.0, 25.0, 11.0, 9.0, 1.0, 10.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.147216796875, -0.14249038696289062, -0.13776397705078125, -0.13303756713867188, -0.1283111572265625, -0.12358474731445312, -0.11885833740234375, -0.11413192749023438, -0.109405517578125, -0.10467910766601562, -0.09995269775390625, -0.09522628784179688, -0.0904998779296875, -0.08577346801757812, -0.08104705810546875, -0.07632064819335938, -0.07159423828125, -0.06686782836914062, -0.06214141845703125, -0.057415008544921875, -0.0526885986328125, -0.047962188720703125, -0.04323577880859375, -0.038509368896484375, -0.033782958984375, -0.029056549072265625, -0.02433013916015625, -0.019603729248046875, -0.0148773193359375, -0.010150909423828125, -0.00542449951171875, -0.000698089599609375, 0.0040283203125, 0.008754730224609375, 0.01348114013671875, 0.018207550048828125, 0.0229339599609375, 0.027660369873046875, 0.03238677978515625, 0.037113189697265625, 0.041839599609375, 0.046566009521484375, 0.05129241943359375, 0.056018829345703125, 0.0607452392578125, 0.06547164916992188, 0.07019805908203125, 0.07492446899414062, 0.07965087890625, 0.08437728881835938, 0.08910369873046875, 0.09383010864257812, 0.0985565185546875, 0.10328292846679688, 0.10800933837890625, 0.11273574829101562, 0.117462158203125, 0.12218856811523438, 0.12691497802734375, 0.13164138793945312, 0.1363677978515625, 0.14109420776367188, 0.14582061767578125, 0.15054702758789062, 0.1552734375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 11.0, 11.0, 10.0, 11.0, 10.0, 12.0, 10.0, 20.0, 17.0, 28.0, 30.0, 29.0, 28.0, 32.0, 39.0, 31.0, 23.0, 45.0, 28.0, 49.0, 1066.0, 34.0, 39.0, 37.0, 29.0, 38.0, 27.0, 32.0, 31.0, 26.0, 18.0, 28.0, 25.0, 15.0, 12.0, 9.0, 8.0, 9.0, 10.0, 18.0, 8.0, 3.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 5.0, 1.0, 1.0], "bins": [-1.10546875, -1.0726547241210938, -1.0398406982421875, -1.0070266723632812, -0.974212646484375, -0.9413986206054688, -0.9085845947265625, -0.8757705688476562, -0.84295654296875, -0.8101425170898438, -0.7773284912109375, -0.7445144653320312, -0.711700439453125, -0.6788864135742188, -0.6460723876953125, -0.6132583618164062, -0.5804443359375, -0.5476303100585938, -0.5148162841796875, -0.48200225830078125, -0.449188232421875, -0.41637420654296875, -0.3835601806640625, -0.35074615478515625, -0.31793212890625, -0.28511810302734375, -0.2523040771484375, -0.21949005126953125, -0.186676025390625, -0.15386199951171875, -0.1210479736328125, -0.08823394775390625, -0.055419921875, -0.02260589599609375, 0.0102081298828125, 0.04302215576171875, 0.075836181640625, 0.10865020751953125, 0.1414642333984375, 0.17427825927734375, 0.20709228515625, 0.23990631103515625, 0.2727203369140625, 0.30553436279296875, 0.338348388671875, 0.37116241455078125, 0.4039764404296875, 0.43679046630859375, 0.4696044921875, 0.5024185180664062, 0.5352325439453125, 0.5680465698242188, 0.600860595703125, 0.6336746215820312, 0.6664886474609375, 0.6993026733398438, 0.73211669921875, 0.7649307250976562, 0.7977447509765625, 0.8305587768554688, 0.863372802734375, 0.8961868286132812, 0.9290008544921875, 0.9618148803710938, 0.99462890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 6.0, 14.0, 19.0, 31.0, 45.0, 49.0, 70.0, 113.0, 118.0, 183.0, 243.0, 364.0, 461.0, 628.0, 908.0, 1221.0, 1852.0, 2588.0, 3798.0, 5753.0, 9120.0, 16251.0, 38971.0, 251923.0, 1636534.0, 70382.0, 22356.0, 11404.0, 6926.0, 4362.0, 3114.0, 2071.0, 1439.0, 1017.0, 777.0, 563.0, 391.0, 252.0, 244.0, 172.0, 96.0, 74.0, 75.0, 33.0, 30.0, 20.0, 17.0, 15.0, 11.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2109375, -0.2043895721435547, -0.19784164428710938, -0.19129371643066406, -0.18474578857421875, -0.17819786071777344, -0.17164993286132812, -0.1651020050048828, -0.1585540771484375, -0.1520061492919922, -0.14545822143554688, -0.13891029357910156, -0.13236236572265625, -0.12581443786621094, -0.11926651000976562, -0.11271858215332031, -0.106170654296875, -0.09962272644042969, -0.09307479858398438, -0.08652687072753906, -0.07997894287109375, -0.07343101501464844, -0.06688308715820312, -0.06033515930175781, -0.0537872314453125, -0.04723930358886719, -0.040691375732421875, -0.03414344787597656, -0.02759552001953125, -0.021047592163085938, -0.014499664306640625, -0.007951736450195312, -0.00140380859375, 0.0051441192626953125, 0.011692047119140625, 0.018239974975585938, 0.02478790283203125, 0.03133583068847656, 0.037883758544921875, 0.04443168640136719, 0.0509796142578125, 0.05752754211425781, 0.06407546997070312, 0.07062339782714844, 0.07717132568359375, 0.08371925354003906, 0.09026718139648438, 0.09681510925292969, 0.103363037109375, 0.10991096496582031, 0.11645889282226562, 0.12300682067871094, 0.12955474853515625, 0.13610267639160156, 0.14265060424804688, 0.1491985321044922, 0.1557464599609375, 0.1622943878173828, 0.16884231567382812, 0.17539024353027344, 0.18193817138671875, 0.18848609924316406, 0.19503402709960938, 0.2015819549560547, 0.2081298828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 8.0, 7.0, 6.0, 13.0, 16.0, 14.0, 27.0, 24.0, 24.0, 22.0, 36.0, 47.0, 45.0, 57.0, 46.0, 50.0, 54.0, 53.0, 56.0, 60.0, 52.0, 40.0, 38.0, 32.0, 42.0, 27.0, 19.0, 20.0, 14.0, 11.0, 7.0, 6.0, 5.0, 7.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01045989990234375, -0.010142207145690918, -0.009824514389038086, -0.009506821632385254, -0.009189128875732422, -0.00887143611907959, -0.008553743362426758, -0.008236050605773926, -0.007918357849121094, -0.007600665092468262, -0.00728297233581543, -0.006965279579162598, -0.006647586822509766, -0.006329894065856934, -0.0060122013092041016, -0.0056945085525512695, -0.0053768157958984375, -0.0050591230392456055, -0.0047414302825927734, -0.004423737525939941, -0.004106044769287109, -0.0037883520126342773, -0.0034706592559814453, -0.0031529664993286133, -0.0028352737426757812, -0.0025175809860229492, -0.002199888229370117, -0.0018821954727172852, -0.0015645027160644531, -0.001246809959411621, -0.0009291172027587891, -0.000611424446105957, -0.000293731689453125, 2.396106719970703e-05, 0.00034165382385253906, 0.0006593465805053711, 0.0009770393371582031, 0.0012947320938110352, 0.0016124248504638672, 0.0019301176071166992, 0.0022478103637695312, 0.0025655031204223633, 0.0028831958770751953, 0.0032008886337280273, 0.0035185813903808594, 0.0038362741470336914, 0.0041539669036865234, 0.0044716596603393555, 0.0047893524169921875, 0.0051070451736450195, 0.0054247379302978516, 0.005742430686950684, 0.006060123443603516, 0.006377816200256348, 0.00669550895690918, 0.007013201713562012, 0.007330894470214844, 0.007648587226867676, 0.007966279983520508, 0.00828397274017334, 0.008601665496826172, 0.008919358253479004, 0.009237051010131836, 0.009554743766784668, 0.0098724365234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 13.0, 14.0, 11.0, 19.0, 25.0, 31.0, 42.0, 63.0, 78.0, 127.0, 157.0, 259.0, 577.0, 4154.0, 774550.0, 265129.0, 2011.0, 484.0, 217.0, 157.0, 113.0, 59.0, 50.0, 44.0, 30.0, 27.0, 20.0, 15.0, 16.0, 12.0, 5.0, 9.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1995849609375, -0.19312286376953125, -0.1866607666015625, -0.18019866943359375, -0.173736572265625, -0.16727447509765625, -0.1608123779296875, -0.15435028076171875, -0.14788818359375, -0.14142608642578125, -0.1349639892578125, -0.12850189208984375, -0.122039794921875, -0.11557769775390625, -0.1091156005859375, -0.10265350341796875, -0.09619140625, -0.08972930908203125, -0.0832672119140625, -0.07680511474609375, -0.070343017578125, -0.06388092041015625, -0.0574188232421875, -0.05095672607421875, -0.04449462890625, -0.03803253173828125, -0.0315704345703125, -0.02510833740234375, -0.018646240234375, -0.01218414306640625, -0.0057220458984375, 0.00074005126953125, 0.0072021484375, 0.01366424560546875, 0.0201263427734375, 0.02658843994140625, 0.033050537109375, 0.03951263427734375, 0.0459747314453125, 0.05243682861328125, 0.05889892578125, 0.06536102294921875, 0.0718231201171875, 0.07828521728515625, 0.084747314453125, 0.09120941162109375, 0.0976715087890625, 0.10413360595703125, 0.110595703125, 0.11705780029296875, 0.1235198974609375, 0.12998199462890625, 0.136444091796875, 0.14290618896484375, 0.1493682861328125, 0.15583038330078125, 0.16229248046875, 0.16875457763671875, 0.1752166748046875, 0.18167877197265625, 0.188140869140625, 0.19460296630859375, 0.2010650634765625, 0.20752716064453125, 0.2139892578125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 13.0, 74.0, 274.0, 438.0, 177.0, 36.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00814780406653881, -0.006315184757113457, -0.004482565447688103, -0.0026499456726014614, -0.0008173263631761074, 0.001015293411910534, 0.002847912721335888, 0.004680532030761242, 0.006513151340186596, 0.00834577064961195, 0.010178389959037304, 0.012011010199785233, 0.013843629509210587, 0.01567624881863594, 0.017508868128061295, 0.01934148743748665, 0.021174106746912003, 0.023006726056337357, 0.02483934536576271, 0.026671964675188065, 0.02850458398461342, 0.030337203294038773, 0.03216982260346413, 0.03400244191288948, 0.035835061222314835, 0.03766768053174019, 0.03950029984116554, 0.0413329191505909, 0.04316553846001625, 0.044998157769441605, 0.04683077707886696, 0.04866339638829231, 0.05049601569771767, 0.05232863500714302, 0.054161254316568375, 0.05599387362599373, 0.05782649293541908, 0.05965911224484444, 0.06149173155426979, 0.06332435458898544, 0.0651569738984108, 0.06698959320783615, 0.0688222125172615, 0.07065483182668686, 0.07248745113611221, 0.07432007044553757, 0.07615268975496292, 0.07798530906438828, 0.07981792837381363, 0.08165054768323898, 0.08348316699266434, 0.08531578630208969, 0.08714840561151505, 0.0889810249209404, 0.09081364423036575, 0.09264626353979111, 0.09447888284921646, 0.09631150215864182, 0.09814412146806717, 0.09997674077749252, 0.10180936008691788, 0.10364197939634323, 0.10547459870576859, 0.10730721801519394, 0.1091398373246193]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 6.0, 8.0, 7.0, 15.0, 10.0, 9.0, 20.0, 24.0, 29.0, 27.0, 18.0, 41.0, 34.0, 42.0, 38.0, 50.0, 49.0, 49.0, 36.0, 53.0, 38.0, 51.0, 30.0, 33.0, 29.0, 44.0, 28.0, 24.0, 26.0, 20.0, 20.0, 17.0, 14.0, 8.0, 11.0, 9.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00837773084640503, -0.008094369433820248, -0.007811008021235466, -0.007527646608650684, -0.007244285196065903, -0.006960923783481121, -0.006677562370896339, -0.006394200958311558, -0.006110839545726776, -0.0058274781331419945, -0.005544116720557213, -0.005260755307972431, -0.0049773938953876495, -0.004694032482802868, -0.004410671070218086, -0.004127309657633305, -0.003843948245048523, -0.0035605868324637413, -0.0032772254198789597, -0.002993864007294178, -0.0027105025947093964, -0.0024271411821246147, -0.002143779769539833, -0.0018604183569550514, -0.0015770569443702698, -0.0012936955317854881, -0.0010103341192007065, -0.0007269727066159248, -0.0004436112940311432, -0.00016024988144636154, 0.0001231115311384201, 0.00040647294372320175, 0.0006898343563079834, 0.000973195768892765, 0.0012565571814775467, 0.0015399185940623283, 0.00182328000664711, 0.0021066414192318916, 0.0023900028318166733, 0.002673364244401455, 0.0029567256569862366, 0.0032400870695710182, 0.0035234484821558, 0.0038068098947405815, 0.004090171307325363, 0.004373532719910145, 0.0046568941324949265, 0.004940255545079708, 0.00522361695766449, 0.005506978370249271, 0.005790339782834053, 0.006073701195418835, 0.006357062608003616, 0.006640424020588398, 0.00692378543317318, 0.007207146845757961, 0.007490508258342743, 0.007773869670927525, 0.008057231083512306, 0.008340592496097088, 0.00862395390868187, 0.008907315321266651, 0.009190676733851433, 0.009474038146436214, 0.009757399559020996]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 5.0, 6.0, 3.0, 13.0, 13.0, 15.0, 16.0, 19.0, 23.0, 32.0, 25.0, 31.0, 39.0, 32.0, 37.0, 37.0, 37.0, 51.0, 52.0, 45.0, 36.0, 45.0, 38.0, 45.0, 37.0, 40.0, 20.0, 21.0, 33.0, 27.0, 16.0, 21.0, 18.0, 14.0, 12.0, 11.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.843231201171875, -1.78900146484375, -1.734771728515625, -1.6805419921875, -1.626312255859375, -1.57208251953125, -1.517852783203125, -1.463623046875, -1.409393310546875, -1.35516357421875, -1.300933837890625, -1.2467041015625, -1.192474365234375, -1.13824462890625, -1.084014892578125, -1.02978515625, -0.975555419921875, -0.92132568359375, -0.867095947265625, -0.8128662109375, -0.758636474609375, -0.70440673828125, -0.650177001953125, -0.595947265625, -0.541717529296875, -0.48748779296875, -0.433258056640625, -0.3790283203125, -0.324798583984375, -0.27056884765625, -0.216339111328125, -0.162109375, -0.107879638671875, -0.05364990234375, 0.000579833984375, 0.0548095703125, 0.109039306640625, 0.16326904296875, 0.217498779296875, 0.271728515625, 0.325958251953125, 0.38018798828125, 0.434417724609375, 0.4886474609375, 0.542877197265625, 0.59710693359375, 0.651336669921875, 0.70556640625, 0.759796142578125, 0.81402587890625, 0.868255615234375, 0.9224853515625, 0.976715087890625, 1.03094482421875, 1.085174560546875, 1.139404296875, 1.193634033203125, 1.24786376953125, 1.302093505859375, 1.3563232421875, 1.410552978515625, 1.46478271484375, 1.519012451171875, 1.5732421875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 10.0, 12.0, 20.0, 16.0, 36.0, 48.0, 64.0, 84.0, 101.0, 214.0, 326.0, 485.0, 865.0, 1473.0, 2478.0, 4796.0, 9456.0, 20963.0, 54681.0, 180023.0, 576105.0, 121348.0, 41270.0, 16621.0, 7734.0, 3914.0, 2187.0, 1183.0, 710.0, 427.0, 291.0, 173.0, 144.0, 80.0, 61.0, 46.0, 30.0, 17.0, 18.0, 8.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.474609375, -3.3763427734375, -3.278076171875, -3.1798095703125, -3.08154296875, -2.9832763671875, -2.885009765625, -2.7867431640625, -2.6884765625, -2.5902099609375, -2.491943359375, -2.3936767578125, -2.29541015625, -2.1971435546875, -2.098876953125, -2.0006103515625, -1.90234375, -1.8040771484375, -1.705810546875, -1.6075439453125, -1.50927734375, -1.4110107421875, -1.312744140625, -1.2144775390625, -1.1162109375, -1.0179443359375, -0.919677734375, -0.8214111328125, -0.72314453125, -0.6248779296875, -0.526611328125, -0.4283447265625, -0.330078125, -0.2318115234375, -0.133544921875, -0.0352783203125, 0.06298828125, 0.1612548828125, 0.259521484375, 0.3577880859375, 0.4560546875, 0.5543212890625, 0.652587890625, 0.7508544921875, 0.84912109375, 0.9473876953125, 1.045654296875, 1.1439208984375, 1.2421875, 1.3404541015625, 1.438720703125, 1.5369873046875, 1.63525390625, 1.7335205078125, 1.831787109375, 1.9300537109375, 2.0283203125, 2.1265869140625, 2.224853515625, 2.3231201171875, 2.42138671875, 2.5196533203125, 2.617919921875, 2.7161865234375, 2.814453125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 10.0, 5.0, 16.0, 17.0, 25.0, 21.0, 24.0, 45.0, 45.0, 52.0, 72.0, 114.0, 140.0, 1512.0, 336.0, 145.0, 90.0, 70.0, 54.0, 55.0, 42.0, 32.0, 23.0, 21.0, 20.0, 15.0, 19.0, 9.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.7705078125, -5.583984375, -5.3974609375, -5.2109375, -5.0244140625, -4.837890625, -4.6513671875, -4.46484375, -4.2783203125, -4.091796875, -3.9052734375, -3.71875, -3.5322265625, -3.345703125, -3.1591796875, -2.97265625, -2.7861328125, -2.599609375, -2.4130859375, -2.2265625, -2.0400390625, -1.853515625, -1.6669921875, -1.48046875, -1.2939453125, -1.107421875, -0.9208984375, -0.734375, -0.5478515625, -0.361328125, -0.1748046875, 0.01171875, 0.1982421875, 0.384765625, 0.5712890625, 0.7578125, 0.9443359375, 1.130859375, 1.3173828125, 1.50390625, 1.6904296875, 1.876953125, 2.0634765625, 2.25, 2.4365234375, 2.623046875, 2.8095703125, 2.99609375, 3.1826171875, 3.369140625, 3.5556640625, 3.7421875, 3.9287109375, 4.115234375, 4.3017578125, 4.48828125, 4.6748046875, 4.861328125, 5.0478515625, 5.234375, 5.4208984375, 5.607421875, 5.7939453125, 5.98046875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 3.0, 12.0, 14.0, 27.0, 30.0, 36.0, 40.0, 49.0, 95.0, 130.0, 214.0, 384.0, 913.0, 3590.0, 34686.0, 2820280.0, 272032.0, 10098.0, 1661.0, 583.0, 285.0, 165.0, 116.0, 62.0, 52.0, 43.0, 29.0, 17.0, 20.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0390625, -10.7021484375, -10.365234375, -10.0283203125, -9.69140625, -9.3544921875, -9.017578125, -8.6806640625, -8.34375, -8.0068359375, -7.669921875, -7.3330078125, -6.99609375, -6.6591796875, -6.322265625, -5.9853515625, -5.6484375, -5.3115234375, -4.974609375, -4.6376953125, -4.30078125, -3.9638671875, -3.626953125, -3.2900390625, -2.953125, -2.6162109375, -2.279296875, -1.9423828125, -1.60546875, -1.2685546875, -0.931640625, -0.5947265625, -0.2578125, 0.0791015625, 0.416015625, 0.7529296875, 1.08984375, 1.4267578125, 1.763671875, 2.1005859375, 2.4375, 2.7744140625, 3.111328125, 3.4482421875, 3.78515625, 4.1220703125, 4.458984375, 4.7958984375, 5.1328125, 5.4697265625, 5.806640625, 6.1435546875, 6.48046875, 6.8173828125, 7.154296875, 7.4912109375, 7.828125, 8.1650390625, 8.501953125, 8.8388671875, 9.17578125, 9.5126953125, 9.849609375, 10.1865234375, 10.5234375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 173.0, 697.0, 131.0, 8.0, 0.0, 1.0], "bins": [-101.06002044677734, -99.35868835449219, -97.65735626220703, -95.9560317993164, -94.25469970703125, -92.5533676147461, -90.85203552246094, -89.15071105957031, -87.44937896728516, -85.748046875, -84.04671478271484, -82.34539031982422, -80.64405822753906, -78.9427261352539, -77.24139404296875, -75.54006958007812, -73.83872985839844, -72.13739776611328, -70.43606567382812, -68.7347412109375, -67.03340911865234, -65.33207702636719, -63.63074493408203, -61.92941665649414, -60.22808837890625, -58.526756286621094, -56.8254280090332, -55.12409591674805, -53.422767639160156, -51.721435546875, -50.020103454589844, -48.31877517700195, -46.61744689941406, -44.916114807128906, -43.214786529541016, -41.51345443725586, -39.81212615966797, -38.11079406738281, -36.409461975097656, -34.708133697509766, -33.006805419921875, -31.30547523498535, -29.604145050048828, -27.902812957763672, -26.20148468017578, -24.500152587890625, -22.7988224029541, -21.097492218017578, -19.396162033081055, -17.69483184814453, -15.993501663208008, -14.292170524597168, -12.590840339660645, -10.889510154724121, -9.188179016113281, -7.486848831176758, -5.785518646240234, -4.084188461303711, -2.3828577995300293, -0.6815271377563477, 1.0198030471801758, 2.721133232116699, 4.422464370727539, 6.1237945556640625, 7.825124740600586]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 10.0, 5.0, 4.0, 6.0, 10.0, 7.0, 19.0, 18.0, 16.0, 20.0, 33.0, 28.0, 27.0, 34.0, 37.0, 38.0, 48.0, 42.0, 32.0, 38.0, 42.0, 40.0, 31.0, 32.0, 36.0, 41.0, 38.0, 32.0, 31.0, 25.0, 33.0, 16.0, 29.0, 10.0, 15.0, 17.0, 10.0, 9.0, 12.0, 8.0, 5.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.426677703857422, -11.073619842529297, -10.720561981201172, -10.367504119873047, -10.014446258544922, -9.661388397216797, -9.308330535888672, -8.955272674560547, -8.602214813232422, -8.249156951904297, -7.896099090576172, -7.543041229248047, -7.189983367919922, -6.836925506591797, -6.48386812210083, -6.130810260772705, -5.777752876281738, -5.424695014953613, -5.071637153625488, -4.718579292297363, -4.365521430969238, -4.012463569641113, -3.6594061851501465, -3.3063483238220215, -2.9532904624938965, -2.6002326011657715, -2.2471747398376465, -1.8941171169281006, -1.5410592555999756, -1.1880013942718506, -0.8349437713623047, -0.4818859100341797, -0.12882709503173828, 0.22423070669174194, 0.5772885084152222, 0.9303462505340576, 1.2834041118621826, 1.6364619731903076, 1.9895195960998535, 2.3425774574279785, 2.6956353187561035, 3.0486931800842285, 3.4017510414123535, 3.7548086643218994, 4.107866287231445, 4.46092414855957, 4.813982009887695, 5.16703987121582, 5.520097732543945, 5.87315559387207, 6.226213455200195, 6.57927131652832, 6.932329177856445, 7.28538703918457, 7.638444423675537, 7.991502285003662, 8.344560623168945, 8.69761848449707, 9.050676345825195, 9.40373420715332, 9.756792068481445, 10.10984992980957, 10.462907791137695, 10.81596565246582, 11.169022560119629]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 8.0, 10.0, 14.0, 22.0, 6.0, 21.0, 16.0, 25.0, 25.0, 26.0, 23.0, 47.0, 43.0, 34.0, 39.0, 48.0, 39.0, 45.0, 45.0, 40.0, 40.0, 35.0, 43.0, 32.0, 32.0, 40.0, 20.0, 24.0, 23.0, 19.0, 20.0, 13.0, 18.0, 12.0, 6.0, 5.0, 6.0, 3.0, 4.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.9423828125, -1.8878021240234375, -1.833221435546875, -1.7786407470703125, -1.72406005859375, -1.6694793701171875, -1.614898681640625, -1.5603179931640625, -1.5057373046875, -1.4511566162109375, -1.396575927734375, -1.3419952392578125, -1.28741455078125, -1.2328338623046875, -1.178253173828125, -1.1236724853515625, -1.069091796875, -1.0145111083984375, -0.959930419921875, -0.9053497314453125, -0.85076904296875, -0.7961883544921875, -0.741607666015625, -0.6870269775390625, -0.6324462890625, -0.5778656005859375, -0.523284912109375, -0.4687042236328125, -0.41412353515625, -0.3595428466796875, -0.304962158203125, -0.2503814697265625, -0.19580078125, -0.1412200927734375, -0.086639404296875, -0.0320587158203125, 0.02252197265625, 0.0771026611328125, 0.131683349609375, 0.1862640380859375, 0.2408447265625, 0.2954254150390625, 0.350006103515625, 0.4045867919921875, 0.45916748046875, 0.5137481689453125, 0.568328857421875, 0.6229095458984375, 0.677490234375, 0.7320709228515625, 0.786651611328125, 0.8412322998046875, 0.89581298828125, 0.9503936767578125, 1.004974365234375, 1.0595550537109375, 1.1141357421875, 1.1687164306640625, 1.223297119140625, 1.2778778076171875, 1.33245849609375, 1.3870391845703125, 1.441619873046875, 1.4962005615234375, 1.55078125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 7.0, 15.0, 33.0, 19.0, 56.0, 85.0, 99.0, 155.0, 205.0, 306.0, 440.0, 685.0, 998.0, 1555.0, 2513.0, 4177.0, 7800.0, 16432.0, 41427.0, 146928.0, 815967.0, 2361899.0, 607661.0, 116543.0, 35614.0, 14692.0, 7115.0, 3910.0, 2350.0, 1479.0, 988.0, 679.0, 417.0, 274.0, 207.0, 165.0, 99.0, 82.0, 58.0, 35.0, 27.0, 18.0, 13.0, 8.0, 15.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.193359375, -3.1005859375, -3.0078125, -2.9150390625, -2.822265625, -2.7294921875, -2.63671875, -2.5439453125, -2.451171875, -2.3583984375, -2.265625, -2.1728515625, -2.080078125, -1.9873046875, -1.89453125, -1.8017578125, -1.708984375, -1.6162109375, -1.5234375, -1.4306640625, -1.337890625, -1.2451171875, -1.15234375, -1.0595703125, -0.966796875, -0.8740234375, -0.78125, -0.6884765625, -0.595703125, -0.5029296875, -0.41015625, -0.3173828125, -0.224609375, -0.1318359375, -0.0390625, 0.0537109375, 0.146484375, 0.2392578125, 0.33203125, 0.4248046875, 0.517578125, 0.6103515625, 0.703125, 0.7958984375, 0.888671875, 0.9814453125, 1.07421875, 1.1669921875, 1.259765625, 1.3525390625, 1.4453125, 1.5380859375, 1.630859375, 1.7236328125, 1.81640625, 1.9091796875, 2.001953125, 2.0947265625, 2.1875, 2.2802734375, 2.373046875, 2.4658203125, 2.55859375, 2.6513671875, 2.744140625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 10.0, 11.0, 13.0, 24.0, 23.0, 25.0, 36.0, 53.0, 80.0, 116.0, 189.0, 277.0, 480.0, 717.0, 678.0, 463.0, 301.0, 177.0, 117.0, 75.0, 46.0, 36.0, 23.0, 21.0, 17.0, 11.0, 12.0, 4.0, 10.0, 5.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-3.986328125, -3.881500244140625, -3.77667236328125, -3.671844482421875, -3.5670166015625, -3.462188720703125, -3.35736083984375, -3.252532958984375, -3.147705078125, -3.042877197265625, -2.93804931640625, -2.833221435546875, -2.7283935546875, -2.623565673828125, -2.51873779296875, -2.413909912109375, -2.30908203125, -2.204254150390625, -2.09942626953125, -1.994598388671875, -1.8897705078125, -1.784942626953125, -1.68011474609375, -1.575286865234375, -1.470458984375, -1.365631103515625, -1.26080322265625, -1.155975341796875, -1.0511474609375, -0.946319580078125, -0.84149169921875, -0.736663818359375, -0.6318359375, -0.527008056640625, -0.42218017578125, -0.317352294921875, -0.2125244140625, -0.107696533203125, -0.00286865234375, 0.101959228515625, 0.206787109375, 0.311614990234375, 0.41644287109375, 0.521270751953125, 0.6260986328125, 0.730926513671875, 0.83575439453125, 0.940582275390625, 1.04541015625, 1.150238037109375, 1.25506591796875, 1.359893798828125, 1.4647216796875, 1.569549560546875, 1.67437744140625, 1.779205322265625, 1.884033203125, 1.988861083984375, 2.09368896484375, 2.198516845703125, 2.3033447265625, 2.408172607421875, 2.51300048828125, 2.617828369140625, 2.72265625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 3.0, 9.0, 20.0, 18.0, 26.0, 41.0, 55.0, 94.0, 139.0, 275.0, 606.0, 1720.0, 6010.0, 33402.0, 954455.0, 3124477.0, 60353.0, 8823.0, 2184.0, 771.0, 320.0, 176.0, 90.0, 60.0, 44.0, 27.0, 20.0, 17.0, 8.0, 9.0, 5.0, 6.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.953125, -9.643310546875, -9.33349609375, -9.023681640625, -8.7138671875, -8.404052734375, -8.09423828125, -7.784423828125, -7.474609375, -7.164794921875, -6.85498046875, -6.545166015625, -6.2353515625, -5.925537109375, -5.61572265625, -5.305908203125, -4.99609375, -4.686279296875, -4.37646484375, -4.066650390625, -3.7568359375, -3.447021484375, -3.13720703125, -2.827392578125, -2.517578125, -2.207763671875, -1.89794921875, -1.588134765625, -1.2783203125, -0.968505859375, -0.65869140625, -0.348876953125, -0.0390625, 0.270751953125, 0.58056640625, 0.890380859375, 1.2001953125, 1.510009765625, 1.81982421875, 2.129638671875, 2.439453125, 2.749267578125, 3.05908203125, 3.368896484375, 3.6787109375, 3.988525390625, 4.29833984375, 4.608154296875, 4.91796875, 5.227783203125, 5.53759765625, 5.847412109375, 6.1572265625, 6.467041015625, 6.77685546875, 7.086669921875, 7.396484375, 7.706298828125, 8.01611328125, 8.325927734375, 8.6357421875, 8.945556640625, 9.25537109375, 9.565185546875, 9.875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 229.0, 624.0, 129.0, 15.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.62740325927734, -99.2317886352539, -96.83617401123047, -94.44056701660156, -92.04495239257812, -89.64933776855469, -87.25372314453125, -84.85810852050781, -82.46249389648438, -80.06687927246094, -77.6712646484375, -75.2756576538086, -72.88004302978516, -70.48442840576172, -68.08881378173828, -65.69319915771484, -63.29759216308594, -60.9019775390625, -58.50636672973633, -56.11075210571289, -53.71514129638672, -51.31952667236328, -48.923912048339844, -46.528297424316406, -44.132686614990234, -41.7370719909668, -39.341461181640625, -36.94584655761719, -34.55023193359375, -32.15462112426758, -29.75900650024414, -27.363393783569336, -24.967788696289062, -22.572175979614258, -20.176563262939453, -17.780948638916016, -15.385335922241211, -12.989723205566406, -10.594109535217285, -8.198495864868164, -5.802883148193359, -3.4072699546813965, -1.0116567611694336, 1.3839564323425293, 3.779569625854492, 6.175182342529297, 8.570796012878418, 10.966409683227539, 13.362022399902344, 15.757635116577148, 18.153247833251953, 20.54886245727539, 22.944475173950195, 25.340087890625, 27.735702514648438, 30.131315231323242, 32.52692794799805, 34.922542572021484, 37.318153381347656, 39.713768005371094, 42.10938262939453, 44.5049934387207, 46.90060806274414, 49.29621887207031, 51.69183349609375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 9.0, 6.0, 5.0, 14.0, 11.0, 11.0, 24.0, 18.0, 37.0, 29.0, 26.0, 39.0, 36.0, 38.0, 53.0, 43.0, 48.0, 51.0, 44.0, 46.0, 47.0, 38.0, 41.0, 37.0, 39.0, 32.0, 34.0, 29.0, 15.0, 14.0, 15.0, 14.0, 15.0, 12.0, 6.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.871389389038086, -9.507628440856934, -9.143867492675781, -8.780106544494629, -8.416345596313477, -8.05258560180664, -7.688824653625488, -7.325063705444336, -6.961302757263184, -6.597541809082031, -6.233780860900879, -5.870020389556885, -5.506259441375732, -5.14249849319458, -4.778738021850586, -4.414977073669434, -4.051216125488281, -3.687455177307129, -3.3236944675445557, -2.9599337577819824, -2.59617280960083, -2.2324118614196777, -1.8686511516571045, -1.5048904418945312, -1.141129493713379, -0.7773686647415161, -0.4136078357696533, -0.04984700679779053, 0.31391382217407227, 0.6776746511459351, 1.0414354801177979, 1.405196189880371, 1.7689571380615234, 2.132718086242676, 2.496478796005249, 2.8602395057678223, 3.2240004539489746, 3.587761402130127, 3.9515221118927, 4.315282821655273, 4.679043769836426, 5.042804718017578, 5.4065656661987305, 5.770326137542725, 6.134087085723877, 6.497848033905029, 6.861608505249023, 7.225369453430176, 7.589130401611328, 7.9528913497924805, 8.316652297973633, 8.680413246154785, 9.044174194335938, 9.407934188842773, 9.771695137023926, 10.135456085205078, 10.49921703338623, 10.862977981567383, 11.226738929748535, 11.590499877929688, 11.954259872436523, 12.318020820617676, 12.681781768798828, 13.04554271697998, 13.409303665161133]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 14.0, 22.0, 11.0, 26.0, 21.0, 26.0, 31.0, 36.0, 41.0, 46.0, 41.0, 43.0, 42.0, 38.0, 40.0, 51.0, 42.0, 51.0, 42.0, 42.0, 41.0, 28.0, 30.0, 23.0, 25.0, 12.0, 21.0, 21.0, 16.0, 8.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9765625, -1.91876220703125, -1.8609619140625, -1.80316162109375, -1.745361328125, -1.68756103515625, -1.6297607421875, -1.57196044921875, -1.51416015625, -1.45635986328125, -1.3985595703125, -1.34075927734375, -1.282958984375, -1.22515869140625, -1.1673583984375, -1.10955810546875, -1.0517578125, -0.99395751953125, -0.9361572265625, -0.87835693359375, -0.820556640625, -0.76275634765625, -0.7049560546875, -0.64715576171875, -0.58935546875, -0.53155517578125, -0.4737548828125, -0.41595458984375, -0.358154296875, -0.30035400390625, -0.2425537109375, -0.18475341796875, -0.126953125, -0.06915283203125, -0.0113525390625, 0.04644775390625, 0.104248046875, 0.16204833984375, 0.2198486328125, 0.27764892578125, 0.33544921875, 0.39324951171875, 0.4510498046875, 0.50885009765625, 0.566650390625, 0.62445068359375, 0.6822509765625, 0.74005126953125, 0.7978515625, 0.85565185546875, 0.9134521484375, 0.97125244140625, 1.029052734375, 1.08685302734375, 1.1446533203125, 1.20245361328125, 1.26025390625, 1.31805419921875, 1.3758544921875, 1.43365478515625, 1.491455078125, 1.54925537109375, 1.6070556640625, 1.66485595703125, 1.72265625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 9.0, 12.0, 23.0, 24.0, 46.0, 52.0, 82.0, 127.0, 169.0, 207.0, 348.0, 478.0, 720.0, 1084.0, 1685.0, 2486.0, 3619.0, 5523.0, 8903.0, 14384.0, 23292.0, 39508.0, 70552.0, 135599.0, 248369.0, 222865.0, 115702.0, 60997.0, 34857.0, 21007.0, 12778.0, 7808.0, 5042.0, 3357.0, 2164.0, 1493.0, 941.0, 662.0, 476.0, 332.0, 226.0, 161.0, 112.0, 75.0, 55.0, 43.0, 30.0, 17.0, 18.0, 17.0, 3.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.1417236328125, -0.13713455200195312, -0.13254547119140625, -0.12795639038085938, -0.1233673095703125, -0.11877822875976562, -0.11418914794921875, -0.10960006713867188, -0.105010986328125, -0.10042190551757812, -0.09583282470703125, -0.09124374389648438, -0.0866546630859375, -0.08206558227539062, -0.07747650146484375, -0.07288742065429688, -0.06829833984375, -0.06370925903320312, -0.05912017822265625, -0.054531097412109375, -0.0499420166015625, -0.045352935791015625, -0.04076385498046875, -0.036174774169921875, -0.031585693359375, -0.026996612548828125, -0.02240753173828125, -0.017818450927734375, -0.0132293701171875, -0.008640289306640625, -0.00405120849609375, 0.000537872314453125, 0.005126953125, 0.009716033935546875, 0.01430511474609375, 0.018894195556640625, 0.0234832763671875, 0.028072357177734375, 0.03266143798828125, 0.037250518798828125, 0.041839599609375, 0.046428680419921875, 0.05101776123046875, 0.055606842041015625, 0.0601959228515625, 0.06478500366210938, 0.06937408447265625, 0.07396316528320312, 0.07855224609375, 0.08314132690429688, 0.08773040771484375, 0.09231948852539062, 0.0969085693359375, 0.10149765014648438, 0.10608673095703125, 0.11067581176757812, 0.115264892578125, 0.11985397338867188, 0.12444305419921875, 0.12903213500976562, 0.1336212158203125, 0.13821029663085938, 0.14279937744140625, 0.14738845825195312, 0.1519775390625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 9.0, 9.0, 14.0, 15.0, 18.0, 18.0, 20.0, 28.0, 20.0, 26.0, 39.0, 35.0, 34.0, 42.0, 34.0, 26.0, 53.0, 1070.0, 48.0, 40.0, 48.0, 42.0, 37.0, 40.0, 32.0, 20.0, 29.0, 24.0, 23.0, 13.0, 12.0, 17.0, 16.0, 13.0, 10.0, 6.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0], "bins": [-1.2861328125, -1.2495269775390625, -1.212921142578125, -1.1763153076171875, -1.13970947265625, -1.1031036376953125, -1.066497802734375, -1.0298919677734375, -0.9932861328125, -0.9566802978515625, -0.920074462890625, -0.8834686279296875, -0.84686279296875, -0.8102569580078125, -0.773651123046875, -0.7370452880859375, -0.700439453125, -0.6638336181640625, -0.627227783203125, -0.5906219482421875, -0.55401611328125, -0.5174102783203125, -0.480804443359375, -0.4441986083984375, -0.4075927734375, -0.3709869384765625, -0.334381103515625, -0.2977752685546875, -0.26116943359375, -0.2245635986328125, -0.187957763671875, -0.1513519287109375, -0.11474609375, -0.0781402587890625, -0.041534423828125, -0.0049285888671875, 0.03167724609375, 0.0682830810546875, 0.104888916015625, 0.1414947509765625, 0.1781005859375, 0.2147064208984375, 0.251312255859375, 0.2879180908203125, 0.32452392578125, 0.3611297607421875, 0.397735595703125, 0.4343414306640625, 0.470947265625, 0.5075531005859375, 0.544158935546875, 0.5807647705078125, 0.61737060546875, 0.6539764404296875, 0.690582275390625, 0.7271881103515625, 0.7637939453125, 0.8003997802734375, 0.837005615234375, 0.8736114501953125, 0.91021728515625, 0.9468231201171875, 0.983428955078125, 1.0200347900390625, 1.056640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 11.0, 23.0, 26.0, 29.0, 36.0, 63.0, 89.0, 152.0, 171.0, 258.0, 361.0, 542.0, 806.0, 1153.0, 1772.0, 2774.0, 4429.0, 7404.0, 13968.0, 34372.0, 243121.0, 1681785.0, 59795.0, 19162.0, 9554.0, 5300.0, 3351.0, 2048.0, 1442.0, 951.0, 663.0, 457.0, 299.0, 211.0, 162.0, 92.0, 81.0, 60.0, 41.0, 30.0, 23.0, 18.0, 8.0, 8.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.255615234375, -0.24791526794433594, -0.24021530151367188, -0.2325153350830078, -0.22481536865234375, -0.2171154022216797, -0.20941543579101562, -0.20171546936035156, -0.1940155029296875, -0.18631553649902344, -0.17861557006835938, -0.1709156036376953, -0.16321563720703125, -0.1555156707763672, -0.14781570434570312, -0.14011573791503906, -0.132415771484375, -0.12471580505371094, -0.11701583862304688, -0.10931587219238281, -0.10161590576171875, -0.09391593933105469, -0.08621597290039062, -0.07851600646972656, -0.0708160400390625, -0.06311607360839844, -0.055416107177734375, -0.04771614074707031, -0.04001617431640625, -0.03231620788574219, -0.024616241455078125, -0.016916275024414062, -0.00921630859375, -0.0015163421630859375, 0.006183624267578125, 0.013883590698242188, 0.02158355712890625, 0.029283523559570312, 0.036983489990234375, 0.04468345642089844, 0.0523834228515625, 0.06008338928222656, 0.06778335571289062, 0.07548332214355469, 0.08318328857421875, 0.09088325500488281, 0.09858322143554688, 0.10628318786621094, 0.113983154296875, 0.12168312072753906, 0.12938308715820312, 0.1370830535888672, 0.14478302001953125, 0.1524829864501953, 0.16018295288085938, 0.16788291931152344, 0.1755828857421875, 0.18328285217285156, 0.19098281860351562, 0.1986827850341797, 0.20638275146484375, 0.2140827178955078, 0.22178268432617188, 0.22948265075683594, 0.2371826171875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 9.0, 5.0, 7.0, 12.0, 15.0, 20.0, 20.0, 24.0, 26.0, 38.0, 36.0, 48.0, 52.0, 41.0, 46.0, 62.0, 44.0, 53.0, 51.0, 37.0, 46.0, 43.0, 36.0, 43.0, 34.0, 24.0, 28.0, 24.0, 12.0, 15.0, 9.0, 14.0, 4.0, 8.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00978851318359375, -0.009512186050415039, -0.009235858917236328, -0.008959531784057617, -0.008683204650878906, -0.008406877517700195, -0.008130550384521484, -0.007854223251342773, -0.0075778961181640625, -0.0073015689849853516, -0.007025241851806641, -0.00674891471862793, -0.006472587585449219, -0.006196260452270508, -0.005919933319091797, -0.005643606185913086, -0.005367279052734375, -0.005090951919555664, -0.004814624786376953, -0.004538297653198242, -0.004261970520019531, -0.00398564338684082, -0.0037093162536621094, -0.0034329891204833984, -0.0031566619873046875, -0.0028803348541259766, -0.0026040077209472656, -0.0023276805877685547, -0.0020513534545898438, -0.0017750263214111328, -0.0014986991882324219, -0.001222372055053711, -0.000946044921875, -0.0006697177886962891, -0.0003933906555175781, -0.00011706352233886719, 0.00015926361083984375, 0.0004355907440185547, 0.0007119178771972656, 0.0009882450103759766, 0.0012645721435546875, 0.0015408992767333984, 0.0018172264099121094, 0.0020935535430908203, 0.0023698806762695312, 0.002646207809448242, 0.002922534942626953, 0.003198862075805664, 0.003475189208984375, 0.003751516342163086, 0.004027843475341797, 0.004304170608520508, 0.004580497741699219, 0.00485682487487793, 0.005133152008056641, 0.0054094791412353516, 0.0056858062744140625, 0.0059621334075927734, 0.006238460540771484, 0.006514787673950195, 0.006791114807128906, 0.007067441940307617, 0.007343769073486328, 0.007620096206665039, 0.00789642333984375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 8.0, 9.0, 14.0, 14.0, 12.0, 22.0, 35.0, 25.0, 51.0, 66.0, 82.0, 119.0, 139.0, 234.0, 411.0, 1120.0, 46329.0, 983793.0, 14181.0, 752.0, 376.0, 208.0, 144.0, 108.0, 75.0, 61.0, 32.0, 34.0, 23.0, 13.0, 14.0, 11.0, 9.0, 5.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1600341796875, -0.15439796447753906, -0.14876174926757812, -0.1431255340576172, -0.13748931884765625, -0.1318531036376953, -0.12621688842773438, -0.12058067321777344, -0.1149444580078125, -0.10930824279785156, -0.10367202758789062, -0.09803581237792969, -0.09239959716796875, -0.08676338195800781, -0.08112716674804688, -0.07549095153808594, -0.069854736328125, -0.06421852111816406, -0.058582305908203125, -0.05294609069824219, -0.04730987548828125, -0.04167366027832031, -0.036037445068359375, -0.030401229858398438, -0.0247650146484375, -0.019128799438476562, -0.013492584228515625, -0.007856369018554688, -0.00222015380859375, 0.0034160614013671875, 0.009052276611328125, 0.014688491821289062, 0.02032470703125, 0.025960922241210938, 0.031597137451171875, 0.03723335266113281, 0.04286956787109375, 0.04850578308105469, 0.054141998291015625, 0.05977821350097656, 0.0654144287109375, 0.07105064392089844, 0.07668685913085938, 0.08232307434082031, 0.08795928955078125, 0.09359550476074219, 0.09923171997070312, 0.10486793518066406, 0.110504150390625, 0.11614036560058594, 0.12177658081054688, 0.1274127960205078, 0.13304901123046875, 0.1386852264404297, 0.14432144165039062, 0.14995765686035156, 0.1555938720703125, 0.16123008728027344, 0.16686630249023438, 0.1725025177001953, 0.17813873291015625, 0.1837749481201172, 0.18941116333007812, 0.19504737854003906, 0.20068359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 34.0, 128.0, 392.0, 323.0, 103.0, 22.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06382698565721512, -0.06222875788807869, -0.06063053384423256, -0.05903230607509613, -0.05743408203125, -0.05583585426211357, -0.05423762649297714, -0.05263940244913101, -0.05104117840528488, -0.04944295063614845, -0.04784472659230232, -0.046246498823165894, -0.04464827477931976, -0.043050047010183334, -0.041451819241046906, -0.039853595197200775, -0.038255367428064346, -0.03665713965892792, -0.03505891561508179, -0.03346068784594536, -0.03186246380209923, -0.0302642360329628, -0.02866601012647152, -0.02706778421998024, -0.02546955831348896, -0.02387133240699768, -0.0222731065005064, -0.02067488059401512, -0.019076652824878693, -0.017478428781032562, -0.015880201011896133, -0.014281975105404854, -0.012683752924203873, -0.011085527017712593, -0.009487301111221313, -0.00788907427340746, -0.00629084836691618, -0.0046926224604249, -0.003094395622611046, -0.0014961697161197662, 0.00010205619037151337, 0.0017002823296934366, 0.00329850846901536, 0.004896734841167927, 0.006494960747659206, 0.008093186654150486, 0.00969141349196434, 0.01128963939845562, 0.0128878653049469, 0.014486091211438179, 0.01608431711792946, 0.017682544887065887, 0.019280768930912018, 0.020878996700048447, 0.022477222606539726, 0.024075448513031006, 0.025673674419522285, 0.027271900326013565, 0.028870126232504845, 0.030468352138996124, 0.03206657990813255, 0.033664803951978683, 0.03526303172111511, 0.03686125576496124, 0.03845948353409767]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 0.0, 7.0, 2.0, 12.0, 12.0, 5.0, 12.0, 7.0, 13.0, 16.0, 20.0, 25.0, 40.0, 31.0, 37.0, 31.0, 38.0, 40.0, 27.0, 49.0, 34.0, 39.0, 43.0, 45.0, 38.0, 46.0, 39.0, 40.0, 32.0, 28.0, 27.0, 23.0, 34.0, 17.0, 20.0, 11.0, 8.0, 13.0, 9.0, 7.0, 4.0, 6.0, 4.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008288741111755371, -0.008021315559744835, -0.007753890007734299, -0.0074864644557237625, -0.007219038903713226, -0.00695161335170269, -0.006684187799692154, -0.006416762247681618, -0.0061493366956710815, -0.005881911143660545, -0.005614485591650009, -0.005347060039639473, -0.005079634487628937, -0.004812208935618401, -0.004544783383607864, -0.004277357831597328, -0.004009932279586792, -0.003742506727576256, -0.0034750811755657196, -0.0032076556235551834, -0.002940230071544647, -0.002672804519534111, -0.002405378967523575, -0.0021379534155130386, -0.0018705278635025024, -0.0016031023114919662, -0.00133567675948143, -0.0010682512074708939, -0.0008008256554603577, -0.0005334001034498215, -0.0002659745514392853, 1.4510005712509155e-06, 0.0002688765525817871, 0.0005363021045923233, 0.0008037276566028595, 0.0010711532086133957, 0.0013385787606239319, 0.001606004312634468, 0.0018734298646450043, 0.0021408554166555405, 0.0024082809686660767, 0.002675706520676613, 0.002943132072687149, 0.0032105576246976852, 0.0034779831767082214, 0.0037454087287187576, 0.004012834280729294, 0.00428025983273983, 0.004547685384750366, 0.004815110936760902, 0.005082536488771439, 0.005349962040781975, 0.005617387592792511, 0.005884813144803047, 0.006152238696813583, 0.00641966424882412, 0.006687089800834656, 0.006954515352845192, 0.007221940904855728, 0.007489366456866264, 0.0077567920088768005, 0.008024217560887337, 0.008291643112897873, 0.008559068664908409, 0.008826494216918945]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 14.0, 22.0, 11.0, 26.0, 20.0, 27.0, 31.0, 36.0, 41.0, 46.0, 41.0, 43.0, 42.0, 40.0, 37.0, 52.0, 42.0, 51.0, 42.0, 42.0, 41.0, 28.0, 30.0, 23.0, 25.0, 12.0, 20.0, 22.0, 16.0, 8.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9765625, -1.91876220703125, -1.8609619140625, -1.80316162109375, -1.745361328125, -1.68756103515625, -1.6297607421875, -1.57196044921875, -1.51416015625, -1.45635986328125, -1.3985595703125, -1.34075927734375, -1.282958984375, -1.22515869140625, -1.1673583984375, -1.10955810546875, -1.0517578125, -0.99395751953125, -0.9361572265625, -0.87835693359375, -0.820556640625, -0.76275634765625, -0.7049560546875, -0.64715576171875, -0.58935546875, -0.53155517578125, -0.4737548828125, -0.41595458984375, -0.358154296875, -0.30035400390625, -0.2425537109375, -0.18475341796875, -0.126953125, -0.06915283203125, -0.0113525390625, 0.04644775390625, 0.104248046875, 0.16204833984375, 0.2198486328125, 0.27764892578125, 0.33544921875, 0.39324951171875, 0.4510498046875, 0.50885009765625, 0.566650390625, 0.62445068359375, 0.6822509765625, 0.74005126953125, 0.7978515625, 0.85565185546875, 0.9134521484375, 0.97125244140625, 1.029052734375, 1.08685302734375, 1.1446533203125, 1.20245361328125, 1.26025390625, 1.31805419921875, 1.3758544921875, 1.43365478515625, 1.491455078125, 1.54925537109375, 1.6070556640625, 1.66485595703125, 1.72265625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 9.0, 18.0, 28.0, 28.0, 39.0, 67.0, 92.0, 147.0, 192.0, 267.0, 405.0, 584.0, 847.0, 1230.0, 1960.0, 3278.0, 5289.0, 9499.0, 18100.0, 36584.0, 79185.0, 184917.0, 335959.0, 200288.0, 85771.0, 39266.0, 19225.0, 10106.0, 5688.0, 3359.0, 2082.0, 1333.0, 846.0, 562.0, 343.0, 285.0, 188.0, 143.0, 109.0, 58.0, 48.0, 32.0, 32.0, 23.0, 10.0, 9.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.083770751953125, -2.01324462890625, -1.942718505859375, -1.8721923828125, -1.801666259765625, -1.73114013671875, -1.660614013671875, -1.590087890625, -1.519561767578125, -1.44903564453125, -1.378509521484375, -1.3079833984375, -1.237457275390625, -1.16693115234375, -1.096405029296875, -1.02587890625, -0.955352783203125, -0.88482666015625, -0.814300537109375, -0.7437744140625, -0.673248291015625, -0.60272216796875, -0.532196044921875, -0.461669921875, -0.391143798828125, -0.32061767578125, -0.250091552734375, -0.1795654296875, -0.109039306640625, -0.03851318359375, 0.032012939453125, 0.1025390625, 0.173065185546875, 0.24359130859375, 0.314117431640625, 0.3846435546875, 0.455169677734375, 0.52569580078125, 0.596221923828125, 0.666748046875, 0.737274169921875, 0.80780029296875, 0.878326416015625, 0.9488525390625, 1.019378662109375, 1.08990478515625, 1.160430908203125, 1.23095703125, 1.301483154296875, 1.37200927734375, 1.442535400390625, 1.5130615234375, 1.583587646484375, 1.65411376953125, 1.724639892578125, 1.795166015625, 1.865692138671875, 1.93621826171875, 2.006744384765625, 2.0772705078125, 2.147796630859375, 2.21832275390625, 2.288848876953125, 2.359375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 8.0, 4.0, 8.0, 8.0, 9.0, 13.0, 12.0, 17.0, 17.0, 22.0, 14.0, 20.0, 25.0, 39.0, 45.0, 47.0, 39.0, 43.0, 87.0, 126.0, 235.0, 1416.0, 203.0, 108.0, 81.0, 56.0, 35.0, 32.0, 36.0, 38.0, 19.0, 26.0, 30.0, 26.0, 26.0, 11.0, 24.0, 15.0, 4.0, 11.0, 2.0, 7.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.0919189453125, -3.957275390625, -3.8226318359375, -3.68798828125, -3.5533447265625, -3.418701171875, -3.2840576171875, -3.1494140625, -3.0147705078125, -2.880126953125, -2.7454833984375, -2.61083984375, -2.4761962890625, -2.341552734375, -2.2069091796875, -2.072265625, -1.9376220703125, -1.802978515625, -1.6683349609375, -1.53369140625, -1.3990478515625, -1.264404296875, -1.1297607421875, -0.9951171875, -0.8604736328125, -0.725830078125, -0.5911865234375, -0.45654296875, -0.3218994140625, -0.187255859375, -0.0526123046875, 0.08203125, 0.2166748046875, 0.351318359375, 0.4859619140625, 0.62060546875, 0.7552490234375, 0.889892578125, 1.0245361328125, 1.1591796875, 1.2938232421875, 1.428466796875, 1.5631103515625, 1.69775390625, 1.8323974609375, 1.967041015625, 2.1016845703125, 2.236328125, 2.3709716796875, 2.505615234375, 2.6402587890625, 2.77490234375, 2.9095458984375, 3.044189453125, 3.1788330078125, 3.3134765625, 3.4481201171875, 3.582763671875, 3.7174072265625, 3.85205078125, 3.9866943359375, 4.121337890625, 4.2559814453125, 4.390625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 5.0, 6.0, 8.0, 9.0, 23.0, 18.0, 36.0, 52.0, 83.0, 98.0, 140.0, 297.0, 528.0, 1282.0, 3720.0, 16905.0, 182873.0, 2751952.0, 165441.0, 16245.0, 3494.0, 1184.0, 502.0, 292.0, 155.0, 98.0, 71.0, 59.0, 29.0, 23.0, 26.0, 14.0, 7.0, 5.0, 5.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.59765625, -7.36376953125, -7.1298828125, -6.89599609375, -6.662109375, -6.42822265625, -6.1943359375, -5.96044921875, -5.7265625, -5.49267578125, -5.2587890625, -5.02490234375, -4.791015625, -4.55712890625, -4.3232421875, -4.08935546875, -3.85546875, -3.62158203125, -3.3876953125, -3.15380859375, -2.919921875, -2.68603515625, -2.4521484375, -2.21826171875, -1.984375, -1.75048828125, -1.5166015625, -1.28271484375, -1.048828125, -0.81494140625, -0.5810546875, -0.34716796875, -0.11328125, 0.12060546875, 0.3544921875, 0.58837890625, 0.822265625, 1.05615234375, 1.2900390625, 1.52392578125, 1.7578125, 1.99169921875, 2.2255859375, 2.45947265625, 2.693359375, 2.92724609375, 3.1611328125, 3.39501953125, 3.62890625, 3.86279296875, 4.0966796875, 4.33056640625, 4.564453125, 4.79833984375, 5.0322265625, 5.26611328125, 5.5, 5.73388671875, 5.9677734375, 6.20166015625, 6.435546875, 6.66943359375, 6.9033203125, 7.13720703125, 7.37109375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 67.0, 522.0, 379.0, 42.0, 6.0], "bins": [-96.9349594116211, -95.34323120117188, -93.75150299072266, -92.15978240966797, -90.56805419921875, -88.97632598876953, -87.38459777832031, -85.79287719726562, -84.2011489868164, -82.60942077636719, -81.01769256591797, -79.42597198486328, -77.83424377441406, -76.24251556396484, -74.65078735351562, -73.05906677246094, -71.46733856201172, -69.8756103515625, -68.28388214111328, -66.6921615600586, -65.10043334960938, -63.508705139160156, -61.9169807434082, -60.325252532958984, -58.733524322509766, -57.14179611206055, -55.550071716308594, -53.958343505859375, -52.36661911010742, -50.7748908996582, -49.18316650390625, -47.59143829345703, -45.99971389770508, -44.40798568725586, -42.816261291503906, -41.22453308105469, -39.632808685302734, -38.041080474853516, -36.44935607910156, -34.857627868652344, -33.265899658203125, -31.67417335510254, -30.082447052001953, -28.490720748901367, -26.89899444580078, -25.307268142700195, -23.71554183959961, -22.12381362915039, -20.532089233398438, -18.94036293029785, -17.348636627197266, -15.75691032409668, -14.165184020996094, -12.573457717895508, -10.981730461120605, -9.39000415802002, -7.79827880859375, -6.206552505493164, -4.614826202392578, -3.023099422454834, -1.431373119354248, 0.1603531837463379, 1.752079963684082, 3.343806266784668, 4.935532569885254]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 1.0, 10.0, 7.0, 9.0, 6.0, 9.0, 15.0, 9.0, 12.0, 8.0, 25.0, 23.0, 19.0, 18.0, 37.0, 33.0, 31.0, 34.0, 45.0, 41.0, 48.0, 31.0, 34.0, 46.0, 43.0, 37.0, 33.0, 41.0, 37.0, 26.0, 35.0, 27.0, 25.0, 25.0, 17.0, 16.0, 10.0, 10.0, 14.0, 15.0, 14.0, 5.0, 1.0, 6.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.162988662719727, -9.855522155761719, -9.548054695129395, -9.240588188171387, -8.933121681213379, -8.625654220581055, -8.318187713623047, -8.010721206665039, -7.703254222869873, -7.395787239074707, -7.088320732116699, -6.780853748321533, -6.473386764526367, -6.165920257568359, -5.858453273773193, -5.550986289978027, -5.2435197830200195, -4.9360527992248535, -4.628586292266846, -4.32111930847168, -4.013652801513672, -3.706185817718506, -3.39871883392334, -3.091252088546753, -2.783785343170166, -2.476318597793579, -2.168851852416992, -1.8613848686218262, -1.5539181232452393, -1.2464513778686523, -0.9389845132827759, -0.6315176486968994, -0.3240499496459961, -0.016583144664764404, 0.2908836603164673, 0.598350465297699, 0.9058172702789307, 1.2132840156555176, 1.520750880241394, 1.8282177448272705, 2.1356844902038574, 2.4431512355804443, 2.7506179809570312, 3.0580849647521973, 3.365551710128784, 3.673018455505371, 3.980485439300537, 4.287952423095703, 4.595418930053711, 4.902885913848877, 5.210352420806885, 5.517819404602051, 5.825285911560059, 6.132752895355225, 6.440219879150391, 6.747686386108398, 7.0551533699035645, 7.3626203536987305, 7.670086860656738, 7.977553844451904, 8.28502082824707, 8.592487335205078, 8.899953842163086, 9.20742130279541, 9.514887809753418]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 7.0, 11.0, 7.0, 5.0, 12.0, 13.0, 24.0, 27.0, 18.0, 20.0, 28.0, 35.0, 30.0, 52.0, 52.0, 44.0, 50.0, 55.0, 31.0, 50.0, 48.0, 47.0, 45.0, 50.0, 40.0, 25.0, 30.0, 27.0, 14.0, 22.0, 18.0, 15.0, 16.0, 12.0, 8.0, 10.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.134765625, -2.074249267578125, -2.01373291015625, -1.953216552734375, -1.8927001953125, -1.832183837890625, -1.77166748046875, -1.711151123046875, -1.650634765625, -1.590118408203125, -1.52960205078125, -1.469085693359375, -1.4085693359375, -1.348052978515625, -1.28753662109375, -1.227020263671875, -1.16650390625, -1.105987548828125, -1.04547119140625, -0.984954833984375, -0.9244384765625, -0.863922119140625, -0.80340576171875, -0.742889404296875, -0.682373046875, -0.621856689453125, -0.56134033203125, -0.500823974609375, -0.4403076171875, -0.379791259765625, -0.31927490234375, -0.258758544921875, -0.1982421875, -0.137725830078125, -0.07720947265625, -0.016693115234375, 0.0438232421875, 0.104339599609375, 0.16485595703125, 0.225372314453125, 0.285888671875, 0.346405029296875, 0.40692138671875, 0.467437744140625, 0.5279541015625, 0.588470458984375, 0.64898681640625, 0.709503173828125, 0.77001953125, 0.830535888671875, 0.89105224609375, 0.951568603515625, 1.0120849609375, 1.072601318359375, 1.13311767578125, 1.193634033203125, 1.254150390625, 1.314666748046875, 1.37518310546875, 1.435699462890625, 1.4962158203125, 1.556732177734375, 1.61724853515625, 1.677764892578125, 1.73828125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 7.0, 9.0, 9.0, 18.0, 20.0, 30.0, 42.0, 66.0, 101.0, 137.0, 208.0, 293.0, 468.0, 702.0, 1032.0, 1822.0, 3347.0, 6876.0, 18254.0, 94538.0, 1795745.0, 2127949.0, 107023.0, 19419.0, 7167.0, 3450.0, 2017.0, 1153.0, 730.0, 503.0, 336.0, 241.0, 174.0, 108.0, 90.0, 63.0, 40.0, 26.0, 19.0, 18.0, 11.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.46343994140625, -4.3096923828125, -4.15594482421875, -4.002197265625, -3.84844970703125, -3.6947021484375, -3.54095458984375, -3.38720703125, -3.23345947265625, -3.0797119140625, -2.92596435546875, -2.772216796875, -2.61846923828125, -2.4647216796875, -2.31097412109375, -2.1572265625, -2.00347900390625, -1.8497314453125, -1.69598388671875, -1.542236328125, -1.38848876953125, -1.2347412109375, -1.08099365234375, -0.92724609375, -0.77349853515625, -0.6197509765625, -0.46600341796875, -0.312255859375, -0.15850830078125, -0.0047607421875, 0.14898681640625, 0.302734375, 0.45648193359375, 0.6102294921875, 0.76397705078125, 0.917724609375, 1.07147216796875, 1.2252197265625, 1.37896728515625, 1.53271484375, 1.68646240234375, 1.8402099609375, 1.99395751953125, 2.147705078125, 2.30145263671875, 2.4552001953125, 2.60894775390625, 2.7626953125, 2.91644287109375, 3.0701904296875, 3.22393798828125, 3.377685546875, 3.53143310546875, 3.6851806640625, 3.83892822265625, 3.99267578125, 4.14642333984375, 4.3001708984375, 4.45391845703125, 4.607666015625, 4.76141357421875, 4.9151611328125, 5.06890869140625, 5.22265625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 12.0, 10.0, 16.0, 18.0, 23.0, 45.0, 66.0, 126.0, 276.0, 563.0, 1091.0, 875.0, 423.0, 188.0, 122.0, 65.0, 45.0, 32.0, 30.0, 18.0, 9.0, 7.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71484375, -3.5709228515625, -3.427001953125, -3.2830810546875, -3.13916015625, -2.9952392578125, -2.851318359375, -2.7073974609375, -2.5634765625, -2.4195556640625, -2.275634765625, -2.1317138671875, -1.98779296875, -1.8438720703125, -1.699951171875, -1.5560302734375, -1.412109375, -1.2681884765625, -1.124267578125, -0.9803466796875, -0.83642578125, -0.6925048828125, -0.548583984375, -0.4046630859375, -0.2607421875, -0.1168212890625, 0.027099609375, 0.1710205078125, 0.31494140625, 0.4588623046875, 0.602783203125, 0.7467041015625, 0.890625, 1.0345458984375, 1.178466796875, 1.3223876953125, 1.46630859375, 1.6102294921875, 1.754150390625, 1.8980712890625, 2.0419921875, 2.1859130859375, 2.329833984375, 2.4737548828125, 2.61767578125, 2.7615966796875, 2.905517578125, 3.0494384765625, 3.193359375, 3.3372802734375, 3.481201171875, 3.6251220703125, 3.76904296875, 3.9129638671875, 4.056884765625, 4.2008056640625, 4.3447265625, 4.4886474609375, 4.632568359375, 4.7764892578125, 4.92041015625, 5.0643310546875, 5.208251953125, 5.3521728515625, 5.49609375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 5.0, 18.0, 15.0, 32.0, 60.0, 85.0, 143.0, 219.0, 510.0, 1199.0, 3585.0, 13930.0, 132231.0, 3836505.0, 182948.0, 16325.0, 4002.0, 1293.0, 532.0, 241.0, 146.0, 99.0, 57.0, 33.0, 23.0, 14.0, 13.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.7694091796875, -7.452880859375, -7.1363525390625, -6.81982421875, -6.5032958984375, -6.186767578125, -5.8702392578125, -5.5537109375, -5.2371826171875, -4.920654296875, -4.6041259765625, -4.28759765625, -3.9710693359375, -3.654541015625, -3.3380126953125, -3.021484375, -2.7049560546875, -2.388427734375, -2.0718994140625, -1.75537109375, -1.4388427734375, -1.122314453125, -0.8057861328125, -0.4892578125, -0.1727294921875, 0.143798828125, 0.4603271484375, 0.77685546875, 1.0933837890625, 1.409912109375, 1.7264404296875, 2.04296875, 2.3594970703125, 2.676025390625, 2.9925537109375, 3.30908203125, 3.6256103515625, 3.942138671875, 4.2586669921875, 4.5751953125, 4.8917236328125, 5.208251953125, 5.5247802734375, 5.84130859375, 6.1578369140625, 6.474365234375, 6.7908935546875, 7.107421875, 7.4239501953125, 7.740478515625, 8.0570068359375, 8.37353515625, 8.6900634765625, 9.006591796875, 9.3231201171875, 9.6396484375, 9.9561767578125, 10.272705078125, 10.5892333984375, 10.90576171875, 11.2222900390625, 11.538818359375, 11.8553466796875, 12.171875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 8.0, 33.0, 110.0, 291.0, 311.0, 168.0, 63.0, 16.0, 9.0, 2.0, 2.0, 1.0, 1.0], "bins": [-60.73704147338867, -59.63462829589844, -58.53221893310547, -57.429805755615234, -56.327392578125, -55.224979400634766, -54.1225700378418, -53.02015686035156, -51.91774368286133, -50.815330505371094, -49.712921142578125, -48.61050796508789, -47.508094787597656, -46.40568161010742, -45.30327224731445, -44.20085906982422, -43.09844970703125, -41.996036529541016, -40.89362716674805, -39.79121398925781, -38.68880081176758, -37.586387634277344, -36.483978271484375, -35.38156509399414, -34.279151916503906, -33.17673873901367, -32.0743293762207, -30.97191619873047, -29.869503021240234, -28.767091751098633, -27.66468048095703, -26.562267303466797, -25.459854125976562, -24.35744285583496, -23.255029678344727, -22.152618408203125, -21.05020523071289, -19.94779396057129, -18.845382690429688, -17.742969512939453, -16.64055633544922, -15.5381441116333, -14.435731887817383, -13.333320617675781, -12.230907440185547, -11.128496170043945, -10.026083946228027, -8.92367172241211, -7.821259498596191, -6.718847274780273, -5.6164350509643555, -4.514023303985596, -3.4116110801696777, -2.3091988563537598, -1.206787109375, -0.10437488555908203, 0.9980373382568359, 2.100449562072754, 3.2028615474700928, 4.305273532867432, 5.40768575668335, 6.510097980499268, 7.612509727478027, 8.714921951293945, 9.817334175109863]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 3.0, 6.0, 10.0, 11.0, 7.0, 13.0, 18.0, 18.0, 18.0, 24.0, 26.0, 25.0, 27.0, 42.0, 41.0, 34.0, 36.0, 49.0, 52.0, 41.0, 41.0, 42.0, 41.0, 20.0, 33.0, 27.0, 33.0, 25.0, 37.0, 25.0, 30.0, 18.0, 24.0, 20.0, 13.0, 14.0, 6.0, 15.0, 9.0, 6.0, 3.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.630743026733398, -10.321427345275879, -10.01211166381836, -9.70279598236084, -9.39348030090332, -9.0841646194458, -8.774848937988281, -8.465534210205078, -8.156217575073242, -7.846901893615723, -7.537586212158203, -7.228270530700684, -6.918954849243164, -6.6096391677856445, -6.300323963165283, -5.991008281707764, -5.681693077087402, -5.372377395629883, -5.063061714172363, -4.753746032714844, -4.444430351257324, -4.135114669799805, -3.8257994651794434, -3.516483783721924, -3.2071681022644043, -2.8978524208068848, -2.5885367393493652, -2.279221296310425, -1.9699056148529053, -1.6605899333953857, -1.3512743711471558, -1.0419588088989258, -0.7326421737670898, -0.4233265519142151, -0.11401093006134033, 0.19530469179153442, 0.5046203136444092, 0.8139359951019287, 1.1232515573501587, 1.4325671195983887, 1.7418828010559082, 2.0511984825134277, 2.3605141639709473, 2.6698296070098877, 2.9791452884674072, 3.2884609699249268, 3.597776412963867, 3.9070920944213867, 4.216407775878906, 4.525723457336426, 4.835039138793945, 5.144354820251465, 5.453670501708984, 5.762986183166504, 6.072301387786865, 6.381617069244385, 6.690932750701904, 7.000248432159424, 7.309564113616943, 7.618879795074463, 7.928194999694824, 8.237510681152344, 8.546826362609863, 8.856142044067383, 9.165457725524902]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 11.0, 8.0, 13.0, 14.0, 28.0, 25.0, 25.0, 28.0, 40.0, 41.0, 38.0, 40.0, 56.0, 49.0, 50.0, 38.0, 43.0, 53.0, 43.0, 47.0, 50.0, 25.0, 29.0, 41.0, 32.0, 26.0, 22.0, 13.0, 14.0, 14.0, 13.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.291259765625, -2.22509765625, -2.158935546875, -2.0927734375, -2.026611328125, -1.96044921875, -1.894287109375, -1.828125, -1.761962890625, -1.69580078125, -1.629638671875, -1.5634765625, -1.497314453125, -1.43115234375, -1.364990234375, -1.298828125, -1.232666015625, -1.16650390625, -1.100341796875, -1.0341796875, -0.968017578125, -0.90185546875, -0.835693359375, -0.76953125, -0.703369140625, -0.63720703125, -0.571044921875, -0.5048828125, -0.438720703125, -0.37255859375, -0.306396484375, -0.240234375, -0.174072265625, -0.10791015625, -0.041748046875, 0.0244140625, 0.090576171875, 0.15673828125, 0.222900390625, 0.2890625, 0.355224609375, 0.42138671875, 0.487548828125, 0.5537109375, 0.619873046875, 0.68603515625, 0.752197265625, 0.818359375, 0.884521484375, 0.95068359375, 1.016845703125, 1.0830078125, 1.149169921875, 1.21533203125, 1.281494140625, 1.34765625, 1.413818359375, 1.47998046875, 1.546142578125, 1.6123046875, 1.678466796875, 1.74462890625, 1.810791015625, 1.876953125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 6.0, 12.0, 16.0, 16.0, 24.0, 59.0, 81.0, 148.0, 242.0, 436.0, 700.0, 1238.0, 2344.0, 4367.0, 7989.0, 15394.0, 30305.0, 60862.0, 137821.0, 325845.0, 257795.0, 103951.0, 47867.0, 24114.0, 12502.0, 6582.0, 3521.0, 1816.0, 1034.0, 609.0, 344.0, 196.0, 105.0, 81.0, 48.0, 24.0, 14.0, 20.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17582130432128906, -0.16926956176757812, -0.1627178192138672, -0.15616607666015625, -0.1496143341064453, -0.14306259155273438, -0.13651084899902344, -0.1299591064453125, -0.12340736389160156, -0.11685562133789062, -0.11030387878417969, -0.10375213623046875, -0.09720039367675781, -0.09064865112304688, -0.08409690856933594, -0.077545166015625, -0.07099342346191406, -0.06444168090820312, -0.05788993835449219, -0.05133819580078125, -0.04478645324707031, -0.038234710693359375, -0.03168296813964844, -0.0251312255859375, -0.018579483032226562, -0.012027740478515625, -0.0054759979248046875, 0.00107574462890625, 0.0076274871826171875, 0.014179229736328125, 0.020730972290039062, 0.02728271484375, 0.03383445739746094, 0.040386199951171875, 0.04693794250488281, 0.05348968505859375, 0.06004142761230469, 0.06659317016601562, 0.07314491271972656, 0.0796966552734375, 0.08624839782714844, 0.09280014038085938, 0.09935188293457031, 0.10590362548828125, 0.11245536804199219, 0.11900711059570312, 0.12555885314941406, 0.132110595703125, 0.13866233825683594, 0.14521408081054688, 0.1517658233642578, 0.15831756591796875, 0.1648693084716797, 0.17142105102539062, 0.17797279357910156, 0.1845245361328125, 0.19107627868652344, 0.19762802124023438, 0.2041797637939453, 0.21073150634765625, 0.2172832489013672, 0.22383499145507812, 0.23038673400878906, 0.2369384765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 8.0, 1.0, 8.0, 13.0, 10.0, 12.0, 17.0, 23.0, 14.0, 21.0, 19.0, 29.0, 19.0, 31.0, 25.0, 39.0, 31.0, 31.0, 36.0, 39.0, 29.0, 1071.0, 35.0, 31.0, 40.0, 33.0, 32.0, 31.0, 28.0, 22.0, 32.0, 24.0, 21.0, 22.0, 17.0, 16.0, 13.0, 9.0, 14.0, 11.0, 6.0, 6.0, 7.0, 5.0, 6.0, 6.0, 2.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.9404296875, -0.907501220703125, -0.87457275390625, -0.841644287109375, -0.8087158203125, -0.775787353515625, -0.74285888671875, -0.709930419921875, -0.677001953125, -0.644073486328125, -0.61114501953125, -0.578216552734375, -0.5452880859375, -0.512359619140625, -0.47943115234375, -0.446502685546875, -0.41357421875, -0.380645751953125, -0.34771728515625, -0.314788818359375, -0.2818603515625, -0.248931884765625, -0.21600341796875, -0.183074951171875, -0.150146484375, -0.117218017578125, -0.08428955078125, -0.051361083984375, -0.0184326171875, 0.014495849609375, 0.04742431640625, 0.080352783203125, 0.11328125, 0.146209716796875, 0.17913818359375, 0.212066650390625, 0.2449951171875, 0.277923583984375, 0.31085205078125, 0.343780517578125, 0.376708984375, 0.409637451171875, 0.44256591796875, 0.475494384765625, 0.5084228515625, 0.541351318359375, 0.57427978515625, 0.607208251953125, 0.64013671875, 0.673065185546875, 0.70599365234375, 0.738922119140625, 0.7718505859375, 0.804779052734375, 0.83770751953125, 0.870635986328125, 0.903564453125, 0.936492919921875, 0.96942138671875, 1.002349853515625, 1.0352783203125, 1.068206787109375, 1.10113525390625, 1.134063720703125, 1.1669921875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 10.0, 29.0, 25.0, 30.0, 40.0, 69.0, 71.0, 126.0, 159.0, 214.0, 281.0, 406.0, 548.0, 724.0, 1055.0, 1456.0, 2082.0, 2949.0, 4385.0, 6630.0, 11141.0, 21794.0, 67169.0, 1595024.0, 293142.0, 42375.0, 17038.0, 9347.0, 5821.0, 3749.0, 2625.0, 1825.0, 1286.0, 925.0, 719.0, 493.0, 348.0, 247.0, 183.0, 158.0, 104.0, 82.0, 57.0, 42.0, 30.0, 29.0, 22.0, 14.0, 11.0, 12.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.19677734375, -0.19039535522460938, -0.18401336669921875, -0.17763137817382812, -0.1712493896484375, -0.16486740112304688, -0.15848541259765625, -0.15210342407226562, -0.145721435546875, -0.13933944702148438, -0.13295745849609375, -0.12657546997070312, -0.1201934814453125, -0.11381149291992188, -0.10742950439453125, -0.10104751586914062, -0.09466552734375, -0.08828353881835938, -0.08190155029296875, -0.07551956176757812, -0.0691375732421875, -0.06275558471679688, -0.05637359619140625, -0.049991607666015625, -0.043609619140625, -0.037227630615234375, -0.03084564208984375, -0.024463653564453125, -0.0180816650390625, -0.011699676513671875, -0.00531768798828125, 0.001064300537109375, 0.0074462890625, 0.013828277587890625, 0.02021026611328125, 0.026592254638671875, 0.0329742431640625, 0.039356231689453125, 0.04573822021484375, 0.052120208740234375, 0.058502197265625, 0.06488418579101562, 0.07126617431640625, 0.07764816284179688, 0.0840301513671875, 0.09041213989257812, 0.09679412841796875, 0.10317611694335938, 0.10955810546875, 0.11594009399414062, 0.12232208251953125, 0.12870407104492188, 0.1350860595703125, 0.14146804809570312, 0.14785003662109375, 0.15423202514648438, 0.160614013671875, 0.16699600219726562, 0.17337799072265625, 0.17975997924804688, 0.1861419677734375, 0.19252395629882812, 0.19890594482421875, 0.20528793334960938, 0.211669921875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 15.0, 10.0, 9.0, 7.0, 24.0, 19.0, 20.0, 32.0, 38.0, 50.0, 51.0, 51.0, 49.0, 71.0, 69.0, 58.0, 53.0, 55.0, 55.0, 39.0, 29.0, 40.0, 33.0, 22.0, 19.0, 20.0, 10.0, 10.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008453369140625, -0.008178114891052246, -0.007902860641479492, -0.007627606391906738, -0.007352352142333984, -0.0070770978927612305, -0.0068018436431884766, -0.006526589393615723, -0.006251335144042969, -0.005976080894470215, -0.005700826644897461, -0.005425572395324707, -0.005150318145751953, -0.004875063896179199, -0.004599809646606445, -0.004324555397033691, -0.0040493011474609375, -0.0037740468978881836, -0.0034987926483154297, -0.0032235383987426758, -0.002948284149169922, -0.002673029899597168, -0.002397775650024414, -0.00212252140045166, -0.0018472671508789062, -0.0015720129013061523, -0.0012967586517333984, -0.0010215044021606445, -0.0007462501525878906, -0.0004709959030151367, -0.0001957416534423828, 7.95125961303711e-05, 0.000354766845703125, 0.0006300210952758789, 0.0009052753448486328, 0.0011805295944213867, 0.0014557838439941406, 0.0017310380935668945, 0.0020062923431396484, 0.0022815465927124023, 0.0025568008422851562, 0.00283205509185791, 0.003107309341430664, 0.003382563591003418, 0.003657817840576172, 0.003933072090148926, 0.00420832633972168, 0.004483580589294434, 0.0047588348388671875, 0.005034089088439941, 0.005309343338012695, 0.005584597587585449, 0.005859851837158203, 0.006135106086730957, 0.006410360336303711, 0.006685614585876465, 0.006960868835449219, 0.007236123085021973, 0.0075113773345947266, 0.0077866315841674805, 0.008061885833740234, 0.008337140083312988, 0.008612394332885742, 0.008887648582458496, 0.00916290283203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 14.0, 10.0, 17.0, 16.0, 15.0, 30.0, 31.0, 67.0, 76.0, 113.0, 162.0, 231.0, 414.0, 1157.0, 66174.0, 968089.0, 10134.0, 733.0, 335.0, 220.0, 155.0, 106.0, 57.0, 58.0, 29.0, 27.0, 25.0, 12.0, 14.0, 7.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1834716796875, -0.1777973175048828, -0.17212295532226562, -0.16644859313964844, -0.16077423095703125, -0.15509986877441406, -0.14942550659179688, -0.1437511444091797, -0.1380767822265625, -0.1324024200439453, -0.12672805786132812, -0.12105369567871094, -0.11537933349609375, -0.10970497131347656, -0.10403060913085938, -0.09835624694824219, -0.092681884765625, -0.08700752258300781, -0.08133316040039062, -0.07565879821777344, -0.06998443603515625, -0.06431007385253906, -0.058635711669921875, -0.05296134948730469, -0.0472869873046875, -0.04161262512207031, -0.035938262939453125, -0.030263900756835938, -0.02458953857421875, -0.018915176391601562, -0.013240814208984375, -0.0075664520263671875, -0.00189208984375, 0.0037822723388671875, 0.009456634521484375, 0.015130996704101562, 0.02080535888671875, 0.026479721069335938, 0.032154083251953125, 0.03782844543457031, 0.0435028076171875, 0.04917716979980469, 0.054851531982421875, 0.06052589416503906, 0.06620025634765625, 0.07187461853027344, 0.07754898071289062, 0.08322334289550781, 0.088897705078125, 0.09457206726074219, 0.10024642944335938, 0.10592079162597656, 0.11159515380859375, 0.11726951599121094, 0.12294387817382812, 0.1286182403564453, 0.1342926025390625, 0.1399669647216797, 0.14564132690429688, 0.15131568908691406, 0.15699005126953125, 0.16266441345214844, 0.16833877563476562, 0.1740131378173828, 0.1796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 12.0, 14.0, 19.0, 28.0, 51.0, 79.0, 121.0, 172.0, 164.0, 128.0, 86.0, 51.0, 37.0, 13.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.010169223882257938, -0.009605241008102894, -0.00904125813394785, -0.00847727619111538, -0.007913293316960335, -0.00734931044280529, -0.006785327568650246, -0.006221345160156488, -0.005657362286001444, -0.005093379411846399, -0.004529397003352642, -0.0039654141291975975, -0.0034014314878731966, -0.0028374488465487957, -0.002273465972393751, -0.001709483563899994, -0.0011455006897449493, -0.0005815179902128875, -1.753529068082571e-05, 0.000546447467058897, 0.001110430108383298, 0.0016744127497076988, 0.0022383956238627434, 0.0028023780323565006, 0.003366360906511545, 0.00393034378066659, 0.004494326189160347, 0.0050583090633153915, 0.005622291937470436, 0.006186274345964193, 0.006750257220119238, 0.007314239628612995, 0.007878221571445465, 0.00844220444560051, 0.009006187319755554, 0.009570170193910599, 0.010134152136743069, 0.010698135010898113, 0.011262117885053158, 0.011826099827885628, 0.012390082702040672, 0.012954065576195717, 0.013518048450350761, 0.014082031324505806, 0.014646013267338276, 0.01520999614149332, 0.01577397808432579, 0.016337960958480835, 0.01690194383263588, 0.017465926706790924, 0.01802990958094597, 0.018593892455101013, 0.019157875329256058, 0.019721858203411102, 0.020285841077566147, 0.020849822089076042, 0.021413806825876236, 0.02197778970003128, 0.022541772574186325, 0.02310575544834137, 0.023669738322496414, 0.02423372119665146, 0.024797704070806503, 0.0253616850823164, 0.025925667956471443]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 4.0, 5.0, 7.0, 9.0, 7.0, 14.0, 15.0, 16.0, 21.0, 22.0, 27.0, 25.0, 38.0, 42.0, 35.0, 52.0, 51.0, 47.0, 41.0, 45.0, 48.0, 38.0, 34.0, 36.0, 27.0, 36.0, 37.0, 36.0, 24.0, 28.0, 21.0, 18.0, 25.0, 14.0, 13.0, 6.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006122410297393799, -0.005922614596784115, -0.005722818896174431, -0.005523023195564747, -0.005323227494955063, -0.005123431794345379, -0.004923636093735695, -0.004723840393126011, -0.004524044692516327, -0.004324248991906643, -0.004124453291296959, -0.003924657590687275, -0.003724861890077591, -0.003525066189467907, -0.003325270488858223, -0.003125474788248539, -0.002925679087638855, -0.002725883387029171, -0.002526087686419487, -0.002326291985809803, -0.002126496285200119, -0.001926700584590435, -0.001726904883980751, -0.001527109183371067, -0.001327313482761383, -0.001127517782151699, -0.0009277220815420151, -0.0007279263809323311, -0.0005281306803226471, -0.0003283349797129631, -0.00012853927910327911, 7.125642150640488e-05, 0.00027105212211608887, 0.00047084782272577286, 0.0006706435233354568, 0.0008704392239451408, 0.0010702349245548248, 0.0012700306251645088, 0.0014698263257741928, 0.0016696220263838768, 0.0018694177269935608, 0.0020692134276032448, 0.0022690091282129288, 0.0024688048288226128, 0.0026686005294322968, 0.0028683962300419807, 0.0030681919306516647, 0.0032679876312613487, 0.0034677833318710327, 0.0036675790324807167, 0.0038673747330904007, 0.004067170433700085, 0.004266966134309769, 0.004466761834919453, 0.004666557535529137, 0.004866353236138821, 0.005066148936748505, 0.005265944637358189, 0.005465740337967873, 0.005665536038577557, 0.005865331739187241, 0.006065127439796925, 0.006264923140406609, 0.006464718841016293, 0.0066645145416259766]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 11.0, 8.0, 13.0, 14.0, 28.0, 25.0, 26.0, 27.0, 40.0, 41.0, 38.0, 40.0, 56.0, 49.0, 49.0, 39.0, 43.0, 53.0, 43.0, 47.0, 50.0, 25.0, 29.0, 41.0, 32.0, 26.0, 22.0, 13.0, 14.0, 14.0, 13.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.291259765625, -2.22509765625, -2.158935546875, -2.0927734375, -2.026611328125, -1.96044921875, -1.894287109375, -1.828125, -1.761962890625, -1.69580078125, -1.629638671875, -1.5634765625, -1.497314453125, -1.43115234375, -1.364990234375, -1.298828125, -1.232666015625, -1.16650390625, -1.100341796875, -1.0341796875, -0.968017578125, -0.90185546875, -0.835693359375, -0.76953125, -0.703369140625, -0.63720703125, -0.571044921875, -0.5048828125, -0.438720703125, -0.37255859375, -0.306396484375, -0.240234375, -0.174072265625, -0.10791015625, -0.041748046875, 0.0244140625, 0.090576171875, 0.15673828125, 0.222900390625, 0.2890625, 0.355224609375, 0.42138671875, 0.487548828125, 0.5537109375, 0.619873046875, 0.68603515625, 0.752197265625, 0.818359375, 0.884521484375, 0.95068359375, 1.016845703125, 1.0830078125, 1.149169921875, 1.21533203125, 1.281494140625, 1.34765625, 1.413818359375, 1.47998046875, 1.546142578125, 1.6123046875, 1.678466796875, 1.74462890625, 1.810791015625, 1.876953125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 19.0, 21.0, 21.0, 35.0, 72.0, 114.0, 180.0, 348.0, 518.0, 1032.0, 1610.0, 2970.0, 5557.0, 10193.0, 20749.0, 44718.0, 110862.0, 364045.0, 309958.0, 95975.0, 40057.0, 18667.0, 9451.0, 4876.0, 2737.0, 1593.0, 883.0, 510.0, 285.0, 206.0, 108.0, 71.0, 44.0, 34.0, 15.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7265625, -2.628936767578125, -2.53131103515625, -2.433685302734375, -2.3360595703125, -2.238433837890625, -2.14080810546875, -2.043182373046875, -1.945556640625, -1.847930908203125, -1.75030517578125, -1.652679443359375, -1.5550537109375, -1.457427978515625, -1.35980224609375, -1.262176513671875, -1.16455078125, -1.066925048828125, -0.96929931640625, -0.871673583984375, -0.7740478515625, -0.676422119140625, -0.57879638671875, -0.481170654296875, -0.383544921875, -0.285919189453125, -0.18829345703125, -0.090667724609375, 0.0069580078125, 0.104583740234375, 0.20220947265625, 0.299835205078125, 0.3974609375, 0.495086669921875, 0.59271240234375, 0.690338134765625, 0.7879638671875, 0.885589599609375, 0.98321533203125, 1.080841064453125, 1.178466796875, 1.276092529296875, 1.37371826171875, 1.471343994140625, 1.5689697265625, 1.666595458984375, 1.76422119140625, 1.861846923828125, 1.95947265625, 2.057098388671875, 2.15472412109375, 2.252349853515625, 2.3499755859375, 2.447601318359375, 2.54522705078125, 2.642852783203125, 2.740478515625, 2.838104248046875, 2.93572998046875, 3.033355712890625, 3.1309814453125, 3.228607177734375, 3.32623291015625, 3.423858642578125, 3.521484375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 1.0, 8.0, 10.0, 11.0, 9.0, 11.0, 11.0, 22.0, 17.0, 23.0, 32.0, 23.0, 42.0, 32.0, 37.0, 46.0, 67.0, 80.0, 109.0, 223.0, 1439.0, 220.0, 126.0, 88.0, 64.0, 47.0, 29.0, 31.0, 22.0, 32.0, 27.0, 21.0, 20.0, 11.0, 11.0, 7.0, 9.0, 7.0, 8.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.390625, -4.24658203125, -4.1025390625, -3.95849609375, -3.814453125, -3.67041015625, -3.5263671875, -3.38232421875, -3.23828125, -3.09423828125, -2.9501953125, -2.80615234375, -2.662109375, -2.51806640625, -2.3740234375, -2.22998046875, -2.0859375, -1.94189453125, -1.7978515625, -1.65380859375, -1.509765625, -1.36572265625, -1.2216796875, -1.07763671875, -0.93359375, -0.78955078125, -0.6455078125, -0.50146484375, -0.357421875, -0.21337890625, -0.0693359375, 0.07470703125, 0.21875, 0.36279296875, 0.5068359375, 0.65087890625, 0.794921875, 0.93896484375, 1.0830078125, 1.22705078125, 1.37109375, 1.51513671875, 1.6591796875, 1.80322265625, 1.947265625, 2.09130859375, 2.2353515625, 2.37939453125, 2.5234375, 2.66748046875, 2.8115234375, 2.95556640625, 3.099609375, 3.24365234375, 3.3876953125, 3.53173828125, 3.67578125, 3.81982421875, 3.9638671875, 4.10791015625, 4.251953125, 4.39599609375, 4.5400390625, 4.68408203125, 4.828125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 4.0, 13.0, 9.0, 20.0, 16.0, 21.0, 31.0, 40.0, 59.0, 63.0, 91.0, 87.0, 103.0, 197.0, 287.0, 583.0, 1996.0, 11029.0, 141644.0, 2898074.0, 80303.0, 7944.0, 1553.0, 558.0, 260.0, 164.0, 94.0, 95.0, 74.0, 68.0, 48.0, 36.0, 30.0, 24.0, 14.0, 19.0, 12.0, 12.0, 11.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.8902587890625, -8.577392578125, -8.2645263671875, -7.95166015625, -7.6387939453125, -7.325927734375, -7.0130615234375, -6.7001953125, -6.3873291015625, -6.074462890625, -5.7615966796875, -5.44873046875, -5.1358642578125, -4.822998046875, -4.5101318359375, -4.197265625, -3.8843994140625, -3.571533203125, -3.2586669921875, -2.94580078125, -2.6329345703125, -2.320068359375, -2.0072021484375, -1.6943359375, -1.3814697265625, -1.068603515625, -0.7557373046875, -0.44287109375, -0.1300048828125, 0.182861328125, 0.4957275390625, 0.80859375, 1.1214599609375, 1.434326171875, 1.7471923828125, 2.06005859375, 2.3729248046875, 2.685791015625, 2.9986572265625, 3.3115234375, 3.6243896484375, 3.937255859375, 4.2501220703125, 4.56298828125, 4.8758544921875, 5.188720703125, 5.5015869140625, 5.814453125, 6.1273193359375, 6.440185546875, 6.7530517578125, 7.06591796875, 7.3787841796875, 7.691650390625, 8.0045166015625, 8.3173828125, 8.6302490234375, 8.943115234375, 9.2559814453125, 9.56884765625, 9.8817138671875, 10.194580078125, 10.5074462890625, 10.8203125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 24.0, 66.0, 183.0, 305.0, 249.0, 123.0, 40.0, 15.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.451316833496094, -38.7172737121582, -37.98323059082031, -37.24918746948242, -36.51514434814453, -35.78110122680664, -35.04705810546875, -34.313011169433594, -33.5789680480957, -32.84492492675781, -32.11088180541992, -31.37683868408203, -30.642793655395508, -29.908750534057617, -29.174707412719727, -28.440664291381836, -27.706623077392578, -26.972579956054688, -26.238536834716797, -25.504493713378906, -24.770448684692383, -24.036405563354492, -23.3023624420166, -22.56831932067871, -21.834274291992188, -21.100231170654297, -20.366188049316406, -19.632144927978516, -18.898099899291992, -18.1640567779541, -17.43001365661621, -16.69597053527832, -15.96192741394043, -15.227884292602539, -14.493840217590332, -13.759797096252441, -13.02575397491455, -12.291709899902344, -11.557666778564453, -10.823623657226562, -10.089580535888672, -9.355537414550781, -8.621493339538574, -7.887450218200684, -7.153407096862793, -6.419363498687744, -5.685319900512695, -4.951276779174805, -4.217233180999756, -3.483189821243286, -2.7491464614868164, -2.0151028633117676, -1.2810595035552979, -0.5470161437988281, 0.1870274543762207, 0.9210705757141113, 1.6551141738891602, 2.38915753364563, 3.1232008934020996, 3.8572444915771484, 4.591287612915039, 5.325331211090088, 6.059374809265137, 6.793417930603027, 7.527461528778076]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 9.0, 10.0, 7.0, 14.0, 15.0, 12.0, 22.0, 21.0, 29.0, 35.0, 31.0, 49.0, 36.0, 45.0, 50.0, 40.0, 46.0, 42.0, 40.0, 47.0, 33.0, 42.0, 49.0, 35.0, 28.0, 29.0, 26.0, 25.0, 20.0, 16.0, 19.0, 12.0, 15.0, 7.0, 8.0, 5.0, 6.0, 4.0, 6.0, 1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.348548889160156, -11.010618209838867, -10.672686576843262, -10.334755897521973, -9.996825218200684, -9.658894538879395, -9.320962905883789, -8.9830322265625, -8.645101547241211, -8.307170867919922, -7.969239711761475, -7.631308555603027, -7.293377876281738, -6.955446720123291, -6.617515563964844, -6.279584884643555, -5.941653728485107, -5.60372257232666, -5.265791893005371, -4.927860736846924, -4.589930057525635, -4.2519989013671875, -3.9140679836273193, -3.576137065887451, -3.238206148147583, -2.900275230407715, -2.5623443126678467, -2.2244133949279785, -1.8864823579788208, -1.5485514402389526, -1.210620403289795, -0.8726894855499268, -0.5347585678100586, -0.19682762026786804, 0.1411033272743225, 0.47903430461883545, 0.8169652223587036, 1.1548961400985718, 1.4928271770477295, 1.8307580947875977, 2.168689012527466, 2.506619930267334, 2.844550848007202, 3.1824817657470703, 3.5204129219055176, 3.8583436012268066, 4.196274757385254, 4.534205436706543, 4.87213659286499, 5.2100677490234375, 5.547998428344727, 5.885929584503174, 6.223860263824463, 6.56179141998291, 6.899722099304199, 7.2376532554626465, 7.575584411621094, 7.913515567779541, 8.251446723937988, 8.589377403259277, 8.927308082580566, 9.265238761901855, 9.603170394897461, 9.94110107421875, 10.279031753540039]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 8.0, 12.0, 13.0, 13.0, 18.0, 20.0, 20.0, 23.0, 31.0, 40.0, 49.0, 57.0, 33.0, 50.0, 55.0, 50.0, 52.0, 47.0, 45.0, 48.0, 46.0, 41.0, 38.0, 43.0, 23.0, 22.0, 23.0, 20.0, 9.0, 16.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.279296875, -2.210357666015625, -2.14141845703125, -2.072479248046875, -2.0035400390625, -1.934600830078125, -1.86566162109375, -1.796722412109375, -1.727783203125, -1.658843994140625, -1.58990478515625, -1.520965576171875, -1.4520263671875, -1.383087158203125, -1.31414794921875, -1.245208740234375, -1.17626953125, -1.107330322265625, -1.03839111328125, -0.969451904296875, -0.9005126953125, -0.831573486328125, -0.76263427734375, -0.693695068359375, -0.624755859375, -0.555816650390625, -0.48687744140625, -0.417938232421875, -0.3489990234375, -0.280059814453125, -0.21112060546875, -0.142181396484375, -0.0732421875, -0.004302978515625, 0.06463623046875, 0.133575439453125, 0.2025146484375, 0.271453857421875, 0.34039306640625, 0.409332275390625, 0.478271484375, 0.547210693359375, 0.61614990234375, 0.685089111328125, 0.7540283203125, 0.822967529296875, 0.89190673828125, 0.960845947265625, 1.02978515625, 1.098724365234375, 1.16766357421875, 1.236602783203125, 1.3055419921875, 1.374481201171875, 1.44342041015625, 1.512359619140625, 1.581298828125, 1.650238037109375, 1.71917724609375, 1.788116455078125, 1.8570556640625, 1.925994873046875, 1.99493408203125, 2.063873291015625, 2.1328125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 9.0, 12.0, 23.0, 12.0, 35.0, 28.0, 42.0, 62.0, 73.0, 98.0, 135.0, 189.0, 363.0, 656.0, 2452.0, 132907.0, 4046534.0, 8171.0, 1070.0, 502.0, 239.0, 153.0, 112.0, 84.0, 66.0, 50.0, 38.0, 25.0, 19.0, 26.0, 20.0, 12.0, 7.0, 7.0, 3.0, 6.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.994873046875, -19.33349609375, -18.672119140625, -18.0107421875, -17.349365234375, -16.68798828125, -16.026611328125, -15.365234375, -14.703857421875, -14.04248046875, -13.381103515625, -12.7197265625, -12.058349609375, -11.39697265625, -10.735595703125, -10.07421875, -9.412841796875, -8.75146484375, -8.090087890625, -7.4287109375, -6.767333984375, -6.10595703125, -5.444580078125, -4.783203125, -4.121826171875, -3.46044921875, -2.799072265625, -2.1376953125, -1.476318359375, -0.81494140625, -0.153564453125, 0.5078125, 1.169189453125, 1.83056640625, 2.491943359375, 3.1533203125, 3.814697265625, 4.47607421875, 5.137451171875, 5.798828125, 6.460205078125, 7.12158203125, 7.782958984375, 8.4443359375, 9.105712890625, 9.76708984375, 10.428466796875, 11.08984375, 11.751220703125, 12.41259765625, 13.073974609375, 13.7353515625, 14.396728515625, 15.05810546875, 15.719482421875, 16.380859375, 17.042236328125, 17.70361328125, 18.364990234375, 19.0263671875, 19.687744140625, 20.34912109375, 21.010498046875, 21.671875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 7.0, 12.0, 8.0, 16.0, 11.0, 19.0, 24.0, 46.0, 52.0, 70.0, 115.0, 130.0, 295.0, 501.0, 921.0, 763.0, 412.0, 218.0, 141.0, 85.0, 50.0, 30.0, 31.0, 24.0, 15.0, 16.0, 7.0, 8.0, 11.0, 11.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.8984375, -3.795257568359375, -3.69207763671875, -3.588897705078125, -3.4857177734375, -3.382537841796875, -3.27935791015625, -3.176177978515625, -3.072998046875, -2.969818115234375, -2.86663818359375, -2.763458251953125, -2.6602783203125, -2.557098388671875, -2.45391845703125, -2.350738525390625, -2.24755859375, -2.144378662109375, -2.04119873046875, -1.938018798828125, -1.8348388671875, -1.731658935546875, -1.62847900390625, -1.525299072265625, -1.422119140625, -1.318939208984375, -1.21575927734375, -1.112579345703125, -1.0093994140625, -0.906219482421875, -0.80303955078125, -0.699859619140625, -0.5966796875, -0.493499755859375, -0.39031982421875, -0.287139892578125, -0.1839599609375, -0.080780029296875, 0.02239990234375, 0.125579833984375, 0.228759765625, 0.331939697265625, 0.43511962890625, 0.538299560546875, 0.6414794921875, 0.744659423828125, 0.84783935546875, 0.951019287109375, 1.05419921875, 1.157379150390625, 1.26055908203125, 1.363739013671875, 1.4669189453125, 1.570098876953125, 1.67327880859375, 1.776458740234375, 1.879638671875, 1.982818603515625, 2.08599853515625, 2.189178466796875, 2.2923583984375, 2.395538330078125, 2.49871826171875, 2.601898193359375, 2.705078125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 12.0, 12.0, 13.0, 31.0, 30.0, 54.0, 61.0, 128.0, 242.0, 562.0, 1589.0, 7336.0, 84745.0, 3908677.0, 176431.0, 11085.0, 1964.0, 625.0, 251.0, 143.0, 79.0, 59.0, 34.0, 41.0, 23.0, 10.0, 12.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4765625, -13.12744140625, -12.7783203125, -12.42919921875, -12.080078125, -11.73095703125, -11.3818359375, -11.03271484375, -10.68359375, -10.33447265625, -9.9853515625, -9.63623046875, -9.287109375, -8.93798828125, -8.5888671875, -8.23974609375, -7.890625, -7.54150390625, -7.1923828125, -6.84326171875, -6.494140625, -6.14501953125, -5.7958984375, -5.44677734375, -5.09765625, -4.74853515625, -4.3994140625, -4.05029296875, -3.701171875, -3.35205078125, -3.0029296875, -2.65380859375, -2.3046875, -1.95556640625, -1.6064453125, -1.25732421875, -0.908203125, -0.55908203125, -0.2099609375, 0.13916015625, 0.48828125, 0.83740234375, 1.1865234375, 1.53564453125, 1.884765625, 2.23388671875, 2.5830078125, 2.93212890625, 3.28125, 3.63037109375, 3.9794921875, 4.32861328125, 4.677734375, 5.02685546875, 5.3759765625, 5.72509765625, 6.07421875, 6.42333984375, 6.7724609375, 7.12158203125, 7.470703125, 7.81982421875, 8.1689453125, 8.51806640625, 8.8671875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 10.0, 34.0, 171.0, 434.0, 277.0, 79.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.537708282470703, -9.175249099731445, -7.8127899169921875, -6.45033073425293, -5.087871551513672, -3.725412368774414, -2.3629531860351562, -1.0004940032958984, 0.3619651794433594, 1.7244243621826172, 3.086883544921875, 4.449342727661133, 5.811801910400391, 7.174261093139648, 8.536720275878906, 9.899179458618164, 11.261638641357422, 12.62409782409668, 13.986557006835938, 15.349016189575195, 16.711475372314453, 18.07393455505371, 19.43639373779297, 20.798852920532227, 22.161312103271484, 23.523771286010742, 24.88623046875, 26.248689651489258, 27.611148834228516, 28.973608016967773, 30.33606719970703, 31.69852638244629, 33.06098937988281, 34.42344665527344, 35.78590774536133, 37.14836883544922, 38.510826110839844, 39.87328338623047, 41.23574447631836, 42.59820556640625, 43.960662841796875, 45.3231201171875, 46.68558120727539, 48.04804229736328, 49.410499572753906, 50.77295684814453, 52.13541793823242, 53.49787902832031, 54.86033630371094, 56.22279357910156, 57.58525466918945, 58.947715759277344, 60.31017303466797, 61.672630310058594, 63.035091400146484, 64.39755249023438, 65.760009765625, 67.12246704101562, 68.48492431640625, 69.8473892211914, 71.20984649658203, 72.57230377197266, 73.93476867675781, 75.29722595214844, 76.65968322753906]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 3.0, 9.0, 5.0, 10.0, 5.0, 11.0, 13.0, 16.0, 19.0, 20.0, 24.0, 34.0, 22.0, 25.0, 25.0, 28.0, 35.0, 41.0, 38.0, 43.0, 34.0, 42.0, 53.0, 46.0, 34.0, 43.0, 40.0, 33.0, 28.0, 27.0, 27.0, 28.0, 24.0, 18.0, 9.0, 15.0, 15.0, 9.0, 11.0, 4.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.944438934326172, -8.672908782958984, -8.401378631591797, -8.12984848022461, -7.85831880569458, -7.586789131164551, -7.315258979797363, -7.043728828430176, -6.772198677062988, -6.500668525695801, -6.2291388511657715, -5.957608699798584, -5.6860785484313965, -5.414548873901367, -5.14301872253418, -4.871488571166992, -4.599958896636963, -4.328428745269775, -4.056899070739746, -3.7853689193725586, -3.513838768005371, -3.2423088550567627, -2.9707789421081543, -2.699248790740967, -2.4277188777923584, -2.15618896484375, -1.8846588134765625, -1.613128900527954, -1.3415988683700562, -1.0700688362121582, -0.7985389232635498, -0.5270088911056519, -0.2554788589477539, 0.016051143407821655, 0.2875811457633972, 0.5591111183166504, 0.8306411504745483, 1.1021711826324463, 1.3737010955810547, 1.6452311277389526, 1.9167611598968506, 2.188291072845459, 2.4598212242126465, 2.731351137161255, 3.0028810501098633, 3.274411201477051, 3.545941114425659, 3.8174710273742676, 4.089001178741455, 4.360531330108643, 4.632061004638672, 4.903591156005859, 5.175121307373047, 5.446651458740234, 5.718181133270264, 5.989711284637451, 6.2612409591674805, 6.532771110534668, 6.804300785064697, 7.075830936431885, 7.347361087799072, 7.618890762329102, 7.890420913696289, 8.161951065063477, 8.433481216430664]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 8.0, 11.0, 15.0, 10.0, 5.0, 12.0, 13.0, 21.0, 22.0, 21.0, 25.0, 23.0, 27.0, 34.0, 30.0, 41.0, 44.0, 35.0, 38.0, 49.0, 33.0, 29.0, 36.0, 43.0, 49.0, 38.0, 31.0, 27.0, 24.0, 31.0, 24.0, 19.0, 29.0, 14.0, 14.0, 15.0, 12.0, 4.0, 8.0, 7.0, 6.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.8251953125, -1.772003173828125, -1.71881103515625, -1.665618896484375, -1.6124267578125, -1.559234619140625, -1.50604248046875, -1.452850341796875, -1.399658203125, -1.346466064453125, -1.29327392578125, -1.240081787109375, -1.1868896484375, -1.133697509765625, -1.08050537109375, -1.027313232421875, -0.97412109375, -0.920928955078125, -0.86773681640625, -0.814544677734375, -0.7613525390625, -0.708160400390625, -0.65496826171875, -0.601776123046875, -0.548583984375, -0.495391845703125, -0.44219970703125, -0.389007568359375, -0.3358154296875, -0.282623291015625, -0.22943115234375, -0.176239013671875, -0.123046875, -0.069854736328125, -0.01666259765625, 0.036529541015625, 0.0897216796875, 0.142913818359375, 0.19610595703125, 0.249298095703125, 0.302490234375, 0.355682373046875, 0.40887451171875, 0.462066650390625, 0.5152587890625, 0.568450927734375, 0.62164306640625, 0.674835205078125, 0.72802734375, 0.781219482421875, 0.83441162109375, 0.887603759765625, 0.9407958984375, 0.993988037109375, 1.04718017578125, 1.100372314453125, 1.153564453125, 1.206756591796875, 1.25994873046875, 1.313140869140625, 1.3663330078125, 1.419525146484375, 1.47271728515625, 1.525909423828125, 1.5791015625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 10.0, 10.0, 22.0, 41.0, 51.0, 61.0, 90.0, 125.0, 179.0, 282.0, 388.0, 571.0, 836.0, 1250.0, 1746.0, 2570.0, 3919.0, 5900.0, 8888.0, 13846.0, 21675.0, 34860.0, 57934.0, 106959.0, 207750.0, 250811.0, 138530.0, 72843.0, 42126.0, 26126.0, 16627.0, 10399.0, 6957.0, 4555.0, 3126.0, 2054.0, 1312.0, 907.0, 707.0, 460.0, 307.0, 232.0, 135.0, 130.0, 94.0, 46.0, 33.0, 24.0, 18.0, 7.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.15380859375, -0.1488780975341797, -0.14394760131835938, -0.13901710510253906, -0.13408660888671875, -0.12915611267089844, -0.12422561645507812, -0.11929512023925781, -0.1143646240234375, -0.10943412780761719, -0.10450363159179688, -0.09957313537597656, -0.09464263916015625, -0.08971214294433594, -0.08478164672851562, -0.07985115051269531, -0.074920654296875, -0.06999015808105469, -0.06505966186523438, -0.06012916564941406, -0.05519866943359375, -0.05026817321777344, -0.045337677001953125, -0.04040718078613281, -0.0354766845703125, -0.030546188354492188, -0.025615692138671875, -0.020685195922851562, -0.01575469970703125, -0.010824203491210938, -0.005893707275390625, -0.0009632110595703125, 0.00396728515625, 0.008897781372070312, 0.013828277587890625, 0.018758773803710938, 0.02368927001953125, 0.028619766235351562, 0.033550262451171875, 0.03848075866699219, 0.0434112548828125, 0.04834175109863281, 0.053272247314453125, 0.05820274353027344, 0.06313323974609375, 0.06806373596191406, 0.07299423217773438, 0.07792472839355469, 0.082855224609375, 0.08778572082519531, 0.09271621704101562, 0.09764671325683594, 0.10257720947265625, 0.10750770568847656, 0.11243820190429688, 0.11736869812011719, 0.1222991943359375, 0.1272296905517578, 0.13216018676757812, 0.13709068298339844, 0.14202117919921875, 0.14695167541503906, 0.15188217163085938, 0.1568126678466797, 0.1617431640625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 2.0, 7.0, 3.0, 4.0, 5.0, 9.0, 11.0, 10.0, 18.0, 21.0, 13.0, 13.0, 20.0, 21.0, 26.0, 30.0, 30.0, 31.0, 24.0, 33.0, 36.0, 25.0, 32.0, 34.0, 29.0, 1061.0, 41.0, 43.0, 38.0, 26.0, 30.0, 28.0, 22.0, 24.0, 21.0, 22.0, 23.0, 23.0, 15.0, 21.0, 19.0, 12.0, 13.0, 8.0, 7.0, 9.0, 4.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.0966796875, -1.063812255859375, -1.03094482421875, -0.998077392578125, -0.9652099609375, -0.932342529296875, -0.89947509765625, -0.866607666015625, -0.833740234375, -0.800872802734375, -0.76800537109375, -0.735137939453125, -0.7022705078125, -0.669403076171875, -0.63653564453125, -0.603668212890625, -0.57080078125, -0.537933349609375, -0.50506591796875, -0.472198486328125, -0.4393310546875, -0.406463623046875, -0.37359619140625, -0.340728759765625, -0.307861328125, -0.274993896484375, -0.24212646484375, -0.209259033203125, -0.1763916015625, -0.143524169921875, -0.11065673828125, -0.077789306640625, -0.044921875, -0.012054443359375, 0.02081298828125, 0.053680419921875, 0.0865478515625, 0.119415283203125, 0.15228271484375, 0.185150146484375, 0.218017578125, 0.250885009765625, 0.28375244140625, 0.316619873046875, 0.3494873046875, 0.382354736328125, 0.41522216796875, 0.448089599609375, 0.48095703125, 0.513824462890625, 0.54669189453125, 0.579559326171875, 0.6124267578125, 0.645294189453125, 0.67816162109375, 0.711029052734375, 0.743896484375, 0.776763916015625, 0.80963134765625, 0.842498779296875, 0.8753662109375, 0.908233642578125, 0.94110107421875, 0.973968505859375, 1.0068359375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 11.0, 11.0, 14.0, 20.0, 22.0, 33.0, 53.0, 72.0, 96.0, 120.0, 163.0, 208.0, 286.0, 358.0, 553.0, 664.0, 910.0, 1189.0, 1665.0, 2291.0, 3397.0, 4830.0, 7280.0, 11635.0, 23245.0, 69972.0, 1522934.0, 345785.0, 48839.0, 18616.0, 10273.0, 6282.0, 4284.0, 2922.0, 2159.0, 1567.0, 1132.0, 785.0, 647.0, 457.0, 356.0, 273.0, 178.0, 150.0, 102.0, 76.0, 55.0, 52.0, 38.0, 28.0, 20.0, 11.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0], "bins": [-0.200927734375, -0.19481468200683594, -0.18870162963867188, -0.1825885772705078, -0.17647552490234375, -0.1703624725341797, -0.16424942016601562, -0.15813636779785156, -0.1520233154296875, -0.14591026306152344, -0.13979721069335938, -0.1336841583251953, -0.12757110595703125, -0.12145805358886719, -0.11534500122070312, -0.10923194885253906, -0.103118896484375, -0.09700584411621094, -0.09089279174804688, -0.08477973937988281, -0.07866668701171875, -0.07255363464355469, -0.06644058227539062, -0.06032752990722656, -0.0542144775390625, -0.04810142517089844, -0.041988372802734375, -0.03587532043457031, -0.02976226806640625, -0.023649215698242188, -0.017536163330078125, -0.011423110961914062, -0.00531005859375, 0.0008029937744140625, 0.006916046142578125, 0.013029098510742188, 0.01914215087890625, 0.025255203247070312, 0.031368255615234375, 0.03748130798339844, 0.0435943603515625, 0.04970741271972656, 0.055820465087890625, 0.06193351745605469, 0.06804656982421875, 0.07415962219238281, 0.08027267456054688, 0.08638572692871094, 0.092498779296875, 0.09861183166503906, 0.10472488403320312, 0.11083793640136719, 0.11695098876953125, 0.12306404113769531, 0.12917709350585938, 0.13529014587402344, 0.1414031982421875, 0.14751625061035156, 0.15362930297851562, 0.1597423553466797, 0.16585540771484375, 0.1719684600830078, 0.17808151245117188, 0.18419456481933594, 0.1903076171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 0.0, 3.0, 3.0, 7.0, 7.0, 8.0, 13.0, 20.0, 17.0, 29.0, 41.0, 49.0, 51.0, 47.0, 68.0, 71.0, 70.0, 63.0, 71.0, 59.0, 40.0, 55.0, 37.0, 31.0, 18.0, 30.0, 18.0, 12.0, 18.0, 11.0, 11.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.011749267578125, -0.011391997337341309, -0.011034727096557617, -0.010677456855773926, -0.010320186614990234, -0.009962916374206543, -0.009605646133422852, -0.00924837589263916, -0.008891105651855469, -0.008533835411071777, -0.008176565170288086, -0.007819294929504395, -0.007462024688720703, -0.007104754447937012, -0.00674748420715332, -0.006390213966369629, -0.0060329437255859375, -0.005675673484802246, -0.005318403244018555, -0.004961133003234863, -0.004603862762451172, -0.0042465925216674805, -0.003889322280883789, -0.0035320520401000977, -0.0031747817993164062, -0.002817511558532715, -0.0024602413177490234, -0.002102971076965332, -0.0017457008361816406, -0.0013884305953979492, -0.0010311603546142578, -0.0006738901138305664, -0.000316619873046875, 4.0650367736816406e-05, 0.0003979206085205078, 0.0007551908493041992, 0.0011124610900878906, 0.001469731330871582, 0.0018270015716552734, 0.002184271812438965, 0.0025415420532226562, 0.0028988122940063477, 0.003256082534790039, 0.0036133527755737305, 0.003970623016357422, 0.004327893257141113, 0.004685163497924805, 0.005042433738708496, 0.0053997039794921875, 0.005756974220275879, 0.00611424446105957, 0.006471514701843262, 0.006828784942626953, 0.0071860551834106445, 0.007543325424194336, 0.007900595664978027, 0.008257865905761719, 0.00861513614654541, 0.008972406387329102, 0.009329676628112793, 0.009686946868896484, 0.010044217109680176, 0.010401487350463867, 0.010758757591247559, 0.01111602783203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 8.0, 15.0, 17.0, 26.0, 28.0, 33.0, 52.0, 64.0, 78.0, 102.0, 180.0, 270.0, 523.0, 1264.0, 95691.0, 943908.0, 4485.0, 703.0, 339.0, 241.0, 151.0, 105.0, 64.0, 49.0, 41.0, 27.0, 20.0, 12.0, 10.0, 10.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2095947265625, -0.20288467407226562, -0.19617462158203125, -0.18946456909179688, -0.1827545166015625, -0.17604446411132812, -0.16933441162109375, -0.16262435913085938, -0.155914306640625, -0.14920425415039062, -0.14249420166015625, -0.13578414916992188, -0.1290740966796875, -0.12236404418945312, -0.11565399169921875, -0.10894393920898438, -0.10223388671875, -0.09552383422851562, -0.08881378173828125, -0.08210372924804688, -0.0753936767578125, -0.06868362426757812, -0.06197357177734375, -0.055263519287109375, -0.048553466796875, -0.041843414306640625, -0.03513336181640625, -0.028423309326171875, -0.0217132568359375, -0.015003204345703125, -0.00829315185546875, -0.001583099365234375, 0.005126953125, 0.011837005615234375, 0.01854705810546875, 0.025257110595703125, 0.0319671630859375, 0.038677215576171875, 0.04538726806640625, 0.052097320556640625, 0.058807373046875, 0.06551742553710938, 0.07222747802734375, 0.07893753051757812, 0.0856475830078125, 0.09235763549804688, 0.09906768798828125, 0.10577774047851562, 0.11248779296875, 0.11919784545898438, 0.12590789794921875, 0.13261795043945312, 0.1393280029296875, 0.14603805541992188, 0.15274810791015625, 0.15945816040039062, 0.166168212890625, 0.17287826538085938, 0.17958831787109375, 0.18629837036132812, 0.1930084228515625, 0.19971847534179688, 0.20642852783203125, 0.21313858032226562, 0.2198486328125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 57.0, 558.0, 363.0, 28.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20869532227516174, -0.20502619445323944, -0.20135706663131714, -0.19768792390823364, -0.19401879608631134, -0.19034966826438904, -0.18668054044246674, -0.18301141262054443, -0.17934226989746094, -0.17567314207553864, -0.17200401425361633, -0.16833487153053284, -0.16466574370861053, -0.16099661588668823, -0.15732748806476593, -0.15365836024284363, -0.14998921751976013, -0.14632008969783783, -0.14265096187591553, -0.13898181915283203, -0.13531269133090973, -0.13164356350898743, -0.12797443568706512, -0.12430530041456223, -0.12063618004322052, -0.11696705222129822, -0.11329791694879532, -0.10962878912687302, -0.10595965385437012, -0.10229052603244781, -0.09862139821052551, -0.09495226293802261, -0.09128312766551971, -0.08761399984359741, -0.08394486457109451, -0.08027573674917221, -0.07660660147666931, -0.07293747365474701, -0.06926834583282471, -0.06559921056032181, -0.06193007901310921, -0.058260947465896606, -0.054591815918684006, -0.050922684371471405, -0.0472535565495491, -0.043584421277046204, -0.0399152934551239, -0.0362461619079113, -0.0325770303606987, -0.0289078988134861, -0.0252387672662735, -0.021569637581706047, -0.017900506034493446, -0.014231374487280846, -0.010562244802713394, -0.0068931132555007935, -0.0032239817082881927, 0.00044514937326312065, 0.004114280454814434, 0.00778341107070446, 0.01145254261791706, 0.015121674165129662, 0.018790803849697113, 0.022459935396909714, 0.026129066944122314]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 4.0, 8.0, 12.0, 12.0, 20.0, 17.0, 19.0, 27.0, 25.0, 38.0, 41.0, 38.0, 47.0, 38.0, 39.0, 51.0, 41.0, 47.0, 37.0, 44.0, 49.0, 45.0, 40.0, 26.0, 34.0, 27.0, 28.0, 31.0, 13.0, 12.0, 16.0, 12.0, 13.0, 10.0, 11.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.014222204685211182, -0.01380304154008627, -0.013383878394961357, -0.012964715249836445, -0.012545552104711533, -0.01212638895958662, -0.011707225814461708, -0.011288062669336796, -0.010868899524211884, -0.010449736379086971, -0.010030573233962059, -0.009611410088837147, -0.009192246943712234, -0.008773083798587322, -0.00835392065346241, -0.007934757508337498, -0.0075155943632125854, -0.007096431218087673, -0.006677268072962761, -0.006258104927837849, -0.005838941782712936, -0.005419778637588024, -0.005000615492463112, -0.0045814523473382, -0.004162289202213287, -0.003743126057088375, -0.003323962911963463, -0.0029047997668385506, -0.0024856366217136383, -0.002066473476588726, -0.0016473103314638138, -0.0012281471863389015, -0.0008089840412139893, -0.000389820896089077, 2.9342249035835266e-05, 0.00044850539416074753, 0.0008676685392856598, 0.001286831684410572, 0.0017059948295354843, 0.0021251579746603966, 0.002544321119785309, 0.002963484264910221, 0.0033826474100351334, 0.0038018105551600456, 0.004220973700284958, 0.00464013684540987, 0.005059299990534782, 0.005478463135659695, 0.005897626280784607, 0.006316789425909519, 0.0067359525710344315, 0.007155115716159344, 0.007574278861284256, 0.007993442006409168, 0.00841260515153408, 0.008831768296658993, 0.009250931441783905, 0.009670094586908817, 0.01008925773203373, 0.010508420877158642, 0.010927584022283554, 0.011346747167408466, 0.011765910312533379, 0.01218507345765829, 0.012604236602783203]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 8.0, 11.0, 14.0, 11.0, 5.0, 12.0, 13.0, 19.0, 24.0, 21.0, 25.0, 23.0, 26.0, 35.0, 30.0, 41.0, 44.0, 35.0, 38.0, 50.0, 32.0, 29.0, 36.0, 43.0, 47.0, 39.0, 32.0, 27.0, 24.0, 30.0, 25.0, 19.0, 29.0, 13.0, 15.0, 15.0, 12.0, 4.0, 8.0, 7.0, 6.0, 8.0, 6.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.8251953125, -1.7720184326171875, -1.718841552734375, -1.6656646728515625, -1.61248779296875, -1.5593109130859375, -1.506134033203125, -1.4529571533203125, -1.3997802734375, -1.3466033935546875, -1.293426513671875, -1.2402496337890625, -1.18707275390625, -1.1338958740234375, -1.080718994140625, -1.0275421142578125, -0.974365234375, -0.9211883544921875, -0.868011474609375, -0.8148345947265625, -0.76165771484375, -0.7084808349609375, -0.655303955078125, -0.6021270751953125, -0.5489501953125, -0.4957733154296875, -0.442596435546875, -0.3894195556640625, -0.33624267578125, -0.2830657958984375, -0.229888916015625, -0.1767120361328125, -0.12353515625, -0.0703582763671875, -0.017181396484375, 0.0359954833984375, 0.08917236328125, 0.1423492431640625, 0.195526123046875, 0.2487030029296875, 0.3018798828125, 0.3550567626953125, 0.408233642578125, 0.4614105224609375, 0.51458740234375, 0.5677642822265625, 0.620941162109375, 0.6741180419921875, 0.727294921875, 0.7804718017578125, 0.833648681640625, 0.8868255615234375, 0.94000244140625, 0.9931793212890625, 1.046356201171875, 1.0995330810546875, 1.1527099609375, 1.2058868408203125, 1.259063720703125, 1.3122406005859375, 1.36541748046875, 1.4185943603515625, 1.471771240234375, 1.5249481201171875, 1.578125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 5.0, 8.0, 9.0, 11.0, 11.0, 28.0, 33.0, 35.0, 56.0, 59.0, 97.0, 137.0, 175.0, 247.0, 390.0, 564.0, 911.0, 1560.0, 2836.0, 5781.0, 11918.0, 26555.0, 63210.0, 167882.0, 414188.0, 212706.0, 77683.0, 32421.0, 14318.0, 6612.0, 3259.0, 1853.0, 1019.0, 610.0, 399.0, 270.0, 189.0, 122.0, 88.0, 92.0, 64.0, 43.0, 27.0, 19.0, 21.0, 16.0, 5.0, 5.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.73046875, -2.64923095703125, -2.5679931640625, -2.48675537109375, -2.405517578125, -2.32427978515625, -2.2430419921875, -2.16180419921875, -2.08056640625, -1.99932861328125, -1.9180908203125, -1.83685302734375, -1.755615234375, -1.67437744140625, -1.5931396484375, -1.51190185546875, -1.4306640625, -1.34942626953125, -1.2681884765625, -1.18695068359375, -1.105712890625, -1.02447509765625, -0.9432373046875, -0.86199951171875, -0.78076171875, -0.69952392578125, -0.6182861328125, -0.53704833984375, -0.455810546875, -0.37457275390625, -0.2933349609375, -0.21209716796875, -0.130859375, -0.04962158203125, 0.0316162109375, 0.11285400390625, 0.194091796875, 0.27532958984375, 0.3565673828125, 0.43780517578125, 0.51904296875, 0.60028076171875, 0.6815185546875, 0.76275634765625, 0.843994140625, 0.92523193359375, 1.0064697265625, 1.08770751953125, 1.1689453125, 1.25018310546875, 1.3314208984375, 1.41265869140625, 1.493896484375, 1.57513427734375, 1.6563720703125, 1.73760986328125, 1.81884765625, 1.90008544921875, 1.9813232421875, 2.06256103515625, 2.143798828125, 2.22503662109375, 2.3062744140625, 2.38751220703125, 2.46875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 8.0, 10.0, 9.0, 22.0, 22.0, 15.0, 21.0, 18.0, 21.0, 37.0, 39.0, 44.0, 55.0, 34.0, 71.0, 97.0, 147.0, 289.0, 1363.0, 175.0, 99.0, 84.0, 46.0, 44.0, 43.0, 29.0, 23.0, 28.0, 23.0, 30.0, 17.0, 10.0, 13.0, 14.0, 7.0, 3.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.90924072265625, -3.7794189453125, -3.64959716796875, -3.519775390625, -3.38995361328125, -3.2601318359375, -3.13031005859375, -3.00048828125, -2.87066650390625, -2.7408447265625, -2.61102294921875, -2.481201171875, -2.35137939453125, -2.2215576171875, -2.09173583984375, -1.9619140625, -1.83209228515625, -1.7022705078125, -1.57244873046875, -1.442626953125, -1.31280517578125, -1.1829833984375, -1.05316162109375, -0.92333984375, -0.79351806640625, -0.6636962890625, -0.53387451171875, -0.404052734375, -0.27423095703125, -0.1444091796875, -0.01458740234375, 0.115234375, 0.24505615234375, 0.3748779296875, 0.50469970703125, 0.634521484375, 0.76434326171875, 0.8941650390625, 1.02398681640625, 1.15380859375, 1.28363037109375, 1.4134521484375, 1.54327392578125, 1.673095703125, 1.80291748046875, 1.9327392578125, 2.06256103515625, 2.1923828125, 2.32220458984375, 2.4520263671875, 2.58184814453125, 2.711669921875, 2.84149169921875, 2.9713134765625, 3.10113525390625, 3.23095703125, 3.36077880859375, 3.4906005859375, 3.62042236328125, 3.750244140625, 3.88006591796875, 4.0098876953125, 4.13970947265625, 4.26953125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 8.0, 9.0, 8.0, 21.0, 19.0, 41.0, 40.0, 52.0, 62.0, 79.0, 133.0, 164.0, 221.0, 302.0, 427.0, 847.0, 2577.0, 602750.0, 2531923.0, 3455.0, 894.0, 472.0, 308.0, 229.0, 136.0, 117.0, 96.0, 70.0, 57.0, 44.0, 27.0, 23.0, 19.0, 18.0, 13.0, 13.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.375, -16.8330078125, -16.291015625, -15.7490234375, -15.20703125, -14.6650390625, -14.123046875, -13.5810546875, -13.0390625, -12.4970703125, -11.955078125, -11.4130859375, -10.87109375, -10.3291015625, -9.787109375, -9.2451171875, -8.703125, -8.1611328125, -7.619140625, -7.0771484375, -6.53515625, -5.9931640625, -5.451171875, -4.9091796875, -4.3671875, -3.8251953125, -3.283203125, -2.7412109375, -2.19921875, -1.6572265625, -1.115234375, -0.5732421875, -0.03125, 0.5107421875, 1.052734375, 1.5947265625, 2.13671875, 2.6787109375, 3.220703125, 3.7626953125, 4.3046875, 4.8466796875, 5.388671875, 5.9306640625, 6.47265625, 7.0146484375, 7.556640625, 8.0986328125, 8.640625, 9.1826171875, 9.724609375, 10.2666015625, 10.80859375, 11.3505859375, 11.892578125, 12.4345703125, 12.9765625, 13.5185546875, 14.060546875, 14.6025390625, 15.14453125, 15.6865234375, 16.228515625, 16.7705078125, 17.3125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 15.0, 24.0, 44.0, 85.0, 122.0, 172.0, 207.0, 140.0, 99.0, 47.0, 28.0, 13.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.176000595092773, -27.605493545532227, -27.034988403320312, -26.464481353759766, -25.89397621154785, -25.323469161987305, -24.75296401977539, -24.182456970214844, -23.611949920654297, -23.04144287109375, -22.470937728881836, -21.90043067932129, -21.329925537109375, -20.759418487548828, -20.188913345336914, -19.618406295776367, -19.047901153564453, -18.477394104003906, -17.906888961791992, -17.336381912231445, -16.76587677001953, -16.195369720458984, -15.624863624572754, -15.054357528686523, -14.483851432800293, -13.913345336914062, -13.342839241027832, -12.772333145141602, -12.201826095581055, -11.63132095336914, -11.060813903808594, -10.490307807922363, -9.919803619384766, -9.349297523498535, -8.778791427612305, -8.208285331726074, -7.6377787590026855, -7.067272663116455, -6.496766090393066, -5.926259994506836, -5.3557538986206055, -4.785247802734375, -4.2147417068481445, -3.644235134124756, -3.0737290382385254, -2.503222942352295, -1.9327166080474854, -1.3622102737426758, -0.7917041778564453, -0.2211979627609253, 0.3493082523345947, 0.9198144674301147, 1.4903206825256348, 2.0608267784118652, 2.631333112716675, 3.2018394470214844, 3.772345542907715, 4.342851638793945, 4.913357734680176, 5.4838643074035645, 6.054370403289795, 6.624876499176025, 7.195383071899414, 7.7658891677856445, 8.336395263671875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 7.0, 15.0, 12.0, 17.0, 14.0, 14.0, 22.0, 18.0, 24.0, 25.0, 27.0, 37.0, 37.0, 45.0, 37.0, 45.0, 44.0, 34.0, 30.0, 40.0, 41.0, 44.0, 35.0, 48.0, 26.0, 31.0, 28.0, 29.0, 26.0, 24.0, 24.0, 7.0, 7.0, 16.0, 11.0, 8.0, 3.0, 7.0, 5.0, 5.0, 5.0, 5.0, 8.0, 0.0, 2.0, 2.0], "bins": [-13.696267127990723, -13.317237854003906, -12.938209533691406, -12.55918025970459, -12.18015193939209, -11.801122665405273, -11.422094345092773, -11.043065071105957, -10.66403579711914, -10.285006523132324, -9.905978202819824, -9.526948928833008, -9.147920608520508, -8.768891334533691, -8.389862060546875, -8.010833740234375, -7.631804943084717, -7.252776145935059, -6.8737473487854, -6.494718551635742, -6.115689277648926, -5.736660480499268, -5.357631683349609, -4.978602409362793, -4.599574089050293, -4.220545291900635, -3.8415162563323975, -3.4624874591827393, -3.083458423614502, -2.7044296264648438, -2.3254008293151855, -1.9463717937469482, -1.567342758178711, -1.1883138418197632, -0.8092849850654602, -0.4302561283111572, -0.05122721195220947, 0.3278017044067383, 0.7068305015563965, 1.0858595371246338, 1.464888334274292, 1.8439172506332397, 2.2229461669921875, 2.6019749641418457, 2.981003761291504, 3.360032796859741, 3.7390615940093994, 4.118090629577637, 4.497119426727295, 4.876148223876953, 5.255177021026611, 5.6342058181762695, 6.013235092163086, 6.392263889312744, 6.771292686462402, 7.150321960449219, 7.529350280761719, 7.908379077911377, 8.287407875061035, 8.666437149047852, 9.045465469360352, 9.424494743347168, 9.803524017333984, 10.182552337646484, 10.5615816116333]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 7.0, 11.0, 14.0, 19.0, 19.0, 25.0, 17.0, 24.0, 33.0, 20.0, 40.0, 29.0, 42.0, 30.0, 35.0, 54.0, 41.0, 40.0, 40.0, 42.0, 43.0, 37.0, 35.0, 24.0, 33.0, 27.0, 35.0, 30.0, 17.0, 23.0, 16.0, 17.0, 15.0, 10.0, 10.0, 10.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5463409423828125, -1.490142822265625, -1.4339447021484375, -1.37774658203125, -1.3215484619140625, -1.265350341796875, -1.2091522216796875, -1.1529541015625, -1.0967559814453125, -1.040557861328125, -0.9843597412109375, -0.92816162109375, -0.8719635009765625, -0.815765380859375, -0.7595672607421875, -0.703369140625, -0.6471710205078125, -0.590972900390625, -0.5347747802734375, -0.47857666015625, -0.4223785400390625, -0.366180419921875, -0.3099822998046875, -0.2537841796875, -0.1975860595703125, -0.141387939453125, -0.0851898193359375, -0.02899169921875, 0.0272064208984375, 0.083404541015625, 0.1396026611328125, 0.19580078125, 0.2519989013671875, 0.308197021484375, 0.3643951416015625, 0.42059326171875, 0.4767913818359375, 0.532989501953125, 0.5891876220703125, 0.6453857421875, 0.7015838623046875, 0.757781982421875, 0.8139801025390625, 0.87017822265625, 0.9263763427734375, 0.982574462890625, 1.0387725830078125, 1.094970703125, 1.1511688232421875, 1.207366943359375, 1.2635650634765625, 1.31976318359375, 1.3759613037109375, 1.432159423828125, 1.4883575439453125, 1.5445556640625, 1.6007537841796875, 1.656951904296875, 1.7131500244140625, 1.76934814453125, 1.8255462646484375, 1.881744384765625, 1.9379425048828125, 1.994140625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 9.0, 16.0, 28.0, 48.0, 87.0, 170.0, 316.0, 656.0, 1509.0, 6857.0, 388237.0, 3761730.0, 29757.0, 2887.0, 1001.0, 452.0, 252.0, 129.0, 67.0, 27.0, 24.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.379150390625, -9.04736328125, -8.715576171875, -8.3837890625, -8.052001953125, -7.72021484375, -7.388427734375, -7.056640625, -6.724853515625, -6.39306640625, -6.061279296875, -5.7294921875, -5.397705078125, -5.06591796875, -4.734130859375, -4.40234375, -4.070556640625, -3.73876953125, -3.406982421875, -3.0751953125, -2.743408203125, -2.41162109375, -2.079833984375, -1.748046875, -1.416259765625, -1.08447265625, -0.752685546875, -0.4208984375, -0.089111328125, 0.24267578125, 0.574462890625, 0.90625, 1.238037109375, 1.56982421875, 1.901611328125, 2.2333984375, 2.565185546875, 2.89697265625, 3.228759765625, 3.560546875, 3.892333984375, 4.22412109375, 4.555908203125, 4.8876953125, 5.219482421875, 5.55126953125, 5.883056640625, 6.21484375, 6.546630859375, 6.87841796875, 7.210205078125, 7.5419921875, 7.873779296875, 8.20556640625, 8.537353515625, 8.869140625, 9.200927734375, 9.53271484375, 9.864501953125, 10.1962890625, 10.528076171875, 10.85986328125, 11.191650390625, 11.5234375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 4.0, 11.0, 17.0, 13.0, 14.0, 19.0, 38.0, 51.0, 57.0, 85.0, 136.0, 180.0, 246.0, 424.0, 590.0, 724.0, 462.0, 313.0, 171.0, 125.0, 99.0, 81.0, 66.0, 28.0, 32.0, 22.0, 15.0, 14.0, 9.0, 7.0, 10.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.28643798828125, -3.1842041015625, -3.08197021484375, -2.979736328125, -2.87750244140625, -2.7752685546875, -2.67303466796875, -2.57080078125, -2.46856689453125, -2.3663330078125, -2.26409912109375, -2.161865234375, -2.05963134765625, -1.9573974609375, -1.85516357421875, -1.7529296875, -1.65069580078125, -1.5484619140625, -1.44622802734375, -1.343994140625, -1.24176025390625, -1.1395263671875, -1.03729248046875, -0.93505859375, -0.83282470703125, -0.7305908203125, -0.62835693359375, -0.526123046875, -0.42388916015625, -0.3216552734375, -0.21942138671875, -0.1171875, -0.01495361328125, 0.0872802734375, 0.18951416015625, 0.291748046875, 0.39398193359375, 0.4962158203125, 0.59844970703125, 0.70068359375, 0.80291748046875, 0.9051513671875, 1.00738525390625, 1.109619140625, 1.21185302734375, 1.3140869140625, 1.41632080078125, 1.5185546875, 1.62078857421875, 1.7230224609375, 1.82525634765625, 1.927490234375, 2.02972412109375, 2.1319580078125, 2.23419189453125, 2.33642578125, 2.43865966796875, 2.5408935546875, 2.64312744140625, 2.745361328125, 2.84759521484375, 2.9498291015625, 3.05206298828125, 3.154296875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 9.0, 27.0, 25.0, 35.0, 51.0, 85.0, 126.0, 274.0, 484.0, 1270.0, 4126.0, 22020.0, 300962.0, 3603504.0, 236125.0, 19194.0, 3719.0, 1109.0, 454.0, 249.0, 122.0, 95.0, 43.0, 48.0, 21.0, 23.0, 13.0, 10.0, 10.0, 6.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98828125, -5.7850341796875, -5.581787109375, -5.3785400390625, -5.17529296875, -4.9720458984375, -4.768798828125, -4.5655517578125, -4.3623046875, -4.1590576171875, -3.955810546875, -3.7525634765625, -3.54931640625, -3.3460693359375, -3.142822265625, -2.9395751953125, -2.736328125, -2.5330810546875, -2.329833984375, -2.1265869140625, -1.92333984375, -1.7200927734375, -1.516845703125, -1.3135986328125, -1.1103515625, -0.9071044921875, -0.703857421875, -0.5006103515625, -0.29736328125, -0.0941162109375, 0.109130859375, 0.3123779296875, 0.515625, 0.7188720703125, 0.922119140625, 1.1253662109375, 1.32861328125, 1.5318603515625, 1.735107421875, 1.9383544921875, 2.1416015625, 2.3448486328125, 2.548095703125, 2.7513427734375, 2.95458984375, 3.1578369140625, 3.361083984375, 3.5643310546875, 3.767578125, 3.9708251953125, 4.174072265625, 4.3773193359375, 4.58056640625, 4.7838134765625, 4.987060546875, 5.1903076171875, 5.3935546875, 5.5968017578125, 5.800048828125, 6.0032958984375, 6.20654296875, 6.4097900390625, 6.613037109375, 6.8162841796875, 7.01953125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 482.0, 522.0, 9.0, 1.0, 1.0, 0.0, 1.0], "bins": [-218.6971893310547, -214.9259033203125, -211.1546173095703, -207.3833465576172, -203.612060546875, -199.8407745361328, -196.06948852539062, -192.2982177734375, -188.5269317626953, -184.75564575195312, -180.98435974121094, -177.2130889892578, -173.44180297851562, -169.67051696777344, -165.89923095703125, -162.12796020507812, -158.35667419433594, -154.58538818359375, -150.81410217285156, -147.04283142089844, -143.27154541015625, -139.50025939941406, -135.72897338867188, -131.95770263671875, -128.18641662597656, -124.41513061523438, -120.64385223388672, -116.87256622314453, -113.10128784179688, -109.33000183105469, -105.55872344970703, -101.78743743896484, -98.01615905761719, -94.244873046875, -90.47359466552734, -86.70230865478516, -82.9310302734375, -79.15974426269531, -75.38846588134766, -71.61717987060547, -67.84590148925781, -64.07461547851562, -60.30333709716797, -56.53205490112305, -52.760772705078125, -48.98948669433594, -45.21820831298828, -41.446922302246094, -37.675636291503906, -33.904354095458984, -30.133071899414062, -26.36178970336914, -22.59050750732422, -18.819223403930664, -15.047941207885742, -11.27665901184082, -7.505378723144531, -3.7340962886810303, 0.0371861457824707, 3.808468818664551, 7.579751014709473, 11.351034164428711, 15.122316360473633, 18.893598556518555, 22.664880752563477]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 10.0, 13.0, 14.0, 17.0, 21.0, 25.0, 33.0, 19.0, 32.0, 37.0, 27.0, 41.0, 43.0, 50.0, 43.0, 51.0, 57.0, 48.0, 38.0, 44.0, 45.0, 46.0, 39.0, 24.0, 26.0, 27.0, 25.0, 17.0, 17.0, 13.0, 8.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.71467113494873, -12.359393119812012, -12.004115104675293, -11.64883804321289, -11.293560028076172, -10.938282012939453, -10.583003997802734, -10.227725982666016, -9.872448921203613, -9.517170906066895, -9.161892890930176, -8.806615829467773, -8.451337814331055, -8.096059799194336, -7.740781784057617, -7.385504245758057, -7.030226230621338, -6.674948215484619, -6.319670677185059, -5.96439266204834, -5.609115123748779, -5.2538371086120605, -4.8985595703125, -4.543281555175781, -4.1880035400390625, -3.832725763320923, -3.477447986602783, -3.1221699714660645, -2.766892433166504, -2.411614418029785, -2.0563366413116455, -1.7010588645935059, -1.3457813262939453, -0.9905035495758057, -0.6352257132530212, -0.2799478769302368, 0.07532989978790283, 0.4306076765060425, 0.7858855724334717, 1.1411633491516113, 1.496441125869751, 1.8517189025878906, 2.2069966793060303, 2.56227445602417, 2.9175524711608887, 3.272830009460449, 3.628108024597168, 3.9833858013153076, 4.338663578033447, 4.693941593170166, 5.049219131469727, 5.404497146606445, 5.759774684906006, 6.115052700042725, 6.470330238342285, 6.825608253479004, 7.180886268615723, 7.536164283752441, 7.891441822052002, 8.246719360351562, 8.601997375488281, 8.957275390625, 9.312553405761719, 9.667831420898438, 10.02310848236084]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 11.0, 10.0, 10.0, 13.0, 16.0, 19.0, 15.0, 26.0, 27.0, 36.0, 23.0, 32.0, 36.0, 39.0, 46.0, 48.0, 35.0, 43.0, 44.0, 45.0, 45.0, 43.0, 41.0, 34.0, 36.0, 37.0, 21.0, 20.0, 27.0, 25.0, 21.0, 16.0, 13.0, 9.0, 6.0, 4.0, 5.0, 3.0, 9.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3955078125, -1.347381591796875, -1.29925537109375, -1.251129150390625, -1.2030029296875, -1.154876708984375, -1.10675048828125, -1.058624267578125, -1.010498046875, -0.962371826171875, -0.91424560546875, -0.866119384765625, -0.8179931640625, -0.769866943359375, -0.72174072265625, -0.673614501953125, -0.62548828125, -0.577362060546875, -0.52923583984375, -0.481109619140625, -0.4329833984375, -0.384857177734375, -0.33673095703125, -0.288604736328125, -0.240478515625, -0.192352294921875, -0.14422607421875, -0.096099853515625, -0.0479736328125, 0.000152587890625, 0.04827880859375, 0.096405029296875, 0.14453125, 0.192657470703125, 0.24078369140625, 0.288909912109375, 0.3370361328125, 0.385162353515625, 0.43328857421875, 0.481414794921875, 0.529541015625, 0.577667236328125, 0.62579345703125, 0.673919677734375, 0.7220458984375, 0.770172119140625, 0.81829833984375, 0.866424560546875, 0.91455078125, 0.962677001953125, 1.01080322265625, 1.058929443359375, 1.1070556640625, 1.155181884765625, 1.20330810546875, 1.251434326171875, 1.299560546875, 1.347686767578125, 1.39581298828125, 1.443939208984375, 1.4920654296875, 1.540191650390625, 1.58831787109375, 1.636444091796875, 1.6845703125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 12.0, 11.0, 29.0, 23.0, 48.0, 67.0, 121.0, 197.0, 239.0, 436.0, 661.0, 1041.0, 1566.0, 2391.0, 3880.0, 5764.0, 9285.0, 14642.0, 23809.0, 38864.0, 68092.0, 133123.0, 249582.0, 225386.0, 115440.0, 60615.0, 35244.0, 21341.0, 13315.0, 8307.0, 5289.0, 3419.0, 2199.0, 1428.0, 939.0, 597.0, 419.0, 237.0, 168.0, 125.0, 69.0, 41.0, 23.0, 26.0, 15.0, 12.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.1478595733642578, -0.14349746704101562, -0.13913536071777344, -0.13477325439453125, -0.13041114807128906, -0.12604904174804688, -0.12168693542480469, -0.1173248291015625, -0.11296272277832031, -0.10860061645507812, -0.10423851013183594, -0.09987640380859375, -0.09551429748535156, -0.09115219116210938, -0.08679008483886719, -0.082427978515625, -0.07806587219238281, -0.07370376586914062, -0.06934165954589844, -0.06497955322265625, -0.06061744689941406, -0.056255340576171875, -0.05189323425292969, -0.0475311279296875, -0.04316902160644531, -0.038806915283203125, -0.03444480895996094, -0.03008270263671875, -0.025720596313476562, -0.021358489990234375, -0.016996383666992188, -0.01263427734375, -0.008272171020507812, -0.003910064697265625, 0.0004520416259765625, 0.00481414794921875, 0.009176254272460938, 0.013538360595703125, 0.017900466918945312, 0.0222625732421875, 0.026624679565429688, 0.030986785888671875, 0.03534889221191406, 0.03971099853515625, 0.04407310485839844, 0.048435211181640625, 0.05279731750488281, 0.057159423828125, 0.06152153015136719, 0.06588363647460938, 0.07024574279785156, 0.07460784912109375, 0.07896995544433594, 0.08333206176757812, 0.08769416809082031, 0.0920562744140625, 0.09641838073730469, 0.10078048706054688, 0.10514259338378906, 0.10950469970703125, 0.11386680603027344, 0.11822891235351562, 0.12259101867675781, 0.126953125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 9.0, 8.0, 11.0, 8.0, 15.0, 19.0, 22.0, 21.0, 25.0, 29.0, 36.0, 35.0, 31.0, 32.0, 46.0, 39.0, 32.0, 1063.0, 52.0, 47.0, 25.0, 38.0, 36.0, 39.0, 34.0, 43.0, 23.0, 20.0, 26.0, 21.0, 18.0, 18.0, 19.0, 12.0, 8.0, 9.0, 5.0, 3.0, 8.0, 3.0, 2.0, 5.0, 6.0, 1.0, 0.0, 2.0], "bins": [-1.1416015625, -1.1098556518554688, -1.0781097412109375, -1.0463638305664062, -1.014617919921875, -0.9828720092773438, -0.9511260986328125, -0.9193801879882812, -0.88763427734375, -0.8558883666992188, -0.8241424560546875, -0.7923965454101562, -0.760650634765625, -0.7289047241210938, -0.6971588134765625, -0.6654129028320312, -0.6336669921875, -0.6019210815429688, -0.5701751708984375, -0.5384292602539062, -0.506683349609375, -0.47493743896484375, -0.4431915283203125, -0.41144561767578125, -0.37969970703125, -0.34795379638671875, -0.3162078857421875, -0.28446197509765625, -0.252716064453125, -0.22097015380859375, -0.1892242431640625, -0.15747833251953125, -0.125732421875, -0.09398651123046875, -0.0622406005859375, -0.03049468994140625, 0.001251220703125, 0.03299713134765625, 0.0647430419921875, 0.09648895263671875, 0.12823486328125, 0.15998077392578125, 0.1917266845703125, 0.22347259521484375, 0.255218505859375, 0.28696441650390625, 0.3187103271484375, 0.35045623779296875, 0.3822021484375, 0.41394805908203125, 0.4456939697265625, 0.47743988037109375, 0.509185791015625, 0.5409317016601562, 0.5726776123046875, 0.6044235229492188, 0.63616943359375, 0.6679153442382812, 0.6996612548828125, 0.7314071655273438, 0.763153076171875, 0.7948989868164062, 0.8266448974609375, 0.8583908081054688, 0.89013671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 8.0, 5.0, 7.0, 15.0, 12.0, 32.0, 27.0, 48.0, 67.0, 64.0, 111.0, 162.0, 220.0, 322.0, 432.0, 608.0, 852.0, 1273.0, 1823.0, 2619.0, 4136.0, 6451.0, 11097.0, 22361.0, 71810.0, 1631167.0, 260453.0, 39734.0, 16174.0, 8704.0, 5370.0, 3464.0, 2290.0, 1544.0, 1067.0, 746.0, 531.0, 367.0, 279.0, 191.0, 130.0, 116.0, 54.0, 68.0, 42.0, 21.0, 24.0, 13.0, 11.0, 9.0, 2.0, 1.0, 6.0, 1.0], "bins": [-0.20068359375, -0.19507598876953125, -0.1894683837890625, -0.18386077880859375, -0.178253173828125, -0.17264556884765625, -0.1670379638671875, -0.16143035888671875, -0.15582275390625, -0.15021514892578125, -0.1446075439453125, -0.13899993896484375, -0.133392333984375, -0.12778472900390625, -0.1221771240234375, -0.11656951904296875, -0.1109619140625, -0.10535430908203125, -0.0997467041015625, -0.09413909912109375, -0.088531494140625, -0.08292388916015625, -0.0773162841796875, -0.07170867919921875, -0.06610107421875, -0.06049346923828125, -0.0548858642578125, -0.04927825927734375, -0.043670654296875, -0.03806304931640625, -0.0324554443359375, -0.02684783935546875, -0.021240234375, -0.01563262939453125, -0.0100250244140625, -0.00441741943359375, 0.001190185546875, 0.00679779052734375, 0.0124053955078125, 0.01801300048828125, 0.02362060546875, 0.02922821044921875, 0.0348358154296875, 0.04044342041015625, 0.046051025390625, 0.05165863037109375, 0.0572662353515625, 0.06287384033203125, 0.0684814453125, 0.07408905029296875, 0.0796966552734375, 0.08530426025390625, 0.090911865234375, 0.09651947021484375, 0.1021270751953125, 0.10773468017578125, 0.11334228515625, 0.11894989013671875, 0.1245574951171875, 0.13016510009765625, 0.135772705078125, 0.14138031005859375, 0.1469879150390625, 0.15259552001953125, 0.158203125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 8.0, 13.0, 7.0, 15.0, 23.0, 14.0, 28.0, 34.0, 36.0, 50.0, 55.0, 66.0, 64.0, 71.0, 88.0, 77.0, 63.0, 50.0, 55.0, 34.0, 28.0, 28.0, 18.0, 10.0, 8.0, 13.0, 8.0, 10.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.008972764015197754, -0.008599519729614258, -0.008226275444030762, -0.007853031158447266, -0.0074797868728637695, -0.0071065425872802734, -0.006733298301696777, -0.006360054016113281, -0.005986809730529785, -0.005613565444946289, -0.005240321159362793, -0.004867076873779297, -0.004493832588195801, -0.004120588302612305, -0.0037473440170288086, -0.0033740997314453125, -0.0030008554458618164, -0.0026276111602783203, -0.0022543668746948242, -0.0018811225891113281, -0.001507878303527832, -0.001134634017944336, -0.0007613897323608398, -0.00038814544677734375, -1.4901161193847656e-05, 0.00035834312438964844, 0.0007315874099731445, 0.0011048316955566406, 0.0014780759811401367, 0.0018513202667236328, 0.002224564552307129, 0.002597808837890625, 0.002971053123474121, 0.003344297409057617, 0.0037175416946411133, 0.004090785980224609, 0.0044640302658081055, 0.0048372745513916016, 0.005210518836975098, 0.005583763122558594, 0.00595700740814209, 0.006330251693725586, 0.006703495979309082, 0.007076740264892578, 0.007449984550476074, 0.00782322883605957, 0.008196473121643066, 0.008569717407226562, 0.008942961692810059, 0.009316205978393555, 0.00968945026397705, 0.010062694549560547, 0.010435938835144043, 0.010809183120727539, 0.011182427406311035, 0.011555671691894531, 0.011928915977478027, 0.012302160263061523, 0.01267540454864502, 0.013048648834228516, 0.013421893119812012, 0.013795137405395508, 0.014168381690979004, 0.0145416259765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 12.0, 12.0, 8.0, 24.0, 16.0, 29.0, 33.0, 54.0, 72.0, 102.0, 152.0, 277.0, 522.0, 1379.0, 225286.0, 817200.0, 1849.0, 636.0, 299.0, 164.0, 123.0, 82.0, 59.0, 44.0, 30.0, 18.0, 15.0, 20.0, 13.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.29541015625, -0.2878532409667969, -0.28029632568359375, -0.2727394104003906, -0.2651824951171875, -0.2576255798339844, -0.25006866455078125, -0.24251174926757812, -0.234954833984375, -0.22739791870117188, -0.21984100341796875, -0.21228408813476562, -0.2047271728515625, -0.19717025756835938, -0.18961334228515625, -0.18205642700195312, -0.17449951171875, -0.16694259643554688, -0.15938568115234375, -0.15182876586914062, -0.1442718505859375, -0.13671493530273438, -0.12915802001953125, -0.12160110473632812, -0.114044189453125, -0.10648727416992188, -0.09893035888671875, -0.09137344360351562, -0.0838165283203125, -0.07625961303710938, -0.06870269775390625, -0.061145782470703125, -0.0535888671875, -0.046031951904296875, -0.03847503662109375, -0.030918121337890625, -0.0233612060546875, -0.015804290771484375, -0.00824737548828125, -0.000690460205078125, 0.006866455078125, 0.014423370361328125, 0.02198028564453125, 0.029537200927734375, 0.0370941162109375, 0.044651031494140625, 0.05220794677734375, 0.059764862060546875, 0.06732177734375, 0.07487869262695312, 0.08243560791015625, 0.08999252319335938, 0.0975494384765625, 0.10510635375976562, 0.11266326904296875, 0.12022018432617188, 0.127777099609375, 0.13533401489257812, 0.14289093017578125, 0.15044784545898438, 0.1580047607421875, 0.16556167602539062, 0.17311859130859375, 0.18067550659179688, 0.188232421875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 52.0, 517.0, 407.0, 31.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16921992599964142, -0.16608023643493652, -0.16294054687023163, -0.15980085730552673, -0.15666116774082184, -0.15352147817611694, -0.15038178861141205, -0.14724209904670715, -0.14410240948200226, -0.14096271991729736, -0.13782303035259247, -0.13468334078788757, -0.13154365122318268, -0.12840396165847778, -0.1252642720937729, -0.122124582529068, -0.1189848929643631, -0.1158452033996582, -0.11270551383495331, -0.10956582427024841, -0.10642613470554352, -0.10328644514083862, -0.10014675557613373, -0.09700706601142883, -0.09386737644672394, -0.09072768688201904, -0.08758799731731415, -0.08444830775260925, -0.08130861818790436, -0.07816892862319946, -0.07502923905849457, -0.07188954949378967, -0.06874985992908478, -0.06561017036437988, -0.06247048079967499, -0.05933079123497009, -0.0561911016702652, -0.0530514121055603, -0.04991172254085541, -0.04677203297615051, -0.043632347136735916, -0.04049265757203102, -0.037352968007326126, -0.03421327844262123, -0.031073588877916336, -0.02793389931321144, -0.024794209748506546, -0.02165452018380165, -0.018514830619096756, -0.015375141054391861, -0.012235451489686966, -0.009095761924982071, -0.005956072360277176, -0.002816382795572281, 0.00032330676913261414, 0.003462996333837509, 0.006602685898542404, 0.0097423754632473, 0.012882065027952194, 0.01602175459265709, 0.019161444157361984, 0.02230113372206688, 0.025440823286771774, 0.02858051285147667, 0.031720202416181564]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 13.0, 19.0, 9.0, 19.0, 22.0, 13.0, 26.0, 24.0, 38.0, 40.0, 38.0, 39.0, 36.0, 51.0, 48.0, 42.0, 39.0, 44.0, 32.0, 32.0, 30.0, 40.0, 30.0, 18.0, 37.0, 28.0, 21.0, 28.0, 19.0, 21.0, 14.0, 17.0, 12.0, 9.0, 10.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.012069642543792725, -0.011717116460204124, -0.011364590376615524, -0.011012064293026924, -0.010659538209438324, -0.010307012125849724, -0.009954486042261124, -0.009601959958672523, -0.009249433875083923, -0.008896907791495323, -0.008544381707906723, -0.008191855624318123, -0.007839329540729523, -0.0074868034571409225, -0.007134277373552322, -0.006781751289963722, -0.006429225206375122, -0.006076699122786522, -0.005724173039197922, -0.005371646955609322, -0.0050191208720207214, -0.004666594788432121, -0.004314068704843521, -0.003961542621254921, -0.003609016537666321, -0.0032564904540777206, -0.0029039643704891205, -0.0025514382869005203, -0.00219891220331192, -0.00184638611972332, -0.0014938600361347198, -0.0011413339525461197, -0.0007888078689575195, -0.00043628178536891937, -8.375570178031921e-05, 0.00026877038180828094, 0.0006212964653968811, 0.0009738225489854813, 0.0013263486325740814, 0.0016788747161626816, 0.0020314007997512817, 0.002383926883339882, 0.002736452966928482, 0.003088979050517082, 0.0034415051341056824, 0.0037940312176942825, 0.004146557301282883, 0.004499083384871483, 0.004851609468460083, 0.005204135552048683, 0.005556661635637283, 0.0059091877192258835, 0.006261713802814484, 0.006614239886403084, 0.006966765969991684, 0.007319292053580284, 0.007671818137168884, 0.008024344220757484, 0.008376870304346085, 0.008729396387934685, 0.009081922471523285, 0.009434448555111885, 0.009786974638700485, 0.010139500722289085, 0.010492026805877686]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 11.0, 10.0, 10.0, 13.0, 16.0, 19.0, 15.0, 26.0, 29.0, 34.0, 23.0, 32.0, 36.0, 39.0, 45.0, 48.0, 34.0, 45.0, 44.0, 44.0, 46.0, 43.0, 40.0, 36.0, 34.0, 38.0, 21.0, 20.0, 27.0, 25.0, 20.0, 17.0, 14.0, 8.0, 6.0, 4.0, 5.0, 3.0, 11.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3955078125, -1.347381591796875, -1.29925537109375, -1.251129150390625, -1.2030029296875, -1.154876708984375, -1.10675048828125, -1.058624267578125, -1.010498046875, -0.962371826171875, -0.91424560546875, -0.866119384765625, -0.8179931640625, -0.769866943359375, -0.72174072265625, -0.673614501953125, -0.62548828125, -0.577362060546875, -0.52923583984375, -0.481109619140625, -0.4329833984375, -0.384857177734375, -0.33673095703125, -0.288604736328125, -0.240478515625, -0.192352294921875, -0.14422607421875, -0.096099853515625, -0.0479736328125, 0.000152587890625, 0.04827880859375, 0.096405029296875, 0.14453125, 0.192657470703125, 0.24078369140625, 0.288909912109375, 0.3370361328125, 0.385162353515625, 0.43328857421875, 0.481414794921875, 0.529541015625, 0.577667236328125, 0.62579345703125, 0.673919677734375, 0.7220458984375, 0.770172119140625, 0.81829833984375, 0.866424560546875, 0.91455078125, 0.962677001953125, 1.01080322265625, 1.058929443359375, 1.1070556640625, 1.155181884765625, 1.20330810546875, 1.251434326171875, 1.299560546875, 1.347686767578125, 1.39581298828125, 1.443939208984375, 1.4920654296875, 1.540191650390625, 1.58831787109375, 1.636444091796875, 1.6845703125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 14.0, 26.0, 61.0, 85.0, 150.0, 310.0, 576.0, 1058.0, 2290.0, 7292.0, 34768.0, 406487.0, 541452.0, 41038.0, 8032.0, 2454.0, 1108.0, 565.0, 331.0, 207.0, 106.0, 51.0, 33.0, 15.0, 10.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.80712890625, -4.6416015625, -4.47607421875, -4.310546875, -4.14501953125, -3.9794921875, -3.81396484375, -3.6484375, -3.48291015625, -3.3173828125, -3.15185546875, -2.986328125, -2.82080078125, -2.6552734375, -2.48974609375, -2.32421875, -2.15869140625, -1.9931640625, -1.82763671875, -1.662109375, -1.49658203125, -1.3310546875, -1.16552734375, -1.0, -0.83447265625, -0.6689453125, -0.50341796875, -0.337890625, -0.17236328125, -0.0068359375, 0.15869140625, 0.32421875, 0.48974609375, 0.6552734375, 0.82080078125, 0.986328125, 1.15185546875, 1.3173828125, 1.48291015625, 1.6484375, 1.81396484375, 1.9794921875, 2.14501953125, 2.310546875, 2.47607421875, 2.6416015625, 2.80712890625, 2.97265625, 3.13818359375, 3.3037109375, 3.46923828125, 3.634765625, 3.80029296875, 3.9658203125, 4.13134765625, 4.296875, 4.46240234375, 4.6279296875, 4.79345703125, 4.958984375, 5.12451171875, 5.2900390625, 5.45556640625, 5.62109375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 12.0, 11.0, 12.0, 13.0, 15.0, 23.0, 20.0, 35.0, 33.0, 32.0, 44.0, 57.0, 75.0, 74.0, 130.0, 228.0, 1375.0, 263.0, 153.0, 88.0, 55.0, 55.0, 38.0, 31.0, 22.0, 27.0, 13.0, 23.0, 14.0, 12.0, 15.0, 11.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.97265625, -3.858306884765625, -3.74395751953125, -3.629608154296875, -3.5152587890625, -3.400909423828125, -3.28656005859375, -3.172210693359375, -3.057861328125, -2.943511962890625, -2.82916259765625, -2.714813232421875, -2.6004638671875, -2.486114501953125, -2.37176513671875, -2.257415771484375, -2.14306640625, -2.028717041015625, -1.91436767578125, -1.800018310546875, -1.6856689453125, -1.571319580078125, -1.45697021484375, -1.342620849609375, -1.228271484375, -1.113922119140625, -0.99957275390625, -0.885223388671875, -0.7708740234375, -0.656524658203125, -0.54217529296875, -0.427825927734375, -0.3134765625, -0.199127197265625, -0.08477783203125, 0.029571533203125, 0.1439208984375, 0.258270263671875, 0.37261962890625, 0.486968994140625, 0.601318359375, 0.715667724609375, 0.83001708984375, 0.944366455078125, 1.0587158203125, 1.173065185546875, 1.28741455078125, 1.401763916015625, 1.51611328125, 1.630462646484375, 1.74481201171875, 1.859161376953125, 1.9735107421875, 2.087860107421875, 2.20220947265625, 2.316558837890625, 2.430908203125, 2.545257568359375, 2.65960693359375, 2.773956298828125, 2.8883056640625, 3.002655029296875, 3.11700439453125, 3.231353759765625, 3.345703125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 9.0, 15.0, 19.0, 23.0, 39.0, 51.0, 70.0, 123.0, 176.0, 308.0, 487.0, 905.0, 1789.0, 6774.0, 2846417.0, 280370.0, 4591.0, 1567.0, 776.0, 395.0, 244.0, 179.0, 133.0, 60.0, 57.0, 32.0, 31.0, 19.0, 13.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0, -14.5439453125, -14.087890625, -13.6318359375, -13.17578125, -12.7197265625, -12.263671875, -11.8076171875, -11.3515625, -10.8955078125, -10.439453125, -9.9833984375, -9.52734375, -9.0712890625, -8.615234375, -8.1591796875, -7.703125, -7.2470703125, -6.791015625, -6.3349609375, -5.87890625, -5.4228515625, -4.966796875, -4.5107421875, -4.0546875, -3.5986328125, -3.142578125, -2.6865234375, -2.23046875, -1.7744140625, -1.318359375, -0.8623046875, -0.40625, 0.0498046875, 0.505859375, 0.9619140625, 1.41796875, 1.8740234375, 2.330078125, 2.7861328125, 3.2421875, 3.6982421875, 4.154296875, 4.6103515625, 5.06640625, 5.5224609375, 5.978515625, 6.4345703125, 6.890625, 7.3466796875, 7.802734375, 8.2587890625, 8.71484375, 9.1708984375, 9.626953125, 10.0830078125, 10.5390625, 10.9951171875, 11.451171875, 11.9072265625, 12.36328125, 12.8193359375, 13.275390625, 13.7314453125, 14.1875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 15.0, 24.0, 48.0, 84.0, 136.0, 207.0, 187.0, 134.0, 85.0, 46.0, 26.0, 6.0, 2.0, 1.0, 1.0], "bins": [-39.56413269042969, -38.84489440917969, -38.12565231323242, -37.40641403198242, -36.687171936035156, -35.967933654785156, -35.24869155883789, -34.52945327758789, -33.810211181640625, -33.090972900390625, -32.37173080444336, -31.652490615844727, -30.933250427246094, -30.21401023864746, -29.494770050048828, -28.775529861450195, -28.056289672851562, -27.33704948425293, -26.617809295654297, -25.898569107055664, -25.17932891845703, -24.4600887298584, -23.740848541259766, -23.021608352661133, -22.302370071411133, -21.5831298828125, -20.863889694213867, -20.144649505615234, -19.4254093170166, -18.70616912841797, -17.986928939819336, -17.267688751220703, -16.54844856262207, -15.829208374023438, -15.109968185424805, -14.390727996826172, -13.671487808227539, -12.952247619628906, -12.233007431030273, -11.51376724243164, -10.794527053833008, -10.075286865234375, -9.356046676635742, -8.63680648803711, -7.917566299438477, -7.198326110839844, -6.479086399078369, -5.759846210479736, -5.0406060218811035, -4.321365833282471, -3.602125644683838, -2.882885694503784, -2.1636455059051514, -1.4444053173065186, -0.7251653671264648, -0.005925178527832031, 0.7133150100708008, 1.4325551986694336, 2.1517953872680664, 2.87103533744812, 3.590275526046753, 4.309515953063965, 5.0287556648254395, 5.747995853424072, 6.467236042022705]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 17.0, 10.0, 9.0, 18.0, 20.0, 25.0, 28.0, 31.0, 39.0, 36.0, 35.0, 51.0, 34.0, 46.0, 52.0, 41.0, 42.0, 42.0, 45.0, 50.0, 50.0, 44.0, 33.0, 33.0, 29.0, 19.0, 22.0, 18.0, 14.0, 10.0, 12.0, 7.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.327797889709473, -11.908851623535156, -11.48990535736084, -11.070959091186523, -10.652012825012207, -10.23306655883789, -9.814120292663574, -9.395174026489258, -8.976227760314941, -8.557281494140625, -8.138335227966309, -7.719388961791992, -7.300442695617676, -6.881496429443359, -6.462550163269043, -6.043603897094727, -5.62465763092041, -5.205711364746094, -4.786765098571777, -4.367818832397461, -3.9488725662231445, -3.529926300048828, -3.1109800338745117, -2.6920337677001953, -2.273087501525879, -1.8541412353515625, -1.435194969177246, -1.0162487030029297, -0.5973024368286133, -0.17835617065429688, 0.24059009552001953, 0.6595363616943359, 1.078481674194336, 1.4974279403686523, 1.9163742065429688, 2.335320472717285, 2.7542667388916016, 3.173213005065918, 3.5921592712402344, 4.011105537414551, 4.430051803588867, 4.848998069763184, 5.2679443359375, 5.686890602111816, 6.105836868286133, 6.524783134460449, 6.943729400634766, 7.362675666809082, 7.781621932983398, 8.200568199157715, 8.619514465332031, 9.038460731506348, 9.457406997680664, 9.87635326385498, 10.295299530029297, 10.714245796203613, 11.13319206237793, 11.552138328552246, 11.971084594726562, 12.390030860900879, 12.808977127075195, 13.227923393249512, 13.646869659423828, 14.065815925598145, 14.484762191772461]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 13.0, 4.0, 7.0, 2.0, 9.0, 12.0, 15.0, 22.0, 23.0, 16.0, 19.0, 35.0, 34.0, 26.0, 33.0, 55.0, 40.0, 43.0, 47.0, 55.0, 42.0, 47.0, 39.0, 43.0, 49.0, 39.0, 31.0, 34.0, 27.0, 32.0, 17.0, 14.0, 20.0, 12.0, 19.0, 8.0, 5.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.5462646484375, -1.490966796875, -1.4356689453125, -1.38037109375, -1.3250732421875, -1.269775390625, -1.2144775390625, -1.1591796875, -1.1038818359375, -1.048583984375, -0.9932861328125, -0.93798828125, -0.8826904296875, -0.827392578125, -0.7720947265625, -0.716796875, -0.6614990234375, -0.606201171875, -0.5509033203125, -0.49560546875, -0.4403076171875, -0.385009765625, -0.3297119140625, -0.2744140625, -0.2191162109375, -0.163818359375, -0.1085205078125, -0.05322265625, 0.0020751953125, 0.057373046875, 0.1126708984375, 0.16796875, 0.2232666015625, 0.278564453125, 0.3338623046875, 0.38916015625, 0.4444580078125, 0.499755859375, 0.5550537109375, 0.6103515625, 0.6656494140625, 0.720947265625, 0.7762451171875, 0.83154296875, 0.8868408203125, 0.942138671875, 0.9974365234375, 1.052734375, 1.1080322265625, 1.163330078125, 1.2186279296875, 1.27392578125, 1.3292236328125, 1.384521484375, 1.4398193359375, 1.4951171875, 1.5504150390625, 1.605712890625, 1.6610107421875, 1.71630859375, 1.7716064453125, 1.826904296875, 1.8822021484375, 1.9375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 6.0, 13.0, 16.0, 18.0, 20.0, 26.0, 39.0, 49.0, 67.0, 66.0, 94.0, 123.0, 124.0, 185.0, 243.0, 306.0, 472.0, 685.0, 1147.0, 2275.0, 6525.0, 48073.0, 2142429.0, 1934962.0, 43850.0, 6397.0, 2391.0, 1150.0, 704.0, 479.0, 299.0, 245.0, 170.0, 129.0, 110.0, 93.0, 57.0, 54.0, 37.0, 27.0, 22.0, 18.0, 16.0, 11.0, 10.0, 10.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-5.15234375, -4.99127197265625, -4.8302001953125, -4.66912841796875, -4.508056640625, -4.34698486328125, -4.1859130859375, -4.02484130859375, -3.86376953125, -3.70269775390625, -3.5416259765625, -3.38055419921875, -3.219482421875, -3.05841064453125, -2.8973388671875, -2.73626708984375, -2.5751953125, -2.41412353515625, -2.2530517578125, -2.09197998046875, -1.930908203125, -1.76983642578125, -1.6087646484375, -1.44769287109375, -1.28662109375, -1.12554931640625, -0.9644775390625, -0.80340576171875, -0.642333984375, -0.48126220703125, -0.3201904296875, -0.15911865234375, 0.001953125, 0.16302490234375, 0.3240966796875, 0.48516845703125, 0.646240234375, 0.80731201171875, 0.9683837890625, 1.12945556640625, 1.29052734375, 1.45159912109375, 1.6126708984375, 1.77374267578125, 1.934814453125, 2.09588623046875, 2.2569580078125, 2.41802978515625, 2.5791015625, 2.74017333984375, 2.9012451171875, 3.06231689453125, 3.223388671875, 3.38446044921875, 3.5455322265625, 3.70660400390625, 3.86767578125, 4.02874755859375, 4.1898193359375, 4.35089111328125, 4.511962890625, 4.67303466796875, 4.8341064453125, 4.99517822265625, 5.15625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 8.0, 18.0, 19.0, 29.0, 33.0, 48.0, 80.0, 93.0, 199.0, 290.0, 376.0, 567.0, 635.0, 519.0, 348.0, 247.0, 173.0, 109.0, 68.0, 54.0, 39.0, 23.0, 17.0, 20.0, 13.0, 13.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.73809814453125, -2.6480712890625, -2.55804443359375, -2.468017578125, -2.37799072265625, -2.2879638671875, -2.19793701171875, -2.10791015625, -2.01788330078125, -1.9278564453125, -1.83782958984375, -1.747802734375, -1.65777587890625, -1.5677490234375, -1.47772216796875, -1.3876953125, -1.29766845703125, -1.2076416015625, -1.11761474609375, -1.027587890625, -0.93756103515625, -0.8475341796875, -0.75750732421875, -0.66748046875, -0.57745361328125, -0.4874267578125, -0.39739990234375, -0.307373046875, -0.21734619140625, -0.1273193359375, -0.03729248046875, 0.052734375, 0.14276123046875, 0.2327880859375, 0.32281494140625, 0.412841796875, 0.50286865234375, 0.5928955078125, 0.68292236328125, 0.77294921875, 0.86297607421875, 0.9530029296875, 1.04302978515625, 1.133056640625, 1.22308349609375, 1.3131103515625, 1.40313720703125, 1.4931640625, 1.58319091796875, 1.6732177734375, 1.76324462890625, 1.853271484375, 1.94329833984375, 2.0333251953125, 2.12335205078125, 2.21337890625, 2.30340576171875, 2.3934326171875, 2.48345947265625, 2.573486328125, 2.66351318359375, 2.7535400390625, 2.84356689453125, 2.93359375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 7.0, 5.0, 6.0, 13.0, 13.0, 26.0, 36.0, 48.0, 86.0, 111.0, 207.0, 359.0, 787.0, 1734.0, 5841.0, 42828.0, 2480542.0, 1618785.0, 34470.0, 5179.0, 1580.0, 711.0, 353.0, 198.0, 129.0, 72.0, 50.0, 32.0, 19.0, 13.0, 13.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.83203125, -5.6495361328125, -5.467041015625, -5.2845458984375, -5.10205078125, -4.9195556640625, -4.737060546875, -4.5545654296875, -4.3720703125, -4.1895751953125, -4.007080078125, -3.8245849609375, -3.64208984375, -3.4595947265625, -3.277099609375, -3.0946044921875, -2.912109375, -2.7296142578125, -2.547119140625, -2.3646240234375, -2.18212890625, -1.9996337890625, -1.817138671875, -1.6346435546875, -1.4521484375, -1.2696533203125, -1.087158203125, -0.9046630859375, -0.72216796875, -0.5396728515625, -0.357177734375, -0.1746826171875, 0.0078125, 0.1903076171875, 0.372802734375, 0.5552978515625, 0.73779296875, 0.9202880859375, 1.102783203125, 1.2852783203125, 1.4677734375, 1.6502685546875, 1.832763671875, 2.0152587890625, 2.19775390625, 2.3802490234375, 2.562744140625, 2.7452392578125, 2.927734375, 3.1102294921875, 3.292724609375, 3.4752197265625, 3.65771484375, 3.8402099609375, 4.022705078125, 4.2052001953125, 4.3876953125, 4.5701904296875, 4.752685546875, 4.9351806640625, 5.11767578125, 5.3001708984375, 5.482666015625, 5.6651611328125, 5.84765625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 14.0, 71.0, 377.0, 420.0, 106.0, 20.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.44794464111328, -51.104148864746094, -49.76035690307617, -48.416561126708984, -47.07276916503906, -45.728973388671875, -44.38517761230469, -43.0413818359375, -41.69758987426758, -40.35379409790039, -39.01000213623047, -37.66620635986328, -36.322410583496094, -34.97861862182617, -33.634822845458984, -32.29103088378906, -30.947235107421875, -29.60344123840332, -28.259647369384766, -26.915851593017578, -25.572057723999023, -24.22826385498047, -22.88446807861328, -21.540674209594727, -20.196880340576172, -18.853086471557617, -17.509292602539062, -16.165496826171875, -14.82170295715332, -13.477909088134766, -12.134114265441895, -10.790319442749023, -9.446521759033203, -8.102727890014648, -6.758933067321777, -5.4151387214660645, -4.071344375610352, -2.7275500297546387, -1.3837556838989258, -0.03996086120605469, 1.3038330078125, 2.647627353668213, 3.991421699523926, 5.335216045379639, 6.679010391235352, 8.022804260253906, 9.366599082946777, 10.710393905639648, 12.054187774658203, 13.397981643676758, 14.741776466369629, 16.0855712890625, 17.429365158081055, 18.77315902709961, 20.116954803466797, 21.46074867248535, 22.804542541503906, 24.14833641052246, 25.492130279541016, 26.835926055908203, 28.179719924926758, 29.523513793945312, 30.8673095703125, 32.21110534667969, 33.55489730834961]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 12.0, 12.0, 11.0, 24.0, 24.0, 15.0, 31.0, 18.0, 40.0, 25.0, 29.0, 30.0, 33.0, 31.0, 35.0, 38.0, 31.0, 47.0, 34.0, 39.0, 30.0, 57.0, 29.0, 29.0, 27.0, 28.0, 23.0, 25.0, 31.0, 18.0, 17.0, 17.0, 12.0, 11.0, 8.0, 12.0, 7.0, 10.0, 0.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.559165954589844, -8.305291175842285, -8.05141544342041, -7.797540664672852, -7.543665885925293, -7.289790630340576, -7.035915374755859, -6.782040596008301, -6.528165817260742, -6.274290561676025, -6.020415782928467, -5.76654052734375, -5.512665748596191, -5.258790493011475, -5.004915237426758, -4.751040458679199, -4.497165203094482, -4.243289947509766, -3.989415168762207, -3.7355399131774902, -3.4816651344299316, -3.227789878845215, -2.973914861679077, -2.7200398445129395, -2.4661648273468018, -2.212289810180664, -1.9584147930145264, -1.7045396566390991, -1.4506646394729614, -1.1967896223068237, -0.9429144859313965, -0.6890394687652588, -0.4351649284362793, -0.1812898814678192, 0.07258516550064087, 0.32646024227142334, 0.580335259437561, 0.8342102766036987, 1.088085412979126, 1.3419604301452637, 1.5958354473114014, 1.849710464477539, 2.1035854816436768, 2.3574604988098145, 2.6113357543945312, 2.86521053314209, 3.1190857887268066, 3.3729608058929443, 3.626835823059082, 3.8807108402252197, 4.134585857391357, 4.388461112976074, 4.642335891723633, 4.89621114730835, 5.150086402893066, 5.403961181640625, 5.657835960388184, 5.9117112159729, 6.165585994720459, 6.419461250305176, 6.673336029052734, 6.927211284637451, 7.181086540222168, 7.434961318969727, 7.688836574554443]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 11.0, 5.0, 8.0, 9.0, 11.0, 6.0, 14.0, 13.0, 18.0, 24.0, 26.0, 45.0, 26.0, 32.0, 34.0, 43.0, 37.0, 40.0, 43.0, 46.0, 54.0, 44.0, 44.0, 47.0, 36.0, 38.0, 35.0, 39.0, 22.0, 28.0, 26.0, 20.0, 9.0, 15.0, 11.0, 11.0, 9.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0050506591796875, -0.965179443359375, -0.9253082275390625, -0.88543701171875, -0.8455657958984375, -0.805694580078125, -0.7658233642578125, -0.7259521484375, -0.6860809326171875, -0.646209716796875, -0.6063385009765625, -0.56646728515625, -0.5265960693359375, -0.486724853515625, -0.4468536376953125, -0.406982421875, -0.3671112060546875, -0.327239990234375, -0.2873687744140625, -0.24749755859375, -0.2076263427734375, -0.167755126953125, -0.1278839111328125, -0.0880126953125, -0.0481414794921875, -0.008270263671875, 0.0316009521484375, 0.07147216796875, 0.1113433837890625, 0.151214599609375, 0.1910858154296875, 0.23095703125, 0.2708282470703125, 0.310699462890625, 0.3505706787109375, 0.39044189453125, 0.4303131103515625, 0.470184326171875, 0.5100555419921875, 0.5499267578125, 0.5897979736328125, 0.629669189453125, 0.6695404052734375, 0.70941162109375, 0.7492828369140625, 0.789154052734375, 0.8290252685546875, 0.868896484375, 0.9087677001953125, 0.948638916015625, 0.9885101318359375, 1.02838134765625, 1.0682525634765625, 1.108123779296875, 1.1479949951171875, 1.1878662109375, 1.2277374267578125, 1.267608642578125, 1.3074798583984375, 1.34735107421875, 1.3872222900390625, 1.427093505859375, 1.4669647216796875, 1.5068359375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 10.0, 19.0, 27.0, 50.0, 43.0, 70.0, 99.0, 176.0, 271.0, 458.0, 715.0, 995.0, 1554.0, 2320.0, 3639.0, 5378.0, 8555.0, 13304.0, 21121.0, 34770.0, 58393.0, 104647.0, 209858.0, 257573.0, 137977.0, 72779.0, 42650.0, 25824.0, 15925.0, 10429.0, 6616.0, 4146.0, 2917.0, 1892.0, 1207.0, 726.0, 506.0, 325.0, 239.0, 138.0, 89.0, 37.0, 33.0, 18.0, 13.0, 13.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10162353515625, -0.09846782684326172, -0.09531211853027344, -0.09215641021728516, -0.08900070190429688, -0.0858449935913086, -0.08268928527832031, -0.07953357696533203, -0.07637786865234375, -0.07322216033935547, -0.07006645202636719, -0.0669107437133789, -0.06375503540039062, -0.060599327087402344, -0.05744361877441406, -0.05428791046142578, -0.0511322021484375, -0.04797649383544922, -0.04482078552246094, -0.041665077209472656, -0.038509368896484375, -0.035353660583496094, -0.03219795227050781, -0.02904224395751953, -0.02588653564453125, -0.02273082733154297, -0.019575119018554688, -0.016419410705566406, -0.013263702392578125, -0.010107994079589844, -0.0069522857666015625, -0.0037965774536132812, -0.000640869140625, 0.0025148391723632812, 0.0056705474853515625, 0.008826255798339844, 0.011981964111328125, 0.015137672424316406, 0.018293380737304688, 0.02144908905029297, 0.02460479736328125, 0.02776050567626953, 0.030916213989257812, 0.034071922302246094, 0.037227630615234375, 0.040383338928222656, 0.04353904724121094, 0.04669475555419922, 0.0498504638671875, 0.05300617218017578, 0.05616188049316406, 0.059317588806152344, 0.062473297119140625, 0.0656290054321289, 0.06878471374511719, 0.07194042205810547, 0.07509613037109375, 0.07825183868408203, 0.08140754699707031, 0.0845632553100586, 0.08771896362304688, 0.09087467193603516, 0.09403038024902344, 0.09718608856201172, 0.100341796875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 9.0, 18.0, 15.0, 20.0, 20.0, 23.0, 35.0, 25.0, 30.0, 35.0, 49.0, 38.0, 51.0, 49.0, 52.0, 1072.0, 43.0, 45.0, 36.0, 39.0, 28.0, 35.0, 28.0, 28.0, 33.0, 23.0, 19.0, 14.0, 16.0, 13.0, 13.0, 9.0, 11.0, 12.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.681640625, -0.6547088623046875, -0.627777099609375, -0.6008453369140625, -0.57391357421875, -0.5469818115234375, -0.520050048828125, -0.4931182861328125, -0.4661865234375, -0.4392547607421875, -0.412322998046875, -0.3853912353515625, -0.35845947265625, -0.3315277099609375, -0.304595947265625, -0.2776641845703125, -0.250732421875, -0.2238006591796875, -0.196868896484375, -0.1699371337890625, -0.14300537109375, -0.1160736083984375, -0.089141845703125, -0.0622100830078125, -0.0352783203125, -0.0083465576171875, 0.018585205078125, 0.0455169677734375, 0.07244873046875, 0.0993804931640625, 0.126312255859375, 0.1532440185546875, 0.18017578125, 0.2071075439453125, 0.234039306640625, 0.2609710693359375, 0.28790283203125, 0.3148345947265625, 0.341766357421875, 0.3686981201171875, 0.3956298828125, 0.4225616455078125, 0.449493408203125, 0.4764251708984375, 0.50335693359375, 0.5302886962890625, 0.557220458984375, 0.5841522216796875, 0.611083984375, 0.6380157470703125, 0.664947509765625, 0.6918792724609375, 0.71881103515625, 0.7457427978515625, 0.772674560546875, 0.7996063232421875, 0.8265380859375, 0.8534698486328125, 0.880401611328125, 0.9073333740234375, 0.93426513671875, 0.9611968994140625, 0.988128662109375, 1.0150604248046875, 1.0419921875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 15.0, 13.0, 15.0, 14.0, 30.0, 46.0, 62.0, 57.0, 101.0, 159.0, 250.0, 347.0, 478.0, 739.0, 1103.0, 1745.0, 2671.0, 4288.0, 7049.0, 12890.0, 29694.0, 144124.0, 1739331.0, 97659.0, 25017.0, 11515.0, 6452.0, 3846.0, 2437.0, 1696.0, 1004.0, 693.0, 486.0, 333.0, 231.0, 151.0, 109.0, 87.0, 51.0, 41.0, 32.0, 12.0, 13.0, 19.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15134811401367188, -0.14620208740234375, -0.14105606079101562, -0.1359100341796875, -0.13076400756835938, -0.12561798095703125, -0.12047195434570312, -0.115325927734375, -0.11017990112304688, -0.10503387451171875, -0.09988784790039062, -0.0947418212890625, -0.08959579467773438, -0.08444976806640625, -0.07930374145507812, -0.07415771484375, -0.06901168823242188, -0.06386566162109375, -0.058719635009765625, -0.0535736083984375, -0.048427581787109375, -0.04328155517578125, -0.038135528564453125, -0.032989501953125, -0.027843475341796875, -0.02269744873046875, -0.017551422119140625, -0.0124053955078125, -0.007259368896484375, -0.00211334228515625, 0.003032684326171875, 0.0081787109375, 0.013324737548828125, 0.01847076416015625, 0.023616790771484375, 0.0287628173828125, 0.033908843994140625, 0.03905487060546875, 0.044200897216796875, 0.049346923828125, 0.054492950439453125, 0.05963897705078125, 0.06478500366210938, 0.0699310302734375, 0.07507705688476562, 0.08022308349609375, 0.08536911010742188, 0.09051513671875, 0.09566116333007812, 0.10080718994140625, 0.10595321655273438, 0.1110992431640625, 0.11624526977539062, 0.12139129638671875, 0.12653732299804688, 0.131683349609375, 0.13682937622070312, 0.14197540283203125, 0.14712142944335938, 0.1522674560546875, 0.15741348266601562, 0.16255950927734375, 0.16770553588867188, 0.1728515625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 8.0, 3.0, 11.0, 33.0, 19.0, 26.0, 39.0, 42.0, 58.0, 61.0, 73.0, 76.0, 62.0, 70.0, 59.0, 65.0, 62.0, 38.0, 25.0, 25.0, 12.0, 13.0, 12.0, 18.0, 13.0, 8.0, 11.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008697509765625, -0.008447468280792236, -0.008197426795959473, -0.007947385311126709, -0.007697343826293945, -0.007447302341461182, -0.007197260856628418, -0.006947219371795654, -0.006697177886962891, -0.006447136402130127, -0.006197094917297363, -0.0059470534324646, -0.005697011947631836, -0.005446970462799072, -0.005196928977966309, -0.004946887493133545, -0.004696846008300781, -0.004446804523468018, -0.004196763038635254, -0.00394672155380249, -0.0036966800689697266, -0.003446638584136963, -0.0031965970993041992, -0.0029465556144714355, -0.002696514129638672, -0.002446472644805908, -0.0021964311599731445, -0.0019463896751403809, -0.0016963481903076172, -0.0014463067054748535, -0.0011962652206420898, -0.0009462237358093262, -0.0006961822509765625, -0.00044614076614379883, -0.00019609928131103516, 5.3942203521728516e-05, 0.0003039836883544922, 0.0005540251731872559, 0.0008040666580200195, 0.0010541081428527832, 0.0013041496276855469, 0.0015541911125183105, 0.0018042325973510742, 0.002054274082183838, 0.0023043155670166016, 0.0025543570518493652, 0.002804398536682129, 0.0030544400215148926, 0.0033044815063476562, 0.00355452299118042, 0.0038045644760131836, 0.004054605960845947, 0.004304647445678711, 0.004554688930511475, 0.004804730415344238, 0.005054771900177002, 0.005304813385009766, 0.005554854869842529, 0.005804896354675293, 0.006054937839508057, 0.00630497932434082, 0.006555020809173584, 0.006805062294006348, 0.007055103778839111, 0.007305145263671875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 5.0, 4.0, 7.0, 8.0, 17.0, 17.0, 19.0, 14.0, 31.0, 38.0, 51.0, 46.0, 56.0, 74.0, 126.0, 227.0, 353.0, 593.0, 1203.0, 43131.0, 991507.0, 8568.0, 943.0, 502.0, 296.0, 167.0, 125.0, 123.0, 67.0, 50.0, 37.0, 32.0, 17.0, 24.0, 17.0, 8.0, 11.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12368965148925781, -0.11932754516601562, -0.11496543884277344, -0.11060333251953125, -0.10624122619628906, -0.10187911987304688, -0.09751701354980469, -0.0931549072265625, -0.08879280090332031, -0.08443069458007812, -0.08006858825683594, -0.07570648193359375, -0.07134437561035156, -0.06698226928710938, -0.06262016296386719, -0.058258056640625, -0.05389595031738281, -0.049533843994140625, -0.04517173767089844, -0.04080963134765625, -0.03644752502441406, -0.032085418701171875, -0.027723312377929688, -0.0233612060546875, -0.018999099731445312, -0.014636993408203125, -0.010274887084960938, -0.00591278076171875, -0.0015506744384765625, 0.002811431884765625, 0.0071735382080078125, 0.01153564453125, 0.015897750854492188, 0.020259857177734375, 0.024621963500976562, 0.02898406982421875, 0.03334617614746094, 0.037708282470703125, 0.04207038879394531, 0.0464324951171875, 0.05079460144042969, 0.055156707763671875, 0.05951881408691406, 0.06388092041015625, 0.06824302673339844, 0.07260513305664062, 0.07696723937988281, 0.081329345703125, 0.08569145202636719, 0.09005355834960938, 0.09441566467285156, 0.09877777099609375, 0.10313987731933594, 0.10750198364257812, 0.11186408996582031, 0.1162261962890625, 0.12058830261230469, 0.12495040893554688, 0.12931251525878906, 0.13367462158203125, 0.13803672790527344, 0.14239883422851562, 0.1467609405517578, 0.151123046875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 27.0, 244.0, 627.0, 90.0, 20.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059488002210855484, -0.0571364089846611, -0.05478481575846672, -0.05243322253227234, -0.05008162930607796, -0.047730036079883575, -0.045378439128398895, -0.04302684962749481, -0.04067525267601013, -0.03832365944981575, -0.03597206622362137, -0.03362047299742699, -0.031268879771232605, -0.028917286545038223, -0.026565691456198692, -0.02421409823000431, -0.021862506866455078, -0.019510913640260696, -0.017159320414066315, -0.014807726256549358, -0.012456133030354977, -0.010104539804160595, -0.007752945646643639, -0.005401352420449257, -0.003049759194254875, -0.0006981657352298498, 0.0016534277237951756, 0.004005021415650845, 0.006356614641845226, 0.008708207868039608, 0.011059802025556564, 0.013411395251750946, 0.015762992203235626, 0.018114585429430008, 0.02046617865562439, 0.02281777188181877, 0.025169365108013153, 0.027520958334207535, 0.029872553423047066, 0.0322241485118866, 0.03457573801279068, 0.03692733123898506, 0.03927892446517944, 0.041630517691373825, 0.04398211091756821, 0.04633370414376259, 0.04868529736995697, 0.05103689432144165, 0.05338848754763603, 0.055740080773830414, 0.058091674000024796, 0.06044326722621918, 0.06279486417770386, 0.06514645367860794, 0.06749805063009262, 0.0698496401309967, 0.07220123708248138, 0.07455283403396606, 0.07690442353487015, 0.07925602048635483, 0.08160760998725891, 0.08395920693874359, 0.08631079643964767, 0.08866239339113235, 0.09101398289203644]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 6.0, 8.0, 7.0, 9.0, 6.0, 16.0, 13.0, 21.0, 30.0, 14.0, 35.0, 42.0, 45.0, 28.0, 49.0, 51.0, 42.0, 60.0, 52.0, 48.0, 50.0, 49.0, 36.0, 40.0, 33.0, 25.0, 32.0, 27.0, 19.0, 21.0, 22.0, 13.0, 19.0, 11.0, 5.0, 10.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008009612560272217, -0.007697757333517075, -0.007385902106761932, -0.00707404688000679, -0.006762191653251648, -0.006450336426496506, -0.0061384811997413635, -0.005826625972986221, -0.005514770746231079, -0.005202915519475937, -0.004891060292720795, -0.0045792050659656525, -0.00426734983921051, -0.003955494612455368, -0.003643639385700226, -0.0033317841589450836, -0.0030199289321899414, -0.002708073705434799, -0.002396218478679657, -0.0020843632519245148, -0.0017725080251693726, -0.0014606527984142303, -0.0011487975716590881, -0.0008369423449039459, -0.0005250871181488037, -0.0002132318913936615, 9.862333536148071e-05, 0.0004104785621166229, 0.0007223337888717651, 0.0010341890156269073, 0.0013460442423820496, 0.0016578994691371918, 0.001969754695892334, 0.002281609922647476, 0.0025934651494026184, 0.0029053203761577606, 0.003217175602912903, 0.003529030829668045, 0.0038408860564231873, 0.0041527412831783295, 0.004464596509933472, 0.004776451736688614, 0.005088306963443756, 0.005400162190198898, 0.0057120174169540405, 0.006023872643709183, 0.006335727870464325, 0.006647583097219467, 0.006959438323974609, 0.007271293550729752, 0.007583148777484894, 0.007895004004240036, 0.008206859230995178, 0.00851871445775032, 0.008830569684505463, 0.009142424911260605, 0.009454280138015747, 0.00976613536477089, 0.010077990591526031, 0.010389845818281174, 0.010701701045036316, 0.011013556271791458, 0.0113254114985466, 0.011637266725301743, 0.011949121952056885]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 12.0, 4.0, 8.0, 9.0, 11.0, 6.0, 14.0, 12.0, 19.0, 24.0, 27.0, 43.0, 27.0, 33.0, 32.0, 44.0, 37.0, 40.0, 45.0, 43.0, 56.0, 43.0, 44.0, 46.0, 37.0, 38.0, 35.0, 39.0, 22.0, 28.0, 27.0, 19.0, 9.0, 15.0, 11.0, 11.0, 8.0, 9.0, 4.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0050506591796875, -0.965179443359375, -0.9253082275390625, -0.88543701171875, -0.8455657958984375, -0.805694580078125, -0.7658233642578125, -0.7259521484375, -0.6860809326171875, -0.646209716796875, -0.6063385009765625, -0.56646728515625, -0.5265960693359375, -0.486724853515625, -0.4468536376953125, -0.406982421875, -0.3671112060546875, -0.327239990234375, -0.2873687744140625, -0.24749755859375, -0.2076263427734375, -0.167755126953125, -0.1278839111328125, -0.0880126953125, -0.0481414794921875, -0.008270263671875, 0.0316009521484375, 0.07147216796875, 0.1113433837890625, 0.151214599609375, 0.1910858154296875, 0.23095703125, 0.2708282470703125, 0.310699462890625, 0.3505706787109375, 0.39044189453125, 0.4303131103515625, 0.470184326171875, 0.5100555419921875, 0.5499267578125, 0.5897979736328125, 0.629669189453125, 0.6695404052734375, 0.70941162109375, 0.7492828369140625, 0.789154052734375, 0.8290252685546875, 0.868896484375, 0.9087677001953125, 0.948638916015625, 0.9885101318359375, 1.02838134765625, 1.0682525634765625, 1.108123779296875, 1.1479949951171875, 1.1878662109375, 1.2277374267578125, 1.267608642578125, 1.3074798583984375, 1.34735107421875, 1.3872222900390625, 1.427093505859375, 1.4669647216796875, 1.5068359375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 4.0, 16.0, 23.0, 26.0, 43.0, 41.0, 53.0, 82.0, 105.0, 139.0, 185.0, 271.0, 402.0, 492.0, 746.0, 1146.0, 1919.0, 3526.0, 7648.0, 19278.0, 64403.0, 323602.0, 486632.0, 91752.0, 25728.0, 9530.0, 4367.0, 2291.0, 1308.0, 813.0, 558.0, 371.0, 263.0, 204.0, 131.0, 135.0, 82.0, 72.0, 46.0, 33.0, 25.0, 21.0, 13.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.30828857421875, -1.2562255859375, -1.20416259765625, -1.152099609375, -1.10003662109375, -1.0479736328125, -0.99591064453125, -0.94384765625, -0.89178466796875, -0.8397216796875, -0.78765869140625, -0.735595703125, -0.68353271484375, -0.6314697265625, -0.57940673828125, -0.52734375, -0.47528076171875, -0.4232177734375, -0.37115478515625, -0.319091796875, -0.26702880859375, -0.2149658203125, -0.16290283203125, -0.11083984375, -0.05877685546875, -0.0067138671875, 0.04534912109375, 0.097412109375, 0.14947509765625, 0.2015380859375, 0.25360107421875, 0.3056640625, 0.35772705078125, 0.4097900390625, 0.46185302734375, 0.513916015625, 0.56597900390625, 0.6180419921875, 0.67010498046875, 0.72216796875, 0.77423095703125, 0.8262939453125, 0.87835693359375, 0.930419921875, 0.98248291015625, 1.0345458984375, 1.08660888671875, 1.138671875, 1.19073486328125, 1.2427978515625, 1.29486083984375, 1.346923828125, 1.39898681640625, 1.4510498046875, 1.50311279296875, 1.55517578125, 1.60723876953125, 1.6593017578125, 1.71136474609375, 1.763427734375, 1.81549072265625, 1.8675537109375, 1.91961669921875, 1.9716796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 8.0, 2.0, 12.0, 9.0, 11.0, 16.0, 12.0, 23.0, 24.0, 35.0, 28.0, 40.0, 44.0, 74.0, 120.0, 246.0, 1478.0, 291.0, 152.0, 93.0, 42.0, 59.0, 41.0, 34.0, 26.0, 25.0, 24.0, 17.0, 16.0, 11.0, 9.0, 10.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.46875, -3.362548828125, -3.25634765625, -3.150146484375, -3.0439453125, -2.937744140625, -2.83154296875, -2.725341796875, -2.619140625, -2.512939453125, -2.40673828125, -2.300537109375, -2.1943359375, -2.088134765625, -1.98193359375, -1.875732421875, -1.76953125, -1.663330078125, -1.55712890625, -1.450927734375, -1.3447265625, -1.238525390625, -1.13232421875, -1.026123046875, -0.919921875, -0.813720703125, -0.70751953125, -0.601318359375, -0.4951171875, -0.388916015625, -0.28271484375, -0.176513671875, -0.0703125, 0.035888671875, 0.14208984375, 0.248291015625, 0.3544921875, 0.460693359375, 0.56689453125, 0.673095703125, 0.779296875, 0.885498046875, 0.99169921875, 1.097900390625, 1.2041015625, 1.310302734375, 1.41650390625, 1.522705078125, 1.62890625, 1.735107421875, 1.84130859375, 1.947509765625, 2.0537109375, 2.159912109375, 2.26611328125, 2.372314453125, 2.478515625, 2.584716796875, 2.69091796875, 2.797119140625, 2.9033203125, 3.009521484375, 3.11572265625, 3.221923828125, 3.328125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 5.0, 3.0, 7.0, 8.0, 14.0, 10.0, 18.0, 33.0, 36.0, 44.0, 52.0, 92.0, 141.0, 228.0, 357.0, 654.0, 1669.0, 7275.0, 1286083.0, 1837764.0, 7903.0, 1689.0, 653.0, 346.0, 191.0, 123.0, 91.0, 52.0, 41.0, 24.0, 20.0, 21.0, 13.0, 15.0, 10.0, 11.0, 2.0, 6.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.3409423828125, -6.154541015625, -5.9681396484375, -5.78173828125, -5.5953369140625, -5.408935546875, -5.2225341796875, -5.0361328125, -4.8497314453125, -4.663330078125, -4.4769287109375, -4.29052734375, -4.1041259765625, -3.917724609375, -3.7313232421875, -3.544921875, -3.3585205078125, -3.172119140625, -2.9857177734375, -2.79931640625, -2.6129150390625, -2.426513671875, -2.2401123046875, -2.0537109375, -1.8673095703125, -1.680908203125, -1.4945068359375, -1.30810546875, -1.1217041015625, -0.935302734375, -0.7489013671875, -0.5625, -0.3760986328125, -0.189697265625, -0.0032958984375, 0.18310546875, 0.3695068359375, 0.555908203125, 0.7423095703125, 0.9287109375, 1.1151123046875, 1.301513671875, 1.4879150390625, 1.67431640625, 1.8607177734375, 2.047119140625, 2.2335205078125, 2.419921875, 2.6063232421875, 2.792724609375, 2.9791259765625, 3.16552734375, 3.3519287109375, 3.538330078125, 3.7247314453125, 3.9111328125, 4.0975341796875, 4.283935546875, 4.4703369140625, 4.65673828125, 4.8431396484375, 5.029541015625, 5.2159423828125, 5.40234375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 61.0, 339.0, 506.0, 86.0, 16.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.33470916748047, -25.090354919433594, -23.84600257873535, -22.601648330688477, -21.357295989990234, -20.11294174194336, -18.868587493896484, -17.62423324584961, -16.379880905151367, -15.135527610778809, -13.89117431640625, -12.646820068359375, -11.402466773986816, -10.158113479614258, -8.913759231567383, -7.669405937194824, -6.425052642822266, -5.180699348449707, -3.9363455772399902, -2.6919920444488525, -1.4476385116577148, -0.20328521728515625, 1.0410685539245605, 2.2854223251342773, 3.529775619506836, 4.7741289138793945, 6.018482685089111, 7.262836456298828, 8.507189750671387, 9.751543045043945, 10.99589729309082, 12.240250587463379, 13.484603881835938, 14.728957176208496, 15.973310470581055, 17.21766471862793, 18.462017059326172, 19.706371307373047, 20.950725555419922, 22.195079803466797, 23.43943214416504, 24.683786392211914, 25.928138732910156, 27.17249298095703, 28.416847229003906, 29.66119956970215, 30.905553817749023, 32.149906158447266, 33.39426040649414, 34.638614654541016, 35.88296890258789, 37.1273193359375, 38.371673583984375, 39.61602783203125, 40.860382080078125, 42.104736328125, 43.349090576171875, 44.59344482421875, 45.837799072265625, 47.082149505615234, 48.32650375366211, 49.570858001708984, 50.81521224975586, 52.059566497802734, 53.303916931152344]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 6.0, 7.0, 12.0, 17.0, 16.0, 19.0, 21.0, 18.0, 27.0, 36.0, 24.0, 38.0, 42.0, 42.0, 34.0, 40.0, 38.0, 38.0, 40.0, 48.0, 49.0, 34.0, 37.0, 38.0, 29.0, 32.0, 33.0, 32.0, 22.0, 21.0, 18.0, 15.0, 19.0, 11.0, 5.0, 8.0, 13.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.742064476013184, -5.535009860992432, -5.32795524597168, -5.120900630950928, -4.913846015930176, -4.706790924072266, -4.499736309051514, -4.292681694030762, -4.08562707901001, -3.878572463989258, -3.671517848968506, -3.464462995529175, -3.257408380508423, -3.050353765487671, -2.84329891204834, -2.636244297027588, -2.429189682006836, -2.222135066986084, -2.015080451965332, -1.808025598526001, -1.600970983505249, -1.393916368484497, -1.1868616342544556, -0.9798069000244141, -0.7727522850036621, -0.5656976103782654, -0.35864293575286865, -0.15158826112747192, 0.055466413497924805, 0.26252102851867676, 0.46957576274871826, 0.6766304969787598, 0.8836846351623535, 1.0907392501831055, 1.297793984413147, 1.5048487186431885, 1.7119033336639404, 1.9189579486846924, 2.1260128021240234, 2.3330674171447754, 2.5401220321655273, 2.7471766471862793, 2.9542312622070312, 3.1612861156463623, 3.3683407306671143, 3.575395345687866, 3.7824501991271973, 3.989504814147949, 4.196559429168701, 4.403614044189453, 4.610668659210205, 4.817723274230957, 5.024778366088867, 5.231832504272461, 5.438887596130371, 5.645942211151123, 5.852996826171875, 6.060051441192627, 6.267106056213379, 6.474160671234131, 6.681215286254883, 6.888270378112793, 7.095324993133545, 7.302379608154297, 7.509434223175049]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 4.0, 8.0, 12.0, 7.0, 13.0, 15.0, 20.0, 23.0, 28.0, 30.0, 27.0, 40.0, 42.0, 35.0, 40.0, 50.0, 56.0, 40.0, 41.0, 57.0, 53.0, 42.0, 32.0, 32.0, 32.0, 30.0, 35.0, 30.0, 27.0, 15.0, 14.0, 11.0, 10.0, 6.0, 9.0, 6.0, 11.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.2308197021484375, -1.185272216796875, -1.1397247314453125, -1.09417724609375, -1.0486297607421875, -1.003082275390625, -0.9575347900390625, -0.9119873046875, -0.8664398193359375, -0.820892333984375, -0.7753448486328125, -0.72979736328125, -0.6842498779296875, -0.638702392578125, -0.5931549072265625, -0.547607421875, -0.5020599365234375, -0.456512451171875, -0.4109649658203125, -0.36541748046875, -0.3198699951171875, -0.274322509765625, -0.2287750244140625, -0.1832275390625, -0.1376800537109375, -0.092132568359375, -0.0465850830078125, -0.00103759765625, 0.0445098876953125, 0.090057373046875, 0.1356048583984375, 0.18115234375, 0.2266998291015625, 0.272247314453125, 0.3177947998046875, 0.36334228515625, 0.4088897705078125, 0.454437255859375, 0.4999847412109375, 0.5455322265625, 0.5910797119140625, 0.636627197265625, 0.6821746826171875, 0.72772216796875, 0.7732696533203125, 0.818817138671875, 0.8643646240234375, 0.909912109375, 0.9554595947265625, 1.001007080078125, 1.0465545654296875, 1.09210205078125, 1.1376495361328125, 1.183197021484375, 1.2287445068359375, 1.2742919921875, 1.3198394775390625, 1.365386962890625, 1.4109344482421875, 1.45648193359375, 1.5020294189453125, 1.547576904296875, 1.5931243896484375, 1.638671875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 13.0, 9.0, 11.0, 10.0, 17.0, 30.0, 32.0, 50.0, 66.0, 97.0, 132.0, 199.0, 270.0, 463.0, 744.0, 1172.0, 1970.0, 3462.0, 7797.0, 36322.0, 2588616.0, 1511160.0, 26879.0, 7054.0, 3139.0, 1679.0, 1017.0, 624.0, 389.0, 248.0, 169.0, 138.0, 87.0, 68.0, 29.0, 29.0, 28.0, 23.0, 11.0, 9.0, 7.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.72113037109375, -5.5086669921875, -5.29620361328125, -5.083740234375, -4.87127685546875, -4.6588134765625, -4.44635009765625, -4.23388671875, -4.02142333984375, -3.8089599609375, -3.59649658203125, -3.384033203125, -3.17156982421875, -2.9591064453125, -2.74664306640625, -2.5341796875, -2.32171630859375, -2.1092529296875, -1.89678955078125, -1.684326171875, -1.47186279296875, -1.2593994140625, -1.04693603515625, -0.83447265625, -0.62200927734375, -0.4095458984375, -0.19708251953125, 0.015380859375, 0.22784423828125, 0.4403076171875, 0.65277099609375, 0.865234375, 1.07769775390625, 1.2901611328125, 1.50262451171875, 1.715087890625, 1.92755126953125, 2.1400146484375, 2.35247802734375, 2.56494140625, 2.77740478515625, 2.9898681640625, 3.20233154296875, 3.414794921875, 3.62725830078125, 3.8397216796875, 4.05218505859375, 4.2646484375, 4.47711181640625, 4.6895751953125, 4.90203857421875, 5.114501953125, 5.32696533203125, 5.5394287109375, 5.75189208984375, 5.96435546875, 6.17681884765625, 6.3892822265625, 6.60174560546875, 6.814208984375, 7.02667236328125, 7.2391357421875, 7.45159912109375, 7.6640625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 14.0, 29.0, 42.0, 63.0, 105.0, 153.0, 231.0, 371.0, 520.0, 701.0, 595.0, 426.0, 281.0, 192.0, 114.0, 73.0, 44.0, 29.0, 23.0, 6.0, 12.0, 8.0, 5.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05859375, -1.9814453125, -1.904296875, -1.8271484375, -1.75, -1.6728515625, -1.595703125, -1.5185546875, -1.44140625, -1.3642578125, -1.287109375, -1.2099609375, -1.1328125, -1.0556640625, -0.978515625, -0.9013671875, -0.82421875, -0.7470703125, -0.669921875, -0.5927734375, -0.515625, -0.4384765625, -0.361328125, -0.2841796875, -0.20703125, -0.1298828125, -0.052734375, 0.0244140625, 0.1015625, 0.1787109375, 0.255859375, 0.3330078125, 0.41015625, 0.4873046875, 0.564453125, 0.6416015625, 0.71875, 0.7958984375, 0.873046875, 0.9501953125, 1.02734375, 1.1044921875, 1.181640625, 1.2587890625, 1.3359375, 1.4130859375, 1.490234375, 1.5673828125, 1.64453125, 1.7216796875, 1.798828125, 1.8759765625, 1.953125, 2.0302734375, 2.107421875, 2.1845703125, 2.26171875, 2.3388671875, 2.416015625, 2.4931640625, 2.5703125, 2.6474609375, 2.724609375, 2.8017578125, 2.87890625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 6.0, 4.0, 10.0, 18.0, 23.0, 49.0, 75.0, 157.0, 315.0, 616.0, 1324.0, 3205.0, 11865.0, 96865.0, 2642497.0, 1367936.0, 56053.0, 8421.0, 2680.0, 1057.0, 536.0, 276.0, 142.0, 67.0, 33.0, 15.0, 14.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.05859375, -3.9388427734375, -3.819091796875, -3.6993408203125, -3.57958984375, -3.4598388671875, -3.340087890625, -3.2203369140625, -3.1005859375, -2.9808349609375, -2.861083984375, -2.7413330078125, -2.62158203125, -2.5018310546875, -2.382080078125, -2.2623291015625, -2.142578125, -2.0228271484375, -1.903076171875, -1.7833251953125, -1.66357421875, -1.5438232421875, -1.424072265625, -1.3043212890625, -1.1845703125, -1.0648193359375, -0.945068359375, -0.8253173828125, -0.70556640625, -0.5858154296875, -0.466064453125, -0.3463134765625, -0.2265625, -0.1068115234375, 0.012939453125, 0.1326904296875, 0.25244140625, 0.3721923828125, 0.491943359375, 0.6116943359375, 0.7314453125, 0.8511962890625, 0.970947265625, 1.0906982421875, 1.21044921875, 1.3302001953125, 1.449951171875, 1.5697021484375, 1.689453125, 1.8092041015625, 1.928955078125, 2.0487060546875, 2.16845703125, 2.2882080078125, 2.407958984375, 2.5277099609375, 2.6474609375, 2.7672119140625, 2.886962890625, 3.0067138671875, 3.12646484375, 3.2462158203125, 3.365966796875, 3.4857177734375, 3.60546875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 8.0, 9.0, 11.0, 14.0, 18.0, 15.0, 20.0, 19.0, 35.0, 36.0, 37.0, 49.0, 50.0, 41.0, 66.0, 57.0, 59.0, 57.0, 47.0, 57.0, 37.0, 38.0, 23.0, 34.0, 35.0, 20.0, 25.0, 19.0, 5.0, 9.0, 8.0, 7.0, 8.0, 5.0, 2.0, 7.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.285243511199951, -7.0404839515686035, -6.795724868774414, -6.550965309143066, -6.306205749511719, -6.061446189880371, -5.816686630249023, -5.571927547454834, -5.327167987823486, -5.082408428192139, -4.837649345397949, -4.592889785766602, -4.348130226135254, -4.103370666503906, -3.8586113452911377, -3.613852024078369, -3.3690924644470215, -3.124332904815674, -2.8795735836029053, -2.6348142623901367, -2.390054702758789, -2.1452951431274414, -1.9005358219146729, -1.6557763814926147, -1.4110169410705566, -1.1662575006484985, -0.9214980602264404, -0.6767386198043823, -0.4319791793823242, -0.1872197389602661, 0.05753970146179199, 0.3022991418838501, 0.5470590591430664, 0.7918184995651245, 1.0365779399871826, 1.2813373804092407, 1.5260968208312988, 1.770856261253357, 2.015615701675415, 2.2603750228881836, 2.5051345825195312, 2.749894142150879, 2.9946534633636475, 3.239412784576416, 3.4841723442077637, 3.7289319038391113, 3.97369122505188, 4.218450546264648, 4.463210105895996, 4.707969665527344, 4.952729225158691, 5.197488307952881, 5.4422478675842285, 5.687007427215576, 5.931766510009766, 6.176526069641113, 6.421285629272461, 6.666045188903809, 6.910804748535156, 7.155563831329346, 7.400323390960693, 7.645082950592041, 7.8898420333862305, 8.134601593017578, 8.379361152648926]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 7.0, 8.0, 17.0, 10.0, 19.0, 26.0, 30.0, 22.0, 24.0, 35.0, 35.0, 25.0, 43.0, 34.0, 33.0, 27.0, 35.0, 40.0, 34.0, 39.0, 46.0, 45.0, 26.0, 39.0, 24.0, 32.0, 19.0, 25.0, 13.0, 28.0, 16.0, 24.0, 8.0, 4.0, 15.0, 10.0, 12.0, 8.0, 9.0, 3.0, 6.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0], "bins": [-6.252314567565918, -6.062999725341797, -5.873684883117676, -5.684370040893555, -5.495055675506592, -5.305740833282471, -5.11642599105835, -4.9271111488342285, -4.737796783447266, -4.5484819412231445, -4.359167098999023, -4.169852256774902, -3.9805378913879395, -3.7912230491638184, -3.6019082069396973, -3.412593364715576, -3.223278522491455, -3.033963680267334, -2.844649076461792, -2.655334234237671, -2.466019630432129, -2.276704788208008, -2.0873899459838867, -1.8980752229690552, -1.7087604999542236, -1.519445776939392, -1.3301310539245605, -1.1408162117004395, -0.9515014886856079, -0.7621867656707764, -0.5728719234466553, -0.38355720043182373, -0.19424200057983398, -0.004927247762680054, 0.18438750505447388, 0.3737022876739502, 0.5630170106887817, 0.7523317337036133, 0.9416465759277344, 1.130961298942566, 1.3202760219573975, 1.509590744972229, 1.6989054679870605, 1.8882203102111816, 2.0775351524353027, 2.2668497562408447, 2.456164598464966, 2.645479202270508, 2.834794044494629, 3.02410888671875, 3.213423490524292, 3.402738332748413, 3.592052936553955, 3.781367778778076, 3.9706826210021973, 4.159997463226318, 4.349311828613281, 4.538626670837402, 4.727941513061523, 4.9172563552856445, 5.106570720672607, 5.2958855628967285, 5.48520040512085, 5.674515247344971, 5.863830089569092]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 7.0, 4.0, 7.0, 9.0, 11.0, 16.0, 14.0, 19.0, 15.0, 17.0, 28.0, 30.0, 38.0, 29.0, 26.0, 36.0, 37.0, 33.0, 36.0, 44.0, 38.0, 56.0, 36.0, 45.0, 35.0, 35.0, 36.0, 33.0, 36.0, 17.0, 26.0, 14.0, 22.0, 10.0, 14.0, 19.0, 11.0, 13.0, 10.0, 7.0, 7.0, 4.0, 3.0, 5.0, 5.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-14.6328125, -14.1890869140625, -13.745361328125, -13.3016357421875, -12.85791015625, -12.4141845703125, -11.970458984375, -11.5267333984375, -11.0830078125, -10.6392822265625, -10.195556640625, -9.7518310546875, -9.30810546875, -8.8643798828125, -8.420654296875, -7.9769287109375, -7.533203125, -7.0894775390625, -6.645751953125, -6.2020263671875, -5.75830078125, -5.3145751953125, -4.870849609375, -4.4271240234375, -3.9833984375, -3.5396728515625, -3.095947265625, -2.6522216796875, -2.20849609375, -1.7647705078125, -1.321044921875, -0.8773193359375, -0.43359375, 0.0101318359375, 0.453857421875, 0.8975830078125, 1.34130859375, 1.7850341796875, 2.228759765625, 2.6724853515625, 3.1162109375, 3.5599365234375, 4.003662109375, 4.4473876953125, 4.89111328125, 5.3348388671875, 5.778564453125, 6.2222900390625, 6.666015625, 7.1097412109375, 7.553466796875, 7.9971923828125, 8.44091796875, 8.8846435546875, 9.328369140625, 9.7720947265625, 10.2158203125, 10.6595458984375, 11.103271484375, 11.5469970703125, 11.99072265625, 12.4344482421875, 12.878173828125, 13.3218994140625, 13.765625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 12.0, 10.0, 26.0, 27.0, 50.0, 76.0, 104.0, 158.0, 234.0, 304.0, 463.0, 649.0, 915.0, 1363.0, 2034.0, 2994.0, 4537.0, 6704.0, 10108.0, 15658.0, 24967.0, 41321.0, 70473.0, 122831.0, 196888.0, 207911.0, 136353.0, 77970.0, 45447.0, 27656.0, 17244.0, 11159.0, 7100.0, 4683.0, 3216.0, 2194.0, 1497.0, 1025.0, 670.0, 440.0, 344.0, 232.0, 143.0, 113.0, 83.0, 56.0, 37.0, 31.0, 21.0, 8.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5810546875, -0.5629501342773438, -0.5448455810546875, -0.5267410278320312, -0.508636474609375, -0.49053192138671875, -0.4724273681640625, -0.45432281494140625, -0.43621826171875, -0.41811370849609375, -0.4000091552734375, -0.38190460205078125, -0.363800048828125, -0.34569549560546875, -0.3275909423828125, -0.30948638916015625, -0.2913818359375, -0.27327728271484375, -0.2551727294921875, -0.23706817626953125, -0.218963623046875, -0.20085906982421875, -0.1827545166015625, -0.16464996337890625, -0.14654541015625, -0.12844085693359375, -0.1103363037109375, -0.09223175048828125, -0.074127197265625, -0.05602264404296875, -0.0379180908203125, -0.01981353759765625, -0.001708984375, 0.01639556884765625, 0.0345001220703125, 0.05260467529296875, 0.070709228515625, 0.08881378173828125, 0.1069183349609375, 0.12502288818359375, 0.14312744140625, 0.16123199462890625, 0.1793365478515625, 0.19744110107421875, 0.215545654296875, 0.23365020751953125, 0.2517547607421875, 0.26985931396484375, 0.2879638671875, 0.30606842041015625, 0.3241729736328125, 0.34227752685546875, 0.360382080078125, 0.37848663330078125, 0.3965911865234375, 0.41469573974609375, 0.43280029296875, 0.45090484619140625, 0.4690093994140625, 0.48711395263671875, 0.505218505859375, 0.5233230590820312, 0.5414276123046875, 0.5595321655273438, 0.57763671875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 2.0, 5.0, 9.0, 6.0, 12.0, 7.0, 12.0, 18.0, 20.0, 17.0, 21.0, 17.0, 19.0, 21.0, 28.0, 28.0, 31.0, 33.0, 44.0, 37.0, 31.0, 49.0, 1065.0, 39.0, 26.0, 48.0, 29.0, 38.0, 37.0, 34.0, 30.0, 28.0, 24.0, 32.0, 17.0, 17.0, 10.0, 10.0, 12.0, 14.0, 14.0, 5.0, 4.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-9.296875, -9.0224609375, -8.748046875, -8.4736328125, -8.19921875, -7.9248046875, -7.650390625, -7.3759765625, -7.1015625, -6.8271484375, -6.552734375, -6.2783203125, -6.00390625, -5.7294921875, -5.455078125, -5.1806640625, -4.90625, -4.6318359375, -4.357421875, -4.0830078125, -3.80859375, -3.5341796875, -3.259765625, -2.9853515625, -2.7109375, -2.4365234375, -2.162109375, -1.8876953125, -1.61328125, -1.3388671875, -1.064453125, -0.7900390625, -0.515625, -0.2412109375, 0.033203125, 0.3076171875, 0.58203125, 0.8564453125, 1.130859375, 1.4052734375, 1.6796875, 1.9541015625, 2.228515625, 2.5029296875, 2.77734375, 3.0517578125, 3.326171875, 3.6005859375, 3.875, 4.1494140625, 4.423828125, 4.6982421875, 4.97265625, 5.2470703125, 5.521484375, 5.7958984375, 6.0703125, 6.3447265625, 6.619140625, 6.8935546875, 7.16796875, 7.4423828125, 7.716796875, 7.9912109375, 8.265625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 8.0, 8.0, 5.0, 12.0, 18.0, 24.0, 23.0, 41.0, 47.0, 79.0, 99.0, 146.0, 188.0, 261.0, 347.0, 551.0, 776.0, 1036.0, 1513.0, 2233.0, 3355.0, 5261.0, 8657.0, 16106.0, 37689.0, 181983.0, 1656953.0, 113762.0, 29852.0, 13843.0, 7779.0, 4766.0, 2992.0, 2060.0, 1392.0, 962.0, 645.0, 432.0, 326.0, 225.0, 213.0, 122.0, 95.0, 63.0, 54.0, 37.0, 27.0, 14.0, 10.0, 16.0, 2.0, 5.0, 3.0, 7.0, 5.0, 3.0, 1.0], "bins": [-1.3486328125, -1.3082427978515625, -1.267852783203125, -1.2274627685546875, -1.18707275390625, -1.1466827392578125, -1.106292724609375, -1.0659027099609375, -1.0255126953125, -0.9851226806640625, -0.944732666015625, -0.9043426513671875, -0.86395263671875, -0.8235626220703125, -0.783172607421875, -0.7427825927734375, -0.702392578125, -0.6620025634765625, -0.621612548828125, -0.5812225341796875, -0.54083251953125, -0.5004425048828125, -0.460052490234375, -0.4196624755859375, -0.3792724609375, -0.3388824462890625, -0.298492431640625, -0.2581024169921875, -0.21771240234375, -0.1773223876953125, -0.136932373046875, -0.0965423583984375, -0.05615234375, -0.0157623291015625, 0.024627685546875, 0.0650177001953125, 0.10540771484375, 0.1457977294921875, 0.186187744140625, 0.2265777587890625, 0.2669677734375, 0.3073577880859375, 0.347747802734375, 0.3881378173828125, 0.42852783203125, 0.4689178466796875, 0.509307861328125, 0.5496978759765625, 0.590087890625, 0.6304779052734375, 0.670867919921875, 0.7112579345703125, 0.75164794921875, 0.7920379638671875, 0.832427978515625, 0.8728179931640625, 0.9132080078125, 0.9535980224609375, 0.993988037109375, 1.0343780517578125, 1.07476806640625, 1.1151580810546875, 1.155548095703125, 1.1959381103515625, 1.236328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 12.0, 2.0, 10.0, 12.0, 11.0, 16.0, 16.0, 17.0, 24.0, 24.0, 37.0, 39.0, 54.0, 57.0, 58.0, 59.0, 81.0, 64.0, 53.0, 35.0, 47.0, 48.0, 38.0, 31.0, 32.0, 30.0, 16.0, 9.0, 23.0, 7.0, 9.0, 3.0, 8.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039764404296875, -0.0384368896484375, -0.037109375, -0.0357818603515625, -0.034454345703125, -0.0331268310546875, -0.03179931640625, -0.0304718017578125, -0.029144287109375, -0.0278167724609375, -0.0264892578125, -0.0251617431640625, -0.023834228515625, -0.0225067138671875, -0.02117919921875, -0.0198516845703125, -0.018524169921875, -0.0171966552734375, -0.015869140625, -0.0145416259765625, -0.013214111328125, -0.0118865966796875, -0.01055908203125, -0.0092315673828125, -0.007904052734375, -0.0065765380859375, -0.0052490234375, -0.0039215087890625, -0.002593994140625, -0.0012664794921875, 6.103515625e-05, 0.0013885498046875, 0.002716064453125, 0.0040435791015625, 0.00537109375, 0.0066986083984375, 0.008026123046875, 0.0093536376953125, 0.01068115234375, 0.0120086669921875, 0.013336181640625, 0.0146636962890625, 0.0159912109375, 0.0173187255859375, 0.018646240234375, 0.0199737548828125, 0.02130126953125, 0.0226287841796875, 0.023956298828125, 0.0252838134765625, 0.026611328125, 0.0279388427734375, 0.029266357421875, 0.0305938720703125, 0.03192138671875, 0.0332489013671875, 0.034576416015625, 0.0359039306640625, 0.0372314453125, 0.0385589599609375, 0.039886474609375, 0.0412139892578125, 0.04254150390625, 0.0438690185546875, 0.045196533203125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 11.0, 7.0, 21.0, 21.0, 45.0, 49.0, 80.0, 124.0, 214.0, 317.0, 520.0, 1008.0, 1835.0, 3610.0, 7792.0, 19784.0, 54055.0, 157055.0, 347495.0, 283407.0, 107701.0, 37179.0, 13911.0, 5937.0, 2930.0, 1438.0, 779.0, 459.0, 249.0, 174.0, 113.0, 71.0, 47.0, 29.0, 25.0, 17.0, 11.0, 11.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2078857421875, -0.20191574096679688, -0.19594573974609375, -0.18997573852539062, -0.1840057373046875, -0.17803573608398438, -0.17206573486328125, -0.16609573364257812, -0.160125732421875, -0.15415573120117188, -0.14818572998046875, -0.14221572875976562, -0.1362457275390625, -0.13027572631835938, -0.12430572509765625, -0.11833572387695312, -0.11236572265625, -0.10639572143554688, -0.10042572021484375, -0.09445571899414062, -0.0884857177734375, -0.08251571655273438, -0.07654571533203125, -0.07057571411132812, -0.064605712890625, -0.058635711669921875, -0.05266571044921875, -0.046695709228515625, -0.0407257080078125, -0.034755706787109375, -0.02878570556640625, -0.022815704345703125, -0.016845703125, -0.010875701904296875, -0.00490570068359375, 0.001064300537109375, 0.0070343017578125, 0.013004302978515625, 0.01897430419921875, 0.024944305419921875, 0.030914306640625, 0.036884307861328125, 0.04285430908203125, 0.048824310302734375, 0.0547943115234375, 0.060764312744140625, 0.06673431396484375, 0.07270431518554688, 0.07867431640625, 0.08464431762695312, 0.09061431884765625, 0.09658432006835938, 0.1025543212890625, 0.10852432250976562, 0.11449432373046875, 0.12046432495117188, 0.126434326171875, 0.13240432739257812, 0.13837432861328125, 0.14434432983398438, 0.1503143310546875, 0.15628433227539062, 0.16225433349609375, 0.16822433471679688, 0.1741943359375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 7.0, 24.0, 27.0, 29.0, 52.0, 69.0, 123.0, 114.0, 140.0, 88.0, 101.0, 61.0, 49.0, 31.0, 23.0, 19.0, 11.0, 10.0, 7.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04608623683452606, -0.04316399618983269, -0.04024175554513931, -0.03731951117515564, -0.034397274255752563, -0.03147502988576889, -0.028552789241075516, -0.02563054859638214, -0.022708307951688766, -0.019786067306995392, -0.016863826662302017, -0.013941584154963493, -0.011019343510270119, -0.008097102865576744, -0.00517486035823822, -0.0022526197135448456, 0.000669620931148529, 0.003591862041503191, 0.006514103151857853, 0.009436344727873802, 0.012358585372567177, 0.015280826017260551, 0.018203068524599075, 0.02112530916929245, 0.024047549813985825, 0.0269697904586792, 0.029892031103372574, 0.03281427174806595, 0.03573651611804962, 0.0386587530374527, 0.04158099740743637, 0.044503238052129745, 0.04742547869682312, 0.050347719341516495, 0.05326995998620987, 0.05619220435619354, 0.05911444127559662, 0.06203668564558029, 0.06495893001556396, 0.06788116693496704, 0.07080340385437012, 0.07372564822435379, 0.07664788514375687, 0.07957012951374054, 0.08249236643314362, 0.08541461080312729, 0.08833685517311096, 0.09125909209251404, 0.09418133646249771, 0.09710358083248138, 0.10002581775188446, 0.10294806212186813, 0.10587029904127121, 0.10879254341125488, 0.11171478033065796, 0.11463702470064163, 0.1175592690706253, 0.12048151344060898, 0.12340375036001205, 0.12632599472999573, 0.1292482316493988, 0.13217046856880188, 0.13509272038936615, 0.13801495730876923, 0.1409371942281723]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 1.0, 7.0, 12.0, 13.0, 18.0, 20.0, 22.0, 20.0, 37.0, 34.0, 15.0, 37.0, 30.0, 40.0, 33.0, 30.0, 40.0, 44.0, 42.0, 43.0, 40.0, 38.0, 41.0, 37.0, 34.0, 35.0, 26.0, 34.0, 18.0, 25.0, 17.0, 10.0, 16.0, 10.0, 11.0, 10.0, 5.0, 7.0, 8.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.04232919216156006, -0.04095478728413582, -0.03958038240671158, -0.03820597380399704, -0.0368315689265728, -0.03545716404914856, -0.03408275544643402, -0.03270835056900978, -0.03133394569158554, -0.0299595408141613, -0.02858513407409191, -0.027210727334022522, -0.025836322456598282, -0.024461917579174042, -0.023087510839104652, -0.021713104099035263, -0.020338699221611023, -0.018964294344186783, -0.017589887604117393, -0.016215480864048004, -0.014841075986623764, -0.01346667017787695, -0.012092264369130135, -0.01071785856038332, -0.009343452751636505, -0.00796904694288969, -0.006594641134142876, -0.005220235325396061, -0.003845829516649246, -0.0024714237079024315, -0.0010970178991556168, 0.00027738790959119797, 0.0016517937183380127, 0.0030261995270848274, 0.004400605335831642, 0.005775011144578457, 0.007149416953325272, 0.008523822762072086, 0.009898228570818901, 0.011272634379565716, 0.01264704018831253, 0.014021445997059345, 0.01539585180580616, 0.01677025854587555, 0.01814466342329979, 0.01951906830072403, 0.02089347504079342, 0.022267881780862808, 0.02364228665828705, 0.02501669153571129, 0.026391098275780678, 0.027765505015850067, 0.029139909893274307, 0.030514314770698547, 0.031888723373413086, 0.033263128250837326, 0.034637533128261566, 0.036011938005685806, 0.037386342883110046, 0.038760751485824585, 0.040135156363248825, 0.041509561240673065, 0.042883969843387604, 0.044258374720811844, 0.045632779598236084]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 9.0, 13.0, 15.0, 16.0, 16.0, 18.0, 19.0, 29.0, 34.0, 33.0, 26.0, 27.0, 34.0, 33.0, 39.0, 40.0, 40.0, 41.0, 50.0, 39.0, 40.0, 37.0, 38.0, 31.0, 37.0, 32.0, 18.0, 24.0, 19.0, 16.0, 12.0, 16.0, 17.0, 11.0, 12.0, 12.0, 8.0, 6.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-14.484375, -14.0438232421875, -13.603271484375, -13.1627197265625, -12.72216796875, -12.2816162109375, -11.841064453125, -11.4005126953125, -10.9599609375, -10.5194091796875, -10.078857421875, -9.6383056640625, -9.19775390625, -8.7572021484375, -8.316650390625, -7.8760986328125, -7.435546875, -6.9949951171875, -6.554443359375, -6.1138916015625, -5.67333984375, -5.2327880859375, -4.792236328125, -4.3516845703125, -3.9111328125, -3.4705810546875, -3.030029296875, -2.5894775390625, -2.14892578125, -1.7083740234375, -1.267822265625, -0.8272705078125, -0.38671875, 0.0538330078125, 0.494384765625, 0.9349365234375, 1.37548828125, 1.8160400390625, 2.256591796875, 2.6971435546875, 3.1376953125, 3.5782470703125, 4.018798828125, 4.4593505859375, 4.89990234375, 5.3404541015625, 5.781005859375, 6.2215576171875, 6.662109375, 7.1026611328125, 7.543212890625, 7.9837646484375, 8.42431640625, 8.8648681640625, 9.305419921875, 9.7459716796875, 10.1865234375, 10.6270751953125, 11.067626953125, 11.5081787109375, 11.94873046875, 12.3892822265625, 12.829833984375, 13.2703857421875, 13.7109375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 13.0, 14.0, 15.0, 19.0, 26.0, 22.0, 45.0, 43.0, 59.0, 96.0, 115.0, 172.0, 260.0, 582.0, 1702.0, 7519.0, 53164.0, 616768.0, 333319.0, 27500.0, 4680.0, 1140.0, 428.0, 230.0, 160.0, 105.0, 82.0, 56.0, 38.0, 33.0, 17.0, 26.0, 16.0, 14.0, 12.0, 10.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.392578125, -3.289306640625, -3.18603515625, -3.082763671875, -2.9794921875, -2.876220703125, -2.77294921875, -2.669677734375, -2.56640625, -2.463134765625, -2.35986328125, -2.256591796875, -2.1533203125, -2.050048828125, -1.94677734375, -1.843505859375, -1.740234375, -1.636962890625, -1.53369140625, -1.430419921875, -1.3271484375, -1.223876953125, -1.12060546875, -1.017333984375, -0.9140625, -0.810791015625, -0.70751953125, -0.604248046875, -0.5009765625, -0.397705078125, -0.29443359375, -0.191162109375, -0.087890625, 0.015380859375, 0.11865234375, 0.221923828125, 0.3251953125, 0.428466796875, 0.53173828125, 0.635009765625, 0.73828125, 0.841552734375, 0.94482421875, 1.048095703125, 1.1513671875, 1.254638671875, 1.35791015625, 1.461181640625, 1.564453125, 1.667724609375, 1.77099609375, 1.874267578125, 1.9775390625, 2.080810546875, 2.18408203125, 2.287353515625, 2.390625, 2.493896484375, 2.59716796875, 2.700439453125, 2.8037109375, 2.906982421875, 3.01025390625, 3.113525390625, 3.216796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 10.0, 13.0, 20.0, 22.0, 40.0, 39.0, 45.0, 57.0, 72.0, 82.0, 2067.0, 159.0, 75.0, 50.0, 69.0, 52.0, 44.0, 36.0, 26.0, 19.0, 15.0, 10.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.34375, -38.21484375, -37.0859375, -35.95703125, -34.828125, -33.69921875, -32.5703125, -31.44140625, -30.3125, -29.18359375, -28.0546875, -26.92578125, -25.796875, -24.66796875, -23.5390625, -22.41015625, -21.28125, -20.15234375, -19.0234375, -17.89453125, -16.765625, -15.63671875, -14.5078125, -13.37890625, -12.25, -11.12109375, -9.9921875, -8.86328125, -7.734375, -6.60546875, -5.4765625, -4.34765625, -3.21875, -2.08984375, -0.9609375, 0.16796875, 1.296875, 2.42578125, 3.5546875, 4.68359375, 5.8125, 6.94140625, 8.0703125, 9.19921875, 10.328125, 11.45703125, 12.5859375, 13.71484375, 14.84375, 15.97265625, 17.1015625, 18.23046875, 19.359375, 20.48828125, 21.6171875, 22.74609375, 23.875, 25.00390625, 26.1328125, 27.26171875, 28.390625, 29.51953125, 30.6484375, 31.77734375, 32.90625]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 7.0, 13.0, 12.0, 21.0, 18.0, 24.0, 42.0, 84.0, 116.0, 201.0, 421.0, 875.0, 1956.0, 5500.0, 24228.0, 262415.0, 2759887.0, 73102.0, 10930.0, 3230.0, 1260.0, 593.0, 277.0, 176.0, 105.0, 49.0, 31.0, 25.0, 24.0, 10.0, 11.0, 10.0, 11.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.806640625, -2.719635009765625, -2.63262939453125, -2.545623779296875, -2.4586181640625, -2.371612548828125, -2.28460693359375, -2.197601318359375, -2.110595703125, -2.023590087890625, -1.93658447265625, -1.849578857421875, -1.7625732421875, -1.675567626953125, -1.58856201171875, -1.501556396484375, -1.41455078125, -1.327545166015625, -1.24053955078125, -1.153533935546875, -1.0665283203125, -0.979522705078125, -0.89251708984375, -0.805511474609375, -0.718505859375, -0.631500244140625, -0.54449462890625, -0.457489013671875, -0.3704833984375, -0.283477783203125, -0.19647216796875, -0.109466552734375, -0.0224609375, 0.064544677734375, 0.15155029296875, 0.238555908203125, 0.3255615234375, 0.412567138671875, 0.49957275390625, 0.586578369140625, 0.673583984375, 0.760589599609375, 0.84759521484375, 0.934600830078125, 1.0216064453125, 1.108612060546875, 1.19561767578125, 1.282623291015625, 1.36962890625, 1.456634521484375, 1.54364013671875, 1.630645751953125, 1.7176513671875, 1.804656982421875, 1.89166259765625, 1.978668212890625, 2.065673828125, 2.152679443359375, 2.23968505859375, 2.326690673828125, 2.4136962890625, 2.500701904296875, 2.58770751953125, 2.674713134765625, 2.76171875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 14.0, 32.0, 73.0, 179.0, 285.0, 213.0, 112.0, 41.0, 18.0, 8.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.817657470703125, -21.578218460083008, -19.338781356811523, -17.099342346191406, -14.859904289245605, -12.620466232299805, -10.381027221679688, -8.141589164733887, -5.902151107788086, -3.662712812423706, -1.4232745170593262, 0.8161640167236328, 3.0556020736694336, 5.295040130615234, 7.534479141235352, 9.773917198181152, 12.013355255126953, 14.252793312072754, 16.492231369018555, 18.731670379638672, 20.971107482910156, 23.210546493530273, 25.44998550415039, 27.689422607421875, 29.928861618041992, 32.16830062866211, 34.407737731933594, 36.647178649902344, 38.88661575317383, 41.12605285644531, 43.36549377441406, 45.60493087768555, 47.84436798095703, 50.083805084228516, 52.323246002197266, 54.56268310546875, 56.802120208740234, 59.04155731201172, 61.28099822998047, 63.52043533325195, 65.75987243652344, 67.99931335449219, 70.2387466430664, 72.47818756103516, 74.7176284790039, 76.95706176757812, 79.19650268554688, 81.43594360351562, 83.67538452148438, 85.91482543945312, 88.15425872802734, 90.3936996459961, 92.63314056396484, 94.87257385253906, 97.11201477050781, 99.35145568847656, 101.59088897705078, 103.83032989501953, 106.06976318359375, 108.3092041015625, 110.54864501953125, 112.78807830810547, 115.02751922607422, 117.26696014404297, 119.50639343261719]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 6.0, 9.0, 6.0, 15.0, 8.0, 8.0, 9.0, 20.0, 25.0, 37.0, 20.0, 26.0, 22.0, 38.0, 52.0, 50.0, 51.0, 56.0, 57.0, 41.0, 47.0, 38.0, 48.0, 45.0, 43.0, 33.0, 33.0, 20.0, 30.0, 19.0, 17.0, 19.0, 15.0, 9.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.07651901245117, -35.96726989746094, -34.85801696777344, -33.7487678527832, -32.63951873779297, -31.53026580810547, -30.421016693115234, -29.311765670776367, -28.2025146484375, -27.093263626098633, -25.9840145111084, -24.87476348876953, -23.765512466430664, -22.656261444091797, -21.547012329101562, -20.437761306762695, -19.32851219177246, -18.219261169433594, -17.11001205444336, -16.000761032104492, -14.891510009765625, -13.782259941101074, -12.673009872436523, -11.563758850097656, -10.454508781433105, -9.345258712768555, -8.236007690429688, -7.126757621765137, -6.017507076263428, -4.908256530761719, -3.799006462097168, -2.689755916595459, -1.58050537109375, -0.47125494480133057, 0.6379954814910889, 1.7472457885742188, 2.8564963340759277, 3.9657468795776367, 5.0749969482421875, 6.1842474937438965, 7.2934980392456055, 8.402748107910156, 9.511999130249023, 10.621249198913574, 11.730499267578125, 12.839750289916992, 13.949000358581543, 15.058250427246094, 16.16750144958496, 17.276752471923828, 18.386001586914062, 19.49525260925293, 20.604503631591797, 21.71375274658203, 22.8230037689209, 23.932254791259766, 25.04150390625, 26.150754928588867, 27.2600040435791, 28.36925506591797, 29.478506088256836, 30.587757110595703, 31.697006225585938, 32.80625534057617, 33.91550827026367]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 16.0, 14.0, 17.0, 24.0, 48.0, 73.0, 97.0, 161.0, 242.0, 469.0, 891.0, 2237.0, 6869.0, 1022408.0, 9579.0, 2926.0, 1162.0, 519.0, 269.0, 174.0, 110.0, 85.0, 56.0, 40.0, 24.0, 15.0, 12.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 4.0], "bins": [-16.94603729248047, -16.557693481445312, -16.169349670410156, -15.781004905700684, -15.392660140991211, -15.004316329956055, -14.615972518920898, -14.227627754211426, -13.83928394317627, -13.450940132141113, -13.06259536743164, -12.674251556396484, -12.285906791687012, -11.897562980651855, -11.509218215942383, -11.120874404907227, -10.73253059387207, -10.344186782836914, -9.955842018127441, -9.567498207092285, -9.179153442382812, -8.790809631347656, -8.4024658203125, -8.014121055603027, -7.625776290893555, -7.23743200302124, -6.849087715148926, -6.4607439041137695, -6.072399616241455, -5.684055328369141, -5.295711040496826, -4.907366752624512, -4.5190229415893555, -4.130678653717041, -3.7423346042633057, -3.353990316390991, -2.965646266937256, -2.5773019790649414, -2.188957691192627, -1.8006136417388916, -1.4122693538665771, -1.0239251852035522, -0.6355809569358826, -0.2472367286682129, 0.141107439994812, 0.5294516086578369, 0.9177958965301514, 1.3061399459838867, 1.6944842338562012, 2.0828285217285156, 2.471172571182251, 2.8595168590545654, 3.247860908508301, 3.6362051963806152, 4.02454948425293, 4.412893295288086, 4.801238059997559, 5.189582347869873, 5.5779266357421875, 5.966270446777344, 6.354614734649658, 6.742959022521973, 7.131303310394287, 7.519647598266602, 7.907991409301758]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 15.0, 163.0, 51457128.0, 5711.0, 140.0, 12.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1335.0008544921875, -1293.2445068359375, -1251.4881591796875, -1209.7318115234375, -1167.9754638671875, -1126.2191162109375, -1084.4627685546875, -1042.70654296875, -1000.9501342773438, -959.1937866210938, -917.4374389648438, -875.6810913085938, -833.9248046875, -792.16845703125, -750.412109375, -708.65576171875, -666.8994140625, -625.14306640625, -583.38671875, -541.63037109375, -499.8740539550781, -458.1177062988281, -416.36138916015625, -374.60504150390625, -332.84869384765625, -291.09234619140625, -249.3360137939453, -207.57968139648438, -165.82333374023438, -124.06698608398438, -82.31065368652344, -40.5543212890625, 1.2020263671875, 42.95836639404297, 84.71470642089844, 126.4710464477539, 168.22738647460938, 209.98373413085938, 251.7400665283203, 293.49639892578125, 335.25274658203125, 377.00909423828125, 418.76544189453125, 460.5217590332031, 502.2781066894531, 544.034423828125, 585.790771484375, 627.547119140625, 669.303466796875, 711.059814453125, 752.816162109375, 794.572509765625, 836.328857421875, 878.085205078125, 919.8414916992188, 961.5978393554688, 1003.3541870117188, 1045.1104736328125, 1086.8668212890625, 1128.6231689453125, 1170.3795166015625, 1212.1358642578125, 1253.8922119140625, 1295.6485595703125, 1337.4049072265625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 16.0, 21.0, 30.0, 71.0, 152.0, 323.0, 193.0, 71.0, 41.0, 22.0, 16.0, 10.0, 7.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.30596923828125, -122.39356231689453, -115.48114776611328, -108.56874084472656, -101.65632629394531, -94.7439193725586, -87.83151245117188, -80.91909790039062, -74.00668334960938, -67.09427642822266, -60.181861877441406, -53.26945495605469, -46.35704040527344, -39.44463348388672, -32.532222747802734, -25.61981201171875, -18.70740509033203, -11.794994354248047, -4.882584571838379, 2.029825210571289, 8.942235946655273, 15.854644775390625, 22.76705551147461, 29.679466247558594, 36.59187698364258, 43.50428771972656, 50.41669845581055, 57.32910919189453, 64.24151611328125, 71.1539306640625, 78.06633758544922, 84.97874450683594, 91.89115905761719, 98.8035659790039, 105.71598052978516, 112.62838745117188, 119.54080200195312, 126.45320892333984, 133.36561584472656, 140.2780303955078, 147.19044494628906, 154.1028594970703, 161.0152587890625, 167.92767333984375, 174.840087890625, 181.75250244140625, 188.66490173339844, 195.5773162841797, 202.48971557617188, 209.40213012695312, 216.3145294189453, 223.22694396972656, 230.1393585205078, 237.0517578125, 243.96417236328125, 250.8765869140625, 257.78900146484375, 264.701416015625, 271.61383056640625, 278.5262451171875, 285.4386291503906, 292.3510437011719, 299.2634582519531, 306.1758728027344, 313.0882873535156]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 8.0, 4.0, 7.0, 6.0, 9.0, 7.0, 11.0, 11.0, 22.0, 15.0, 20.0, 21.0, 33.0, 32.0, 25.0, 37.0, 39.0, 55.0, 44.0, 50.0, 48.0, 48.0, 58.0, 48.0, 42.0, 48.0, 27.0, 35.0, 39.0, 24.0, 19.0, 18.0, 19.0, 18.0, 11.0, 5.0, 9.0, 11.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-43.378883361816406, -42.14045715332031, -40.90203094482422, -39.663604736328125, -38.42517852783203, -37.18675231933594, -35.948326110839844, -34.709896087646484, -33.47146987915039, -32.2330436706543, -30.994617462158203, -29.75619125366211, -28.517763137817383, -27.27933692932129, -26.040910720825195, -24.80248260498047, -23.564058303833008, -22.325632095336914, -21.08720588684082, -19.848777770996094, -18.6103515625, -17.371925354003906, -16.133499145507812, -14.895071983337402, -13.656645774841309, -12.418219566345215, -11.179792404174805, -9.941366195678711, -8.702939987182617, -7.464512825012207, -6.226086616516113, -4.987659454345703, -3.7492332458496094, -2.5108065605163574, -1.2723801136016846, -0.03395366668701172, 1.2044730186462402, 2.442899703979492, 3.681325912475586, 4.919753074645996, 6.15817928314209, 7.396605968475342, 8.635032653808594, 9.873458862304688, 11.111885070800781, 12.350312232971191, 13.588738441467285, 14.827165603637695, 16.06559181213379, 17.304018020629883, 18.542444229125977, 19.780872344970703, 21.019298553466797, 22.25772476196289, 23.496150970458984, 24.734577178955078, 25.973003387451172, 27.211429595947266, 28.44985580444336, 29.688282012939453, 30.92671012878418, 32.165138244628906, 33.403564453125, 34.641990661621094, 35.88041687011719]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 5.0, 7.0, 9.0, 11.0, 19.0, 28.0, 33.0, 47.0, 65.0, 94.0, 145.0, 187.0, 285.0, 443.0, 660.0, 1080.0, 1762.0, 2942.0, 5169.0, 10136.0, 21747.0, 58355.0, 210279.0, 3433526.0, 316341.0, 79537.0, 27090.0, 11205.0, 5431.0, 2906.0, 1692.0, 1022.0, 646.0, 423.0, 305.0, 186.0, 145.0, 85.0, 61.0, 45.0, 39.0, 27.0, 16.0, 13.0, 10.0, 5.0, 6.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.6678466796875, -4.515380859375, -4.3629150390625, -4.21044921875, -4.0579833984375, -3.905517578125, -3.7530517578125, -3.6005859375, -3.4481201171875, -3.295654296875, -3.1431884765625, -2.99072265625, -2.8382568359375, -2.685791015625, -2.5333251953125, -2.380859375, -2.2283935546875, -2.075927734375, -1.9234619140625, -1.77099609375, -1.6185302734375, -1.466064453125, -1.3135986328125, -1.1611328125, -1.0086669921875, -0.856201171875, -0.7037353515625, -0.55126953125, -0.3988037109375, -0.246337890625, -0.0938720703125, 0.05859375, 0.2110595703125, 0.363525390625, 0.5159912109375, 0.66845703125, 0.8209228515625, 0.973388671875, 1.1258544921875, 1.2783203125, 1.4307861328125, 1.583251953125, 1.7357177734375, 1.88818359375, 2.0406494140625, 2.193115234375, 2.3455810546875, 2.498046875, 2.6505126953125, 2.802978515625, 2.9554443359375, 3.10791015625, 3.2603759765625, 3.412841796875, 3.5653076171875, 3.7177734375, 3.8702392578125, 4.022705078125, 4.1751708984375, 4.32763671875, 4.4801025390625, 4.632568359375, 4.7850341796875, 4.9375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 19.0, 31.0, 28.0, 46.0, 46.0, 69.0, 75.0, 77.0, 92.0, 68.0, 72.0, 69.0, 59.0, 42.0, 41.0, 34.0, 28.0, 17.0, 13.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1820068359375, -0.1751880645751953, -0.16836929321289062, -0.16155052185058594, -0.15473175048828125, -0.14791297912597656, -0.14109420776367188, -0.1342754364013672, -0.1274566650390625, -0.12063789367675781, -0.11381912231445312, -0.10700035095214844, -0.10018157958984375, -0.09336280822753906, -0.08654403686523438, -0.07972526550292969, -0.072906494140625, -0.06608772277832031, -0.059268951416015625, -0.05245018005371094, -0.04563140869140625, -0.03881263732910156, -0.031993865966796875, -0.025175094604492188, -0.0183563232421875, -0.011537551879882812, -0.004718780517578125, 0.0020999908447265625, 0.00891876220703125, 0.015737533569335938, 0.022556304931640625, 0.029375076293945312, 0.03619384765625, 0.04301261901855469, 0.049831390380859375, 0.05665016174316406, 0.06346893310546875, 0.07028770446777344, 0.07710647583007812, 0.08392524719238281, 0.0907440185546875, 0.09756278991699219, 0.10438156127929688, 0.11120033264160156, 0.11801910400390625, 0.12483787536621094, 0.13165664672851562, 0.1384754180908203, 0.145294189453125, 0.1521129608154297, 0.15893173217773438, 0.16575050354003906, 0.17256927490234375, 0.17938804626464844, 0.18620681762695312, 0.1930255889892578, 0.1998443603515625, 0.2066631317138672, 0.21348190307617188, 0.22030067443847656, 0.22711944580078125, 0.23393821716308594, 0.24075698852539062, 0.2475757598876953, 0.25439453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 11.0, 22.0, 27.0, 46.0, 70.0, 142.0, 322.0, 714.0, 1696.0, 4517.0, 14614.0, 58356.0, 375598.0, 3510526.0, 177006.0, 35031.0, 9609.0, 3460.0, 1319.0, 557.0, 263.0, 132.0, 93.0, 38.0, 24.0, 14.0, 14.0, 10.0, 10.0, 7.0, 5.0, 0.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.73828125, -7.5128173828125, -7.287353515625, -7.0618896484375, -6.83642578125, -6.6109619140625, -6.385498046875, -6.1600341796875, -5.9345703125, -5.7091064453125, -5.483642578125, -5.2581787109375, -5.03271484375, -4.8072509765625, -4.581787109375, -4.3563232421875, -4.130859375, -3.9053955078125, -3.679931640625, -3.4544677734375, -3.22900390625, -3.0035400390625, -2.778076171875, -2.5526123046875, -2.3271484375, -2.1016845703125, -1.876220703125, -1.6507568359375, -1.42529296875, -1.1998291015625, -0.974365234375, -0.7489013671875, -0.5234375, -0.2979736328125, -0.072509765625, 0.1529541015625, 0.37841796875, 0.6038818359375, 0.829345703125, 1.0548095703125, 1.2802734375, 1.5057373046875, 1.731201171875, 1.9566650390625, 2.18212890625, 2.4075927734375, 2.633056640625, 2.8585205078125, 3.083984375, 3.3094482421875, 3.534912109375, 3.7603759765625, 3.98583984375, 4.2113037109375, 4.436767578125, 4.6622314453125, 4.8876953125, 5.1131591796875, 5.338623046875, 5.5640869140625, 5.78955078125, 6.0150146484375, 6.240478515625, 6.4659423828125, 6.69140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 5.0, 8.0, 5.0, 6.0, 15.0, 12.0, 30.0, 31.0, 44.0, 55.0, 80.0, 91.0, 120.0, 200.0, 554.0, 1736.0, 366.0, 177.0, 122.0, 108.0, 62.0, 65.0, 31.0, 29.0, 22.0, 14.0, 13.0, 12.0, 14.0, 7.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.029296875, -1.0002059936523438, -0.9711151123046875, -0.9420242309570312, -0.912933349609375, -0.8838424682617188, -0.8547515869140625, -0.8256607055664062, -0.79656982421875, -0.7674789428710938, -0.7383880615234375, -0.7092971801757812, -0.680206298828125, -0.6511154174804688, -0.6220245361328125, -0.5929336547851562, -0.5638427734375, -0.5347518920898438, -0.5056610107421875, -0.47657012939453125, -0.447479248046875, -0.41838836669921875, -0.3892974853515625, -0.36020660400390625, -0.33111572265625, -0.30202484130859375, -0.2729339599609375, -0.24384307861328125, -0.214752197265625, -0.18566131591796875, -0.1565704345703125, -0.12747955322265625, -0.098388671875, -0.06929779052734375, -0.0402069091796875, -0.01111602783203125, 0.017974853515625, 0.04706573486328125, 0.0761566162109375, 0.10524749755859375, 0.13433837890625, 0.16342926025390625, 0.1925201416015625, 0.22161102294921875, 0.250701904296875, 0.27979278564453125, 0.3088836669921875, 0.33797454833984375, 0.3670654296875, 0.39615631103515625, 0.4252471923828125, 0.45433807373046875, 0.483428955078125, 0.5125198364257812, 0.5416107177734375, 0.5707015991210938, 0.59979248046875, 0.6288833618164062, 0.6579742431640625, 0.6870651245117188, 0.716156005859375, 0.7452468872070312, 0.7743377685546875, 0.8034286499023438, 0.83251953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 4.0, 10.0, 10.0, 20.0, 20.0, 28.0, 34.0, 51.0, 51.0, 74.0, 117.0, 113.0, 100.0, 94.0, 56.0, 59.0, 39.0, 31.0, 18.0, 14.0, 10.0, 12.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.692089080810547, -9.432366371154785, -9.172643661499023, -8.912920951843262, -8.6531982421875, -8.393475532531738, -8.133752822875977, -7.874029636383057, -7.614306926727295, -7.354584217071533, -7.0948615074157715, -6.83513879776001, -6.57541561126709, -6.315692901611328, -6.055970191955566, -5.796247482299805, -5.536524772644043, -5.276802062988281, -5.0170793533325195, -4.757356643676758, -4.497633934020996, -4.237911224365234, -3.9781880378723145, -3.7184653282165527, -3.458742618560791, -3.1990199089050293, -2.9392971992492676, -2.6795742511749268, -2.419851541519165, -2.1601288318634033, -1.900406002998352, -1.6406831741333008, -1.3809595108032227, -1.121236801147461, -0.8615139722824097, -0.6017912030220032, -0.3420684337615967, -0.08234572410583496, 0.1773771047592163, 0.4370999336242676, 0.6968226432800293, 0.9565454125404358, 1.2162681818008423, 1.4759910106658936, 1.7357137203216553, 1.995436429977417, 2.255159378051758, 2.5148820877075195, 2.7746047973632812, 3.034327507019043, 3.2940502166748047, 3.5537731647491455, 3.8134958744049072, 4.07321834564209, 4.33294153213501, 4.5926642417907715, 4.852386951446533, 5.112109661102295, 5.371832370758057, 5.631555080413818, 5.891278266906738, 6.1510009765625, 6.410723686218262, 6.670446395874023, 6.930169105529785]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 7.0, 4.0, 6.0, 13.0, 6.0, 13.0, 20.0, 20.0, 25.0, 35.0, 28.0, 49.0, 37.0, 50.0, 55.0, 43.0, 41.0, 52.0, 41.0, 47.0, 54.0, 47.0, 46.0, 36.0, 35.0, 35.0, 29.0, 18.0, 13.0, 23.0, 14.0, 8.0, 10.0, 7.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8015806674957275, -3.682335376739502, -3.5630898475646973, -3.4438445568084717, -3.324599266052246, -3.2053537368774414, -3.086108446121216, -2.9668631553649902, -2.8476176261901855, -2.72837233543396, -2.6091268062591553, -2.4898815155029297, -2.370635986328125, -2.2513906955718994, -2.132145404815674, -2.012899875640869, -1.8936545848846436, -1.7744091749191284, -1.6551637649536133, -1.5359184741973877, -1.4166730642318726, -1.2974276542663574, -1.1781823635101318, -1.0589369535446167, -0.9396915435791016, -0.8204461336135864, -0.7012007832527161, -0.5819554328918457, -0.46271002292633057, -0.34346461296081543, -0.22421926259994507, -0.10497391223907471, 0.014271259307861328, 0.13351663947105408, 0.2527620196342468, 0.3720073997974396, 0.4912527799606323, 0.6104981899261475, 0.7297435402870178, 0.8489888906478882, 0.9682343006134033, 1.0874797105789185, 1.2067251205444336, 1.3259704113006592, 1.4452158212661743, 1.5644612312316895, 1.683706521987915, 1.8029519319534302, 1.9221973419189453, 2.041442632675171, 2.1606881618499756, 2.279933452606201, 2.399178981781006, 2.5184242725372314, 2.637669563293457, 2.7569150924682617, 2.8761603832244873, 2.995405673980713, 3.1146512031555176, 3.233896493911743, 3.3531417846679688, 3.4723873138427734, 3.591632604598999, 3.7108778953552246, 3.8301234245300293]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 7.0, 15.0, 14.0, 34.0, 36.0, 38.0, 64.0, 88.0, 116.0, 163.0, 236.0, 400.0, 548.0, 797.0, 1232.0, 1950.0, 3154.0, 5485.0, 10324.0, 20257.0, 45821.0, 124875.0, 423724.0, 261732.0, 80482.0, 32093.0, 15081.0, 7845.0, 4438.0, 2547.0, 1616.0, 1050.0, 641.0, 488.0, 308.0, 259.0, 167.0, 108.0, 89.0, 58.0, 31.0, 21.0, 33.0, 18.0, 13.0, 12.0, 6.0, 3.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.5732421875, -1.52215576171875, -1.4710693359375, -1.41998291015625, -1.368896484375, -1.31781005859375, -1.2667236328125, -1.21563720703125, -1.16455078125, -1.11346435546875, -1.0623779296875, -1.01129150390625, -0.960205078125, -0.90911865234375, -0.8580322265625, -0.80694580078125, -0.755859375, -0.70477294921875, -0.6536865234375, -0.60260009765625, -0.551513671875, -0.50042724609375, -0.4493408203125, -0.39825439453125, -0.34716796875, -0.29608154296875, -0.2449951171875, -0.19390869140625, -0.142822265625, -0.09173583984375, -0.0406494140625, 0.01043701171875, 0.0615234375, 0.11260986328125, 0.1636962890625, 0.21478271484375, 0.265869140625, 0.31695556640625, 0.3680419921875, 0.41912841796875, 0.47021484375, 0.52130126953125, 0.5723876953125, 0.62347412109375, 0.674560546875, 0.72564697265625, 0.7767333984375, 0.82781982421875, 0.87890625, 0.92999267578125, 0.9810791015625, 1.03216552734375, 1.083251953125, 1.13433837890625, 1.1854248046875, 1.23651123046875, 1.28759765625, 1.33868408203125, 1.3897705078125, 1.44085693359375, 1.491943359375, 1.54302978515625, 1.5941162109375, 1.64520263671875, 1.6962890625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 8.0, 13.0, 9.0, 16.0, 13.0, 31.0, 33.0, 35.0, 48.0, 58.0, 51.0, 53.0, 62.0, 69.0, 59.0, 65.0, 65.0, 52.0, 52.0, 33.0, 30.0, 36.0, 22.0, 15.0, 7.0, 12.0, 4.0, 7.0, 4.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.192626953125, -0.1867084503173828, -0.18078994750976562, -0.17487144470214844, -0.16895294189453125, -0.16303443908691406, -0.15711593627929688, -0.1511974334716797, -0.1452789306640625, -0.1393604278564453, -0.13344192504882812, -0.12752342224121094, -0.12160491943359375, -0.11568641662597656, -0.10976791381835938, -0.10384941101074219, -0.097930908203125, -0.09201240539550781, -0.08609390258789062, -0.08017539978027344, -0.07425689697265625, -0.06833839416503906, -0.062419891357421875, -0.05650138854980469, -0.0505828857421875, -0.04466438293457031, -0.038745880126953125, -0.03282737731933594, -0.02690887451171875, -0.020990371704101562, -0.015071868896484375, -0.009153366088867188, -0.00323486328125, 0.0026836395263671875, 0.008602142333984375, 0.014520645141601562, 0.02043914794921875, 0.026357650756835938, 0.032276153564453125, 0.03819465637207031, 0.0441131591796875, 0.05003166198730469, 0.055950164794921875, 0.06186866760253906, 0.06778717041015625, 0.07370567321777344, 0.07962417602539062, 0.08554267883300781, 0.091461181640625, 0.09737968444824219, 0.10329818725585938, 0.10921669006347656, 0.11513519287109375, 0.12105369567871094, 0.12697219848632812, 0.1328907012939453, 0.1388092041015625, 0.1447277069091797, 0.15064620971679688, 0.15656471252441406, 0.16248321533203125, 0.16840171813964844, 0.17432022094726562, 0.1802387237548828, 0.1861572265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 4.0, 16.0, 18.0, 19.0, 42.0, 52.0, 62.0, 120.0, 187.0, 271.0, 349.0, 511.0, 834.0, 1299.0, 2101.0, 3628.0, 6680.0, 14131.0, 36105.0, 122282.0, 546766.0, 219109.0, 53789.0, 19504.0, 8879.0, 4650.0, 2570.0, 1528.0, 1017.0, 676.0, 446.0, 280.0, 198.0, 136.0, 98.0, 51.0, 41.0, 21.0, 25.0, 21.0, 11.0, 11.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4892578125, -1.4390869140625, -1.388916015625, -1.3387451171875, -1.28857421875, -1.2384033203125, -1.188232421875, -1.1380615234375, -1.087890625, -1.0377197265625, -0.987548828125, -0.9373779296875, -0.88720703125, -0.8370361328125, -0.786865234375, -0.7366943359375, -0.6865234375, -0.6363525390625, -0.586181640625, -0.5360107421875, -0.48583984375, -0.4356689453125, -0.385498046875, -0.3353271484375, -0.28515625, -0.2349853515625, -0.184814453125, -0.1346435546875, -0.08447265625, -0.0343017578125, 0.015869140625, 0.0660400390625, 0.1162109375, 0.1663818359375, 0.216552734375, 0.2667236328125, 0.31689453125, 0.3670654296875, 0.417236328125, 0.4674072265625, 0.517578125, 0.5677490234375, 0.617919921875, 0.6680908203125, 0.71826171875, 0.7684326171875, 0.818603515625, 0.8687744140625, 0.9189453125, 0.9691162109375, 1.019287109375, 1.0694580078125, 1.11962890625, 1.1697998046875, 1.219970703125, 1.2701416015625, 1.3203125, 1.3704833984375, 1.420654296875, 1.4708251953125, 1.52099609375, 1.5711669921875, 1.621337890625, 1.6715087890625, 1.7216796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 8.0, 4.0, 10.0, 6.0, 7.0, 12.0, 12.0, 10.0, 10.0, 15.0, 23.0, 29.0, 24.0, 18.0, 32.0, 38.0, 41.0, 41.0, 41.0, 47.0, 35.0, 44.0, 45.0, 45.0, 46.0, 29.0, 35.0, 42.0, 29.0, 33.0, 33.0, 19.0, 14.0, 29.0, 17.0, 12.0, 9.0, 14.0, 10.0, 12.0, 8.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7783203125, -0.7527389526367188, -0.7271575927734375, -0.7015762329101562, -0.675994873046875, -0.6504135131835938, -0.6248321533203125, -0.5992507934570312, -0.57366943359375, -0.5480880737304688, -0.5225067138671875, -0.49692535400390625, -0.471343994140625, -0.44576263427734375, -0.4201812744140625, -0.39459991455078125, -0.3690185546875, -0.34343719482421875, -0.3178558349609375, -0.29227447509765625, -0.266693115234375, -0.24111175537109375, -0.2155303955078125, -0.18994903564453125, -0.16436767578125, -0.13878631591796875, -0.1132049560546875, -0.08762359619140625, -0.062042236328125, -0.03646087646484375, -0.0108795166015625, 0.01470184326171875, 0.040283203125, 0.06586456298828125, 0.0914459228515625, 0.11702728271484375, 0.142608642578125, 0.16819000244140625, 0.1937713623046875, 0.21935272216796875, 0.24493408203125, 0.27051544189453125, 0.2960968017578125, 0.32167816162109375, 0.347259521484375, 0.37284088134765625, 0.3984222412109375, 0.42400360107421875, 0.4495849609375, 0.47516632080078125, 0.5007476806640625, 0.5263290405273438, 0.551910400390625, 0.5774917602539062, 0.6030731201171875, 0.6286544799804688, 0.65423583984375, 0.6798171997070312, 0.7053985595703125, 0.7309799194335938, 0.756561279296875, 0.7821426391601562, 0.8077239990234375, 0.8333053588867188, 0.85888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 8.0, 11.0, 11.0, 13.0, 13.0, 28.0, 27.0, 34.0, 49.0, 68.0, 76.0, 126.0, 172.0, 232.0, 387.0, 619.0, 998.0, 1840.0, 3336.0, 7420.0, 19062.0, 78044.0, 712762.0, 173186.0, 29849.0, 10172.0, 4529.0, 2171.0, 1238.0, 669.0, 450.0, 266.0, 203.0, 138.0, 79.0, 65.0, 46.0, 39.0, 27.0, 20.0, 18.0, 12.0, 4.0, 8.0, 9.0, 8.0, 1.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.31640625, -4.18017578125, -4.0439453125, -3.90771484375, -3.771484375, -3.63525390625, -3.4990234375, -3.36279296875, -3.2265625, -3.09033203125, -2.9541015625, -2.81787109375, -2.681640625, -2.54541015625, -2.4091796875, -2.27294921875, -2.13671875, -2.00048828125, -1.8642578125, -1.72802734375, -1.591796875, -1.45556640625, -1.3193359375, -1.18310546875, -1.046875, -0.91064453125, -0.7744140625, -0.63818359375, -0.501953125, -0.36572265625, -0.2294921875, -0.09326171875, 0.04296875, 0.17919921875, 0.3154296875, 0.45166015625, 0.587890625, 0.72412109375, 0.8603515625, 0.99658203125, 1.1328125, 1.26904296875, 1.4052734375, 1.54150390625, 1.677734375, 1.81396484375, 1.9501953125, 2.08642578125, 2.22265625, 2.35888671875, 2.4951171875, 2.63134765625, 2.767578125, 2.90380859375, 3.0400390625, 3.17626953125, 3.3125, 3.44873046875, 3.5849609375, 3.72119140625, 3.857421875, 3.99365234375, 4.1298828125, 4.26611328125, 4.40234375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 6.0, 7.0, 16.0, 16.0, 18.0, 22.0, 34.0, 44.0, 56.0, 95.0, 118.0, 121.0, 100.0, 89.0, 53.0, 51.0, 31.0, 23.0, 21.0, 15.0, 12.0, 11.0, 11.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008158683776855469, -0.000792182981967926, -0.0007684975862503052, -0.0007448121905326843, -0.0007211267948150635, -0.0006974413990974426, -0.0006737560033798218, -0.0006500706076622009, -0.0006263852119445801, -0.0006026998162269592, -0.0005790144205093384, -0.0005553290247917175, -0.0005316436290740967, -0.0005079582333564758, -0.000484272837638855, -0.00046058744192123413, -0.0004369020462036133, -0.00041321665048599243, -0.0003895312547683716, -0.00036584585905075073, -0.0003421604633331299, -0.00031847506761550903, -0.0002947896718978882, -0.00027110427618026733, -0.0002474188804626465, -0.00022373348474502563, -0.00020004808902740479, -0.00017636269330978394, -0.00015267729759216309, -0.00012899190187454224, -0.00010530650615692139, -8.162111043930054e-05, -5.793571472167969e-05, -3.425031900405884e-05, -1.0564923286437988e-05, 1.3120472431182861e-05, 3.680586814880371e-05, 6.049126386642456e-05, 8.417665958404541e-05, 0.00010786205530166626, 0.0001315474510192871, 0.00015523284673690796, 0.0001789182424545288, 0.00020260363817214966, 0.0002262890338897705, 0.00024997442960739136, 0.0002736598253250122, 0.00029734522104263306, 0.0003210306167602539, 0.00034471601247787476, 0.0003684014081954956, 0.00039208680391311646, 0.0004157721996307373, 0.00043945759534835815, 0.000463142991065979, 0.00048682838678359985, 0.0005105137825012207, 0.0005341991782188416, 0.0005578845739364624, 0.0005815699696540833, 0.0006052553653717041, 0.000628940761089325, 0.0006526261568069458, 0.0006763115525245667, 0.0006999969482421875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 6.0, 5.0, 9.0, 12.0, 10.0, 19.0, 25.0, 27.0, 45.0, 59.0, 86.0, 128.0, 180.0, 277.0, 435.0, 748.0, 1332.0, 2554.0, 5485.0, 13982.0, 52745.0, 536002.0, 367940.0, 43387.0, 12434.0, 4863.0, 2425.0, 1248.0, 729.0, 455.0, 291.0, 156.0, 120.0, 82.0, 60.0, 44.0, 44.0, 30.0, 22.0, 9.0, 10.0, 6.0, 7.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.2890625, -5.12347412109375, -4.9578857421875, -4.79229736328125, -4.626708984375, -4.46112060546875, -4.2955322265625, -4.12994384765625, -3.96435546875, -3.79876708984375, -3.6331787109375, -3.46759033203125, -3.302001953125, -3.13641357421875, -2.9708251953125, -2.80523681640625, -2.6396484375, -2.47406005859375, -2.3084716796875, -2.14288330078125, -1.977294921875, -1.81170654296875, -1.6461181640625, -1.48052978515625, -1.31494140625, -1.14935302734375, -0.9837646484375, -0.81817626953125, -0.652587890625, -0.48699951171875, -0.3214111328125, -0.15582275390625, 0.009765625, 0.17535400390625, 0.3409423828125, 0.50653076171875, 0.672119140625, 0.83770751953125, 1.0032958984375, 1.16888427734375, 1.33447265625, 1.50006103515625, 1.6656494140625, 1.83123779296875, 1.996826171875, 2.16241455078125, 2.3280029296875, 2.49359130859375, 2.6591796875, 2.82476806640625, 2.9903564453125, 3.15594482421875, 3.321533203125, 3.48712158203125, 3.6527099609375, 3.81829833984375, 3.98388671875, 4.14947509765625, 4.3150634765625, 4.48065185546875, 4.646240234375, 4.81182861328125, 4.9774169921875, 5.14300537109375, 5.30859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 20.0, 23.0, 33.0, 47.0, 87.0, 99.0, 112.0, 128.0, 132.0, 92.0, 59.0, 48.0, 25.0, 18.0, 21.0, 9.0, 8.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.051788330078125, -1.98443603515625, -1.917083740234375, -1.8497314453125, -1.782379150390625, -1.71502685546875, -1.647674560546875, -1.580322265625, -1.512969970703125, -1.44561767578125, -1.378265380859375, -1.3109130859375, -1.243560791015625, -1.17620849609375, -1.108856201171875, -1.04150390625, -0.974151611328125, -0.90679931640625, -0.839447021484375, -0.7720947265625, -0.704742431640625, -0.63739013671875, -0.570037841796875, -0.502685546875, -0.435333251953125, -0.36798095703125, -0.300628662109375, -0.2332763671875, -0.165924072265625, -0.09857177734375, -0.031219482421875, 0.0361328125, 0.103485107421875, 0.17083740234375, 0.238189697265625, 0.3055419921875, 0.372894287109375, 0.44024658203125, 0.507598876953125, 0.574951171875, 0.642303466796875, 0.70965576171875, 0.777008056640625, 0.8443603515625, 0.911712646484375, 0.97906494140625, 1.046417236328125, 1.11376953125, 1.181121826171875, 1.24847412109375, 1.315826416015625, 1.3831787109375, 1.450531005859375, 1.51788330078125, 1.585235595703125, 1.652587890625, 1.719940185546875, 1.78729248046875, 1.854644775390625, 1.9219970703125, 1.989349365234375, 2.05670166015625, 2.124053955078125, 2.19140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 12.0, 18.0, 32.0, 113.0, 293.0, 336.0, 112.0, 40.0, 17.0, 10.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.60757446289062, -76.93553161621094, -75.26348114013672, -73.59143829345703, -71.91939544677734, -70.24734497070312, -68.57530212402344, -66.90325927734375, -65.23120880126953, -63.55916213989258, -61.88711929321289, -60.21507263183594, -58.543025970458984, -56.8709831237793, -55.198936462402344, -53.526893615722656, -51.85485076904297, -50.182804107666016, -48.51076126098633, -46.838714599609375, -45.16666793823242, -43.494625091552734, -41.82257843017578, -40.150535583496094, -38.478485107421875, -36.80643844604492, -35.134395599365234, -33.46234893798828, -31.79030418395996, -30.11825942993164, -28.446212768554688, -26.774168014526367, -25.102121353149414, -23.430076599121094, -21.75802993774414, -20.08598518371582, -18.4139404296875, -16.741893768310547, -15.069849014282227, -13.397804260253906, -11.72575855255127, -10.053712844848633, -8.381668090820312, -6.709622383117676, -5.037577152252197, -3.3655319213867188, -1.693486213684082, -0.02144145965576172, 1.650604248046875, 3.3226494789123535, 4.994694709777832, 6.666740417480469, 8.338785171508789, 10.010830879211426, 11.682876586914062, 13.354921340942383, 15.02696704864502, 16.699012756347656, 18.371057510375977, 20.043102264404297, 21.71514892578125, 23.38719367980957, 25.05923843383789, 26.731285095214844, 28.403329849243164]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 6.0, 7.0, 10.0, 19.0, 16.0, 39.0, 48.0, 64.0, 90.0, 118.0, 113.0, 107.0, 82.0, 72.0, 53.0, 42.0, 25.0, 12.0, 10.0, 10.0, 9.0, 2.0, 10.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.521688461303711, -13.0650053024292, -12.608321189880371, -12.15163803100586, -11.694954872131348, -11.238271713256836, -10.781587600708008, -10.324904441833496, -9.868221282958984, -9.411538124084473, -8.954854011535645, -8.498170852661133, -8.041487693786621, -7.584804058074951, -7.128120422363281, -6.6714372634887695, -6.2147536277771, -5.75806999206543, -5.301386833190918, -4.844703197479248, -4.388020038604736, -3.9313364028930664, -3.4746530055999756, -3.0179696083068848, -2.561286211013794, -2.104602813720703, -1.6479194164276123, -1.191235899925232, -0.7345525026321411, -0.27786898612976074, 0.17881441116333008, 0.6354978084564209, 1.0921812057495117, 1.5488646030426025, 2.0055480003356934, 2.4622316360473633, 2.918914794921875, 3.375598430633545, 3.8322818279266357, 4.288965225219727, 4.745648384094238, 5.202332019805908, 5.65901517868042, 6.11569881439209, 6.572381973266602, 7.0290656089782715, 7.485749244689941, 7.942432403564453, 8.399116516113281, 8.855799674987793, 9.312483787536621, 9.769166946411133, 10.225850105285645, 10.682533264160156, 11.139217376708984, 11.595900535583496, 12.052583694458008, 12.50926685333252, 12.965950965881348, 13.42263412475586, 13.879317283630371, 14.336000442504883, 14.792684555053711, 15.249367713928223, 15.706050872802734]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 8.0, 8.0, 15.0, 20.0, 27.0, 26.0, 52.0, 61.0, 73.0, 104.0, 203.0, 308.0, 489.0, 824.0, 1530.0, 2809.0, 6051.0, 15342.0, 47592.0, 3733664.0, 325315.0, 37033.0, 11783.0, 4978.0, 2506.0, 1422.0, 754.0, 426.0, 257.0, 186.0, 128.0, 89.0, 46.0, 57.0, 28.0, 22.0, 9.0, 14.0, 4.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.46875, -7.2547607421875, -7.040771484375, -6.8267822265625, -6.61279296875, -6.3988037109375, -6.184814453125, -5.9708251953125, -5.7568359375, -5.5428466796875, -5.328857421875, -5.1148681640625, -4.90087890625, -4.6868896484375, -4.472900390625, -4.2589111328125, -4.044921875, -3.8309326171875, -3.616943359375, -3.4029541015625, -3.18896484375, -2.9749755859375, -2.760986328125, -2.5469970703125, -2.3330078125, -2.1190185546875, -1.905029296875, -1.6910400390625, -1.47705078125, -1.2630615234375, -1.049072265625, -0.8350830078125, -0.62109375, -0.4071044921875, -0.193115234375, 0.0208740234375, 0.23486328125, 0.4488525390625, 0.662841796875, 0.8768310546875, 1.0908203125, 1.3048095703125, 1.518798828125, 1.7327880859375, 1.94677734375, 2.1607666015625, 2.374755859375, 2.5887451171875, 2.802734375, 3.0167236328125, 3.230712890625, 3.4447021484375, 3.65869140625, 3.8726806640625, 4.086669921875, 4.3006591796875, 4.5146484375, 4.7286376953125, 4.942626953125, 5.1566162109375, 5.37060546875, 5.5845947265625, 5.798583984375, 6.0125732421875, 6.2265625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 14.0, 11.0, 16.0, 20.0, 44.0, 40.0, 53.0, 61.0, 55.0, 85.0, 82.0, 66.0, 77.0, 70.0, 55.0, 51.0, 33.0, 36.0, 28.0, 19.0, 12.0, 9.0, 8.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.1995086669921875, -0.192840576171875, -0.1861724853515625, -0.17950439453125, -0.1728363037109375, -0.166168212890625, -0.1595001220703125, -0.15283203125, -0.1461639404296875, -0.139495849609375, -0.1328277587890625, -0.12615966796875, -0.1194915771484375, -0.112823486328125, -0.1061553955078125, -0.0994873046875, -0.0928192138671875, -0.086151123046875, -0.0794830322265625, -0.07281494140625, -0.0661468505859375, -0.059478759765625, -0.0528106689453125, -0.046142578125, -0.0394744873046875, -0.032806396484375, -0.0261383056640625, -0.01947021484375, -0.0128021240234375, -0.006134033203125, 0.0005340576171875, 0.0072021484375, 0.0138702392578125, 0.020538330078125, 0.0272064208984375, 0.03387451171875, 0.0405426025390625, 0.047210693359375, 0.0538787841796875, 0.060546875, 0.0672149658203125, 0.073883056640625, 0.0805511474609375, 0.08721923828125, 0.0938873291015625, 0.100555419921875, 0.1072235107421875, 0.1138916015625, 0.1205596923828125, 0.127227783203125, 0.1338958740234375, 0.14056396484375, 0.1472320556640625, 0.153900146484375, 0.1605682373046875, 0.167236328125, 0.1739044189453125, 0.180572509765625, 0.1872406005859375, 0.19390869140625, 0.2005767822265625, 0.207244873046875, 0.2139129638671875, 0.2205810546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 7.0, 18.0, 23.0, 23.0, 46.0, 70.0, 110.0, 186.0, 296.0, 481.0, 936.0, 2081.0, 4859.0, 12702.0, 39031.0, 190675.0, 3822993.0, 82100.0, 23121.0, 8287.0, 3173.0, 1454.0, 668.0, 370.0, 200.0, 122.0, 78.0, 57.0, 30.0, 22.0, 16.0, 8.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.25689697265625, -5.0489501953125, -4.84100341796875, -4.633056640625, -4.42510986328125, -4.2171630859375, -4.00921630859375, -3.80126953125, -3.59332275390625, -3.3853759765625, -3.17742919921875, -2.969482421875, -2.76153564453125, -2.5535888671875, -2.34564208984375, -2.1376953125, -1.92974853515625, -1.7218017578125, -1.51385498046875, -1.305908203125, -1.09796142578125, -0.8900146484375, -0.68206787109375, -0.47412109375, -0.26617431640625, -0.0582275390625, 0.14971923828125, 0.357666015625, 0.56561279296875, 0.7735595703125, 0.98150634765625, 1.189453125, 1.39739990234375, 1.6053466796875, 1.81329345703125, 2.021240234375, 2.22918701171875, 2.4371337890625, 2.64508056640625, 2.85302734375, 3.06097412109375, 3.2689208984375, 3.47686767578125, 3.684814453125, 3.89276123046875, 4.1007080078125, 4.30865478515625, 4.5166015625, 4.72454833984375, 4.9324951171875, 5.14044189453125, 5.348388671875, 5.55633544921875, 5.7642822265625, 5.97222900390625, 6.18017578125, 6.38812255859375, 6.5960693359375, 6.80401611328125, 7.011962890625, 7.21990966796875, 7.4278564453125, 7.63580322265625, 7.84375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 8.0, 12.0, 14.0, 9.0, 11.0, 15.0, 25.0, 20.0, 23.0, 41.0, 39.0, 71.0, 117.0, 362.0, 2575.0, 365.0, 112.0, 48.0, 36.0, 30.0, 22.0, 12.0, 16.0, 16.0, 18.0, 14.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6073455810546875, -0.589202880859375, -0.5710601806640625, -0.55291748046875, -0.5347747802734375, -0.516632080078125, -0.4984893798828125, -0.4803466796875, -0.4622039794921875, -0.444061279296875, -0.4259185791015625, -0.40777587890625, -0.3896331787109375, -0.371490478515625, -0.3533477783203125, -0.335205078125, -0.3170623779296875, -0.298919677734375, -0.2807769775390625, -0.26263427734375, -0.2444915771484375, -0.226348876953125, -0.2082061767578125, -0.1900634765625, -0.1719207763671875, -0.153778076171875, -0.1356353759765625, -0.11749267578125, -0.0993499755859375, -0.081207275390625, -0.0630645751953125, -0.044921875, -0.0267791748046875, -0.008636474609375, 0.0095062255859375, 0.02764892578125, 0.0457916259765625, 0.063934326171875, 0.0820770263671875, 0.1002197265625, 0.1183624267578125, 0.136505126953125, 0.1546478271484375, 0.17279052734375, 0.1909332275390625, 0.209075927734375, 0.2272186279296875, 0.245361328125, 0.2635040283203125, 0.281646728515625, 0.2997894287109375, 0.31793212890625, 0.3360748291015625, 0.354217529296875, 0.3723602294921875, 0.3905029296875, 0.4086456298828125, 0.426788330078125, 0.4449310302734375, 0.46307373046875, 0.4812164306640625, 0.499359130859375, 0.5175018310546875, 0.53564453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 8.0, 18.0, 16.0, 49.0, 138.0, 296.0, 259.0, 129.0, 44.0, 25.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.516450881958008, -11.248242378234863, -10.980032920837402, -10.711824417114258, -10.443615913391113, -10.175406455993652, -9.907197952270508, -9.638989448547363, -9.370779991149902, -9.102571487426758, -8.834362030029297, -8.566153526306152, -8.297945022583008, -8.029735565185547, -7.761527061462402, -7.4933180809021, -7.225109577178955, -6.956900596618652, -6.688692092895508, -6.420483112335205, -6.152274131774902, -5.884065628051758, -5.615856647491455, -5.347647666931152, -5.079439163208008, -4.811230182647705, -4.5430216789245605, -4.274812698364258, -4.006603717803955, -3.7383949756622314, -3.470186233520508, -3.201977252960205, -2.9337682723999023, -2.6655595302581787, -2.397350549697876, -2.1291418075561523, -1.8609329462051392, -1.592724084854126, -1.3245153427124023, -1.0563064813613892, -0.788097620010376, -0.5198887586593628, -0.2516799569129944, 0.016528844833374023, 0.2847377061843872, 0.5529465675354004, 0.821155309677124, 1.0893641710281372, 1.3575730323791504, 1.6257818937301636, 1.8939907550811768, 2.1621994972229004, 2.430408477783203, 2.6986172199249268, 2.9668259620666504, 3.235034942626953, 3.5032436847686768, 3.7714524269104004, 4.039661407470703, 4.307869911193848, 4.57607889175415, 4.844287872314453, 5.112496376037598, 5.3807053565979, 5.648914337158203]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 11.0, 11.0, 19.0, 25.0, 28.0, 39.0, 43.0, 63.0, 52.0, 60.0, 71.0, 61.0, 68.0, 47.0, 64.0, 50.0, 56.0, 45.0, 41.0, 33.0, 22.0, 12.0, 17.0, 10.0, 14.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6449379920959473, -2.5576741695404053, -2.4704103469848633, -2.383146286010742, -2.2958824634552, -2.208618640899658, -2.121354818344116, -2.034090995788574, -1.9468270540237427, -1.8595632314682007, -1.7722992897033691, -1.6850354671478271, -1.5977716445922852, -1.5105077028274536, -1.4232438802719116, -1.33597993850708, -1.248716115951538, -1.161452293395996, -1.0741883516311646, -0.9869245290756226, -0.8996606469154358, -0.812396764755249, -0.725132942199707, -0.6378690600395203, -0.5506051778793335, -0.46334129571914673, -0.37607744336128235, -0.28881359100341797, -0.2015497088432312, -0.11428582668304443, -0.02702200412750244, 0.060241878032684326, 0.147505521774292, 0.23476938903331757, 0.32203325629234314, 0.4092971086502075, 0.4965609908103943, 0.583824872970581, 0.671088695526123, 0.7583525776863098, 0.8456164598464966, 0.9328803420066833, 1.0201442241668701, 1.107408046722412, 1.194671869277954, 1.2819358110427856, 1.3691996335983276, 1.4564635753631592, 1.5437273979187012, 1.6309912204742432, 1.7182551622390747, 1.8055189847946167, 1.8927829265594482, 1.9800467491149902, 2.0673105716705322, 2.154574394226074, 2.2418384552001953, 2.3291022777557373, 2.4163661003112793, 2.5036301612854004, 2.5908939838409424, 2.6781578063964844, 2.7654216289520264, 2.8526854515075684, 2.9399492740631104]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 15.0, 7.0, 13.0, 34.0, 42.0, 56.0, 114.0, 176.0, 319.0, 575.0, 1241.0, 2998.0, 7751.0, 26230.0, 125581.0, 646768.0, 185584.0, 34548.0, 9985.0, 3453.0, 1515.0, 682.0, 366.0, 167.0, 113.0, 83.0, 48.0, 23.0, 27.0, 13.0, 10.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.49609375, -3.38885498046875, -3.2816162109375, -3.17437744140625, -3.067138671875, -2.95989990234375, -2.8526611328125, -2.74542236328125, -2.63818359375, -2.53094482421875, -2.4237060546875, -2.31646728515625, -2.209228515625, -2.10198974609375, -1.9947509765625, -1.88751220703125, -1.7802734375, -1.67303466796875, -1.5657958984375, -1.45855712890625, -1.351318359375, -1.24407958984375, -1.1368408203125, -1.02960205078125, -0.92236328125, -0.81512451171875, -0.7078857421875, -0.60064697265625, -0.493408203125, -0.38616943359375, -0.2789306640625, -0.17169189453125, -0.064453125, 0.04278564453125, 0.1500244140625, 0.25726318359375, 0.364501953125, 0.47174072265625, 0.5789794921875, 0.68621826171875, 0.79345703125, 0.90069580078125, 1.0079345703125, 1.11517333984375, 1.222412109375, 1.32965087890625, 1.4368896484375, 1.54412841796875, 1.6513671875, 1.75860595703125, 1.8658447265625, 1.97308349609375, 2.080322265625, 2.18756103515625, 2.2947998046875, 2.40203857421875, 2.50927734375, 2.61651611328125, 2.7237548828125, 2.83099365234375, 2.938232421875, 3.04547119140625, 3.1527099609375, 3.25994873046875, 3.3671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 10.0, 24.0, 33.0, 47.0, 55.0, 70.0, 92.0, 103.0, 88.0, 112.0, 89.0, 81.0, 61.0, 36.0, 28.0, 21.0, 5.0, 9.0, 5.0, 9.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250732421875, -0.24125289916992188, -0.23177337646484375, -0.22229385375976562, -0.2128143310546875, -0.20333480834960938, -0.19385528564453125, -0.18437576293945312, -0.174896240234375, -0.16541671752929688, -0.15593719482421875, -0.14645767211914062, -0.1369781494140625, -0.12749862670898438, -0.11801910400390625, -0.10853958129882812, -0.09906005859375, -0.08958053588867188, -0.08010101318359375, -0.07062149047851562, -0.0611419677734375, -0.051662445068359375, -0.04218292236328125, -0.032703399658203125, -0.023223876953125, -0.013744354248046875, -0.00426483154296875, 0.005214691162109375, 0.0146942138671875, 0.024173736572265625, 0.03365325927734375, 0.043132781982421875, 0.0526123046875, 0.062091827392578125, 0.07157135009765625, 0.08105087280273438, 0.0905303955078125, 0.10000991821289062, 0.10948944091796875, 0.11896896362304688, 0.128448486328125, 0.13792800903320312, 0.14740753173828125, 0.15688705444335938, 0.1663665771484375, 0.17584609985351562, 0.18532562255859375, 0.19480514526367188, 0.20428466796875, 0.21376419067382812, 0.22324371337890625, 0.23272323608398438, 0.2422027587890625, 0.2516822814941406, 0.26116180419921875, 0.2706413269042969, 0.280120849609375, 0.2896003723144531, 0.29907989501953125, 0.3085594177246094, 0.3180389404296875, 0.3275184631347656, 0.33699798583984375, 0.3464775085449219, 0.35595703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 9.0, 19.0, 17.0, 12.0, 33.0, 47.0, 71.0, 125.0, 163.0, 207.0, 351.0, 523.0, 888.0, 1440.0, 2411.0, 4303.0, 8193.0, 17012.0, 38966.0, 105126.0, 349828.0, 340759.0, 102413.0, 39197.0, 17430.0, 8284.0, 4418.0, 2373.0, 1494.0, 852.0, 513.0, 361.0, 238.0, 145.0, 94.0, 67.0, 39.0, 30.0, 38.0, 16.0, 6.0, 9.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4677734375, -1.42041015625, -1.373046875, -1.32568359375, -1.2783203125, -1.23095703125, -1.18359375, -1.13623046875, -1.0888671875, -1.04150390625, -0.994140625, -0.94677734375, -0.8994140625, -0.85205078125, -0.8046875, -0.75732421875, -0.7099609375, -0.66259765625, -0.615234375, -0.56787109375, -0.5205078125, -0.47314453125, -0.42578125, -0.37841796875, -0.3310546875, -0.28369140625, -0.236328125, -0.18896484375, -0.1416015625, -0.09423828125, -0.046875, 0.00048828125, 0.0478515625, 0.09521484375, 0.142578125, 0.18994140625, 0.2373046875, 0.28466796875, 0.33203125, 0.37939453125, 0.4267578125, 0.47412109375, 0.521484375, 0.56884765625, 0.6162109375, 0.66357421875, 0.7109375, 0.75830078125, 0.8056640625, 0.85302734375, 0.900390625, 0.94775390625, 0.9951171875, 1.04248046875, 1.08984375, 1.13720703125, 1.1845703125, 1.23193359375, 1.279296875, 1.32666015625, 1.3740234375, 1.42138671875, 1.46875, 1.51611328125, 1.5634765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 11.0, 13.0, 14.0, 14.0, 16.0, 36.0, 28.0, 29.0, 34.0, 29.0, 51.0, 38.0, 37.0, 54.0, 50.0, 44.0, 44.0, 51.0, 37.0, 42.0, 36.0, 41.0, 39.0, 29.0, 32.0, 20.0, 23.0, 20.0, 17.0, 17.0, 11.0, 8.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8907394409179688, -0.8639984130859375, -0.8372573852539062, -0.810516357421875, -0.7837753295898438, -0.7570343017578125, -0.7302932739257812, -0.70355224609375, -0.6768112182617188, -0.6500701904296875, -0.6233291625976562, -0.596588134765625, -0.5698471069335938, -0.5431060791015625, -0.5163650512695312, -0.4896240234375, -0.46288299560546875, -0.4361419677734375, -0.40940093994140625, -0.382659912109375, -0.35591888427734375, -0.3291778564453125, -0.30243682861328125, -0.27569580078125, -0.24895477294921875, -0.2222137451171875, -0.19547271728515625, -0.168731689453125, -0.14199066162109375, -0.1152496337890625, -0.08850860595703125, -0.061767578125, -0.03502655029296875, -0.0082855224609375, 0.01845550537109375, 0.045196533203125, 0.07193756103515625, 0.0986785888671875, 0.12541961669921875, 0.15216064453125, 0.17890167236328125, 0.2056427001953125, 0.23238372802734375, 0.259124755859375, 0.28586578369140625, 0.3126068115234375, 0.33934783935546875, 0.3660888671875, 0.39282989501953125, 0.4195709228515625, 0.44631195068359375, 0.473052978515625, 0.49979400634765625, 0.5265350341796875, 0.5532760620117188, 0.58001708984375, 0.6067581176757812, 0.6334991455078125, 0.6602401733398438, 0.686981201171875, 0.7137222290039062, 0.7404632568359375, 0.7672042846679688, 0.7939453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 4.0, 9.0, 9.0, 11.0, 19.0, 29.0, 42.0, 68.0, 90.0, 116.0, 190.0, 334.0, 509.0, 961.0, 1816.0, 3897.0, 9638.0, 30093.0, 157059.0, 680464.0, 121610.0, 25536.0, 8536.0, 3558.0, 1732.0, 831.0, 502.0, 319.0, 173.0, 136.0, 79.0, 51.0, 37.0, 22.0, 18.0, 13.0, 14.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.336639404296875, -2.25726318359375, -2.177886962890625, -2.0985107421875, -2.019134521484375, -1.93975830078125, -1.860382080078125, -1.781005859375, -1.701629638671875, -1.62225341796875, -1.542877197265625, -1.4635009765625, -1.384124755859375, -1.30474853515625, -1.225372314453125, -1.14599609375, -1.066619873046875, -0.98724365234375, -0.907867431640625, -0.8284912109375, -0.749114990234375, -0.66973876953125, -0.590362548828125, -0.510986328125, -0.431610107421875, -0.35223388671875, -0.272857666015625, -0.1934814453125, -0.114105224609375, -0.03472900390625, 0.044647216796875, 0.1240234375, 0.203399658203125, 0.28277587890625, 0.362152099609375, 0.4415283203125, 0.520904541015625, 0.60028076171875, 0.679656982421875, 0.759033203125, 0.838409423828125, 0.91778564453125, 0.997161865234375, 1.0765380859375, 1.155914306640625, 1.23529052734375, 1.314666748046875, 1.39404296875, 1.473419189453125, 1.55279541015625, 1.632171630859375, 1.7115478515625, 1.790924072265625, 1.87030029296875, 1.949676513671875, 2.029052734375, 2.108428955078125, 2.18780517578125, 2.267181396484375, 2.3465576171875, 2.425933837890625, 2.50531005859375, 2.584686279296875, 2.6640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 3.0, 6.0, 7.0, 10.0, 12.0, 13.0, 21.0, 31.0, 34.0, 45.0, 56.0, 72.0, 90.0, 106.0, 98.0, 92.0, 86.0, 45.0, 41.0, 23.0, 28.0, 17.0, 9.0, 11.0, 8.0, 8.0, 6.0, 2.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.00045871734619140625, -0.0004468858242034912, -0.00043505430221557617, -0.00042322278022766113, -0.0004113912582397461, -0.00039955973625183105, -0.000387728214263916, -0.000375896692276001, -0.00036406517028808594, -0.0003522336483001709, -0.00034040212631225586, -0.0003285706043243408, -0.0003167390823364258, -0.00030490756034851074, -0.0002930760383605957, -0.00028124451637268066, -0.0002694129943847656, -0.0002575814723968506, -0.00024574995040893555, -0.0002339184284210205, -0.00022208690643310547, -0.00021025538444519043, -0.0001984238624572754, -0.00018659234046936035, -0.0001747608184814453, -0.00016292929649353027, -0.00015109777450561523, -0.0001392662525177002, -0.00012743473052978516, -0.00011560320854187012, -0.00010377168655395508, -9.194016456604004e-05, -8.0108642578125e-05, -6.827712059020996e-05, -5.644559860229492e-05, -4.461407661437988e-05, -3.2782554626464844e-05, -2.0951032638549805e-05, -9.119510650634766e-06, 2.7120113372802734e-06, 1.4543533325195312e-05, 2.637505531311035e-05, 3.820657730102539e-05, 5.003809928894043e-05, 6.186962127685547e-05, 7.370114326477051e-05, 8.553266525268555e-05, 9.736418724060059e-05, 0.00010919570922851562, 0.00012102723121643066, 0.0001328587532043457, 0.00014469027519226074, 0.00015652179718017578, 0.00016835331916809082, 0.00018018484115600586, 0.0001920163631439209, 0.00020384788513183594, 0.00021567940711975098, 0.00022751092910766602, 0.00023934245109558105, 0.0002511739730834961, 0.00026300549507141113, 0.00027483701705932617, 0.0002866685390472412, 0.00029850006103515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 6.0, 3.0, 4.0, 8.0, 9.0, 20.0, 25.0, 35.0, 69.0, 91.0, 179.0, 323.0, 515.0, 961.0, 2027.0, 4991.0, 14870.0, 63497.0, 610107.0, 295707.0, 37855.0, 10115.0, 3779.0, 1574.0, 736.0, 382.0, 244.0, 136.0, 100.0, 62.0, 38.0, 31.0, 15.0, 11.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.29296875, -2.207550048828125, -2.12213134765625, -2.036712646484375, -1.9512939453125, -1.865875244140625, -1.78045654296875, -1.695037841796875, -1.609619140625, -1.524200439453125, -1.43878173828125, -1.353363037109375, -1.2679443359375, -1.182525634765625, -1.09710693359375, -1.011688232421875, -0.92626953125, -0.840850830078125, -0.75543212890625, -0.670013427734375, -0.5845947265625, -0.499176025390625, -0.41375732421875, -0.328338623046875, -0.242919921875, -0.157501220703125, -0.07208251953125, 0.013336181640625, 0.0987548828125, 0.184173583984375, 0.26959228515625, 0.355010986328125, 0.4404296875, 0.525848388671875, 0.61126708984375, 0.696685791015625, 0.7821044921875, 0.867523193359375, 0.95294189453125, 1.038360595703125, 1.123779296875, 1.209197998046875, 1.29461669921875, 1.380035400390625, 1.4654541015625, 1.550872802734375, 1.63629150390625, 1.721710205078125, 1.80712890625, 1.892547607421875, 1.97796630859375, 2.063385009765625, 2.1488037109375, 2.234222412109375, 2.31964111328125, 2.405059814453125, 2.490478515625, 2.575897216796875, 2.66131591796875, 2.746734619140625, 2.8321533203125, 2.917572021484375, 3.00299072265625, 3.088409423828125, 3.173828125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 7.0, 12.0, 7.0, 14.0, 30.0, 35.0, 45.0, 50.0, 71.0, 90.0, 115.0, 119.0, 113.0, 83.0, 62.0, 45.0, 34.0, 15.0, 16.0, 10.0, 4.0, 4.0, 8.0, 3.0, 0.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9453125, -0.911468505859375, -0.87762451171875, -0.843780517578125, -0.8099365234375, -0.776092529296875, -0.74224853515625, -0.708404541015625, -0.674560546875, -0.640716552734375, -0.60687255859375, -0.573028564453125, -0.5391845703125, -0.505340576171875, -0.47149658203125, -0.437652587890625, -0.40380859375, -0.369964599609375, -0.33612060546875, -0.302276611328125, -0.2684326171875, -0.234588623046875, -0.20074462890625, -0.166900634765625, -0.133056640625, -0.099212646484375, -0.06536865234375, -0.031524658203125, 0.0023193359375, 0.036163330078125, 0.07000732421875, 0.103851318359375, 0.1376953125, 0.171539306640625, 0.20538330078125, 0.239227294921875, 0.2730712890625, 0.306915283203125, 0.34075927734375, 0.374603271484375, 0.408447265625, 0.442291259765625, 0.47613525390625, 0.509979248046875, 0.5438232421875, 0.577667236328125, 0.61151123046875, 0.645355224609375, 0.67919921875, 0.713043212890625, 0.74688720703125, 0.780731201171875, 0.8145751953125, 0.848419189453125, 0.88226318359375, 0.916107177734375, 0.949951171875, 0.983795166015625, 1.01763916015625, 1.051483154296875, 1.0853271484375, 1.119171142578125, 1.15301513671875, 1.186859130859375, 1.220703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 15.0, 33.0, 56.0, 117.0, 240.0, 252.0, 129.0, 74.0, 28.0, 17.0, 7.0, 8.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.47842788696289, -13.900054931640625, -13.321681022644043, -12.743308067321777, -12.164934158325195, -11.58656120300293, -11.008188247680664, -10.429815292358398, -9.851441383361816, -9.27306842803955, -8.694694519042969, -8.116321563720703, -7.537948131561279, -6.9595746994018555, -6.38120174407959, -5.802828311920166, -5.224454879760742, -4.646081447601318, -4.0677080154418945, -3.489335060119629, -2.910961627960205, -2.3325881958007812, -1.7542150020599365, -1.1758418083190918, -0.597468376159668, -0.01909506320953369, 0.5592782497406006, 1.1376515626907349, 1.7160248756408691, 2.294398307800293, 2.8727715015411377, 3.4511446952819824, 4.029516220092773, 4.607889652252197, 5.186263084411621, 5.764636039733887, 6.3430094718933105, 6.921382904052734, 7.499755859375, 8.078128814697266, 8.656502723693848, 9.234875679016113, 9.813249588012695, 10.391622543334961, 10.969995498657227, 11.548369407653809, 12.126742362976074, 12.705116271972656, 13.283489227294922, 13.861862182617188, 14.44023609161377, 15.018609046936035, 15.596982955932617, 16.175355911254883, 16.75372886657715, 17.332101821899414, 17.910476684570312, 18.488849639892578, 19.067222595214844, 19.645597457885742, 20.223970413208008, 20.802343368530273, 21.38071632385254, 21.959089279174805, 22.53746223449707]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 9.0, 3.0, 9.0, 10.0, 12.0, 9.0, 22.0, 22.0, 35.0, 41.0, 62.0, 63.0, 67.0, 83.0, 87.0, 74.0, 71.0, 52.0, 43.0, 54.0, 34.0, 27.0, 25.0, 18.0, 16.0, 7.0, 8.0, 7.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.06308364868164, -9.800085067749023, -9.53708553314209, -9.274085998535156, -9.011087417602539, -8.748088836669922, -8.485089302062988, -8.222089767456055, -7.9590911865234375, -7.696092128753662, -7.433093070983887, -7.170094013214111, -6.907094955444336, -6.6440958976745605, -6.381096839904785, -6.11809778213501, -5.855098724365234, -5.592099666595459, -5.329100608825684, -5.066101551055908, -4.803102493286133, -4.540103435516357, -4.277104377746582, -4.014105319976807, -3.7511062622070312, -3.488107204437256, -3.2251081466674805, -2.962109088897705, -2.6991100311279297, -2.4361109733581543, -2.173111915588379, -1.9101128578186035, -1.6471138000488281, -1.3841147422790527, -1.1211156845092773, -0.858116626739502, -0.5951175689697266, -0.33211851119995117, -0.06911945343017578, 0.1938796043395996, 0.456878662109375, 0.7198777198791504, 0.9828767776489258, 1.2458758354187012, 1.5088748931884766, 1.771873950958252, 2.0348730087280273, 2.2978720664978027, 2.560871124267578, 2.8238701820373535, 3.086869239807129, 3.3498682975769043, 3.6128673553466797, 3.875866413116455, 4.1388654708862305, 4.401864528656006, 4.664863586425781, 4.927862644195557, 5.190861701965332, 5.453860759735107, 5.716859817504883, 5.979858875274658, 6.242857933044434, 6.505856990814209, 6.768856048583984]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 2.0, 9.0, 8.0, 9.0, 18.0, 28.0, 52.0, 60.0, 113.0, 157.0, 303.0, 555.0, 1186.0, 2491.0, 5970.0, 16869.0, 63807.0, 3967419.0, 101231.0, 21293.0, 7295.0, 2842.0, 1224.0, 617.0, 317.0, 161.0, 80.0, 43.0, 34.0, 26.0, 21.0, 9.0, 18.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.1129150390625, -3.913330078125, -3.7137451171875, -3.51416015625, -3.3145751953125, -3.114990234375, -2.9154052734375, -2.7158203125, -2.5162353515625, -2.316650390625, -2.1170654296875, -1.91748046875, -1.7178955078125, -1.518310546875, -1.3187255859375, -1.119140625, -0.9195556640625, -0.719970703125, -0.5203857421875, -0.32080078125, -0.1212158203125, 0.078369140625, 0.2779541015625, 0.4775390625, 0.6771240234375, 0.876708984375, 1.0762939453125, 1.27587890625, 1.4754638671875, 1.675048828125, 1.8746337890625, 2.07421875, 2.2738037109375, 2.473388671875, 2.6729736328125, 2.87255859375, 3.0721435546875, 3.271728515625, 3.4713134765625, 3.6708984375, 3.8704833984375, 4.070068359375, 4.2696533203125, 4.46923828125, 4.6688232421875, 4.868408203125, 5.0679931640625, 5.267578125, 5.4671630859375, 5.666748046875, 5.8663330078125, 6.06591796875, 6.2655029296875, 6.465087890625, 6.6646728515625, 6.8642578125, 7.0638427734375, 7.263427734375, 7.4630126953125, 7.66259765625, 7.8621826171875, 8.061767578125, 8.2613525390625, 8.4609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 19.0, 36.0, 42.0, 44.0, 67.0, 84.0, 83.0, 98.0, 105.0, 95.0, 86.0, 62.0, 47.0, 38.0, 18.0, 12.0, 13.0, 11.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2900390625, -0.2809181213378906, -0.27179718017578125, -0.2626762390136719, -0.2535552978515625, -0.24443435668945312, -0.23531341552734375, -0.22619247436523438, -0.217071533203125, -0.20795059204101562, -0.19882965087890625, -0.18970870971679688, -0.1805877685546875, -0.17146682739257812, -0.16234588623046875, -0.15322494506835938, -0.14410400390625, -0.13498306274414062, -0.12586212158203125, -0.11674118041992188, -0.1076202392578125, -0.09849929809570312, -0.08937835693359375, -0.08025741577148438, -0.071136474609375, -0.062015533447265625, -0.05289459228515625, -0.043773651123046875, -0.0346527099609375, -0.025531768798828125, -0.01641082763671875, -0.007289886474609375, 0.0018310546875, 0.010951995849609375, 0.02007293701171875, 0.029193878173828125, 0.0383148193359375, 0.047435760498046875, 0.05655670166015625, 0.06567764282226562, 0.074798583984375, 0.08391952514648438, 0.09304046630859375, 0.10216140747070312, 0.1112823486328125, 0.12040328979492188, 0.12952423095703125, 0.13864517211914062, 0.14776611328125, 0.15688705444335938, 0.16600799560546875, 0.17512893676757812, 0.1842498779296875, 0.19337081909179688, 0.20249176025390625, 0.21161270141601562, 0.220733642578125, 0.22985458374023438, 0.23897552490234375, 0.24809646606445312, 0.2572174072265625, 0.2663383483886719, 0.27545928955078125, 0.2845802307128906, 0.293701171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 9.0, 9.0, 14.0, 20.0, 25.0, 37.0, 38.0, 55.0, 78.0, 137.0, 219.0, 287.0, 477.0, 785.0, 1426.0, 2519.0, 4535.0, 9096.0, 18761.0, 44092.0, 198914.0, 3772927.0, 81301.0, 29872.0, 13477.0, 6705.0, 3673.0, 1964.0, 1059.0, 678.0, 390.0, 221.0, 161.0, 118.0, 69.0, 45.0, 33.0, 18.0, 12.0, 12.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.13726806640625, -4.0050048828125, -3.87274169921875, -3.740478515625, -3.60821533203125, -3.4759521484375, -3.34368896484375, -3.21142578125, -3.07916259765625, -2.9468994140625, -2.81463623046875, -2.682373046875, -2.55010986328125, -2.4178466796875, -2.28558349609375, -2.1533203125, -2.02105712890625, -1.8887939453125, -1.75653076171875, -1.624267578125, -1.49200439453125, -1.3597412109375, -1.22747802734375, -1.09521484375, -0.96295166015625, -0.8306884765625, -0.69842529296875, -0.566162109375, -0.43389892578125, -0.3016357421875, -0.16937255859375, -0.037109375, 0.09515380859375, 0.2274169921875, 0.35968017578125, 0.491943359375, 0.62420654296875, 0.7564697265625, 0.88873291015625, 1.02099609375, 1.15325927734375, 1.2855224609375, 1.41778564453125, 1.550048828125, 1.68231201171875, 1.8145751953125, 1.94683837890625, 2.0791015625, 2.21136474609375, 2.3436279296875, 2.47589111328125, 2.608154296875, 2.74041748046875, 2.8726806640625, 3.00494384765625, 3.13720703125, 3.26947021484375, 3.4017333984375, 3.53399658203125, 3.666259765625, 3.79852294921875, 3.9307861328125, 4.06304931640625, 4.1953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 8.0, 8.0, 20.0, 12.0, 20.0, 17.0, 22.0, 33.0, 49.0, 140.0, 485.0, 2635.0, 304.0, 83.0, 51.0, 27.0, 26.0, 22.0, 10.0, 15.0, 8.0, 12.0, 4.0, 6.0, 2.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6435546875, -0.6242599487304688, -0.6049652099609375, -0.5856704711914062, -0.566375732421875, -0.5470809936523438, -0.5277862548828125, -0.5084915161132812, -0.48919677734375, -0.46990203857421875, -0.4506072998046875, -0.43131256103515625, -0.412017822265625, -0.39272308349609375, -0.3734283447265625, -0.35413360595703125, -0.3348388671875, -0.31554412841796875, -0.2962493896484375, -0.27695465087890625, -0.257659912109375, -0.23836517333984375, -0.2190704345703125, -0.19977569580078125, -0.18048095703125, -0.16118621826171875, -0.1418914794921875, -0.12259674072265625, -0.103302001953125, -0.08400726318359375, -0.0647125244140625, -0.04541778564453125, -0.026123046875, -0.00682830810546875, 0.0124664306640625, 0.03176116943359375, 0.051055908203125, 0.07035064697265625, 0.0896453857421875, 0.10894012451171875, 0.12823486328125, 0.14752960205078125, 0.1668243408203125, 0.18611907958984375, 0.205413818359375, 0.22470855712890625, 0.2440032958984375, 0.26329803466796875, 0.2825927734375, 0.30188751220703125, 0.3211822509765625, 0.34047698974609375, 0.359771728515625, 0.37906646728515625, 0.3983612060546875, 0.41765594482421875, 0.43695068359375, 0.45624542236328125, 0.4755401611328125, 0.49483489990234375, 0.514129638671875, 0.5334243774414062, 0.5527191162109375, 0.5720138549804688, 0.59130859375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 9.0, 15.0, 37.0, 59.0, 92.0, 170.0, 220.0, 168.0, 91.0, 50.0, 23.0, 18.0, 11.0, 12.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.041604042053223, -4.895073413848877, -4.7485432624816895, -4.602012634277344, -4.455482006072998, -4.308951377868652, -4.162421226501465, -4.015890598297119, -3.8693602085113525, -3.722829818725586, -3.5762991905212402, -3.4297688007354736, -3.283238410949707, -3.1367077827453613, -2.9901773929595947, -2.843647003173828, -2.6971163749694824, -2.550585985183716, -2.40405535697937, -2.2575249671936035, -2.110994338989258, -1.9644639492034912, -1.8179335594177246, -1.6714030504226685, -1.5248725414276123, -1.3783420324325562, -1.2318115234375, -1.0852811336517334, -0.9387506246566772, -0.7922201156616211, -0.6456896662712097, -0.49915921688079834, -0.3526287078857422, -0.20609822869300842, -0.05956774950027466, 0.0869627296924591, 0.23349320888519287, 0.380023717880249, 0.5265541672706604, 0.6730846166610718, 0.8196151256561279, 0.9661456346511841, 1.1126761436462402, 1.2592065334320068, 1.405737042427063, 1.5522675514221191, 1.6987979412078857, 1.845328450202942, 1.991858959197998, 2.1383893489837646, 2.2849199771881104, 2.431450366973877, 2.5779809951782227, 2.7245113849639893, 2.871041774749756, 3.0175724029541016, 3.164102792739868, 3.3106331825256348, 3.4571638107299805, 3.603694200515747, 3.7502245903015137, 3.8967552185058594, 4.043285846710205, 4.189815998077393, 4.336346626281738]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 10.0, 13.0, 10.0, 20.0, 26.0, 26.0, 40.0, 43.0, 47.0, 54.0, 79.0, 70.0, 77.0, 72.0, 75.0, 64.0, 51.0, 48.0, 53.0, 26.0, 30.0, 19.0, 13.0, 16.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1183671951293945, -3.0369200706481934, -2.955472946166992, -2.87402606010437, -2.792578935623169, -2.7111318111419678, -2.6296846866607666, -2.5482375621795654, -2.4667906761169434, -2.385343551635742, -2.303896427154541, -2.222449541091919, -2.1410024166107178, -2.0595552921295166, -1.9781081676483154, -1.8966610431671143, -1.815213918685913, -1.733766794204712, -1.6523197889328003, -1.5708726644515991, -1.4894256591796875, -1.4079785346984863, -1.3265314102172852, -1.245084285736084, -1.1636372804641724, -1.0821901559829712, -1.0007431507110596, -0.9192960262298584, -0.837848961353302, -0.7564018964767456, -0.6749547719955444, -0.593507707118988, -0.5120606422424316, -0.43061357736587524, -0.34916648268699646, -0.2677193880081177, -0.18627232313156128, -0.10482525825500488, -0.0233781635761261, 0.058068931102752686, 0.13951599597930908, 0.22096307575702667, 0.30241015553474426, 0.38385725021362305, 0.46530431509017944, 0.5467513799667358, 0.628198504447937, 0.7096455693244934, 0.7910926342010498, 0.8725396990776062, 0.9539867639541626, 1.0354338884353638, 1.1168808937072754, 1.1983280181884766, 1.2797751426696777, 1.361222267150879, 1.4426692724227905, 1.5241163969039917, 1.6055634021759033, 1.6870105266571045, 1.7684576511383057, 1.8499046564102173, 1.9313517808914185, 2.01279878616333, 2.0942459106445312]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 9.0, 22.0, 17.0, 41.0, 61.0, 99.0, 150.0, 307.0, 560.0, 1114.0, 2448.0, 5655.0, 15538.0, 51926.0, 248802.0, 554176.0, 120170.0, 29964.0, 10124.0, 3920.0, 1654.0, 815.0, 398.0, 221.0, 123.0, 77.0, 50.0, 30.0, 28.0, 10.0, 3.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.640625, -3.527862548828125, -3.41510009765625, -3.302337646484375, -3.1895751953125, -3.076812744140625, -2.96405029296875, -2.851287841796875, -2.738525390625, -2.625762939453125, -2.51300048828125, -2.400238037109375, -2.2874755859375, -2.174713134765625, -2.06195068359375, -1.949188232421875, -1.83642578125, -1.723663330078125, -1.61090087890625, -1.498138427734375, -1.3853759765625, -1.272613525390625, -1.15985107421875, -1.047088623046875, -0.934326171875, -0.821563720703125, -0.70880126953125, -0.596038818359375, -0.4832763671875, -0.370513916015625, -0.25775146484375, -0.144989013671875, -0.0322265625, 0.080535888671875, 0.19329833984375, 0.306060791015625, 0.4188232421875, 0.531585693359375, 0.64434814453125, 0.757110595703125, 0.869873046875, 0.982635498046875, 1.09539794921875, 1.208160400390625, 1.3209228515625, 1.433685302734375, 1.54644775390625, 1.659210205078125, 1.77197265625, 1.884735107421875, 1.99749755859375, 2.110260009765625, 2.2230224609375, 2.335784912109375, 2.44854736328125, 2.561309814453125, 2.674072265625, 2.786834716796875, 2.89959716796875, 3.012359619140625, 3.1251220703125, 3.237884521484375, 3.35064697265625, 3.463409423828125, 3.576171875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 12.0, 8.0, 15.0, 23.0, 33.0, 39.0, 57.0, 53.0, 61.0, 69.0, 80.0, 75.0, 93.0, 76.0, 76.0, 55.0, 53.0, 30.0, 29.0, 17.0, 9.0, 9.0, 8.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296630859375, -0.28887939453125, -0.2811279296875, -0.27337646484375, -0.265625, -0.25787353515625, -0.2501220703125, -0.24237060546875, -0.234619140625, -0.22686767578125, -0.2191162109375, -0.21136474609375, -0.20361328125, -0.19586181640625, -0.1881103515625, -0.18035888671875, -0.172607421875, -0.16485595703125, -0.1571044921875, -0.14935302734375, -0.1416015625, -0.13385009765625, -0.1260986328125, -0.11834716796875, -0.110595703125, -0.10284423828125, -0.0950927734375, -0.08734130859375, -0.07958984375, -0.07183837890625, -0.0640869140625, -0.05633544921875, -0.048583984375, -0.04083251953125, -0.0330810546875, -0.02532958984375, -0.017578125, -0.00982666015625, -0.0020751953125, 0.00567626953125, 0.013427734375, 0.02117919921875, 0.0289306640625, 0.03668212890625, 0.04443359375, 0.05218505859375, 0.0599365234375, 0.06768798828125, 0.075439453125, 0.08319091796875, 0.0909423828125, 0.09869384765625, 0.1064453125, 0.11419677734375, 0.1219482421875, 0.12969970703125, 0.137451171875, 0.14520263671875, 0.1529541015625, 0.16070556640625, 0.16845703125, 0.17620849609375, 0.1839599609375, 0.19171142578125, 0.199462890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 9.0, 3.0, 6.0, 14.0, 16.0, 14.0, 26.0, 34.0, 55.0, 84.0, 104.0, 191.0, 263.0, 420.0, 636.0, 1247.0, 2171.0, 4452.0, 9924.0, 23629.0, 65545.0, 223958.0, 467631.0, 162729.0, 50380.0, 18975.0, 7918.0, 3602.0, 1832.0, 1023.0, 588.0, 370.0, 231.0, 153.0, 109.0, 71.0, 56.0, 26.0, 22.0, 17.0, 11.0, 2.0, 9.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.350860595703125, -2.27593994140625, -2.201019287109375, -2.1260986328125, -2.051177978515625, -1.97625732421875, -1.901336669921875, -1.826416015625, -1.751495361328125, -1.67657470703125, -1.601654052734375, -1.5267333984375, -1.451812744140625, -1.37689208984375, -1.301971435546875, -1.22705078125, -1.152130126953125, -1.07720947265625, -1.002288818359375, -0.9273681640625, -0.852447509765625, -0.77752685546875, -0.702606201171875, -0.627685546875, -0.552764892578125, -0.47784423828125, -0.402923583984375, -0.3280029296875, -0.253082275390625, -0.17816162109375, -0.103240966796875, -0.0283203125, 0.046600341796875, 0.12152099609375, 0.196441650390625, 0.2713623046875, 0.346282958984375, 0.42120361328125, 0.496124267578125, 0.571044921875, 0.645965576171875, 0.72088623046875, 0.795806884765625, 0.8707275390625, 0.945648193359375, 1.02056884765625, 1.095489501953125, 1.17041015625, 1.245330810546875, 1.32025146484375, 1.395172119140625, 1.4700927734375, 1.545013427734375, 1.61993408203125, 1.694854736328125, 1.769775390625, 1.844696044921875, 1.91961669921875, 1.994537353515625, 2.0694580078125, 2.144378662109375, 2.21929931640625, 2.294219970703125, 2.369140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 9.0, 11.0, 5.0, 10.0, 12.0, 16.0, 20.0, 27.0, 26.0, 31.0, 32.0, 48.0, 42.0, 43.0, 48.0, 45.0, 43.0, 52.0, 43.0, 43.0, 49.0, 50.0, 35.0, 33.0, 40.0, 29.0, 22.0, 27.0, 23.0, 15.0, 5.0, 15.0, 11.0, 9.0, 9.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92236328125, -0.8897933959960938, -0.8572235107421875, -0.8246536254882812, -0.792083740234375, -0.7595138549804688, -0.7269439697265625, -0.6943740844726562, -0.66180419921875, -0.6292343139648438, -0.5966644287109375, -0.5640945434570312, -0.531524658203125, -0.49895477294921875, -0.4663848876953125, -0.43381500244140625, -0.4012451171875, -0.36867523193359375, -0.3361053466796875, -0.30353546142578125, -0.270965576171875, -0.23839569091796875, -0.2058258056640625, -0.17325592041015625, -0.14068603515625, -0.10811614990234375, -0.0755462646484375, -0.04297637939453125, -0.010406494140625, 0.02216339111328125, 0.0547332763671875, 0.08730316162109375, 0.119873046875, 0.15244293212890625, 0.1850128173828125, 0.21758270263671875, 0.250152587890625, 0.28272247314453125, 0.3152923583984375, 0.34786224365234375, 0.38043212890625, 0.41300201416015625, 0.4455718994140625, 0.47814178466796875, 0.510711669921875, 0.5432815551757812, 0.5758514404296875, 0.6084213256835938, 0.6409912109375, 0.6735610961914062, 0.7061309814453125, 0.7387008666992188, 0.771270751953125, 0.8038406372070312, 0.8364105224609375, 0.8689804077148438, 0.90155029296875, 0.9341201782226562, 0.9666900634765625, 0.9992599487304688, 1.031829833984375, 1.0643997192382812, 1.0969696044921875, 1.1295394897460938, 1.162109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 5.0, 7.0, 4.0, 2.0, 8.0, 4.0, 11.0, 16.0, 11.0, 31.0, 34.0, 18.0, 54.0, 84.0, 131.0, 291.0, 527.0, 1076.0, 2669.0, 7872.0, 32956.0, 335976.0, 602949.0, 47668.0, 10137.0, 3258.0, 1362.0, 644.0, 304.0, 154.0, 101.0, 51.0, 37.0, 27.0, 14.0, 16.0, 10.0, 6.0, 10.0, 3.0, 5.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.310546875, -2.218505859375, -2.12646484375, -2.034423828125, -1.9423828125, -1.850341796875, -1.75830078125, -1.666259765625, -1.57421875, -1.482177734375, -1.39013671875, -1.298095703125, -1.2060546875, -1.114013671875, -1.02197265625, -0.929931640625, -0.837890625, -0.745849609375, -0.65380859375, -0.561767578125, -0.4697265625, -0.377685546875, -0.28564453125, -0.193603515625, -0.1015625, -0.009521484375, 0.08251953125, 0.174560546875, 0.2666015625, 0.358642578125, 0.45068359375, 0.542724609375, 0.634765625, 0.726806640625, 0.81884765625, 0.910888671875, 1.0029296875, 1.094970703125, 1.18701171875, 1.279052734375, 1.37109375, 1.463134765625, 1.55517578125, 1.647216796875, 1.7392578125, 1.831298828125, 1.92333984375, 2.015380859375, 2.107421875, 2.199462890625, 2.29150390625, 2.383544921875, 2.4755859375, 2.567626953125, 2.65966796875, 2.751708984375, 2.84375, 2.935791015625, 3.02783203125, 3.119873046875, 3.2119140625, 3.303955078125, 3.39599609375, 3.488037109375, 3.580078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 7.0, 10.0, 9.0, 16.0, 14.0, 34.0, 47.0, 52.0, 60.0, 81.0, 87.0, 114.0, 101.0, 84.0, 65.0, 58.0, 25.0, 33.0, 29.0, 14.0, 13.0, 16.0, 4.0, 2.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00035071372985839844, -0.0003422833979129791, -0.0003338530659675598, -0.0003254227340221405, -0.0003169924020767212, -0.0003085620701313019, -0.00030013173818588257, -0.00029170140624046326, -0.00028327107429504395, -0.00027484074234962463, -0.0002664104104042053, -0.000257980078458786, -0.0002495497465133667, -0.0002411194145679474, -0.00023268908262252808, -0.00022425875067710876, -0.00021582841873168945, -0.00020739808678627014, -0.00019896775484085083, -0.00019053742289543152, -0.0001821070909500122, -0.0001736767590045929, -0.00016524642705917358, -0.00015681609511375427, -0.00014838576316833496, -0.00013995543122291565, -0.00013152509927749634, -0.00012309476733207703, -0.00011466443538665771, -0.0001062341034412384, -9.780377149581909e-05, -8.937343955039978e-05, -8.094310760498047e-05, -7.251277565956116e-05, -6.408244371414185e-05, -5.5652111768722534e-05, -4.722177982330322e-05, -3.879144787788391e-05, -3.03611159324646e-05, -2.1930783987045288e-05, -1.3500452041625977e-05, -5.070120096206665e-06, 3.3602118492126465e-06, 1.1790543794631958e-05, 2.022087574005127e-05, 2.865120768547058e-05, 3.708153963088989e-05, 4.5511871576309204e-05, 5.3942203521728516e-05, 6.237253546714783e-05, 7.080286741256714e-05, 7.923319935798645e-05, 8.766353130340576e-05, 9.609386324882507e-05, 0.00010452419519424438, 0.0001129545271396637, 0.00012138485908508301, 0.00012981519103050232, 0.00013824552297592163, 0.00014667585492134094, 0.00015510618686676025, 0.00016353651881217957, 0.00017196685075759888, 0.0001803971827030182, 0.0001888275146484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 9.0, 12.0, 17.0, 27.0, 38.0, 42.0, 53.0, 84.0, 88.0, 166.0, 234.0, 367.0, 511.0, 922.0, 1623.0, 3132.0, 6379.0, 15015.0, 42035.0, 157762.0, 586104.0, 161742.0, 43024.0, 15304.0, 6534.0, 3102.0, 1611.0, 958.0, 537.0, 339.0, 228.0, 143.0, 97.0, 73.0, 54.0, 39.0, 32.0, 19.0, 28.0, 16.0, 8.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7021484375, -1.64813232421875, -1.5941162109375, -1.54010009765625, -1.486083984375, -1.43206787109375, -1.3780517578125, -1.32403564453125, -1.27001953125, -1.21600341796875, -1.1619873046875, -1.10797119140625, -1.053955078125, -0.99993896484375, -0.9459228515625, -0.89190673828125, -0.837890625, -0.78387451171875, -0.7298583984375, -0.67584228515625, -0.621826171875, -0.56781005859375, -0.5137939453125, -0.45977783203125, -0.40576171875, -0.35174560546875, -0.2977294921875, -0.24371337890625, -0.189697265625, -0.13568115234375, -0.0816650390625, -0.02764892578125, 0.0263671875, 0.08038330078125, 0.1343994140625, 0.18841552734375, 0.242431640625, 0.29644775390625, 0.3504638671875, 0.40447998046875, 0.45849609375, 0.51251220703125, 0.5665283203125, 0.62054443359375, 0.674560546875, 0.72857666015625, 0.7825927734375, 0.83660888671875, 0.890625, 0.94464111328125, 0.9986572265625, 1.05267333984375, 1.106689453125, 1.16070556640625, 1.2147216796875, 1.26873779296875, 1.32275390625, 1.37677001953125, 1.4307861328125, 1.48480224609375, 1.538818359375, 1.59283447265625, 1.6468505859375, 1.70086669921875, 1.7548828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 5.0, 7.0, 11.0, 13.0, 21.0, 28.0, 40.0, 29.0, 32.0, 56.0, 64.0, 80.0, 97.0, 75.0, 83.0, 76.0, 45.0, 47.0, 39.0, 29.0, 19.0, 19.0, 16.0, 6.0, 11.0, 9.0, 7.0, 5.0, 5.0, 5.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7958984375, -0.7705612182617188, -0.7452239990234375, -0.7198867797851562, -0.694549560546875, -0.6692123413085938, -0.6438751220703125, -0.6185379028320312, -0.59320068359375, -0.5678634643554688, -0.5425262451171875, -0.5171890258789062, -0.491851806640625, -0.46651458740234375, -0.4411773681640625, -0.41584014892578125, -0.3905029296875, -0.36516571044921875, -0.3398284912109375, -0.31449127197265625, -0.289154052734375, -0.26381683349609375, -0.2384796142578125, -0.21314239501953125, -0.18780517578125, -0.16246795654296875, -0.1371307373046875, -0.11179351806640625, -0.086456298828125, -0.06111907958984375, -0.0357818603515625, -0.01044464111328125, 0.014892578125, 0.04022979736328125, 0.0655670166015625, 0.09090423583984375, 0.116241455078125, 0.14157867431640625, 0.1669158935546875, 0.19225311279296875, 0.21759033203125, 0.24292755126953125, 0.2682647705078125, 0.29360198974609375, 0.318939208984375, 0.34427642822265625, 0.3696136474609375, 0.39495086669921875, 0.4202880859375, 0.44562530517578125, 0.4709625244140625, 0.49629974365234375, 0.521636962890625, 0.5469741821289062, 0.5723114013671875, 0.5976486206054688, 0.62298583984375, 0.6483230590820312, 0.6736602783203125, 0.6989974975585938, 0.724334716796875, 0.7496719360351562, 0.7750091552734375, 0.8003463745117188, 0.82568359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 17.0, 22.0, 28.0, 55.0, 106.0, 169.0, 220.0, 165.0, 97.0, 37.0, 29.0, 18.0, 12.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.644939422607422, -21.984752655029297, -21.324565887451172, -20.664377212524414, -20.00419044494629, -19.344003677368164, -18.68381690979004, -18.023630142211914, -17.363441467285156, -16.70325469970703, -16.043067932128906, -15.382880210876465, -14.722692489624023, -14.062505722045898, -13.402318954467773, -12.742132186889648, -12.081945419311523, -11.421758651733398, -10.761570930480957, -10.101384162902832, -9.44119644165039, -8.781009674072266, -8.12082290649414, -7.460635662078857, -6.800448417663574, -6.140261173248291, -5.480073928833008, -4.819887161254883, -4.1596999168396, -3.4995126724243164, -2.8393256664276123, -2.179138660430908, -1.5189533233642578, -0.8587661981582642, -0.1985790729522705, 0.46160805225372314, 1.1217951774597168, 1.781982421875, 2.442169427871704, 3.102356433868408, 3.7625436782836914, 4.422730922698975, 5.082918167114258, 5.743104934692383, 6.403292179107666, 7.063479423522949, 7.723666191101074, 8.383853912353516, 9.04404067993164, 9.704227447509766, 10.364415168762207, 11.024601936340332, 11.684789657592773, 12.344976425170898, 13.005163192749023, 13.665349960327148, 14.32553768157959, 14.985724449157715, 15.645912170410156, 16.30609893798828, 16.966285705566406, 17.62647247314453, 18.28666114807129, 18.946847915649414, 19.60703468322754]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 7.0, 9.0, 14.0, 21.0, 26.0, 23.0, 33.0, 43.0, 45.0, 55.0, 65.0, 48.0, 63.0, 60.0, 54.0, 59.0, 77.0, 55.0, 48.0, 35.0, 42.0, 25.0, 26.0, 17.0, 8.0, 8.0, 15.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.728199005126953, -7.396625995635986, -7.0650529861450195, -6.7334794998168945, -6.401906490325928, -6.070333480834961, -5.738759994506836, -5.407186985015869, -5.075613975524902, -4.7440409660339355, -4.412467956542969, -4.080894470214844, -3.749321460723877, -3.41774845123291, -3.0861752033233643, -2.7546019554138184, -2.4230289459228516, -2.0914559364318848, -1.7598826885223389, -1.4283095598220825, -1.0967364311218262, -0.7651633024215698, -0.4335901737213135, -0.10201692581176758, 0.22955608367919922, 0.5611292123794556, 0.8927023410797119, 1.2242754697799683, 1.5558485984802246, 1.887421727180481, 2.2189948558807373, 2.550568103790283, 2.88214111328125, 3.213714122772217, 3.5452873706817627, 3.8768606185913086, 4.208433628082275, 4.540006637573242, 4.871580123901367, 5.203153133392334, 5.534726142883301, 5.866299152374268, 6.197872161865234, 6.529445648193359, 6.861018657684326, 7.192591667175293, 7.524165153503418, 7.855738162994385, 8.187311172485352, 8.518884658813477, 8.850457191467285, 9.18203067779541, 9.513603210449219, 9.845176696777344, 10.176750183105469, 10.508323669433594, 10.839896202087402, 11.171469688415527, 11.503042221069336, 11.834615707397461, 12.166189193725586, 12.497761726379395, 12.82933521270752, 13.160907745361328, 13.492481231689453]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 10.0, 6.0, 17.0, 24.0, 41.0, 73.0, 116.0, 197.0, 575.0, 2545.0, 23802.0, 4114681.0, 47723.0, 3288.0, 683.0, 210.0, 127.0, 44.0, 34.0, 26.0, 18.0, 10.0, 6.0, 4.0, 4.0, 3.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.384521484375, -13.95654296875, -13.528564453125, -13.1005859375, -12.672607421875, -12.24462890625, -11.816650390625, -11.388671875, -10.960693359375, -10.53271484375, -10.104736328125, -9.6767578125, -9.248779296875, -8.82080078125, -8.392822265625, -7.96484375, -7.536865234375, -7.10888671875, -6.680908203125, -6.2529296875, -5.824951171875, -5.39697265625, -4.968994140625, -4.541015625, -4.113037109375, -3.68505859375, -3.257080078125, -2.8291015625, -2.401123046875, -1.97314453125, -1.545166015625, -1.1171875, -0.689208984375, -0.26123046875, 0.166748046875, 0.5947265625, 1.022705078125, 1.45068359375, 1.878662109375, 2.306640625, 2.734619140625, 3.16259765625, 3.590576171875, 4.0185546875, 4.446533203125, 4.87451171875, 5.302490234375, 5.73046875, 6.158447265625, 6.58642578125, 7.014404296875, 7.4423828125, 7.870361328125, 8.29833984375, 8.726318359375, 9.154296875, 9.582275390625, 10.01025390625, 10.438232421875, 10.8662109375, 11.294189453125, 11.72216796875, 12.150146484375, 12.578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 15.0, 25.0, 33.0, 45.0, 49.0, 57.0, 69.0, 72.0, 78.0, 92.0, 77.0, 78.0, 81.0, 56.0, 36.0, 30.0, 22.0, 25.0, 7.0, 7.0, 4.0, 4.0, 5.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.32115936279296875, -0.3117523193359375, -0.30234527587890625, -0.292938232421875, -0.28353118896484375, -0.2741241455078125, -0.26471710205078125, -0.25531005859375, -0.24590301513671875, -0.2364959716796875, -0.22708892822265625, -0.217681884765625, -0.20827484130859375, -0.1988677978515625, -0.18946075439453125, -0.1800537109375, -0.17064666748046875, -0.1612396240234375, -0.15183258056640625, -0.142425537109375, -0.13301849365234375, -0.1236114501953125, -0.11420440673828125, -0.10479736328125, -0.09539031982421875, -0.0859832763671875, -0.07657623291015625, -0.067169189453125, -0.05776214599609375, -0.0483551025390625, -0.03894805908203125, -0.029541015625, -0.02013397216796875, -0.0107269287109375, -0.00131988525390625, 0.008087158203125, 0.01749420166015625, 0.0269012451171875, 0.03630828857421875, 0.04571533203125, 0.05512237548828125, 0.0645294189453125, 0.07393646240234375, 0.083343505859375, 0.09275054931640625, 0.1021575927734375, 0.11156463623046875, 0.1209716796875, 0.13037872314453125, 0.1397857666015625, 0.14919281005859375, 0.158599853515625, 0.16800689697265625, 0.1774139404296875, 0.18682098388671875, 0.19622802734375, 0.20563507080078125, 0.2150421142578125, 0.22444915771484375, 0.233856201171875, 0.24326324462890625, 0.2526702880859375, 0.26207733154296875, 0.271484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 6.0, 7.0, 8.0, 15.0, 23.0, 40.0, 49.0, 61.0, 85.0, 132.0, 180.0, 330.0, 563.0, 1044.0, 2010.0, 4151.0, 9121.0, 20918.0, 58030.0, 2592529.0, 1409893.0, 57334.0, 20546.0, 8695.0, 4063.0, 1990.0, 1029.0, 566.0, 304.0, 191.0, 123.0, 75.0, 48.0, 25.0, 28.0, 14.0, 14.0, 6.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.9375, -4.800323486328125, -4.66314697265625, -4.525970458984375, -4.3887939453125, -4.251617431640625, -4.11444091796875, -3.977264404296875, -3.840087890625, -3.702911376953125, -3.56573486328125, -3.428558349609375, -3.2913818359375, -3.154205322265625, -3.01702880859375, -2.879852294921875, -2.74267578125, -2.605499267578125, -2.46832275390625, -2.331146240234375, -2.1939697265625, -2.056793212890625, -1.91961669921875, -1.782440185546875, -1.645263671875, -1.508087158203125, -1.37091064453125, -1.233734130859375, -1.0965576171875, -0.959381103515625, -0.82220458984375, -0.685028076171875, -0.5478515625, -0.410675048828125, -0.27349853515625, -0.136322021484375, 0.0008544921875, 0.138031005859375, 0.27520751953125, 0.412384033203125, 0.549560546875, 0.686737060546875, 0.82391357421875, 0.961090087890625, 1.0982666015625, 1.235443115234375, 1.37261962890625, 1.509796142578125, 1.64697265625, 1.784149169921875, 1.92132568359375, 2.058502197265625, 2.1956787109375, 2.332855224609375, 2.47003173828125, 2.607208251953125, 2.744384765625, 2.881561279296875, 3.01873779296875, 3.155914306640625, 3.2930908203125, 3.430267333984375, 3.56744384765625, 3.704620361328125, 3.841796875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 9.0, 7.0, 10.0, 7.0, 11.0, 16.0, 35.0, 36.0, 49.0, 105.0, 469.0, 2891.0, 195.0, 72.0, 40.0, 24.0, 24.0, 16.0, 17.0, 6.0, 11.0, 7.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26171875, -1.2318649291992188, -1.2020111083984375, -1.1721572875976562, -1.142303466796875, -1.1124496459960938, -1.0825958251953125, -1.0527420043945312, -1.02288818359375, -0.9930343627929688, -0.9631805419921875, -0.9333267211914062, -0.903472900390625, -0.8736190795898438, -0.8437652587890625, -0.8139114379882812, -0.7840576171875, -0.7542037963867188, -0.7243499755859375, -0.6944961547851562, -0.664642333984375, -0.6347885131835938, -0.6049346923828125, -0.5750808715820312, -0.54522705078125, -0.5153732299804688, -0.4855194091796875, -0.45566558837890625, -0.425811767578125, -0.39595794677734375, -0.3661041259765625, -0.33625030517578125, -0.306396484375, -0.27654266357421875, -0.2466888427734375, -0.21683502197265625, -0.186981201171875, -0.15712738037109375, -0.1272735595703125, -0.09741973876953125, -0.06756591796875, -0.03771209716796875, -0.0078582763671875, 0.02199554443359375, 0.051849365234375, 0.08170318603515625, 0.1115570068359375, 0.14141082763671875, 0.1712646484375, 0.20111846923828125, 0.2309722900390625, 0.26082611083984375, 0.290679931640625, 0.32053375244140625, 0.3503875732421875, 0.38024139404296875, 0.41009521484375, 0.43994903564453125, 0.4698028564453125, 0.49965667724609375, 0.529510498046875, 0.5593643188476562, 0.5892181396484375, 0.6190719604492188, 0.64892578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 11.0, 9.0, 17.0, 34.0, 57.0, 65.0, 126.0, 157.0, 201.0, 118.0, 67.0, 41.0, 34.0, 25.0, 9.0, 8.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.483750343322754, -4.317582607269287, -4.151414394378662, -3.9852466583251953, -3.8190789222717285, -3.6529109477996826, -3.4867429733276367, -3.32057523727417, -3.154407262802124, -2.988239288330078, -2.8220715522766113, -2.6559035778045654, -2.4897356033325195, -2.3235678672790527, -2.157399892807007, -1.9912320375442505, -1.8250641822814941, -1.6588963270187378, -1.4927284717559814, -1.3265604972839355, -1.1603926420211792, -0.9942247867584229, -0.8280568718910217, -0.6618889570236206, -0.49572110176086426, -0.3295532166957855, -0.1633853316307068, 0.0027825534343719482, 0.16895043849945068, 0.33511829376220703, 0.5012862086296082, 0.6674541234970093, 0.8336219787597656, 0.999789834022522, 1.1659576892852783, 1.3321256637573242, 1.4982935190200806, 1.664461374282837, 1.8306293487548828, 1.9967972040176392, 2.1629650592803955, 2.3291330337524414, 2.495300769805908, 2.661468744277954, 2.82763671875, 2.993804454803467, 3.1599724292755127, 3.3261404037475586, 3.4923081398010254, 3.6584761142730713, 3.824643850326538, 3.990811824798584, 4.156979560852051, 4.323147773742676, 4.489315509796143, 4.655483245849609, 4.821651458740234, 4.987819194793701, 5.153987407684326, 5.320155143737793, 5.48632287979126, 5.652490615844727, 5.818658828735352, 5.984826564788818, 6.150994300842285]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 8.0, 2.0, 6.0, 6.0, 4.0, 10.0, 11.0, 17.0, 22.0, 19.0, 22.0, 22.0, 26.0, 26.0, 31.0, 30.0, 40.0, 23.0, 31.0, 34.0, 23.0, 31.0, 22.0, 37.0, 35.0, 39.0, 31.0, 34.0, 29.0, 37.0, 33.0, 25.0, 30.0, 21.0, 31.0, 19.0, 16.0, 12.0, 21.0, 18.0, 7.0, 7.0, 11.0, 10.0, 6.0, 10.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.7520215511322021, -1.6974339485168457, -1.6428463459014893, -1.5882586240768433, -1.5336710214614868, -1.4790834188461304, -1.4244956970214844, -1.369908094406128, -1.3153204917907715, -1.260732889175415, -1.2061452865600586, -1.1515575647354126, -1.0969699621200562, -1.0423823595046997, -0.9877946972846985, -0.9332070350646973, -0.8786194324493408, -0.8240318298339844, -0.7694441676139832, -0.7148565053939819, -0.6602689027786255, -0.605681300163269, -0.5510936379432678, -0.496506005525589, -0.44191837310791016, -0.3873307406902313, -0.3327431082725525, -0.27815547585487366, -0.22356784343719482, -0.168980211019516, -0.11439257860183716, -0.059804946184158325, -0.005217194557189941, 0.04937043786048889, 0.10395807027816772, 0.15854570269584656, 0.2131333351135254, 0.2677209675312042, 0.32230859994888306, 0.3768962323665619, 0.4314838647842407, 0.48607149720191956, 0.5406591296195984, 0.5952467918395996, 0.649834394454956, 0.7044219970703125, 0.7590096592903137, 0.8135973215103149, 0.8681849241256714, 0.9227725267410278, 0.977360188961029, 1.0319478511810303, 1.0865354537963867, 1.1411230564117432, 1.1957106590270996, 1.2502983808517456, 1.304885983467102, 1.3594735860824585, 1.4140613079071045, 1.468648910522461, 1.5232365131378174, 1.5778241157531738, 1.6324117183685303, 1.6869994401931763, 1.7415870428085327]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 8.0, 14.0, 11.0, 11.0, 20.0, 28.0, 45.0, 91.0, 119.0, 139.0, 222.0, 345.0, 575.0, 973.0, 1841.0, 3592.0, 7515.0, 17608.0, 47954.0, 153032.0, 449882.0, 245805.0, 73246.0, 25493.0, 10001.0, 4506.0, 2305.0, 1231.0, 730.0, 395.0, 275.0, 170.0, 103.0, 67.0, 46.0, 39.0, 28.0, 16.0, 11.0, 8.0, 11.0, 5.0, 3.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.291015625, -2.211151123046875, -2.13128662109375, -2.051422119140625, -1.9715576171875, -1.891693115234375, -1.81182861328125, -1.731964111328125, -1.652099609375, -1.572235107421875, -1.49237060546875, -1.412506103515625, -1.3326416015625, -1.252777099609375, -1.17291259765625, -1.093048095703125, -1.01318359375, -0.933319091796875, -0.85345458984375, -0.773590087890625, -0.6937255859375, -0.613861083984375, -0.53399658203125, -0.454132080078125, -0.374267578125, -0.294403076171875, -0.21453857421875, -0.134674072265625, -0.0548095703125, 0.025054931640625, 0.10491943359375, 0.184783935546875, 0.2646484375, 0.344512939453125, 0.42437744140625, 0.504241943359375, 0.5841064453125, 0.663970947265625, 0.74383544921875, 0.823699951171875, 0.903564453125, 0.983428955078125, 1.06329345703125, 1.143157958984375, 1.2230224609375, 1.302886962890625, 1.38275146484375, 1.462615966796875, 1.54248046875, 1.622344970703125, 1.70220947265625, 1.782073974609375, 1.8619384765625, 1.941802978515625, 2.02166748046875, 2.101531982421875, 2.181396484375, 2.261260986328125, 2.34112548828125, 2.420989990234375, 2.5008544921875, 2.580718994140625, 2.66058349609375, 2.740447998046875, 2.8203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 13.0, 17.0, 30.0, 35.0, 46.0, 57.0, 60.0, 79.0, 93.0, 72.0, 95.0, 77.0, 70.0, 66.0, 48.0, 40.0, 29.0, 22.0, 11.0, 9.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352783203125, -0.34259796142578125, -0.3324127197265625, -0.32222747802734375, -0.312042236328125, -0.30185699462890625, -0.2916717529296875, -0.28148651123046875, -0.27130126953125, -0.26111602783203125, -0.2509307861328125, -0.24074554443359375, -0.230560302734375, -0.22037506103515625, -0.2101898193359375, -0.20000457763671875, -0.1898193359375, -0.17963409423828125, -0.1694488525390625, -0.15926361083984375, -0.149078369140625, -0.13889312744140625, -0.1287078857421875, -0.11852264404296875, -0.10833740234375, -0.09815216064453125, -0.0879669189453125, -0.07778167724609375, -0.067596435546875, -0.05741119384765625, -0.0472259521484375, -0.03704071044921875, -0.02685546875, -0.01667022705078125, -0.0064849853515625, 0.00370025634765625, 0.013885498046875, 0.02407073974609375, 0.0342559814453125, 0.04444122314453125, 0.05462646484375, 0.06481170654296875, 0.0749969482421875, 0.08518218994140625, 0.095367431640625, 0.10555267333984375, 0.1157379150390625, 0.12592315673828125, 0.1361083984375, 0.14629364013671875, 0.1564788818359375, 0.16666412353515625, 0.176849365234375, 0.18703460693359375, 0.1972198486328125, 0.20740509033203125, 0.21759033203125, 0.22777557373046875, 0.2379608154296875, 0.24814605712890625, 0.258331298828125, 0.26851654052734375, 0.2787017822265625, 0.28888702392578125, 0.299072265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 17.0, 19.0, 22.0, 23.0, 31.0, 42.0, 56.0, 69.0, 90.0, 148.0, 211.0, 317.0, 434.0, 691.0, 1171.0, 1969.0, 3645.0, 7260.0, 15425.0, 35353.0, 89824.0, 273039.0, 389053.0, 136141.0, 50989.0, 21215.0, 9784.0, 4931.0, 2587.0, 1445.0, 837.0, 545.0, 354.0, 244.0, 146.0, 107.0, 102.0, 45.0, 51.0, 37.0, 28.0, 15.0, 15.0, 9.0, 3.0, 5.0, 2.0, 7.0, 3.0, 1.0, 0.0, 3.0], "bins": [-2.1953125, -2.1311187744140625, -2.066925048828125, -2.0027313232421875, -1.93853759765625, -1.8743438720703125, -1.810150146484375, -1.7459564208984375, -1.6817626953125, -1.6175689697265625, -1.553375244140625, -1.4891815185546875, -1.42498779296875, -1.3607940673828125, -1.296600341796875, -1.2324066162109375, -1.168212890625, -1.1040191650390625, -1.039825439453125, -0.9756317138671875, -0.91143798828125, -0.8472442626953125, -0.783050537109375, -0.7188568115234375, -0.6546630859375, -0.5904693603515625, -0.526275634765625, -0.4620819091796875, -0.39788818359375, -0.3336944580078125, -0.269500732421875, -0.2053070068359375, -0.14111328125, -0.0769195556640625, -0.012725830078125, 0.0514678955078125, 0.11566162109375, 0.1798553466796875, 0.244049072265625, 0.3082427978515625, 0.3724365234375, 0.4366302490234375, 0.500823974609375, 0.5650177001953125, 0.62921142578125, 0.6934051513671875, 0.757598876953125, 0.8217926025390625, 0.885986328125, 0.9501800537109375, 1.014373779296875, 1.0785675048828125, 1.14276123046875, 1.2069549560546875, 1.271148681640625, 1.3353424072265625, 1.3995361328125, 1.4637298583984375, 1.527923583984375, 1.5921173095703125, 1.65631103515625, 1.7205047607421875, 1.784698486328125, 1.8488922119140625, 1.9130859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 11.0, 17.0, 11.0, 12.0, 30.0, 26.0, 28.0, 31.0, 22.0, 45.0, 32.0, 43.0, 50.0, 39.0, 48.0, 40.0, 53.0, 54.0, 33.0, 41.0, 38.0, 35.0, 20.0, 28.0, 28.0, 23.0, 26.0, 20.0, 17.0, 11.0, 8.0, 11.0, 8.0, 7.0, 8.0, 2.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1494140625, -1.1139373779296875, -1.078460693359375, -1.0429840087890625, -1.00750732421875, -0.9720306396484375, -0.936553955078125, -0.9010772705078125, -0.8656005859375, -0.8301239013671875, -0.794647216796875, -0.7591705322265625, -0.72369384765625, -0.6882171630859375, -0.652740478515625, -0.6172637939453125, -0.581787109375, -0.5463104248046875, -0.510833740234375, -0.4753570556640625, -0.43988037109375, -0.4044036865234375, -0.368927001953125, -0.3334503173828125, -0.2979736328125, -0.2624969482421875, -0.227020263671875, -0.1915435791015625, -0.15606689453125, -0.1205902099609375, -0.085113525390625, -0.0496368408203125, -0.01416015625, 0.0213165283203125, 0.056793212890625, 0.0922698974609375, 0.12774658203125, 0.1632232666015625, 0.198699951171875, 0.2341766357421875, 0.2696533203125, 0.3051300048828125, 0.340606689453125, 0.3760833740234375, 0.41156005859375, 0.4470367431640625, 0.482513427734375, 0.5179901123046875, 0.553466796875, 0.5889434814453125, 0.624420166015625, 0.6598968505859375, 0.69537353515625, 0.7308502197265625, 0.766326904296875, 0.8018035888671875, 0.8372802734375, 0.8727569580078125, 0.908233642578125, 0.9437103271484375, 0.97918701171875, 1.0146636962890625, 1.050140380859375, 1.0856170654296875, 1.12109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 12.0, 14.0, 23.0, 28.0, 39.0, 61.0, 90.0, 120.0, 196.0, 344.0, 612.0, 1168.0, 2358.0, 5097.0, 12708.0, 39660.0, 188183.0, 595317.0, 148638.0, 33645.0, 11104.0, 4564.0, 2064.0, 1022.0, 591.0, 302.0, 203.0, 114.0, 84.0, 51.0, 42.0, 26.0, 13.0, 21.0, 10.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.2040863037109375, -1.166961669921875, -1.1298370361328125, -1.09271240234375, -1.0555877685546875, -1.018463134765625, -0.9813385009765625, -0.9442138671875, -0.9070892333984375, -0.869964599609375, -0.8328399658203125, -0.79571533203125, -0.7585906982421875, -0.721466064453125, -0.6843414306640625, -0.647216796875, -0.6100921630859375, -0.572967529296875, -0.5358428955078125, -0.49871826171875, -0.4615936279296875, -0.424468994140625, -0.3873443603515625, -0.3502197265625, -0.3130950927734375, -0.275970458984375, -0.2388458251953125, -0.20172119140625, -0.1645965576171875, -0.127471923828125, -0.0903472900390625, -0.05322265625, -0.0160980224609375, 0.021026611328125, 0.0581512451171875, 0.09527587890625, 0.1324005126953125, 0.169525146484375, 0.2066497802734375, 0.2437744140625, 0.2808990478515625, 0.318023681640625, 0.3551483154296875, 0.39227294921875, 0.4293975830078125, 0.466522216796875, 0.5036468505859375, 0.540771484375, 0.5778961181640625, 0.615020751953125, 0.6521453857421875, 0.68927001953125, 0.7263946533203125, 0.763519287109375, 0.8006439208984375, 0.8377685546875, 0.8748931884765625, 0.912017822265625, 0.9491424560546875, 0.98626708984375, 1.0233917236328125, 1.060516357421875, 1.0976409912109375, 1.134765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 7.0, 6.0, 13.0, 10.0, 10.0, 14.0, 21.0, 23.0, 36.0, 48.0, 63.0, 56.0, 73.0, 96.0, 84.0, 79.0, 74.0, 66.0, 49.0, 32.0, 26.0, 29.0, 21.0, 20.0, 17.0, 10.0, 7.0, 7.0, 6.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015997886657714844, -0.00015471875667572021, -0.000149458646774292, -0.00014419853687286377, -0.00013893842697143555, -0.00013367831707000732, -0.0001284182071685791, -0.00012315809726715088, -0.00011789798736572266, -0.00011263787746429443, -0.00010737776756286621, -0.00010211765766143799, -9.685754776000977e-05, -9.159743785858154e-05, -8.633732795715332e-05, -8.10772180557251e-05, -7.581710815429688e-05, -7.055699825286865e-05, -6.529688835144043e-05, -6.003677845001221e-05, -5.4776668548583984e-05, -4.951655864715576e-05, -4.425644874572754e-05, -3.8996338844299316e-05, -3.3736228942871094e-05, -2.847611904144287e-05, -2.321600914001465e-05, -1.7955899238586426e-05, -1.2695789337158203e-05, -7.4356794357299805e-06, -2.175569534301758e-06, 3.084540367126465e-06, 8.344650268554688e-06, 1.360476016998291e-05, 1.8864870071411133e-05, 2.4124979972839355e-05, 2.9385089874267578e-05, 3.46451997756958e-05, 3.9905309677124023e-05, 4.5165419578552246e-05, 5.042552947998047e-05, 5.568563938140869e-05, 6.0945749282836914e-05, 6.620585918426514e-05, 7.146596908569336e-05, 7.672607898712158e-05, 8.19861888885498e-05, 8.724629878997803e-05, 9.250640869140625e-05, 9.776651859283447e-05, 0.0001030266284942627, 0.00010828673839569092, 0.00011354684829711914, 0.00011880695819854736, 0.00012406706809997559, 0.0001293271780014038, 0.00013458728790283203, 0.00013984739780426025, 0.00014510750770568848, 0.0001503676176071167, 0.00015562772750854492, 0.00016088783740997314, 0.00016614794731140137, 0.0001714080572128296, 0.0001766681671142578]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 11.0, 19.0, 19.0, 31.0, 35.0, 69.0, 80.0, 118.0, 172.0, 227.0, 379.0, 590.0, 1025.0, 1874.0, 3588.0, 7305.0, 16812.0, 43985.0, 154659.0, 521237.0, 205002.0, 54203.0, 19722.0, 8396.0, 3839.0, 2081.0, 1143.0, 680.0, 393.0, 245.0, 168.0, 134.0, 80.0, 51.0, 26.0, 31.0, 20.0, 26.0, 18.0, 12.0, 11.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9230880737304688, -0.8896331787109375, -0.8561782836914062, -0.822723388671875, -0.7892684936523438, -0.7558135986328125, -0.7223587036132812, -0.68890380859375, -0.6554489135742188, -0.6219940185546875, -0.5885391235351562, -0.555084228515625, -0.5216293334960938, -0.4881744384765625, -0.45471954345703125, -0.4212646484375, -0.38780975341796875, -0.3543548583984375, -0.32089996337890625, -0.287445068359375, -0.25399017333984375, -0.2205352783203125, -0.18708038330078125, -0.15362548828125, -0.12017059326171875, -0.0867156982421875, -0.05326080322265625, -0.019805908203125, 0.01364898681640625, 0.0471038818359375, 0.08055877685546875, 0.114013671875, 0.14746856689453125, 0.1809234619140625, 0.21437835693359375, 0.247833251953125, 0.28128814697265625, 0.3147430419921875, 0.34819793701171875, 0.38165283203125, 0.41510772705078125, 0.4485626220703125, 0.48201751708984375, 0.515472412109375, 0.5489273071289062, 0.5823822021484375, 0.6158370971679688, 0.6492919921875, 0.6827468872070312, 0.7162017822265625, 0.7496566772460938, 0.783111572265625, 0.8165664672851562, 0.8500213623046875, 0.8834762573242188, 0.91693115234375, 0.9503860473632812, 0.9838409423828125, 1.0172958374023438, 1.050750732421875, 1.0842056274414062, 1.1176605224609375, 1.1511154174804688, 1.1845703125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 10.0, 7.0, 8.0, 12.0, 14.0, 13.0, 23.0, 27.0, 33.0, 23.0, 41.0, 42.0, 43.0, 59.0, 78.0, 75.0, 81.0, 69.0, 54.0, 57.0, 30.0, 29.0, 31.0, 27.0, 29.0, 15.0, 18.0, 4.0, 11.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5869522094726562, -0.5694122314453125, -0.5518722534179688, -0.534332275390625, -0.5167922973632812, -0.4992523193359375, -0.48171234130859375, -0.46417236328125, -0.44663238525390625, -0.4290924072265625, -0.41155242919921875, -0.394012451171875, -0.37647247314453125, -0.3589324951171875, -0.34139251708984375, -0.3238525390625, -0.30631256103515625, -0.2887725830078125, -0.27123260498046875, -0.253692626953125, -0.23615264892578125, -0.2186126708984375, -0.20107269287109375, -0.18353271484375, -0.16599273681640625, -0.1484527587890625, -0.13091278076171875, -0.113372802734375, -0.09583282470703125, -0.0782928466796875, -0.06075286865234375, -0.043212890625, -0.02567291259765625, -0.0081329345703125, 0.00940704345703125, 0.026947021484375, 0.04448699951171875, 0.0620269775390625, 0.07956695556640625, 0.09710693359375, 0.11464691162109375, 0.1321868896484375, 0.14972686767578125, 0.167266845703125, 0.18480682373046875, 0.2023468017578125, 0.21988677978515625, 0.2374267578125, 0.25496673583984375, 0.2725067138671875, 0.29004669189453125, 0.307586669921875, 0.32512664794921875, 0.3426666259765625, 0.36020660400390625, 0.37774658203125, 0.39528656005859375, 0.4128265380859375, 0.43036651611328125, 0.447906494140625, 0.46544647216796875, 0.4829864501953125, 0.5005264282226562, 0.51806640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 17.0, 28.0, 39.0, 87.0, 159.0, 208.0, 197.0, 125.0, 70.0, 23.0, 15.0, 8.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.055179595947266, -14.33144760131836, -13.607715606689453, -12.883984565734863, -12.160252571105957, -11.43652057647705, -10.712789535522461, -9.989057540893555, -9.265325546264648, -8.541593551635742, -7.817862033843994, -7.094130516052246, -6.37039852142334, -5.646666526794434, -4.9229350090026855, -4.1992034912109375, -3.4754714965820312, -2.751739740371704, -2.028007984161377, -1.3042762279510498, -0.5805444717407227, 0.1431872844696045, 0.8669190406799316, 1.5906505584716797, 2.314382553100586, 3.038114309310913, 3.7618460655212402, 4.485577583312988, 5.2093095779418945, 5.933041572570801, 6.656773090362549, 7.380504608154297, 8.10423469543457, 8.827966690063477, 9.551698684692383, 10.275429725646973, 10.999161720275879, 11.722893714904785, 12.446624755859375, 13.170356750488281, 13.894088745117188, 14.617820739746094, 15.341552734375, 16.065284729003906, 16.789016723632812, 17.512746810913086, 18.236478805541992, 18.9602108001709, 19.683942794799805, 20.40767478942871, 21.131406784057617, 21.855138778686523, 22.578868865966797, 23.302600860595703, 24.02633285522461, 24.750064849853516, 25.473796844482422, 26.197528839111328, 26.921260833740234, 27.64499282836914, 28.368724822998047, 29.09245491027832, 29.816186904907227, 30.539918899536133, 31.26365089416504]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 12.0, 10.0, 11.0, 23.0, 24.0, 19.0, 27.0, 31.0, 26.0, 18.0, 37.0, 35.0, 42.0, 36.0, 42.0, 38.0, 52.0, 45.0, 44.0, 50.0, 54.0, 40.0, 33.0, 24.0, 28.0, 30.0, 21.0, 20.0, 18.0, 20.0, 24.0, 18.0, 10.0, 7.0, 6.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.034990310668945, -7.789400100708008, -7.54380989074707, -7.298219680786133, -7.052629470825195, -6.807039260864258, -6.5614495277404785, -6.315859317779541, -6.0702691078186035, -5.824678897857666, -5.5790886878967285, -5.333498477935791, -5.087908744812012, -4.842318534851074, -4.596728324890137, -4.351138114929199, -4.105547904968262, -3.859957695007324, -3.6143674850463867, -3.3687775135040283, -3.123187303543091, -2.8775970935821533, -2.632007122039795, -2.3864169120788574, -2.14082670211792, -1.8952364921569824, -1.6496464014053345, -1.4040563106536865, -1.158466100692749, -0.9128758907318115, -0.6672857999801636, -0.4216957092285156, -0.17610549926757812, 0.0694846510887146, 0.3150748014450073, 0.5606649518013, 0.8062551021575928, 1.0518453121185303, 1.2974354028701782, 1.5430254936218262, 1.7886157035827637, 2.034205913543701, 2.2797961235046387, 2.525386095046997, 2.7709763050079346, 3.016566514968872, 3.2621564865112305, 3.507746696472168, 3.7533369064331055, 3.998927116394043, 4.2445173263549805, 4.490107536315918, 4.7356977462768555, 4.981287956237793, 5.226877689361572, 5.47246789932251, 5.718058109283447, 5.963648319244385, 6.209238529205322, 6.45482873916626, 6.700418472290039, 6.946008682250977, 7.191598892211914, 7.437189102172852, 7.682779312133789]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 27.0, 36.0, 42.0, 88.0, 124.0, 165.0, 305.0, 628.0, 1261.0, 2960.0, 8960.0, 37597.0, 3932093.0, 177758.0, 22188.0, 6096.0, 2072.0, 827.0, 422.0, 226.0, 127.0, 89.0, 51.0, 33.0, 29.0, 12.0, 13.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.12664794921875, -4.9603271484375, -4.79400634765625, -4.627685546875, -4.46136474609375, -4.2950439453125, -4.12872314453125, -3.96240234375, -3.79608154296875, -3.6297607421875, -3.46343994140625, -3.297119140625, -3.13079833984375, -2.9644775390625, -2.79815673828125, -2.6318359375, -2.46551513671875, -2.2991943359375, -2.13287353515625, -1.966552734375, -1.80023193359375, -1.6339111328125, -1.46759033203125, -1.30126953125, -1.13494873046875, -0.9686279296875, -0.80230712890625, -0.635986328125, -0.46966552734375, -0.3033447265625, -0.13702392578125, 0.029296875, 0.19561767578125, 0.3619384765625, 0.52825927734375, 0.694580078125, 0.86090087890625, 1.0272216796875, 1.19354248046875, 1.35986328125, 1.52618408203125, 1.6925048828125, 1.85882568359375, 2.025146484375, 2.19146728515625, 2.3577880859375, 2.52410888671875, 2.6904296875, 2.85675048828125, 3.0230712890625, 3.18939208984375, 3.355712890625, 3.52203369140625, 3.6883544921875, 3.85467529296875, 4.02099609375, 4.18731689453125, 4.3536376953125, 4.51995849609375, 4.686279296875, 4.85260009765625, 5.0189208984375, 5.18524169921875, 5.3515625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 6.0, 19.0, 13.0, 19.0, 34.0, 29.0, 37.0, 50.0, 55.0, 58.0, 84.0, 77.0, 88.0, 67.0, 69.0, 52.0, 49.0, 43.0, 37.0, 31.0, 24.0, 19.0, 10.0, 7.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.40478515625, -0.39469337463378906, -0.3846015930175781, -0.3745098114013672, -0.36441802978515625, -0.3543262481689453, -0.3442344665527344, -0.33414268493652344, -0.3240509033203125, -0.31395912170410156, -0.3038673400878906, -0.2937755584716797, -0.28368377685546875, -0.2735919952392578, -0.2635002136230469, -0.25340843200683594, -0.243316650390625, -0.23322486877441406, -0.22313308715820312, -0.2130413055419922, -0.20294952392578125, -0.1928577423095703, -0.18276596069335938, -0.17267417907714844, -0.1625823974609375, -0.15249061584472656, -0.14239883422851562, -0.1323070526123047, -0.12221527099609375, -0.11212348937988281, -0.10203170776367188, -0.09193992614746094, -0.08184814453125, -0.07175636291503906, -0.061664581298828125, -0.05157279968261719, -0.04148101806640625, -0.03138923645019531, -0.021297454833984375, -0.011205673217773438, -0.0011138916015625, 0.008977890014648438, 0.019069671630859375, 0.029161453247070312, 0.03925323486328125, 0.04934501647949219, 0.059436798095703125, 0.06952857971191406, 0.079620361328125, 0.08971214294433594, 0.09980392456054688, 0.10989570617675781, 0.11998748779296875, 0.1300792694091797, 0.14017105102539062, 0.15026283264160156, 0.1603546142578125, 0.17044639587402344, 0.18053817749023438, 0.1906299591064453, 0.20072174072265625, 0.2108135223388672, 0.22090530395507812, 0.23099708557128906, 0.2410888671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 8.0, 11.0, 8.0, 16.0, 29.0, 45.0, 53.0, 87.0, 151.0, 200.0, 378.0, 565.0, 1074.0, 2031.0, 3893.0, 8082.0, 18664.0, 51987.0, 914404.0, 3096617.0, 56990.0, 20338.0, 8989.0, 4316.0, 2257.0, 1258.0, 659.0, 429.0, 263.0, 160.0, 96.0, 72.0, 52.0, 31.0, 21.0, 9.0, 12.0, 12.0, 5.0, 7.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26953125, -3.160675048828125, -3.05181884765625, -2.942962646484375, -2.8341064453125, -2.725250244140625, -2.61639404296875, -2.507537841796875, -2.398681640625, -2.289825439453125, -2.18096923828125, -2.072113037109375, -1.9632568359375, -1.854400634765625, -1.74554443359375, -1.636688232421875, -1.52783203125, -1.418975830078125, -1.31011962890625, -1.201263427734375, -1.0924072265625, -0.983551025390625, -0.87469482421875, -0.765838623046875, -0.656982421875, -0.548126220703125, -0.43927001953125, -0.330413818359375, -0.2215576171875, -0.112701416015625, -0.00384521484375, 0.105010986328125, 0.2138671875, 0.322723388671875, 0.43157958984375, 0.540435791015625, 0.6492919921875, 0.758148193359375, 0.86700439453125, 0.975860595703125, 1.084716796875, 1.193572998046875, 1.30242919921875, 1.411285400390625, 1.5201416015625, 1.628997802734375, 1.73785400390625, 1.846710205078125, 1.95556640625, 2.064422607421875, 2.17327880859375, 2.282135009765625, 2.3909912109375, 2.499847412109375, 2.60870361328125, 2.717559814453125, 2.826416015625, 2.935272216796875, 3.04412841796875, 3.152984619140625, 3.2618408203125, 3.370697021484375, 3.47955322265625, 3.588409423828125, 3.697265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 1.0, 10.0, 8.0, 9.0, 10.0, 15.0, 19.0, 21.0, 31.0, 46.0, 84.0, 204.0, 2401.0, 801.0, 154.0, 76.0, 40.0, 28.0, 20.0, 21.0, 8.0, 6.0, 9.0, 10.0, 6.0, 6.0, 2.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60595703125, -0.58251953125, -0.55908203125, -0.53564453125, -0.51220703125, -0.48876953125, -0.46533203125, -0.44189453125, -0.41845703125, -0.39501953125, -0.37158203125, -0.34814453125, -0.32470703125, -0.30126953125, -0.27783203125, -0.25439453125, -0.23095703125, -0.20751953125, -0.18408203125, -0.16064453125, -0.13720703125, -0.11376953125, -0.09033203125, -0.06689453125, -0.04345703125, -0.02001953125, 0.00341796875, 0.02685546875, 0.05029296875, 0.07373046875, 0.09716796875, 0.12060546875, 0.14404296875, 0.16748046875, 0.19091796875, 0.21435546875, 0.23779296875, 0.26123046875, 0.28466796875, 0.30810546875, 0.33154296875, 0.35498046875, 0.37841796875, 0.40185546875, 0.42529296875, 0.44873046875, 0.47216796875, 0.49560546875, 0.51904296875, 0.54248046875, 0.56591796875, 0.58935546875, 0.61279296875, 0.63623046875, 0.65966796875, 0.68310546875, 0.70654296875, 0.72998046875, 0.75341796875, 0.77685546875, 0.80029296875, 0.82373046875, 0.84716796875, 0.87060546875, 0.89404296875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 11.0, 17.0, 21.0, 43.0, 76.0, 107.0, 144.0, 167.0, 125.0, 104.0, 66.0, 35.0, 28.0, 19.0, 9.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.987713813781738, -4.824145793914795, -4.660577774047852, -4.497009754180908, -4.333441734313965, -4.1698737144470215, -4.006305694580078, -3.8427376747131348, -3.6791696548461914, -3.515601634979248, -3.3520336151123047, -3.1884655952453613, -3.024897575378418, -2.8613295555114746, -2.6977615356445312, -2.534193515777588, -2.3706257343292236, -2.2070577144622803, -2.043489694595337, -1.8799216747283936, -1.7163536548614502, -1.5527856349945068, -1.389217734336853, -1.2256497144699097, -1.0620816946029663, -0.898513674736023, -0.7349456548690796, -0.571377694606781, -0.40780967473983765, -0.2442416548728943, -0.0806736946105957, 0.08289432525634766, 0.24646234512329102, 0.4100303649902344, 0.5735983848571777, 0.7371663451194763, 0.9007343649864197, 1.0643024444580078, 1.2278703451156616, 1.391438364982605, 1.5550063848495483, 1.7185744047164917, 1.882142424583435, 2.045710325241089, 2.2092783451080322, 2.3728463649749756, 2.536414384841919, 2.6999824047088623, 2.8635504245758057, 3.027118444442749, 3.1906864643096924, 3.3542544841766357, 3.517822504043579, 3.6813905239105225, 3.8449583053588867, 4.00852632522583, 4.172094345092773, 4.335662364959717, 4.49923038482666, 4.6627984046936035, 4.826366424560547, 4.98993444442749, 5.153502464294434, 5.317070484161377, 5.48063850402832]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 8.0, 9.0, 13.0, 11.0, 15.0, 24.0, 17.0, 24.0, 27.0, 38.0, 43.0, 41.0, 54.0, 34.0, 31.0, 47.0, 44.0, 42.0, 46.0, 43.0, 36.0, 47.0, 29.0, 48.0, 28.0, 27.0, 25.0, 18.0, 24.0, 22.0, 11.0, 11.0, 14.0, 5.0, 6.0, 4.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.025444507598877, -1.9613349437713623, -1.8972253799438477, -1.833115816116333, -1.769006371498108, -1.7048968076705933, -1.6407872438430786, -1.576677680015564, -1.5125682353973389, -1.4484586715698242, -1.3843491077423096, -1.320239543914795, -1.2561300992965698, -1.1920205354690552, -1.1279109716415405, -1.0638014078140259, -0.9996918439865112, -0.9355822801589966, -0.8714727759361267, -0.8073632121086121, -0.7432537078857422, -0.6791441440582275, -0.6150345802307129, -0.5509250164031982, -0.48681551218032837, -0.4227059781551361, -0.35859644412994385, -0.2944868803024292, -0.23037734627723694, -0.16626781225204468, -0.10215824842453003, -0.03804871439933777, 0.026060819625854492, 0.09017036110162735, 0.1542799025774002, 0.21838945150375366, 0.2824989855289459, 0.3466085195541382, 0.41071808338165283, 0.4748276174068451, 0.5389371514320374, 0.603046715259552, 0.6671562194824219, 0.7312657833099365, 0.7953753471374512, 0.859484851360321, 0.9235944151878357, 0.9877039194107056, 1.0518134832382202, 1.1159230470657349, 1.1800326108932495, 1.2441420555114746, 1.3082516193389893, 1.372361183166504, 1.4364707469940186, 1.5005803108215332, 1.5646898746490479, 1.6287994384765625, 1.6929090023040771, 1.7570185661315918, 1.821128010749817, 1.8852375745773315, 1.9493471384048462, 2.0134565830230713, 2.077566146850586]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 3.0, 3.0, 11.0, 15.0, 20.0, 20.0, 33.0, 39.0, 54.0, 112.0, 161.0, 242.0, 426.0, 614.0, 1307.0, 2575.0, 5088.0, 10885.0, 26077.0, 68675.0, 216133.0, 455931.0, 165338.0, 54878.0, 21554.0, 9260.0, 4292.0, 2093.0, 1071.0, 620.0, 347.0, 214.0, 134.0, 93.0, 66.0, 48.0, 43.0, 23.0, 18.0, 10.0, 13.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.900390625, -1.837860107421875, -1.77532958984375, -1.712799072265625, -1.6502685546875, -1.587738037109375, -1.52520751953125, -1.462677001953125, -1.400146484375, -1.337615966796875, -1.27508544921875, -1.212554931640625, -1.1500244140625, -1.087493896484375, -1.02496337890625, -0.962432861328125, -0.89990234375, -0.837371826171875, -0.77484130859375, -0.712310791015625, -0.6497802734375, -0.587249755859375, -0.52471923828125, -0.462188720703125, -0.399658203125, -0.337127685546875, -0.27459716796875, -0.212066650390625, -0.1495361328125, -0.087005615234375, -0.02447509765625, 0.038055419921875, 0.1005859375, 0.163116455078125, 0.22564697265625, 0.288177490234375, 0.3507080078125, 0.413238525390625, 0.47576904296875, 0.538299560546875, 0.600830078125, 0.663360595703125, 0.72589111328125, 0.788421630859375, 0.8509521484375, 0.913482666015625, 0.97601318359375, 1.038543701171875, 1.10107421875, 1.163604736328125, 1.22613525390625, 1.288665771484375, 1.3511962890625, 1.413726806640625, 1.47625732421875, 1.538787841796875, 1.601318359375, 1.663848876953125, 1.72637939453125, 1.788909912109375, 1.8514404296875, 1.913970947265625, 1.97650146484375, 2.039031982421875, 2.1015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 14.0, 12.0, 8.0, 18.0, 23.0, 29.0, 34.0, 45.0, 39.0, 63.0, 78.0, 75.0, 76.0, 71.0, 65.0, 75.0, 50.0, 43.0, 44.0, 40.0, 27.0, 23.0, 19.0, 8.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.3795928955078125, -0.369293212890625, -0.3589935302734375, -0.34869384765625, -0.3383941650390625, -0.328094482421875, -0.3177947998046875, -0.3074951171875, -0.2971954345703125, -0.286895751953125, -0.2765960693359375, -0.26629638671875, -0.2559967041015625, -0.245697021484375, -0.2353973388671875, -0.22509765625, -0.2147979736328125, -0.204498291015625, -0.1941986083984375, -0.18389892578125, -0.1735992431640625, -0.163299560546875, -0.1529998779296875, -0.1427001953125, -0.1324005126953125, -0.122100830078125, -0.1118011474609375, -0.10150146484375, -0.0912017822265625, -0.080902099609375, -0.0706024169921875, -0.060302734375, -0.0500030517578125, -0.039703369140625, -0.0294036865234375, -0.01910400390625, -0.0088043212890625, 0.001495361328125, 0.0117950439453125, 0.0220947265625, 0.0323944091796875, 0.042694091796875, 0.0529937744140625, 0.06329345703125, 0.0735931396484375, 0.083892822265625, 0.0941925048828125, 0.1044921875, 0.1147918701171875, 0.125091552734375, 0.1353912353515625, 0.14569091796875, 0.1559906005859375, 0.166290283203125, 0.1765899658203125, 0.1868896484375, 0.1971893310546875, 0.207489013671875, 0.2177886962890625, 0.22808837890625, 0.2383880615234375, 0.248687744140625, 0.2589874267578125, 0.269287109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 16.0, 10.0, 16.0, 20.0, 28.0, 47.0, 76.0, 107.0, 169.0, 263.0, 446.0, 805.0, 1525.0, 3671.0, 9421.0, 28158.0, 100315.0, 428170.0, 353616.0, 83131.0, 23898.0, 8147.0, 3174.0, 1493.0, 730.0, 430.0, 220.0, 130.0, 97.0, 66.0, 47.0, 38.0, 21.0, 17.0, 13.0, 7.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.943359375, -1.873779296875, -1.80419921875, -1.734619140625, -1.6650390625, -1.595458984375, -1.52587890625, -1.456298828125, -1.38671875, -1.317138671875, -1.24755859375, -1.177978515625, -1.1083984375, -1.038818359375, -0.96923828125, -0.899658203125, -0.830078125, -0.760498046875, -0.69091796875, -0.621337890625, -0.5517578125, -0.482177734375, -0.41259765625, -0.343017578125, -0.2734375, -0.203857421875, -0.13427734375, -0.064697265625, 0.0048828125, 0.074462890625, 0.14404296875, 0.213623046875, 0.283203125, 0.352783203125, 0.42236328125, 0.491943359375, 0.5615234375, 0.631103515625, 0.70068359375, 0.770263671875, 0.83984375, 0.909423828125, 0.97900390625, 1.048583984375, 1.1181640625, 1.187744140625, 1.25732421875, 1.326904296875, 1.396484375, 1.466064453125, 1.53564453125, 1.605224609375, 1.6748046875, 1.744384765625, 1.81396484375, 1.883544921875, 1.953125, 2.022705078125, 2.09228515625, 2.161865234375, 2.2314453125, 2.301025390625, 2.37060546875, 2.440185546875, 2.509765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 10.0, 10.0, 9.0, 13.0, 12.0, 17.0, 21.0, 23.0, 23.0, 40.0, 48.0, 41.0, 42.0, 51.0, 38.0, 58.0, 43.0, 46.0, 50.0, 51.0, 35.0, 39.0, 48.0, 31.0, 43.0, 34.0, 20.0, 26.0, 20.0, 14.0, 12.0, 9.0, 2.0, 9.0, 9.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.3222503662109375, -1.281219482421875, -1.2401885986328125, -1.19915771484375, -1.1581268310546875, -1.117095947265625, -1.0760650634765625, -1.0350341796875, -0.9940032958984375, -0.952972412109375, -0.9119415283203125, -0.87091064453125, -0.8298797607421875, -0.788848876953125, -0.7478179931640625, -0.706787109375, -0.6657562255859375, -0.624725341796875, -0.5836944580078125, -0.54266357421875, -0.5016326904296875, -0.460601806640625, -0.4195709228515625, -0.3785400390625, -0.3375091552734375, -0.296478271484375, -0.2554473876953125, -0.21441650390625, -0.1733856201171875, -0.132354736328125, -0.0913238525390625, -0.05029296875, -0.0092620849609375, 0.031768798828125, 0.0727996826171875, 0.11383056640625, 0.1548614501953125, 0.195892333984375, 0.2369232177734375, 0.2779541015625, 0.3189849853515625, 0.360015869140625, 0.4010467529296875, 0.44207763671875, 0.4831085205078125, 0.524139404296875, 0.5651702880859375, 0.606201171875, 0.6472320556640625, 0.688262939453125, 0.7292938232421875, 0.77032470703125, 0.8113555908203125, 0.852386474609375, 0.8934173583984375, 0.9344482421875, 0.9754791259765625, 1.016510009765625, 1.0575408935546875, 1.09857177734375, 1.1396026611328125, 1.180633544921875, 1.2216644287109375, 1.2626953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 12.0, 11.0, 24.0, 25.0, 39.0, 93.0, 102.0, 183.0, 323.0, 738.0, 1520.0, 3991.0, 12724.0, 56715.0, 513227.0, 394984.0, 46461.0, 10944.0, 3582.0, 1386.0, 678.0, 345.0, 171.0, 96.0, 52.0, 44.0, 23.0, 18.0, 15.0, 8.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8955078125, -1.83966064453125, -1.7838134765625, -1.72796630859375, -1.672119140625, -1.61627197265625, -1.5604248046875, -1.50457763671875, -1.44873046875, -1.39288330078125, -1.3370361328125, -1.28118896484375, -1.225341796875, -1.16949462890625, -1.1136474609375, -1.05780029296875, -1.001953125, -0.94610595703125, -0.8902587890625, -0.83441162109375, -0.778564453125, -0.72271728515625, -0.6668701171875, -0.61102294921875, -0.55517578125, -0.49932861328125, -0.4434814453125, -0.38763427734375, -0.331787109375, -0.27593994140625, -0.2200927734375, -0.16424560546875, -0.1083984375, -0.05255126953125, 0.0032958984375, 0.05914306640625, 0.114990234375, 0.17083740234375, 0.2266845703125, 0.28253173828125, 0.33837890625, 0.39422607421875, 0.4500732421875, 0.50592041015625, 0.561767578125, 0.61761474609375, 0.6734619140625, 0.72930908203125, 0.78515625, 0.84100341796875, 0.8968505859375, 0.95269775390625, 1.008544921875, 1.06439208984375, 1.1202392578125, 1.17608642578125, 1.23193359375, 1.28778076171875, 1.3436279296875, 1.39947509765625, 1.455322265625, 1.51116943359375, 1.5670166015625, 1.62286376953125, 1.6787109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 13.0, 20.0, 15.0, 24.0, 40.0, 34.0, 60.0, 68.0, 91.0, 80.0, 78.0, 95.0, 74.0, 68.0, 59.0, 45.0, 32.0, 21.0, 16.0, 7.0, 9.0, 12.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001666545867919922, -0.0001606084406375885, -0.00015456229448318481, -0.00014851614832878113, -0.00014247000217437744, -0.00013642385601997375, -0.00013037770986557007, -0.00012433156371116638, -0.0001182854175567627, -0.00011223927140235901, -0.00010619312524795532, -0.00010014697909355164, -9.410083293914795e-05, -8.805468678474426e-05, -8.200854063034058e-05, -7.596239447593689e-05, -6.99162483215332e-05, -6.387010216712952e-05, -5.782395601272583e-05, -5.1777809858322144e-05, -4.573166370391846e-05, -3.968551754951477e-05, -3.3639371395111084e-05, -2.7593225240707397e-05, -2.154707908630371e-05, -1.5500932931900024e-05, -9.454786777496338e-06, -3.4086406230926514e-06, 2.637505531311035e-06, 8.683651685714722e-06, 1.4729797840118408e-05, 2.0775943994522095e-05, 2.682209014892578e-05, 3.286823630332947e-05, 3.8914382457733154e-05, 4.496052861213684e-05, 5.100667476654053e-05, 5.7052820920944214e-05, 6.30989670753479e-05, 6.914511322975159e-05, 7.519125938415527e-05, 8.123740553855896e-05, 8.728355169296265e-05, 9.332969784736633e-05, 9.937584400177002e-05, 0.0001054219901561737, 0.00011146813631057739, 0.00011751428246498108, 0.00012356042861938477, 0.00012960657477378845, 0.00013565272092819214, 0.00014169886708259583, 0.0001477450132369995, 0.0001537911593914032, 0.00015983730554580688, 0.00016588345170021057, 0.00017192959785461426, 0.00017797574400901794, 0.00018402189016342163, 0.00019006803631782532, 0.000196114182472229, 0.0002021603286266327, 0.00020820647478103638, 0.00021425262093544006, 0.00022029876708984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 9.0, 13.0, 18.0, 27.0, 38.0, 79.0, 131.0, 210.0, 355.0, 714.0, 1465.0, 3154.0, 8483.0, 30435.0, 279060.0, 651660.0, 52565.0, 12013.0, 4260.0, 1888.0, 892.0, 465.0, 215.0, 141.0, 79.0, 53.0, 32.0, 29.0, 12.0, 11.0, 9.0, 6.0, 7.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.138671875, -2.070037841796875, -2.00140380859375, -1.932769775390625, -1.8641357421875, -1.795501708984375, -1.72686767578125, -1.658233642578125, -1.589599609375, -1.520965576171875, -1.45233154296875, -1.383697509765625, -1.3150634765625, -1.246429443359375, -1.17779541015625, -1.109161376953125, -1.04052734375, -0.971893310546875, -0.90325927734375, -0.834625244140625, -0.7659912109375, -0.697357177734375, -0.62872314453125, -0.560089111328125, -0.491455078125, -0.422821044921875, -0.35418701171875, -0.285552978515625, -0.2169189453125, -0.148284912109375, -0.07965087890625, -0.011016845703125, 0.0576171875, 0.126251220703125, 0.19488525390625, 0.263519287109375, 0.3321533203125, 0.400787353515625, 0.46942138671875, 0.538055419921875, 0.606689453125, 0.675323486328125, 0.74395751953125, 0.812591552734375, 0.8812255859375, 0.949859619140625, 1.01849365234375, 1.087127685546875, 1.15576171875, 1.224395751953125, 1.29302978515625, 1.361663818359375, 1.4302978515625, 1.498931884765625, 1.56756591796875, 1.636199951171875, 1.704833984375, 1.773468017578125, 1.84210205078125, 1.910736083984375, 1.9793701171875, 2.048004150390625, 2.11663818359375, 2.185272216796875, 2.25390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 7.0, 11.0, 6.0, 8.0, 17.0, 20.0, 33.0, 35.0, 52.0, 87.0, 68.0, 125.0, 100.0, 104.0, 80.0, 52.0, 49.0, 31.0, 19.0, 22.0, 18.0, 11.0, 8.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.042694091796875, -1.01019287109375, -0.977691650390625, -0.9451904296875, -0.912689208984375, -0.88018798828125, -0.847686767578125, -0.815185546875, -0.782684326171875, -0.75018310546875, -0.717681884765625, -0.6851806640625, -0.652679443359375, -0.62017822265625, -0.587677001953125, -0.55517578125, -0.522674560546875, -0.49017333984375, -0.457672119140625, -0.4251708984375, -0.392669677734375, -0.36016845703125, -0.327667236328125, -0.295166015625, -0.262664794921875, -0.23016357421875, -0.197662353515625, -0.1651611328125, -0.132659912109375, -0.10015869140625, -0.067657470703125, -0.03515625, -0.002655029296875, 0.02984619140625, 0.062347412109375, 0.0948486328125, 0.127349853515625, 0.15985107421875, 0.192352294921875, 0.224853515625, 0.257354736328125, 0.28985595703125, 0.322357177734375, 0.3548583984375, 0.387359619140625, 0.41986083984375, 0.452362060546875, 0.48486328125, 0.517364501953125, 0.54986572265625, 0.582366943359375, 0.6148681640625, 0.647369384765625, 0.67987060546875, 0.712371826171875, 0.744873046875, 0.777374267578125, 0.80987548828125, 0.842376708984375, 0.8748779296875, 0.907379150390625, 0.93988037109375, 0.972381591796875, 1.0048828125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 3.0, 9.0, 21.0, 47.0, 117.0, 236.0, 257.0, 186.0, 76.0, 28.0, 11.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.09490203857422, -30.283344268798828, -29.471784591674805, -28.660226821899414, -27.848669052124023, -27.037109375, -26.22555160522461, -25.41399383544922, -24.602434158325195, -23.790876388549805, -22.97931671142578, -22.16775894165039, -21.356201171875, -20.544641494750977, -19.733083724975586, -18.921524047851562, -18.109966278076172, -17.29840850830078, -16.486848831176758, -15.675291061401367, -14.86373233795166, -14.052173614501953, -13.240615844726562, -12.429057121276855, -11.617500305175781, -10.805941581726074, -9.994383811950684, -9.182825088500977, -8.37126636505127, -7.559708118438721, -6.748149871826172, -5.936591148376465, -5.125032424926758, -4.313474178314209, -3.501915454864502, -2.690357208251953, -1.8787987232208252, -1.0672402381896973, -0.25568199157714844, 0.5558767318725586, 1.3674349784851074, 2.1789934635162354, 2.9905519485473633, 3.802110195159912, 4.613668441772461, 5.425227165222168, 6.236785411834717, 7.048344135284424, 7.859902381896973, 8.67146110534668, 9.48301887512207, 10.294577598571777, 11.106136322021484, 11.917694091796875, 12.729252815246582, 13.540811538696289, 14.35236930847168, 15.163928031921387, 15.975485801696777, 16.787044525146484, 17.598602294921875, 18.4101619720459, 19.22171974182129, 20.033279418945312, 20.844837188720703]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 1.0, 2.0, 4.0, 9.0, 6.0, 10.0, 4.0, 20.0, 20.0, 11.0, 25.0, 20.0, 18.0, 24.0, 28.0, 33.0, 39.0, 31.0, 35.0, 46.0, 33.0, 38.0, 47.0, 34.0, 30.0, 46.0, 37.0, 38.0, 34.0, 32.0, 22.0, 24.0, 24.0, 31.0, 17.0, 25.0, 14.0, 18.0, 10.0, 15.0, 11.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 5.0, 1.0], "bins": [-6.982834339141846, -6.787529945373535, -6.592225551605225, -6.396921157836914, -6.201617240905762, -6.006312847137451, -5.811008453369141, -5.61570405960083, -5.4203996658325195, -5.225095272064209, -5.029790878295898, -4.834486961364746, -4.6391825675964355, -4.443878173828125, -4.2485737800598145, -4.053269386291504, -3.8579654693603516, -3.662661075592041, -3.4673569202423096, -3.272052526473999, -3.0767483711242676, -2.881443977355957, -2.6861395835876465, -2.490835189819336, -2.2955310344696045, -2.100226640701294, -1.9049224853515625, -1.709618091583252, -1.514313817024231, -1.31900954246521, -1.1237051486968994, -0.9284008741378784, -0.7330961227416992, -0.5377918481826782, -0.34248751401901245, -0.14718317985534668, 0.048121094703674316, 0.2434253692626953, 0.43872976303100586, 0.6340340375900269, 0.8293383121490479, 1.0246425867080688, 1.2199468612670898, 1.4152512550354004, 1.6105555295944214, 1.8058598041534424, 2.001164197921753, 2.1964683532714844, 2.391772747039795, 2.5870771408081055, 2.782381296157837, 2.9776856899261475, 3.172989845275879, 3.3682942390441895, 3.5635986328125, 3.7589030265808105, 3.954207181930542, 4.149511337280273, 4.344815731048584, 4.5401201248168945, 4.735424518585205, 4.930728912353516, 5.126032829284668, 5.3213372230529785, 5.516641616821289]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 8.0, 5.0, 14.0, 7.0, 24.0, 41.0, 56.0, 89.0, 140.0, 283.0, 484.0, 1003.0, 2719.0, 9033.0, 44166.0, 4056795.0, 62882.0, 11144.0, 3159.0, 1133.0, 461.0, 259.0, 128.0, 98.0, 53.0, 27.0, 29.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.734375, -5.57318115234375, -5.4119873046875, -5.25079345703125, -5.089599609375, -4.92840576171875, -4.7672119140625, -4.60601806640625, -4.44482421875, -4.28363037109375, -4.1224365234375, -3.96124267578125, -3.800048828125, -3.63885498046875, -3.4776611328125, -3.31646728515625, -3.1552734375, -2.99407958984375, -2.8328857421875, -2.67169189453125, -2.510498046875, -2.34930419921875, -2.1881103515625, -2.02691650390625, -1.86572265625, -1.70452880859375, -1.5433349609375, -1.38214111328125, -1.220947265625, -1.05975341796875, -0.8985595703125, -0.73736572265625, -0.576171875, -0.41497802734375, -0.2537841796875, -0.09259033203125, 0.068603515625, 0.22979736328125, 0.3909912109375, 0.55218505859375, 0.71337890625, 0.87457275390625, 1.0357666015625, 1.19696044921875, 1.358154296875, 1.51934814453125, 1.6805419921875, 1.84173583984375, 2.0029296875, 2.16412353515625, 2.3253173828125, 2.48651123046875, 2.647705078125, 2.80889892578125, 2.9700927734375, 3.13128662109375, 3.29248046875, 3.45367431640625, 3.6148681640625, 3.77606201171875, 3.937255859375, 4.09844970703125, 4.2596435546875, 4.42083740234375, 4.58203125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 10.0, 7.0, 7.0, 13.0, 18.0, 16.0, 27.0, 43.0, 55.0, 50.0, 55.0, 70.0, 66.0, 74.0, 87.0, 58.0, 63.0, 65.0, 48.0, 44.0, 35.0, 20.0, 24.0, 18.0, 9.0, 7.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.43896484375, -0.4281768798828125, -0.417388916015625, -0.4066009521484375, -0.39581298828125, -0.3850250244140625, -0.374237060546875, -0.3634490966796875, -0.3526611328125, -0.3418731689453125, -0.331085205078125, -0.3202972412109375, -0.30950927734375, -0.2987213134765625, -0.287933349609375, -0.2771453857421875, -0.266357421875, -0.2555694580078125, -0.244781494140625, -0.2339935302734375, -0.22320556640625, -0.2124176025390625, -0.201629638671875, -0.1908416748046875, -0.1800537109375, -0.1692657470703125, -0.158477783203125, -0.1476898193359375, -0.13690185546875, -0.1261138916015625, -0.115325927734375, -0.1045379638671875, -0.09375, -0.0829620361328125, -0.072174072265625, -0.0613861083984375, -0.05059814453125, -0.0398101806640625, -0.029022216796875, -0.0182342529296875, -0.0074462890625, 0.0033416748046875, 0.014129638671875, 0.0249176025390625, 0.03570556640625, 0.0464935302734375, 0.057281494140625, 0.0680694580078125, 0.078857421875, 0.0896453857421875, 0.100433349609375, 0.1112213134765625, 0.12200927734375, 0.1327972412109375, 0.143585205078125, 0.1543731689453125, 0.1651611328125, 0.1759490966796875, 0.186737060546875, 0.1975250244140625, 0.20831298828125, 0.2191009521484375, 0.229888916015625, 0.2406768798828125, 0.25146484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 11.0, 11.0, 12.0, 26.0, 40.0, 49.0, 80.0, 113.0, 215.0, 309.0, 495.0, 836.0, 1514.0, 2567.0, 4701.0, 9001.0, 19393.0, 54830.0, 3461733.0, 555636.0, 45493.0, 17804.0, 8578.0, 4564.0, 2524.0, 1395.0, 833.0, 516.0, 351.0, 207.0, 148.0, 79.0, 58.0, 46.0, 36.0, 30.0, 13.0, 13.0, 10.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.193359375, -2.114776611328125, -2.03619384765625, -1.957611083984375, -1.8790283203125, -1.800445556640625, -1.72186279296875, -1.643280029296875, -1.564697265625, -1.486114501953125, -1.40753173828125, -1.328948974609375, -1.2503662109375, -1.171783447265625, -1.09320068359375, -1.014617919921875, -0.93603515625, -0.857452392578125, -0.77886962890625, -0.700286865234375, -0.6217041015625, -0.543121337890625, -0.46453857421875, -0.385955810546875, -0.307373046875, -0.228790283203125, -0.15020751953125, -0.071624755859375, 0.0069580078125, 0.085540771484375, 0.16412353515625, 0.242706298828125, 0.3212890625, 0.399871826171875, 0.47845458984375, 0.557037353515625, 0.6356201171875, 0.714202880859375, 0.79278564453125, 0.871368408203125, 0.949951171875, 1.028533935546875, 1.10711669921875, 1.185699462890625, 1.2642822265625, 1.342864990234375, 1.42144775390625, 1.500030517578125, 1.57861328125, 1.657196044921875, 1.73577880859375, 1.814361572265625, 1.8929443359375, 1.971527099609375, 2.05010986328125, 2.128692626953125, 2.207275390625, 2.285858154296875, 2.36444091796875, 2.443023681640625, 2.5216064453125, 2.600189208984375, 2.67877197265625, 2.757354736328125, 2.8359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 10.0, 9.0, 8.0, 18.0, 25.0, 30.0, 56.0, 139.0, 742.0, 2531.0, 215.0, 85.0, 41.0, 30.0, 17.0, 18.0, 18.0, 7.0, 13.0, 4.0, 6.0, 5.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58984375, -0.5689010620117188, -0.5479583740234375, -0.5270156860351562, -0.506072998046875, -0.48513031005859375, -0.4641876220703125, -0.44324493408203125, -0.42230224609375, -0.40135955810546875, -0.3804168701171875, -0.35947418212890625, -0.338531494140625, -0.31758880615234375, -0.2966461181640625, -0.27570343017578125, -0.2547607421875, -0.23381805419921875, -0.2128753662109375, -0.19193267822265625, -0.170989990234375, -0.15004730224609375, -0.1291046142578125, -0.10816192626953125, -0.08721923828125, -0.06627655029296875, -0.0453338623046875, -0.02439117431640625, -0.003448486328125, 0.01749420166015625, 0.0384368896484375, 0.05937957763671875, 0.080322265625, 0.10126495361328125, 0.1222076416015625, 0.14315032958984375, 0.164093017578125, 0.18503570556640625, 0.2059783935546875, 0.22692108154296875, 0.24786376953125, 0.26880645751953125, 0.2897491455078125, 0.31069183349609375, 0.331634521484375, 0.35257720947265625, 0.3735198974609375, 0.39446258544921875, 0.4154052734375, 0.43634796142578125, 0.4572906494140625, 0.47823333740234375, 0.499176025390625, 0.5201187133789062, 0.5410614013671875, 0.5620040893554688, 0.58294677734375, 0.6038894653320312, 0.6248321533203125, 0.6457748413085938, 0.666717529296875, 0.6876602172851562, 0.7086029052734375, 0.7295455932617188, 0.75048828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 28.0, 39.0, 94.0, 163.0, 221.0, 190.0, 103.0, 76.0, 34.0, 19.0, 9.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484951972961426, -3.296396017074585, -3.1078402996063232, -2.9192843437194824, -2.7307283878326416, -2.542172431945801, -2.353616714477539, -2.1650607585906982, -1.976504921913147, -1.7879490852355957, -1.5993931293487549, -1.4108372926712036, -1.2222814559936523, -1.0337255001068115, -0.8451696634292603, -0.6566137075424194, -0.46805787086486816, -0.2795019745826721, -0.09094610810279846, 0.0976097583770752, 0.28616565465927124, 0.4747215509414673, 0.6632773876190186, 0.8518333435058594, 1.0403891801834106, 1.228945016860962, 1.4175009727478027, 1.606056809425354, 1.7946126461029053, 1.983168601989746, 2.171724319458008, 2.3602805137634277, 2.5488362312316895, 2.7373921871185303, 2.925947904586792, 3.114503860473633, 3.3030598163604736, 3.4916157722473145, 3.680171489715576, 3.868727445602417, 4.057283401489258, 4.2458391189575195, 4.4343953132629395, 4.622951030731201, 4.811506748199463, 5.000062942504883, 5.1886186599731445, 5.377174377441406, 5.565730094909668, 5.75428581237793, 5.94284200668335, 6.131397724151611, 6.319953441619873, 6.508509635925293, 6.697065353393555, 6.885621070861816, 7.074177265167236, 7.262732982635498, 7.451289176940918, 7.63984489440918, 7.828400611877441, 8.016956329345703, 8.205513000488281, 8.394068717956543, 8.582624435424805]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 13.0, 11.0, 9.0, 14.0, 15.0, 14.0, 27.0, 27.0, 24.0, 41.0, 36.0, 41.0, 40.0, 39.0, 32.0, 39.0, 41.0, 37.0, 43.0, 45.0, 31.0, 43.0, 33.0, 31.0, 43.0, 32.0, 28.0, 23.0, 16.0, 22.0, 11.0, 21.0, 17.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.730224609375, -1.6761236190795898, -1.6220225095748901, -1.56792151927948, -1.5138204097747803, -1.4597194194793701, -1.40561842918396, -1.3515173196792603, -1.2974162101745605, -1.2433152198791504, -1.1892141103744507, -1.1351131200790405, -1.0810120105743408, -1.0269110202789307, -0.9728099703788757, -0.9187089204788208, -0.8646079301834106, -0.8105068802833557, -0.7564058303833008, -0.7023048400878906, -0.6482037305831909, -0.5941027402877808, -0.5400016903877258, -0.4859006404876709, -0.43179959058761597, -0.37769854068756104, -0.3235974907875061, -0.26949647068977356, -0.21539542078971863, -0.1612943708896637, -0.10719335079193115, -0.05309230089187622, 0.0010086297988891602, 0.055109672248363495, 0.10921071469783783, 0.16331174969673157, 0.2174127995967865, 0.27151384949684143, 0.325614869594574, 0.3797159194946289, 0.43381696939468384, 0.48791801929473877, 0.5420190691947937, 0.5961201190948486, 0.6502211093902588, 0.7043222188949585, 0.7584232091903687, 0.8125242590904236, 0.8666253089904785, 0.9207263588905334, 0.9748274087905884, 1.0289283990859985, 1.0830295085906982, 1.1371304988861084, 1.1912314891815186, 1.2453325986862183, 1.299433708190918, 1.3535346984863281, 1.4076358079910278, 1.461736798286438, 1.5158379077911377, 1.5699388980865479, 1.624039888381958, 1.6781409978866577, 1.7322419881820679]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 4.0, 14.0, 19.0, 36.0, 42.0, 50.0, 90.0, 132.0, 242.0, 410.0, 729.0, 1326.0, 2995.0, 7676.0, 22302.0, 79251.0, 347275.0, 440283.0, 101805.0, 27776.0, 9013.0, 3503.0, 1602.0, 793.0, 432.0, 258.0, 172.0, 107.0, 66.0, 46.0, 35.0, 18.0, 19.0, 4.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.427734375, -2.352081298828125, -2.27642822265625, -2.200775146484375, -2.1251220703125, -2.049468994140625, -1.97381591796875, -1.898162841796875, -1.822509765625, -1.746856689453125, -1.67120361328125, -1.595550537109375, -1.5198974609375, -1.444244384765625, -1.36859130859375, -1.292938232421875, -1.21728515625, -1.141632080078125, -1.06597900390625, -0.990325927734375, -0.9146728515625, -0.839019775390625, -0.76336669921875, -0.687713623046875, -0.612060546875, -0.536407470703125, -0.46075439453125, -0.385101318359375, -0.3094482421875, -0.233795166015625, -0.15814208984375, -0.082489013671875, -0.0068359375, 0.068817138671875, 0.14447021484375, 0.220123291015625, 0.2957763671875, 0.371429443359375, 0.44708251953125, 0.522735595703125, 0.598388671875, 0.674041748046875, 0.74969482421875, 0.825347900390625, 0.9010009765625, 0.976654052734375, 1.05230712890625, 1.127960205078125, 1.20361328125, 1.279266357421875, 1.35491943359375, 1.430572509765625, 1.5062255859375, 1.581878662109375, 1.65753173828125, 1.733184814453125, 1.808837890625, 1.884490966796875, 1.96014404296875, 2.035797119140625, 2.1114501953125, 2.187103271484375, 2.26275634765625, 2.338409423828125, 2.4140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 6.0, 8.0, 13.0, 16.0, 16.0, 22.0, 36.0, 35.0, 44.0, 44.0, 54.0, 66.0, 69.0, 74.0, 77.0, 71.0, 68.0, 51.0, 54.0, 28.0, 43.0, 35.0, 23.0, 14.0, 13.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.42236328125, -0.4117279052734375, -0.401092529296875, -0.3904571533203125, -0.37982177734375, -0.3691864013671875, -0.358551025390625, -0.3479156494140625, -0.3372802734375, -0.3266448974609375, -0.316009521484375, -0.3053741455078125, -0.29473876953125, -0.2841033935546875, -0.273468017578125, -0.2628326416015625, -0.252197265625, -0.2415618896484375, -0.230926513671875, -0.2202911376953125, -0.20965576171875, -0.1990203857421875, -0.188385009765625, -0.1777496337890625, -0.1671142578125, -0.1564788818359375, -0.145843505859375, -0.1352081298828125, -0.12457275390625, -0.1139373779296875, -0.103302001953125, -0.0926666259765625, -0.08203125, -0.0713958740234375, -0.060760498046875, -0.0501251220703125, -0.03948974609375, -0.0288543701171875, -0.018218994140625, -0.0075836181640625, 0.0030517578125, 0.0136871337890625, 0.024322509765625, 0.0349578857421875, 0.04559326171875, 0.0562286376953125, 0.066864013671875, 0.0774993896484375, 0.088134765625, 0.0987701416015625, 0.109405517578125, 0.1200408935546875, 0.13067626953125, 0.1413116455078125, 0.151947021484375, 0.1625823974609375, 0.1732177734375, 0.1838531494140625, 0.194488525390625, 0.2051239013671875, 0.21575927734375, 0.2263946533203125, 0.237030029296875, 0.2476654052734375, 0.25830078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 11.0, 15.0, 12.0, 27.0, 40.0, 47.0, 80.0, 100.0, 129.0, 187.0, 364.0, 582.0, 1058.0, 2117.0, 4840.0, 11441.0, 30916.0, 95399.0, 340312.0, 390880.0, 111507.0, 35195.0, 12854.0, 5119.0, 2352.0, 1162.0, 598.0, 385.0, 240.0, 160.0, 111.0, 80.0, 56.0, 50.0, 21.0, 25.0, 23.0, 14.0, 13.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.73046875, -1.6764984130859375, -1.622528076171875, -1.5685577392578125, -1.51458740234375, -1.4606170654296875, -1.406646728515625, -1.3526763916015625, -1.2987060546875, -1.2447357177734375, -1.190765380859375, -1.1367950439453125, -1.08282470703125, -1.0288543701171875, -0.974884033203125, -0.9209136962890625, -0.866943359375, -0.8129730224609375, -0.759002685546875, -0.7050323486328125, -0.65106201171875, -0.5970916748046875, -0.543121337890625, -0.4891510009765625, -0.4351806640625, -0.3812103271484375, -0.327239990234375, -0.2732696533203125, -0.21929931640625, -0.1653289794921875, -0.111358642578125, -0.0573883056640625, -0.00341796875, 0.0505523681640625, 0.104522705078125, 0.1584930419921875, 0.21246337890625, 0.2664337158203125, 0.320404052734375, 0.3743743896484375, 0.4283447265625, 0.4823150634765625, 0.536285400390625, 0.5902557373046875, 0.64422607421875, 0.6981964111328125, 0.752166748046875, 0.8061370849609375, 0.860107421875, 0.9140777587890625, 0.968048095703125, 1.0220184326171875, 1.07598876953125, 1.1299591064453125, 1.183929443359375, 1.2378997802734375, 1.2918701171875, 1.3458404541015625, 1.399810791015625, 1.4537811279296875, 1.50775146484375, 1.5617218017578125, 1.615692138671875, 1.6696624755859375, 1.7236328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 9.0, 10.0, 9.0, 5.0, 10.0, 13.0, 14.0, 14.0, 24.0, 17.0, 21.0, 21.0, 23.0, 29.0, 37.0, 48.0, 32.0, 37.0, 40.0, 37.0, 40.0, 37.0, 32.0, 38.0, 36.0, 32.0, 34.0, 35.0, 30.0, 34.0, 23.0, 30.0, 20.0, 13.0, 9.0, 15.0, 14.0, 11.0, 10.0, 8.0, 4.0, 5.0, 10.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.94677734375, -0.9182205200195312, -0.8896636962890625, -0.8611068725585938, -0.832550048828125, -0.8039932250976562, -0.7754364013671875, -0.7468795776367188, -0.71832275390625, -0.6897659301757812, -0.6612091064453125, -0.6326522827148438, -0.604095458984375, -0.5755386352539062, -0.5469818115234375, -0.5184249877929688, -0.4898681640625, -0.46131134033203125, -0.4327545166015625, -0.40419769287109375, -0.375640869140625, -0.34708404541015625, -0.3185272216796875, -0.28997039794921875, -0.26141357421875, -0.23285675048828125, -0.2042999267578125, -0.17574310302734375, -0.147186279296875, -0.11862945556640625, -0.0900726318359375, -0.06151580810546875, -0.032958984375, -0.00440216064453125, 0.0241546630859375, 0.05271148681640625, 0.081268310546875, 0.10982513427734375, 0.1383819580078125, 0.16693878173828125, 0.19549560546875, 0.22405242919921875, 0.2526092529296875, 0.28116607666015625, 0.309722900390625, 0.33827972412109375, 0.3668365478515625, 0.39539337158203125, 0.4239501953125, 0.45250701904296875, 0.4810638427734375, 0.5096206665039062, 0.538177490234375, 0.5667343139648438, 0.5952911376953125, 0.6238479614257812, 0.65240478515625, 0.6809616088867188, 0.7095184326171875, 0.7380752563476562, 0.766632080078125, 0.7951889038085938, 0.8237457275390625, 0.8523025512695312, 0.880859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 9.0, 9.0, 17.0, 29.0, 35.0, 67.0, 143.0, 248.0, 505.0, 1120.0, 3107.0, 13125.0, 122277.0, 827899.0, 66379.0, 9330.0, 2425.0, 904.0, 423.0, 227.0, 118.0, 68.0, 30.0, 16.0, 10.0, 7.0, 12.0, 2.0, 5.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583984375, -1.51904296875, -1.4541015625, -1.38916015625, -1.32421875, -1.25927734375, -1.1943359375, -1.12939453125, -1.064453125, -0.99951171875, -0.9345703125, -0.86962890625, -0.8046875, -0.73974609375, -0.6748046875, -0.60986328125, -0.544921875, -0.47998046875, -0.4150390625, -0.35009765625, -0.28515625, -0.22021484375, -0.1552734375, -0.09033203125, -0.025390625, 0.03955078125, 0.1044921875, 0.16943359375, 0.234375, 0.29931640625, 0.3642578125, 0.42919921875, 0.494140625, 0.55908203125, 0.6240234375, 0.68896484375, 0.75390625, 0.81884765625, 0.8837890625, 0.94873046875, 1.013671875, 1.07861328125, 1.1435546875, 1.20849609375, 1.2734375, 1.33837890625, 1.4033203125, 1.46826171875, 1.533203125, 1.59814453125, 1.6630859375, 1.72802734375, 1.79296875, 1.85791015625, 1.9228515625, 1.98779296875, 2.052734375, 2.11767578125, 2.1826171875, 2.24755859375, 2.3125, 2.37744140625, 2.4423828125, 2.50732421875, 2.572265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 9.0, 7.0, 8.0, 20.0, 18.0, 28.0, 33.0, 43.0, 45.0, 45.0, 68.0, 67.0, 66.0, 79.0, 60.0, 62.0, 60.0, 54.0, 49.0, 34.0, 23.0, 19.0, 16.0, 18.0, 12.0, 9.0, 5.0, 10.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001842975616455078, -0.0001787487417459488, -0.00017319992184638977, -0.00016765110194683075, -0.00016210228204727173, -0.0001565534621477127, -0.0001510046422481537, -0.00014545582234859467, -0.00013990700244903564, -0.00013435818254947662, -0.0001288093626499176, -0.00012326054275035858, -0.00011771172285079956, -0.00011216290295124054, -0.00010661408305168152, -0.0001010652631521225, -9.551644325256348e-05, -8.996762335300446e-05, -8.441880345344543e-05, -7.886998355388641e-05, -7.332116365432739e-05, -6.777234375476837e-05, -6.222352385520935e-05, -5.667470395565033e-05, -5.112588405609131e-05, -4.557706415653229e-05, -4.0028244256973267e-05, -3.4479424357414246e-05, -2.8930604457855225e-05, -2.3381784558296204e-05, -1.7832964658737183e-05, -1.2284144759178162e-05, -6.735324859619141e-06, -1.1865049600601196e-06, 4.362314939498901e-06, 9.911134839057922e-06, 1.5459954738616943e-05, 2.1008774638175964e-05, 2.6557594537734985e-05, 3.2106414437294006e-05, 3.765523433685303e-05, 4.320405423641205e-05, 4.875287413597107e-05, 5.430169403553009e-05, 5.985051393508911e-05, 6.539933383464813e-05, 7.094815373420715e-05, 7.649697363376617e-05, 8.20457935333252e-05, 8.759461343288422e-05, 9.314343333244324e-05, 9.869225323200226e-05, 0.00010424107313156128, 0.0001097898930311203, 0.00011533871293067932, 0.00012088753283023834, 0.00012643635272979736, 0.00013198517262935638, 0.0001375339925289154, 0.00014308281242847443, 0.00014863163232803345, 0.00015418045222759247, 0.0001597292721271515, 0.0001652780920267105, 0.00017082691192626953]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 11.0, 6.0, 9.0, 18.0, 19.0, 23.0, 44.0, 56.0, 107.0, 160.0, 278.0, 565.0, 1130.0, 2443.0, 6432.0, 26852.0, 432708.0, 535262.0, 30508.0, 6791.0, 2561.0, 1221.0, 590.0, 300.0, 177.0, 115.0, 54.0, 31.0, 21.0, 18.0, 15.0, 10.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.951171875, -1.8902587890625, -1.829345703125, -1.7684326171875, -1.70751953125, -1.6466064453125, -1.585693359375, -1.5247802734375, -1.4638671875, -1.4029541015625, -1.342041015625, -1.2811279296875, -1.22021484375, -1.1593017578125, -1.098388671875, -1.0374755859375, -0.9765625, -0.9156494140625, -0.854736328125, -0.7938232421875, -0.73291015625, -0.6719970703125, -0.611083984375, -0.5501708984375, -0.4892578125, -0.4283447265625, -0.367431640625, -0.3065185546875, -0.24560546875, -0.1846923828125, -0.123779296875, -0.0628662109375, -0.001953125, 0.0589599609375, 0.119873046875, 0.1807861328125, 0.24169921875, 0.3026123046875, 0.363525390625, 0.4244384765625, 0.4853515625, 0.5462646484375, 0.607177734375, 0.6680908203125, 0.72900390625, 0.7899169921875, 0.850830078125, 0.9117431640625, 0.97265625, 1.0335693359375, 1.094482421875, 1.1553955078125, 1.21630859375, 1.2772216796875, 1.338134765625, 1.3990478515625, 1.4599609375, 1.5208740234375, 1.581787109375, 1.6427001953125, 1.70361328125, 1.7645263671875, 1.825439453125, 1.8863525390625, 1.947265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 16.0, 18.0, 22.0, 30.0, 37.0, 53.0, 86.0, 100.0, 116.0, 118.0, 85.0, 89.0, 48.0, 46.0, 38.0, 20.0, 15.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.810546875, -0.78594970703125, -0.7613525390625, -0.73675537109375, -0.712158203125, -0.68756103515625, -0.6629638671875, -0.63836669921875, -0.61376953125, -0.58917236328125, -0.5645751953125, -0.53997802734375, -0.515380859375, -0.49078369140625, -0.4661865234375, -0.44158935546875, -0.4169921875, -0.39239501953125, -0.3677978515625, -0.34320068359375, -0.318603515625, -0.29400634765625, -0.2694091796875, -0.24481201171875, -0.22021484375, -0.19561767578125, -0.1710205078125, -0.14642333984375, -0.121826171875, -0.09722900390625, -0.0726318359375, -0.04803466796875, -0.0234375, 0.00115966796875, 0.0257568359375, 0.05035400390625, 0.074951171875, 0.09954833984375, 0.1241455078125, 0.14874267578125, 0.17333984375, 0.19793701171875, 0.2225341796875, 0.24713134765625, 0.271728515625, 0.29632568359375, 0.3209228515625, 0.34552001953125, 0.3701171875, 0.39471435546875, 0.4193115234375, 0.44390869140625, 0.468505859375, 0.49310302734375, 0.5177001953125, 0.54229736328125, 0.56689453125, 0.59149169921875, 0.6160888671875, 0.64068603515625, 0.665283203125, 0.68988037109375, 0.7144775390625, 0.73907470703125, 0.763671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 10.0, 12.0, 20.0, 33.0, 56.0, 98.0, 119.0, 143.0, 147.0, 109.0, 82.0, 63.0, 40.0, 24.0, 14.0, 8.0, 6.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-16.837818145751953, -16.455625534057617, -16.07343101501465, -15.691238403320312, -15.30904483795166, -14.926852226257324, -14.544658660888672, -14.162466049194336, -13.780272483825684, -13.398078918457031, -13.015886306762695, -12.633692741394043, -12.25149917602539, -11.869306564331055, -11.487112998962402, -11.10491943359375, -10.722726821899414, -10.340533256530762, -9.958340644836426, -9.576147079467773, -9.193953514099121, -8.811760902404785, -8.429567337036133, -8.047374725341797, -7.665180206298828, -7.282987117767334, -6.900793552398682, -6.5186004638671875, -6.136407375335693, -5.754214286804199, -5.372020721435547, -4.989827632904053, -4.607635021209717, -4.225441932678223, -3.8432486057281494, -3.461055278778076, -3.078862190246582, -2.696668863296509, -2.3144755363464355, -1.9322824478149414, -1.5500891208648682, -1.1678959131240845, -0.785702645778656, -0.40350937843322754, -0.021316170692443848, 0.36087703704833984, 0.7430703639984131, 1.1252634525299072, 1.5074567794799805, 1.8896499872207642, 2.271843194961548, 2.654036521911621, 3.0362296104431152, 3.4184229373931885, 3.8006162643432617, 4.182809352874756, 4.56500244140625, 4.947195529937744, 5.3293890953063965, 5.711582183837891, 6.093775272369385, 6.475968360900879, 6.858161926269531, 7.240355014801025, 7.622548580169678]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 3.0, 5.0, 11.0, 12.0, 11.0, 16.0, 19.0, 21.0, 20.0, 46.0, 45.0, 36.0, 33.0, 54.0, 59.0, 65.0, 56.0, 70.0, 65.0, 58.0, 58.0, 46.0, 40.0, 44.0, 22.0, 18.0, 16.0, 17.0, 12.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4530029296875, -6.208856582641602, -5.964710235595703, -5.720563888549805, -5.476417541503906, -5.232271194458008, -4.988125324249268, -4.743978977203369, -4.499832630157471, -4.255686283111572, -4.011539936065674, -3.7673938274383545, -3.523247480392456, -3.2791011333465576, -3.0349550247192383, -2.79080867767334, -2.5466623306274414, -2.302515983581543, -2.0583696365356445, -1.8142235279083252, -1.5700771808624268, -1.3259308338165283, -1.0817846059799194, -0.8376383781433105, -0.5934920310974121, -0.34934574365615845, -0.10519945621490479, 0.13894683122634888, 0.38309311866760254, 0.627239465713501, 0.8713856935501099, 1.1155319213867188, 1.3596782684326172, 1.6038246154785156, 1.8479708433151245, 2.0921170711517334, 2.336263418197632, 2.5804097652435303, 2.8245558738708496, 3.068702220916748, 3.3128485679626465, 3.556994915008545, 3.8011412620544434, 4.045287609100342, 4.289433479309082, 4.5335798263549805, 4.777726173400879, 5.021872520446777, 5.266018867492676, 5.510165214538574, 5.754311561584473, 5.998457908630371, 6.2426042556762695, 6.486750602722168, 6.730896472930908, 6.975042819976807, 7.219189167022705, 7.4633355140686035, 7.707481861114502, 7.9516282081604, 8.19577407836914, 8.439920425415039, 8.684066772460938, 8.928213119506836, 9.172359466552734]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 7.0, 13.0, 24.0, 28.0, 44.0, 92.0, 137.0, 173.0, 393.0, 637.0, 1340.0, 2884.0, 7201.0, 21208.0, 151557.0, 3929096.0, 56307.0, 13900.0, 5099.0, 2076.0, 948.0, 465.0, 245.0, 118.0, 89.0, 65.0, 40.0, 17.0, 16.0, 13.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.195098876953125, -3.09918212890625, -3.003265380859375, -2.9073486328125, -2.811431884765625, -2.71551513671875, -2.619598388671875, -2.523681640625, -2.427764892578125, -2.33184814453125, -2.235931396484375, -2.1400146484375, -2.044097900390625, -1.94818115234375, -1.852264404296875, -1.75634765625, -1.660430908203125, -1.56451416015625, -1.468597412109375, -1.3726806640625, -1.276763916015625, -1.18084716796875, -1.084930419921875, -0.989013671875, -0.893096923828125, -0.79718017578125, -0.701263427734375, -0.6053466796875, -0.509429931640625, -0.41351318359375, -0.317596435546875, -0.2216796875, -0.125762939453125, -0.02984619140625, 0.066070556640625, 0.1619873046875, 0.257904052734375, 0.35382080078125, 0.449737548828125, 0.545654296875, 0.641571044921875, 0.73748779296875, 0.833404541015625, 0.9293212890625, 1.025238037109375, 1.12115478515625, 1.217071533203125, 1.31298828125, 1.408905029296875, 1.50482177734375, 1.600738525390625, 1.6966552734375, 1.792572021484375, 1.88848876953125, 1.984405517578125, 2.080322265625, 2.176239013671875, 2.27215576171875, 2.368072509765625, 2.4639892578125, 2.559906005859375, 2.65582275390625, 2.751739501953125, 2.84765625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 10.0, 15.0, 11.0, 18.0, 26.0, 33.0, 45.0, 44.0, 58.0, 60.0, 71.0, 81.0, 65.0, 81.0, 77.0, 48.0, 47.0, 50.0, 40.0, 26.0, 21.0, 18.0, 16.0, 16.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.459228515625, -0.4480705261230469, -0.43691253662109375, -0.4257545471191406, -0.4145965576171875, -0.4034385681152344, -0.39228057861328125, -0.3811225891113281, -0.369964599609375, -0.3588066101074219, -0.34764862060546875, -0.3364906311035156, -0.3253326416015625, -0.3141746520996094, -0.30301666259765625, -0.2918586730957031, -0.28070068359375, -0.2695426940917969, -0.25838470458984375, -0.24722671508789062, -0.2360687255859375, -0.22491073608398438, -0.21375274658203125, -0.20259475708007812, -0.191436767578125, -0.18027877807617188, -0.16912078857421875, -0.15796279907226562, -0.1468048095703125, -0.13564682006835938, -0.12448883056640625, -0.11333084106445312, -0.1021728515625, -0.09101486206054688, -0.07985687255859375, -0.06869888305664062, -0.0575408935546875, -0.046382904052734375, -0.03522491455078125, -0.024066925048828125, -0.012908935546875, -0.001750946044921875, 0.00940704345703125, 0.020565032958984375, 0.0317230224609375, 0.042881011962890625, 0.05403900146484375, 0.06519699096679688, 0.07635498046875, 0.08751296997070312, 0.09867095947265625, 0.10982894897460938, 0.1209869384765625, 0.13214492797851562, 0.14330291748046875, 0.15446090698242188, 0.165618896484375, 0.17677688598632812, 0.18793487548828125, 0.19909286499023438, 0.2102508544921875, 0.22140884399414062, 0.23256683349609375, 0.24372482299804688, 0.2548828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 5.0, 18.0, 32.0, 75.0, 108.0, 154.0, 347.0, 848.0, 2156.0, 5447.0, 15175.0, 52476.0, 2937048.0, 1110361.0, 47183.0, 13899.0, 5216.0, 2013.0, 866.0, 351.0, 202.0, 112.0, 72.0, 38.0, 22.0, 10.0, 6.0, 9.0, 9.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.315216064453125, -2.21441650390625, -2.113616943359375, -2.0128173828125, -1.912017822265625, -1.81121826171875, -1.710418701171875, -1.609619140625, -1.508819580078125, -1.40802001953125, -1.307220458984375, -1.2064208984375, -1.105621337890625, -1.00482177734375, -0.904022216796875, -0.80322265625, -0.702423095703125, -0.60162353515625, -0.500823974609375, -0.4000244140625, -0.299224853515625, -0.19842529296875, -0.097625732421875, 0.003173828125, 0.103973388671875, 0.20477294921875, 0.305572509765625, 0.4063720703125, 0.507171630859375, 0.60797119140625, 0.708770751953125, 0.8095703125, 0.910369873046875, 1.01116943359375, 1.111968994140625, 1.2127685546875, 1.313568115234375, 1.41436767578125, 1.515167236328125, 1.615966796875, 1.716766357421875, 1.81756591796875, 1.918365478515625, 2.0191650390625, 2.119964599609375, 2.22076416015625, 2.321563720703125, 2.42236328125, 2.523162841796875, 2.62396240234375, 2.724761962890625, 2.8255615234375, 2.926361083984375, 3.02716064453125, 3.127960205078125, 3.228759765625, 3.329559326171875, 3.43035888671875, 3.531158447265625, 3.6319580078125, 3.732757568359375, 3.83355712890625, 3.934356689453125, 4.03515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 11.0, 6.0, 9.0, 6.0, 24.0, 22.0, 28.0, 23.0, 38.0, 72.0, 113.0, 268.0, 1476.0, 1342.0, 266.0, 114.0, 54.0, 46.0, 25.0, 21.0, 13.0, 11.0, 20.0, 14.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.677734375, -0.6535186767578125, -0.629302978515625, -0.6050872802734375, -0.58087158203125, -0.5566558837890625, -0.532440185546875, -0.5082244873046875, -0.4840087890625, -0.4597930908203125, -0.435577392578125, -0.4113616943359375, -0.38714599609375, -0.3629302978515625, -0.338714599609375, -0.3144989013671875, -0.290283203125, -0.2660675048828125, -0.241851806640625, -0.2176361083984375, -0.19342041015625, -0.1692047119140625, -0.144989013671875, -0.1207733154296875, -0.0965576171875, -0.0723419189453125, -0.048126220703125, -0.0239105224609375, 0.00030517578125, 0.0245208740234375, 0.048736572265625, 0.0729522705078125, 0.09716796875, 0.1213836669921875, 0.145599365234375, 0.1698150634765625, 0.19403076171875, 0.2182464599609375, 0.242462158203125, 0.2666778564453125, 0.2908935546875, 0.3151092529296875, 0.339324951171875, 0.3635406494140625, 0.38775634765625, 0.4119720458984375, 0.436187744140625, 0.4604034423828125, 0.484619140625, 0.5088348388671875, 0.533050537109375, 0.5572662353515625, 0.58148193359375, 0.6056976318359375, 0.629913330078125, 0.6541290283203125, 0.6783447265625, 0.7025604248046875, 0.726776123046875, 0.7509918212890625, 0.77520751953125, 0.7994232177734375, 0.823638916015625, 0.8478546142578125, 0.8720703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 10.0, 12.0, 32.0, 46.0, 70.0, 113.0, 153.0, 176.0, 129.0, 95.0, 62.0, 29.0, 22.0, 10.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.775074005126953, -5.571577072143555, -5.368079662322998, -5.1645827293396, -4.961085319519043, -4.7575883865356445, -4.554090976715088, -4.3505940437316895, -4.147096633911133, -3.9435994625091553, -3.7401022911071777, -3.5366051197052, -3.3331079483032227, -3.129611015319824, -2.9261136054992676, -2.722616672515869, -2.5191195011138916, -2.315622329711914, -2.1121251583099365, -1.908627986907959, -1.7051308155059814, -1.5016337633132935, -1.298136591911316, -1.0946394205093384, -0.8911422491073608, -0.6876450777053833, -0.48414793610572815, -0.280650794506073, -0.07715362310409546, 0.1263434886932373, 0.32984066009521484, 0.5333378314971924, 0.7368350028991699, 0.9403321743011475, 1.143829345703125, 1.3473265171051025, 1.55082368850708, 1.754320740699768, 1.9578179121017456, 2.1613149642944336, 2.3648123741149902, 2.5683095455169678, 2.7718067169189453, 2.975303888320923, 3.1788010597229004, 3.382297992706299, 3.5857954025268555, 3.789292335510254, 3.9927895069122314, 4.196286678314209, 4.399783611297607, 4.603281021118164, 4.8067779541015625, 5.010275363922119, 5.213772296905518, 5.417269706726074, 5.620766639709473, 5.824263572692871, 6.027760982513428, 6.231257915496826, 6.434755325317383, 6.638252258300781, 6.841749668121338, 7.045246601104736, 7.248744010925293]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 11.0, 4.0, 7.0, 19.0, 11.0, 12.0, 18.0, 15.0, 31.0, 23.0, 41.0, 26.0, 32.0, 34.0, 41.0, 32.0, 36.0, 45.0, 49.0, 41.0, 44.0, 49.0, 51.0, 36.0, 37.0, 32.0, 30.0, 40.0, 33.0, 21.0, 17.0, 18.0, 14.0, 12.0, 10.0, 10.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5337789058685303, -2.4517745971679688, -2.3697705268859863, -2.287766456604004, -2.2057621479034424, -2.123757839202881, -2.0417537689208984, -1.9597495794296265, -1.8777453899383545, -1.7957412004470825, -1.7137370109558105, -1.6317328214645386, -1.5497286319732666, -1.4677244424819946, -1.3857202529907227, -1.3037160634994507, -1.2217118740081787, -1.1397076845169067, -1.0577034950256348, -0.9756993055343628, -0.8936951160430908, -0.8116909265518188, -0.7296867370605469, -0.6476825475692749, -0.5656783580780029, -0.48367416858673096, -0.401669979095459, -0.319665789604187, -0.23766160011291504, -0.15565741062164307, -0.0736532211303711, 0.008350968360900879, 0.09035515785217285, 0.17235934734344482, 0.2543635368347168, 0.33636772632598877, 0.41837191581726074, 0.5003761053085327, 0.5823802947998047, 0.6643844842910767, 0.7463886737823486, 0.8283928632736206, 0.9103970527648926, 0.9924012422561646, 1.0744054317474365, 1.1564096212387085, 1.2384138107299805, 1.3204180002212524, 1.4024221897125244, 1.4844263792037964, 1.5664305686950684, 1.6484347581863403, 1.7304389476776123, 1.8124431371688843, 1.8944473266601562, 1.9764515161514282, 2.0584557056427, 2.1404600143432617, 2.222464084625244, 2.3044681549072266, 2.386472463607788, 2.4684767723083496, 2.550480842590332, 2.6324849128723145, 2.714489221572876]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 13.0, 14.0, 13.0, 31.0, 27.0, 46.0, 78.0, 137.0, 205.0, 323.0, 528.0, 936.0, 1895.0, 3887.0, 9965.0, 28183.0, 97435.0, 512675.0, 293024.0, 65065.0, 20001.0, 7294.0, 3175.0, 1523.0, 814.0, 469.0, 304.0, 157.0, 108.0, 61.0, 50.0, 29.0, 17.0, 11.0, 8.0, 11.0, 3.0, 5.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-2.974609375, -2.889251708984375, -2.80389404296875, -2.718536376953125, -2.6331787109375, -2.547821044921875, -2.46246337890625, -2.377105712890625, -2.291748046875, -2.206390380859375, -2.12103271484375, -2.035675048828125, -1.9503173828125, -1.864959716796875, -1.77960205078125, -1.694244384765625, -1.60888671875, -1.523529052734375, -1.43817138671875, -1.352813720703125, -1.2674560546875, -1.182098388671875, -1.09674072265625, -1.011383056640625, -0.926025390625, -0.840667724609375, -0.75531005859375, -0.669952392578125, -0.5845947265625, -0.499237060546875, -0.41387939453125, -0.328521728515625, -0.2431640625, -0.157806396484375, -0.07244873046875, 0.012908935546875, 0.0982666015625, 0.183624267578125, 0.26898193359375, 0.354339599609375, 0.439697265625, 0.525054931640625, 0.61041259765625, 0.695770263671875, 0.7811279296875, 0.866485595703125, 0.95184326171875, 1.037200927734375, 1.12255859375, 1.207916259765625, 1.29327392578125, 1.378631591796875, 1.4639892578125, 1.549346923828125, 1.63470458984375, 1.720062255859375, 1.805419921875, 1.890777587890625, 1.97613525390625, 2.061492919921875, 2.1468505859375, 2.232208251953125, 2.31756591796875, 2.402923583984375, 2.48828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 8.0, 7.0, 9.0, 11.0, 12.0, 26.0, 32.0, 26.0, 52.0, 64.0, 68.0, 81.0, 73.0, 82.0, 89.0, 66.0, 72.0, 50.0, 46.0, 29.0, 34.0, 20.0, 15.0, 12.0, 9.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.43953704833984375, -0.4274139404296875, -0.41529083251953125, -0.403167724609375, -0.39104461669921875, -0.3789215087890625, -0.36679840087890625, -0.35467529296875, -0.34255218505859375, -0.3304290771484375, -0.31830596923828125, -0.306182861328125, -0.29405975341796875, -0.2819366455078125, -0.26981353759765625, -0.2576904296875, -0.24556732177734375, -0.2334442138671875, -0.22132110595703125, -0.209197998046875, -0.19707489013671875, -0.1849517822265625, -0.17282867431640625, -0.16070556640625, -0.14858245849609375, -0.1364593505859375, -0.12433624267578125, -0.112213134765625, -0.10009002685546875, -0.0879669189453125, -0.07584381103515625, -0.063720703125, -0.05159759521484375, -0.0394744873046875, -0.02735137939453125, -0.015228271484375, -0.00310516357421875, 0.0090179443359375, 0.02114105224609375, 0.03326416015625, 0.04538726806640625, 0.0575103759765625, 0.06963348388671875, 0.081756591796875, 0.09387969970703125, 0.1060028076171875, 0.11812591552734375, 0.1302490234375, 0.14237213134765625, 0.1544952392578125, 0.16661834716796875, 0.178741455078125, 0.19086456298828125, 0.2029876708984375, 0.21511077880859375, 0.22723388671875, 0.23935699462890625, 0.2514801025390625, 0.26360321044921875, 0.275726318359375, 0.28784942626953125, 0.2999725341796875, 0.31209564208984375, 0.32421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 15.0, 16.0, 17.0, 25.0, 40.0, 47.0, 64.0, 105.0, 151.0, 250.0, 402.0, 787.0, 1375.0, 2700.0, 5590.0, 12025.0, 28535.0, 73573.0, 238400.0, 474650.0, 128360.0, 45873.0, 18924.0, 8473.0, 3813.0, 1856.0, 1027.0, 540.0, 301.0, 204.0, 107.0, 87.0, 58.0, 43.0, 28.0, 21.0, 20.0, 15.0, 10.0, 5.0, 2.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-2.0078125, -1.9524383544921875, -1.897064208984375, -1.8416900634765625, -1.78631591796875, -1.7309417724609375, -1.675567626953125, -1.6201934814453125, -1.5648193359375, -1.5094451904296875, -1.454071044921875, -1.3986968994140625, -1.34332275390625, -1.2879486083984375, -1.232574462890625, -1.1772003173828125, -1.121826171875, -1.0664520263671875, -1.011077880859375, -0.9557037353515625, -0.90032958984375, -0.8449554443359375, -0.789581298828125, -0.7342071533203125, -0.6788330078125, -0.6234588623046875, -0.568084716796875, -0.5127105712890625, -0.45733642578125, -0.4019622802734375, -0.346588134765625, -0.2912139892578125, -0.23583984375, -0.1804656982421875, -0.125091552734375, -0.0697174072265625, -0.01434326171875, 0.0410308837890625, 0.096405029296875, 0.1517791748046875, 0.2071533203125, 0.2625274658203125, 0.317901611328125, 0.3732757568359375, 0.42864990234375, 0.4840240478515625, 0.539398193359375, 0.5947723388671875, 0.650146484375, 0.7055206298828125, 0.760894775390625, 0.8162689208984375, 0.87164306640625, 0.9270172119140625, 0.982391357421875, 1.0377655029296875, 1.0931396484375, 1.1485137939453125, 1.203887939453125, 1.2592620849609375, 1.31463623046875, 1.3700103759765625, 1.425384521484375, 1.4807586669921875, 1.5361328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 12.0, 5.0, 3.0, 14.0, 4.0, 6.0, 9.0, 18.0, 17.0, 20.0, 24.0, 33.0, 35.0, 43.0, 29.0, 40.0, 49.0, 52.0, 42.0, 53.0, 49.0, 49.0, 44.0, 37.0, 53.0, 33.0, 40.0, 35.0, 33.0, 24.0, 24.0, 19.0, 18.0, 11.0, 6.0, 10.0, 5.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.064453125, -1.0245361328125, -0.984619140625, -0.9447021484375, -0.90478515625, -0.8648681640625, -0.824951171875, -0.7850341796875, -0.7451171875, -0.7052001953125, -0.665283203125, -0.6253662109375, -0.58544921875, -0.5455322265625, -0.505615234375, -0.4656982421875, -0.42578125, -0.3858642578125, -0.345947265625, -0.3060302734375, -0.26611328125, -0.2261962890625, -0.186279296875, -0.1463623046875, -0.1064453125, -0.0665283203125, -0.026611328125, 0.0133056640625, 0.05322265625, 0.0931396484375, 0.133056640625, 0.1729736328125, 0.212890625, 0.2528076171875, 0.292724609375, 0.3326416015625, 0.37255859375, 0.4124755859375, 0.452392578125, 0.4923095703125, 0.5322265625, 0.5721435546875, 0.612060546875, 0.6519775390625, 0.69189453125, 0.7318115234375, 0.771728515625, 0.8116455078125, 0.8515625, 0.8914794921875, 0.931396484375, 0.9713134765625, 1.01123046875, 1.0511474609375, 1.091064453125, 1.1309814453125, 1.1708984375, 1.2108154296875, 1.250732421875, 1.2906494140625, 1.33056640625, 1.3704833984375, 1.410400390625, 1.4503173828125, 1.490234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 14.0, 13.0, 8.0, 19.0, 22.0, 46.0, 74.0, 101.0, 159.0, 212.0, 314.0, 591.0, 887.0, 1403.0, 2658.0, 5118.0, 10697.0, 25276.0, 85157.0, 617941.0, 222446.0, 43447.0, 15985.0, 7191.0, 3680.0, 1914.0, 1168.0, 686.0, 406.0, 279.0, 188.0, 156.0, 90.0, 58.0, 46.0, 19.0, 15.0, 19.0, 9.0, 9.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.359375, -1.3151702880859375, -1.270965576171875, -1.2267608642578125, -1.18255615234375, -1.1383514404296875, -1.094146728515625, -1.0499420166015625, -1.0057373046875, -0.9615325927734375, -0.917327880859375, -0.8731231689453125, -0.82891845703125, -0.7847137451171875, -0.740509033203125, -0.6963043212890625, -0.652099609375, -0.6078948974609375, -0.563690185546875, -0.5194854736328125, -0.47528076171875, -0.4310760498046875, -0.386871337890625, -0.3426666259765625, -0.2984619140625, -0.2542572021484375, -0.210052490234375, -0.1658477783203125, -0.12164306640625, -0.0774383544921875, -0.033233642578125, 0.0109710693359375, 0.05517578125, 0.0993804931640625, 0.143585205078125, 0.1877899169921875, 0.23199462890625, 0.2761993408203125, 0.320404052734375, 0.3646087646484375, 0.4088134765625, 0.4530181884765625, 0.497222900390625, 0.5414276123046875, 0.58563232421875, 0.6298370361328125, 0.674041748046875, 0.7182464599609375, 0.762451171875, 0.8066558837890625, 0.850860595703125, 0.8950653076171875, 0.93927001953125, 0.9834747314453125, 1.027679443359375, 1.0718841552734375, 1.1160888671875, 1.1602935791015625, 1.204498291015625, 1.2487030029296875, 1.29290771484375, 1.3371124267578125, 1.381317138671875, 1.4255218505859375, 1.4697265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 12.0, 15.0, 25.0, 39.0, 48.0, 82.0, 84.0, 97.0, 120.0, 98.0, 96.0, 71.0, 54.0, 33.0, 38.0, 13.0, 22.0, 11.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021922588348388672, -0.00021110661327838898, -0.00020298734307289124, -0.0001948680728673935, -0.00018674880266189575, -0.000178629532456398, -0.00017051026225090027, -0.00016239099204540253, -0.00015427172183990479, -0.00014615245163440704, -0.0001380331814289093, -0.00012991391122341156, -0.00012179464101791382, -0.00011367537081241608, -0.00010555610060691833, -9.74368304014206e-05, -8.931756019592285e-05, -8.119828999042511e-05, -7.307901978492737e-05, -6.495974957942963e-05, -5.6840479373931885e-05, -4.872120916843414e-05, -4.06019389629364e-05, -3.248266875743866e-05, -2.4363398551940918e-05, -1.6244128346443176e-05, -8.124858140945435e-06, -5.587935447692871e-09, 8.113682270050049e-06, 1.623295247554779e-05, 2.4352222681045532e-05, 3.2471492886543274e-05, 4.0590763092041016e-05, 4.871003329753876e-05, 5.68293035030365e-05, 6.494857370853424e-05, 7.306784391403198e-05, 8.118711411952972e-05, 8.930638432502747e-05, 9.742565453052521e-05, 0.00010554492473602295, 0.00011366419494152069, 0.00012178346514701843, 0.00012990273535251617, 0.00013802200555801392, 0.00014614127576351166, 0.0001542605459690094, 0.00016237981617450714, 0.00017049908638000488, 0.00017861835658550262, 0.00018673762679100037, 0.0001948568969964981, 0.00020297616720199585, 0.0002110954374074936, 0.00021921470761299133, 0.00022733397781848907, 0.00023545324802398682, 0.00024357251822948456, 0.0002516917884349823, 0.00025981105864048004, 0.0002679303288459778, 0.0002760495990514755, 0.00028416886925697327, 0.000292288139462471, 0.00030040740966796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 4.0, 3.0, 6.0, 18.0, 17.0, 11.0, 45.0, 52.0, 68.0, 110.0, 202.0, 345.0, 557.0, 1054.0, 2287.0, 4932.0, 12772.0, 44378.0, 538367.0, 384274.0, 38715.0, 11478.0, 4451.0, 2071.0, 977.0, 555.0, 265.0, 142.0, 125.0, 66.0, 59.0, 54.0, 24.0, 13.0, 18.0, 5.0, 5.0, 4.0, 4.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.816314697265625, -1.75567626953125, -1.695037841796875, -1.6343994140625, -1.573760986328125, -1.51312255859375, -1.452484130859375, -1.391845703125, -1.331207275390625, -1.27056884765625, -1.209930419921875, -1.1492919921875, -1.088653564453125, -1.02801513671875, -0.967376708984375, -0.90673828125, -0.846099853515625, -0.78546142578125, -0.724822998046875, -0.6641845703125, -0.603546142578125, -0.54290771484375, -0.482269287109375, -0.421630859375, -0.360992431640625, -0.30035400390625, -0.239715576171875, -0.1790771484375, -0.118438720703125, -0.05780029296875, 0.002838134765625, 0.0634765625, 0.124114990234375, 0.18475341796875, 0.245391845703125, 0.3060302734375, 0.366668701171875, 0.42730712890625, 0.487945556640625, 0.548583984375, 0.609222412109375, 0.66986083984375, 0.730499267578125, 0.7911376953125, 0.851776123046875, 0.91241455078125, 0.973052978515625, 1.03369140625, 1.094329833984375, 1.15496826171875, 1.215606689453125, 1.2762451171875, 1.336883544921875, 1.39752197265625, 1.458160400390625, 1.518798828125, 1.579437255859375, 1.64007568359375, 1.700714111328125, 1.7613525390625, 1.821990966796875, 1.88262939453125, 1.943267822265625, 2.00390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 1.0, 2.0, 6.0, 7.0, 6.0, 7.0, 7.0, 15.0, 11.0, 28.0, 29.0, 54.0, 45.0, 90.0, 114.0, 182.0, 94.0, 78.0, 48.0, 39.0, 29.0, 24.0, 9.0, 14.0, 9.0, 8.0, 5.0, 4.0, 8.0, 1.0, 6.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.845703125, -0.8135986328125, -0.781494140625, -0.7493896484375, -0.71728515625, -0.6851806640625, -0.653076171875, -0.6209716796875, -0.5888671875, -0.5567626953125, -0.524658203125, -0.4925537109375, -0.46044921875, -0.4283447265625, -0.396240234375, -0.3641357421875, -0.33203125, -0.2999267578125, -0.267822265625, -0.2357177734375, -0.20361328125, -0.1715087890625, -0.139404296875, -0.1072998046875, -0.0751953125, -0.0430908203125, -0.010986328125, 0.0211181640625, 0.05322265625, 0.0853271484375, 0.117431640625, 0.1495361328125, 0.181640625, 0.2137451171875, 0.245849609375, 0.2779541015625, 0.31005859375, 0.3421630859375, 0.374267578125, 0.4063720703125, 0.4384765625, 0.4705810546875, 0.502685546875, 0.5347900390625, 0.56689453125, 0.5989990234375, 0.631103515625, 0.6632080078125, 0.6953125, 0.7274169921875, 0.759521484375, 0.7916259765625, 0.82373046875, 0.8558349609375, 0.887939453125, 0.9200439453125, 0.9521484375, 0.9842529296875, 1.016357421875, 1.0484619140625, 1.08056640625, 1.1126708984375, 1.144775390625, 1.1768798828125, 1.208984375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 5.0, 7.0, 20.0, 30.0, 47.0, 78.0, 129.0, 144.0, 150.0, 124.0, 85.0, 63.0, 34.0, 36.0, 16.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.419082641601562, -16.924156188964844, -16.429231643676758, -15.934306144714355, -15.439380645751953, -14.944454193115234, -14.449529647827148, -13.95460319519043, -13.459677696228027, -12.964752197265625, -12.469826698303223, -11.97490119934082, -11.479975700378418, -10.985050201416016, -10.490123748779297, -9.995198249816895, -9.500272750854492, -9.00534725189209, -8.510421752929688, -8.015496253967285, -7.520570278167725, -7.025644779205322, -6.53071928024292, -6.035793304443359, -5.540868759155273, -5.045943260192871, -4.551017761230469, -4.056092262268066, -3.561166286468506, -3.0662407875061035, -2.571315288543701, -2.0763895511627197, -1.5814638137817383, -1.0865381956100464, -0.5916126370429993, -0.09668707847595215, 0.39823853969573975, 0.8931641578674316, 1.388089656829834, 1.8830153942108154, 2.3779408931732178, 2.87286639213562, 3.3677921295166016, 3.862717628479004, 4.357643127441406, 4.852568626403809, 5.347494125366211, 5.8424201011657715, 6.337345600128174, 6.832271099090576, 7.3271965980529785, 7.822122573852539, 8.317048072814941, 8.811973571777344, 9.306899070739746, 9.801824569702148, 10.29675006866455, 10.791675567626953, 11.286601066589355, 11.781526565551758, 12.27645206451416, 12.771377563476562, 13.266304016113281, 13.761229515075684, 14.256155014038086]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 5.0, 3.0, 6.0, 10.0, 8.0, 14.0, 9.0, 16.0, 8.0, 21.0, 16.0, 19.0, 24.0, 31.0, 27.0, 32.0, 42.0, 38.0, 36.0, 47.0, 44.0, 50.0, 35.0, 53.0, 35.0, 42.0, 37.0, 38.0, 34.0, 31.0, 35.0, 18.0, 18.0, 20.0, 20.0, 22.0, 13.0, 11.0, 10.0, 9.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.48574686050415, -6.281883716583252, -6.078021049499512, -5.874157905578613, -5.670294761657715, -5.466431617736816, -5.262568950653076, -5.058705806732178, -4.8548431396484375, -4.650979995727539, -4.447117328643799, -4.2432541847229, -4.039391040802002, -3.8355281352996826, -3.6316652297973633, -3.427802085876465, -3.2239389419555664, -3.020076036453247, -2.8162128925323486, -2.6123499870300293, -2.408486843109131, -2.2046239376068115, -2.000761032104492, -1.7968980073928833, -1.5930349826812744, -1.3891719579696655, -1.1853089332580566, -0.9814460277557373, -0.7775830030441284, -0.5737199783325195, -0.3698570728302002, -0.1659940481185913, 0.03786945343017578, 0.24173244833946228, 0.4455954432487488, 0.6494584083557129, 0.8533214330673218, 1.0571844577789307, 1.26104736328125, 1.4649103879928589, 1.6687734127044678, 1.8726364374160767, 2.0764994621276855, 2.280362367630005, 2.484225273132324, 2.6880884170532227, 2.891951322555542, 3.0958142280578613, 3.2996773719787598, 3.503540277481079, 3.7074034214019775, 3.911266326904297, 4.115129470825195, 4.318992614746094, 4.522855281829834, 4.726718425750732, 4.930581092834473, 5.134444236755371, 5.338306903839111, 5.54217004776001, 5.746033191680908, 5.949895858764648, 6.153759002685547, 6.357622146606445, 6.561485290527344]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 10.0, 9.0, 15.0, 19.0, 19.0, 30.0, 36.0, 74.0, 143.0, 220.0, 414.0, 676.0, 1188.0, 2409.0, 5851.0, 17356.0, 140670.0, 3970248.0, 37571.0, 9834.0, 3720.0, 1715.0, 879.0, 449.0, 271.0, 178.0, 106.0, 52.0, 45.0, 29.0, 6.0, 9.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.3515625, -3.247650146484375, -3.14373779296875, -3.039825439453125, -2.9359130859375, -2.832000732421875, -2.72808837890625, -2.624176025390625, -2.520263671875, -2.416351318359375, -2.31243896484375, -2.208526611328125, -2.1046142578125, -2.000701904296875, -1.89678955078125, -1.792877197265625, -1.68896484375, -1.585052490234375, -1.48114013671875, -1.377227783203125, -1.2733154296875, -1.169403076171875, -1.06549072265625, -0.961578369140625, -0.857666015625, -0.753753662109375, -0.64984130859375, -0.545928955078125, -0.4420166015625, -0.338104248046875, -0.23419189453125, -0.130279541015625, -0.0263671875, 0.077545166015625, 0.18145751953125, 0.285369873046875, 0.3892822265625, 0.493194580078125, 0.59710693359375, 0.701019287109375, 0.804931640625, 0.908843994140625, 1.01275634765625, 1.116668701171875, 1.2205810546875, 1.324493408203125, 1.42840576171875, 1.532318115234375, 1.63623046875, 1.740142822265625, 1.84405517578125, 1.947967529296875, 2.0518798828125, 2.155792236328125, 2.25970458984375, 2.363616943359375, 2.467529296875, 2.571441650390625, 2.67535400390625, 2.779266357421875, 2.8831787109375, 2.987091064453125, 3.09100341796875, 3.194915771484375, 3.298828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 12.0, 14.0, 18.0, 32.0, 32.0, 39.0, 43.0, 61.0, 75.0, 73.0, 79.0, 80.0, 73.0, 63.0, 63.0, 49.0, 44.0, 36.0, 24.0, 25.0, 10.0, 10.0, 13.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4610137939453125, -0.448883056640625, -0.4367523193359375, -0.42462158203125, -0.4124908447265625, -0.400360107421875, -0.3882293701171875, -0.3760986328125, -0.3639678955078125, -0.351837158203125, -0.3397064208984375, -0.32757568359375, -0.3154449462890625, -0.303314208984375, -0.2911834716796875, -0.279052734375, -0.2669219970703125, -0.254791259765625, -0.2426605224609375, -0.23052978515625, -0.2183990478515625, -0.206268310546875, -0.1941375732421875, -0.1820068359375, -0.1698760986328125, -0.157745361328125, -0.1456146240234375, -0.13348388671875, -0.1213531494140625, -0.109222412109375, -0.0970916748046875, -0.0849609375, -0.0728302001953125, -0.060699462890625, -0.0485687255859375, -0.03643798828125, -0.0243072509765625, -0.012176513671875, -4.57763671875e-05, 0.0120849609375, 0.0242156982421875, 0.036346435546875, 0.0484771728515625, 0.06060791015625, 0.0727386474609375, 0.084869384765625, 0.0970001220703125, 0.109130859375, 0.1212615966796875, 0.133392333984375, 0.1455230712890625, 0.15765380859375, 0.1697845458984375, 0.181915283203125, 0.1940460205078125, 0.2061767578125, 0.2183074951171875, 0.230438232421875, 0.2425689697265625, 0.25469970703125, 0.2668304443359375, 0.278961181640625, 0.2910919189453125, 0.30322265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 9.0, 18.0, 26.0, 38.0, 80.0, 137.0, 230.0, 397.0, 692.0, 1430.0, 2770.0, 5988.0, 13671.0, 35777.0, 200312.0, 3787621.0, 98155.0, 26411.0, 10725.0, 4778.0, 2333.0, 1234.0, 598.0, 354.0, 195.0, 122.0, 67.0, 38.0, 34.0, 9.0, 12.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.3515625, -2.27655029296875, -2.2015380859375, -2.12652587890625, -2.051513671875, -1.97650146484375, -1.9014892578125, -1.82647705078125, -1.75146484375, -1.67645263671875, -1.6014404296875, -1.52642822265625, -1.451416015625, -1.37640380859375, -1.3013916015625, -1.22637939453125, -1.1513671875, -1.07635498046875, -1.0013427734375, -0.92633056640625, -0.851318359375, -0.77630615234375, -0.7012939453125, -0.62628173828125, -0.55126953125, -0.47625732421875, -0.4012451171875, -0.32623291015625, -0.251220703125, -0.17620849609375, -0.1011962890625, -0.02618408203125, 0.048828125, 0.12384033203125, 0.1988525390625, 0.27386474609375, 0.348876953125, 0.42388916015625, 0.4989013671875, 0.57391357421875, 0.64892578125, 0.72393798828125, 0.7989501953125, 0.87396240234375, 0.948974609375, 1.02398681640625, 1.0989990234375, 1.17401123046875, 1.2490234375, 1.32403564453125, 1.3990478515625, 1.47406005859375, 1.549072265625, 1.62408447265625, 1.6990966796875, 1.77410888671875, 1.84912109375, 1.92413330078125, 1.9991455078125, 2.07415771484375, 2.149169921875, 2.22418212890625, 2.2991943359375, 2.37420654296875, 2.44921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 3.0, 9.0, 8.0, 9.0, 15.0, 11.0, 23.0, 23.0, 26.0, 47.0, 115.0, 190.0, 932.0, 2014.0, 283.0, 107.0, 58.0, 43.0, 28.0, 16.0, 14.0, 10.0, 16.0, 10.0, 8.0, 6.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.677734375, -0.6578750610351562, -0.6380157470703125, -0.6181564331054688, -0.598297119140625, -0.5784378051757812, -0.5585784912109375, -0.5387191772460938, -0.51885986328125, -0.49900054931640625, -0.4791412353515625, -0.45928192138671875, -0.439422607421875, -0.41956329345703125, -0.3997039794921875, -0.37984466552734375, -0.3599853515625, -0.34012603759765625, -0.3202667236328125, -0.30040740966796875, -0.280548095703125, -0.26068878173828125, -0.2408294677734375, -0.22097015380859375, -0.20111083984375, -0.18125152587890625, -0.1613922119140625, -0.14153289794921875, -0.121673583984375, -0.10181427001953125, -0.0819549560546875, -0.06209564208984375, -0.042236328125, -0.02237701416015625, -0.0025177001953125, 0.01734161376953125, 0.037200927734375, 0.05706024169921875, 0.0769195556640625, 0.09677886962890625, 0.11663818359375, 0.13649749755859375, 0.1563568115234375, 0.17621612548828125, 0.196075439453125, 0.21593475341796875, 0.2357940673828125, 0.25565338134765625, 0.2755126953125, 0.29537200927734375, 0.3152313232421875, 0.33509063720703125, 0.354949951171875, 0.37480926513671875, 0.3946685791015625, 0.41452789306640625, 0.43438720703125, 0.45424652099609375, 0.4741058349609375, 0.49396514892578125, 0.513824462890625, 0.5336837768554688, 0.5535430908203125, 0.5734024047851562, 0.59326171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 15.0, 25.0, 30.0, 36.0, 70.0, 111.0, 121.0, 131.0, 135.0, 100.0, 67.0, 56.0, 34.0, 23.0, 13.0, 9.0, 5.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5192713737487793, -3.3754820823669434, -3.2316925525665283, -3.0879030227661133, -2.9441137313842773, -2.8003244400024414, -2.6565349102020264, -2.5127453804016113, -2.3689560890197754, -2.2251667976379395, -2.0813772678375244, -1.937587857246399, -1.7937984466552734, -1.650009036064148, -1.5062196254730225, -1.362430214881897, -1.2186408042907715, -1.074851393699646, -0.9310619831085205, -0.787272572517395, -0.6434831619262695, -0.49969375133514404, -0.35590434074401855, -0.21211493015289307, -0.06832551956176758, 0.07546389102935791, 0.2192533016204834, 0.3630427122116089, 0.5068321228027344, 0.6506215333938599, 0.7944109439849854, 0.9382003545761108, 1.0819892883300781, 1.2257786989212036, 1.369568109512329, 1.5133575201034546, 1.65714693069458, 1.8009363412857056, 1.944725751876831, 2.088515281677246, 2.232304573059082, 2.376093864440918, 2.519883394241333, 2.663672924041748, 2.807462215423584, 2.95125150680542, 3.095041036605835, 3.23883056640625, 3.382619857788086, 3.526409149169922, 3.670198678970337, 3.813988208770752, 3.957777500152588, 4.101566791534424, 4.245356559753418, 4.389145851135254, 4.53293514251709, 4.676724433898926, 4.820513725280762, 4.964303493499756, 5.108092784881592, 5.251882076263428, 5.395671844482422, 5.539461135864258, 5.683250427246094]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 4.0, 4.0, 5.0, 9.0, 7.0, 17.0, 18.0, 22.0, 28.0, 16.0, 23.0, 39.0, 37.0, 35.0, 41.0, 46.0, 30.0, 49.0, 45.0, 51.0, 46.0, 40.0, 41.0, 48.0, 50.0, 29.0, 48.0, 30.0, 27.0, 39.0, 15.0, 8.0, 19.0, 11.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0366344451904297, -1.9622552394866943, -1.8878761529922485, -1.8134970664978027, -1.7391178607940674, -1.664738655090332, -1.5903595685958862, -1.5159804821014404, -1.441601276397705, -1.3672220706939697, -1.292842984199524, -1.2184638977050781, -1.1440846920013428, -1.0697054862976074, -0.9953263998031616, -0.920947253704071, -0.8465681076049805, -0.7721889615058899, -0.6978098154067993, -0.6234306693077087, -0.5490515232086182, -0.4746723771095276, -0.400293231010437, -0.32591408491134644, -0.25153493881225586, -0.17715579271316528, -0.10277664661407471, -0.02839750051498413, 0.045981645584106445, 0.12036079168319702, 0.1947399377822876, 0.2691190838813782, 0.34349822998046875, 0.4178773760795593, 0.4922565221786499, 0.5666356682777405, 0.641014814376831, 0.7153939604759216, 0.7897731065750122, 0.8641522526741028, 0.9385313987731934, 1.0129106044769287, 1.0872896909713745, 1.1616687774658203, 1.2360479831695557, 1.310427188873291, 1.3848062753677368, 1.4591853618621826, 1.533564567565918, 1.6079437732696533, 1.6823228597640991, 1.756701946258545, 1.8310811519622803, 1.9054603576660156, 1.9798394441604614, 2.0542185306549072, 2.1285977363586426, 2.202976942062378, 2.2773561477661133, 2.3517351150512695, 2.426114320755005, 2.5004935264587402, 2.5748724937438965, 2.649251699447632, 2.723630905151367]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 9.0, 9.0, 4.0, 9.0, 12.0, 27.0, 34.0, 48.0, 81.0, 129.0, 204.0, 395.0, 722.0, 1447.0, 2909.0, 6865.0, 18217.0, 59773.0, 260965.0, 531093.0, 115126.0, 31179.0, 10684.0, 4317.0, 2011.0, 1017.0, 527.0, 307.0, 165.0, 80.0, 55.0, 40.0, 21.0, 27.0, 11.0, 12.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5234375, -2.442657470703125, -2.36187744140625, -2.281097412109375, -2.2003173828125, -2.119537353515625, -2.03875732421875, -1.957977294921875, -1.877197265625, -1.796417236328125, -1.71563720703125, -1.634857177734375, -1.5540771484375, -1.473297119140625, -1.39251708984375, -1.311737060546875, -1.23095703125, -1.150177001953125, -1.06939697265625, -0.988616943359375, -0.9078369140625, -0.827056884765625, -0.74627685546875, -0.665496826171875, -0.584716796875, -0.503936767578125, -0.42315673828125, -0.342376708984375, -0.2615966796875, -0.180816650390625, -0.10003662109375, -0.019256591796875, 0.0615234375, 0.142303466796875, 0.22308349609375, 0.303863525390625, 0.3846435546875, 0.465423583984375, 0.54620361328125, 0.626983642578125, 0.707763671875, 0.788543701171875, 0.86932373046875, 0.950103759765625, 1.0308837890625, 1.111663818359375, 1.19244384765625, 1.273223876953125, 1.35400390625, 1.434783935546875, 1.51556396484375, 1.596343994140625, 1.6771240234375, 1.757904052734375, 1.83868408203125, 1.919464111328125, 2.000244140625, 2.081024169921875, 2.16180419921875, 2.242584228515625, 2.3233642578125, 2.404144287109375, 2.48492431640625, 2.565704345703125, 2.646484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 7.0, 5.0, 11.0, 19.0, 29.0, 30.0, 27.0, 39.0, 55.0, 50.0, 85.0, 73.0, 77.0, 80.0, 51.0, 68.0, 51.0, 46.0, 42.0, 41.0, 30.0, 16.0, 14.0, 20.0, 5.0, 8.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4116172790527344, -0.40013885498046875, -0.3886604309082031, -0.3771820068359375, -0.3657035827636719, -0.35422515869140625, -0.3427467346191406, -0.331268310546875, -0.3197898864746094, -0.30831146240234375, -0.2968330383300781, -0.2853546142578125, -0.2738761901855469, -0.26239776611328125, -0.2509193420410156, -0.23944091796875, -0.22796249389648438, -0.21648406982421875, -0.20500564575195312, -0.1935272216796875, -0.18204879760742188, -0.17057037353515625, -0.15909194946289062, -0.147613525390625, -0.13613510131835938, -0.12465667724609375, -0.11317825317382812, -0.1016998291015625, -0.09022140502929688, -0.07874298095703125, -0.06726455688476562, -0.0557861328125, -0.044307708740234375, -0.03282928466796875, -0.021350860595703125, -0.0098724365234375, 0.001605987548828125, 0.01308441162109375, 0.024562835693359375, 0.036041259765625, 0.047519683837890625, 0.05899810791015625, 0.07047653198242188, 0.0819549560546875, 0.09343338012695312, 0.10491180419921875, 0.11639022827148438, 0.12786865234375, 0.13934707641601562, 0.15082550048828125, 0.16230392456054688, 0.1737823486328125, 0.18526077270507812, 0.19673919677734375, 0.20821762084960938, 0.219696044921875, 0.23117446899414062, 0.24265289306640625, 0.2541313171386719, 0.2656097412109375, 0.2770881652832031, 0.28856658935546875, 0.3000450134277344, 0.3115234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 7.0, 14.0, 8.0, 18.0, 30.0, 36.0, 43.0, 69.0, 71.0, 117.0, 143.0, 233.0, 347.0, 528.0, 1153.0, 2462.0, 6296.0, 18175.0, 60318.0, 248932.0, 526902.0, 128097.0, 35199.0, 11253.0, 4075.0, 1721.0, 840.0, 430.0, 295.0, 206.0, 157.0, 97.0, 78.0, 53.0, 36.0, 28.0, 24.0, 22.0, 9.0, 14.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.80859375, -1.746826171875, -1.68505859375, -1.623291015625, -1.5615234375, -1.499755859375, -1.43798828125, -1.376220703125, -1.314453125, -1.252685546875, -1.19091796875, -1.129150390625, -1.0673828125, -1.005615234375, -0.94384765625, -0.882080078125, -0.8203125, -0.758544921875, -0.69677734375, -0.635009765625, -0.5732421875, -0.511474609375, -0.44970703125, -0.387939453125, -0.326171875, -0.264404296875, -0.20263671875, -0.140869140625, -0.0791015625, -0.017333984375, 0.04443359375, 0.106201171875, 0.16796875, 0.229736328125, 0.29150390625, 0.353271484375, 0.4150390625, 0.476806640625, 0.53857421875, 0.600341796875, 0.662109375, 0.723876953125, 0.78564453125, 0.847412109375, 0.9091796875, 0.970947265625, 1.03271484375, 1.094482421875, 1.15625, 1.218017578125, 1.27978515625, 1.341552734375, 1.4033203125, 1.465087890625, 1.52685546875, 1.588623046875, 1.650390625, 1.712158203125, 1.77392578125, 1.835693359375, 1.8974609375, 1.959228515625, 2.02099609375, 2.082763671875, 2.14453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 6.0, 9.0, 10.0, 7.0, 15.0, 9.0, 19.0, 18.0, 19.0, 21.0, 33.0, 29.0, 30.0, 42.0, 41.0, 36.0, 36.0, 38.0, 42.0, 34.0, 31.0, 29.0, 33.0, 39.0, 30.0, 31.0, 32.0, 33.0, 21.0, 26.0, 20.0, 31.0, 18.0, 17.0, 19.0, 21.0, 12.0, 13.0, 3.0, 8.0, 5.0, 4.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.98974609375, -0.9597091674804688, -0.9296722412109375, -0.8996353149414062, -0.869598388671875, -0.8395614624023438, -0.8095245361328125, -0.7794876098632812, -0.74945068359375, -0.7194137573242188, -0.6893768310546875, -0.6593399047851562, -0.629302978515625, -0.5992660522460938, -0.5692291259765625, -0.5391921997070312, -0.5091552734375, -0.47911834716796875, -0.4490814208984375, -0.41904449462890625, -0.389007568359375, -0.35897064208984375, -0.3289337158203125, -0.29889678955078125, -0.26885986328125, -0.23882293701171875, -0.2087860107421875, -0.17874908447265625, -0.148712158203125, -0.11867523193359375, -0.0886383056640625, -0.05860137939453125, -0.028564453125, 0.00147247314453125, 0.0315093994140625, 0.06154632568359375, 0.091583251953125, 0.12162017822265625, 0.1516571044921875, 0.18169403076171875, 0.21173095703125, 0.24176788330078125, 0.2718048095703125, 0.30184173583984375, 0.331878662109375, 0.36191558837890625, 0.3919525146484375, 0.42198944091796875, 0.4520263671875, 0.48206329345703125, 0.5121002197265625, 0.5421371459960938, 0.572174072265625, 0.6022109985351562, 0.6322479248046875, 0.6622848510742188, 0.69232177734375, 0.7223587036132812, 0.7523956298828125, 0.7824325561523438, 0.812469482421875, 0.8425064086914062, 0.8725433349609375, 0.9025802612304688, 0.9326171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 15.0, 5.0, 11.0, 29.0, 38.0, 28.0, 66.0, 75.0, 151.0, 239.0, 504.0, 785.0, 1461.0, 3102.0, 7218.0, 19824.0, 76949.0, 590859.0, 279532.0, 43976.0, 13220.0, 5267.0, 2407.0, 1167.0, 636.0, 365.0, 233.0, 141.0, 94.0, 41.0, 42.0, 18.0, 17.0, 10.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.650390625, -1.60675048828125, -1.5631103515625, -1.51947021484375, -1.475830078125, -1.43218994140625, -1.3885498046875, -1.34490966796875, -1.30126953125, -1.25762939453125, -1.2139892578125, -1.17034912109375, -1.126708984375, -1.08306884765625, -1.0394287109375, -0.99578857421875, -0.9521484375, -0.90850830078125, -0.8648681640625, -0.82122802734375, -0.777587890625, -0.73394775390625, -0.6903076171875, -0.64666748046875, -0.60302734375, -0.55938720703125, -0.5157470703125, -0.47210693359375, -0.428466796875, -0.38482666015625, -0.3411865234375, -0.29754638671875, -0.25390625, -0.21026611328125, -0.1666259765625, -0.12298583984375, -0.079345703125, -0.03570556640625, 0.0079345703125, 0.05157470703125, 0.09521484375, 0.13885498046875, 0.1824951171875, 0.22613525390625, 0.269775390625, 0.31341552734375, 0.3570556640625, 0.40069580078125, 0.4443359375, 0.48797607421875, 0.5316162109375, 0.57525634765625, 0.618896484375, 0.66253662109375, 0.7061767578125, 0.74981689453125, 0.79345703125, 0.83709716796875, 0.8807373046875, 0.92437744140625, 0.968017578125, 1.01165771484375, 1.0552978515625, 1.09893798828125, 1.142578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 5.0, 7.0, 12.0, 11.0, 17.0, 26.0, 25.0, 39.0, 43.0, 65.0, 76.0, 85.0, 109.0, 92.0, 86.0, 80.0, 58.0, 41.0, 31.0, 27.0, 16.0, 11.0, 8.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001983642578125, -0.00019143149256706238, -0.00018449872732162476, -0.00017756596207618713, -0.0001706331968307495, -0.0001637004315853119, -0.00015676766633987427, -0.00014983490109443665, -0.00014290213584899902, -0.0001359693706035614, -0.00012903660535812378, -0.00012210384011268616, -0.00011517107486724854, -0.00010823830962181091, -0.00010130554437637329, -9.437277913093567e-05, -8.744001388549805e-05, -8.050724864006042e-05, -7.35744833946228e-05, -6.664171814918518e-05, -5.970895290374756e-05, -5.2776187658309937e-05, -4.5843422412872314e-05, -3.891065716743469e-05, -3.197789192199707e-05, -2.5045126676559448e-05, -1.8112361431121826e-05, -1.1179596185684204e-05, -4.246830940246582e-06, 2.68593430519104e-06, 9.618699550628662e-06, 1.6551464796066284e-05, 2.3484230041503906e-05, 3.041699528694153e-05, 3.734976053237915e-05, 4.428252577781677e-05, 5.1215291023254395e-05, 5.8148056268692017e-05, 6.508082151412964e-05, 7.201358675956726e-05, 7.894635200500488e-05, 8.58791172504425e-05, 9.281188249588013e-05, 9.974464774131775e-05, 0.00010667741298675537, 0.00011361017823219299, 0.00012054294347763062, 0.00012747570872306824, 0.00013440847396850586, 0.00014134123921394348, 0.0001482740044593811, 0.00015520676970481873, 0.00016213953495025635, 0.00016907230019569397, 0.0001760050654411316, 0.00018293783068656921, 0.00018987059593200684, 0.00019680336117744446, 0.00020373612642288208, 0.0002106688916683197, 0.00021760165691375732, 0.00022453442215919495, 0.00023146718740463257, 0.0002383999526500702, 0.0002453327178955078]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 0.0, 2.0, 3.0, 6.0, 8.0, 4.0, 7.0, 11.0, 14.0, 9.0, 22.0, 33.0, 59.0, 97.0, 169.0, 356.0, 669.0, 1604.0, 4694.0, 17920.0, 144029.0, 796331.0, 65451.0, 11496.0, 3248.0, 1158.0, 502.0, 256.0, 133.0, 89.0, 54.0, 41.0, 26.0, 9.0, 10.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.038299560546875, -1.97113037109375, -1.903961181640625, -1.8367919921875, -1.769622802734375, -1.70245361328125, -1.635284423828125, -1.568115234375, -1.500946044921875, -1.43377685546875, -1.366607666015625, -1.2994384765625, -1.232269287109375, -1.16510009765625, -1.097930908203125, -1.03076171875, -0.963592529296875, -0.89642333984375, -0.829254150390625, -0.7620849609375, -0.694915771484375, -0.62774658203125, -0.560577392578125, -0.493408203125, -0.426239013671875, -0.35906982421875, -0.291900634765625, -0.2247314453125, -0.157562255859375, -0.09039306640625, -0.023223876953125, 0.0439453125, 0.111114501953125, 0.17828369140625, 0.245452880859375, 0.3126220703125, 0.379791259765625, 0.44696044921875, 0.514129638671875, 0.581298828125, 0.648468017578125, 0.71563720703125, 0.782806396484375, 0.8499755859375, 0.917144775390625, 0.98431396484375, 1.051483154296875, 1.11865234375, 1.185821533203125, 1.25299072265625, 1.320159912109375, 1.3873291015625, 1.454498291015625, 1.52166748046875, 1.588836669921875, 1.656005859375, 1.723175048828125, 1.79034423828125, 1.857513427734375, 1.9246826171875, 1.991851806640625, 2.05902099609375, 2.126190185546875, 2.193359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 7.0, 5.0, 10.0, 19.0, 21.0, 29.0, 27.0, 49.0, 96.0, 159.0, 168.0, 127.0, 99.0, 50.0, 38.0, 16.0, 18.0, 16.0, 10.0, 8.0, 4.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.01953125, -0.98480224609375, -0.9500732421875, -0.91534423828125, -0.880615234375, -0.84588623046875, -0.8111572265625, -0.77642822265625, -0.74169921875, -0.70697021484375, -0.6722412109375, -0.63751220703125, -0.602783203125, -0.56805419921875, -0.5333251953125, -0.49859619140625, -0.4638671875, -0.42913818359375, -0.3944091796875, -0.35968017578125, -0.324951171875, -0.29022216796875, -0.2554931640625, -0.22076416015625, -0.18603515625, -0.15130615234375, -0.1165771484375, -0.08184814453125, -0.047119140625, -0.01239013671875, 0.0223388671875, 0.05706787109375, 0.091796875, 0.12652587890625, 0.1612548828125, 0.19598388671875, 0.230712890625, 0.26544189453125, 0.3001708984375, 0.33489990234375, 0.36962890625, 0.40435791015625, 0.4390869140625, 0.47381591796875, 0.508544921875, 0.54327392578125, 0.5780029296875, 0.61273193359375, 0.6474609375, 0.68218994140625, 0.7169189453125, 0.75164794921875, 0.786376953125, 0.82110595703125, 0.8558349609375, 0.89056396484375, 0.92529296875, 0.96002197265625, 0.9947509765625, 1.02947998046875, 1.064208984375, 1.09893798828125, 1.1336669921875, 1.16839599609375, 1.203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 11.0, 12.0, 12.0, 18.0, 31.0, 35.0, 66.0, 84.0, 111.0, 126.0, 110.0, 95.0, 87.0, 51.0, 48.0, 35.0, 23.0, 20.0, 9.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.93679428100586, -9.577986717224121, -9.219179153442383, -8.860371589660645, -8.501564025878906, -8.142756462097168, -7.783949375152588, -7.42514181137085, -7.066334247589111, -6.707526683807373, -6.348719120025635, -5.989912033081055, -5.631104469299316, -5.272296905517578, -4.91348934173584, -4.554681777954102, -4.195874214172363, -3.837066650390625, -3.4782590866088867, -3.1194517612457275, -2.7606441974639893, -2.401836633682251, -2.043029308319092, -1.6842217445373535, -1.3254141807556152, -0.9666066765785217, -0.6077991724014282, -0.2489917278289795, 0.10981583595275879, 0.46862339973449707, 0.8274307250976562, 1.1862382888793945, 1.5450468063354492, 1.9038543701171875, 2.262661933898926, 2.621469259262085, 2.9802768230438232, 3.3390843868255615, 3.6978917121887207, 4.056699275970459, 4.415506839752197, 4.7743144035339355, 5.133121967315674, 5.491929054260254, 5.850736618041992, 6.2095441818237305, 6.568351745605469, 6.927159309387207, 7.285966873168945, 7.644774436950684, 8.003582000732422, 8.36238956451416, 8.721197128295898, 9.080004692077637, 9.438812255859375, 9.797618865966797, 10.156427383422852, 10.51523494720459, 10.874042510986328, 11.232850074768066, 11.591657638549805, 11.950465202331543, 12.309272766113281, 12.668079376220703, 13.026886940002441]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 7.0, 6.0, 12.0, 9.0, 8.0, 11.0, 21.0, 23.0, 17.0, 24.0, 19.0, 29.0, 32.0, 29.0, 30.0, 33.0, 35.0, 42.0, 34.0, 41.0, 33.0, 38.0, 46.0, 36.0, 48.0, 30.0, 31.0, 39.0, 31.0, 13.0, 18.0, 31.0, 19.0, 21.0, 8.0, 12.0, 18.0, 14.0, 13.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.353793144226074, -5.1721062660217285, -4.990419387817383, -4.808732509613037, -4.627045631408691, -4.445358753204346, -4.263671875, -4.0819854736328125, -3.9002983570098877, -3.718611478805542, -3.5369246006011963, -3.3552379608154297, -3.173551082611084, -2.9918642044067383, -2.8101773262023926, -2.628490447998047, -2.446803569793701, -2.2651166915893555, -2.0834298133850098, -1.9017430543899536, -1.720056176185608, -1.5383692979812622, -1.356682538986206, -1.1749956607818604, -0.9933087825775146, -0.811621904373169, -0.629935085773468, -0.4482482671737671, -0.2665613889694214, -0.08487451076507568, 0.09681224822998047, 0.27849912643432617, 0.46018552780151367, 0.6418724060058594, 0.8235592246055603, 1.0052460432052612, 1.186932921409607, 1.3686197996139526, 1.5503065586090088, 1.7319934368133545, 1.9136803150177002, 2.095367193222046, 2.2770540714263916, 2.458740711212158, 2.640427589416504, 2.8221144676208496, 3.0038013458251953, 3.185488224029541, 3.3671751022338867, 3.5488619804382324, 3.730548858642578, 3.912235736846924, 4.0939226150512695, 4.275609493255615, 4.457296371459961, 4.638982772827148, 4.820670127868652, 5.002357006072998, 5.184043884277344, 5.3657307624816895, 5.547417640686035, 5.729104518890381, 5.910791397094727, 6.092477798461914, 6.27416467666626]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 5.0, 20.0, 27.0, 44.0, 62.0, 101.0, 169.0, 286.0, 525.0, 1146.0, 2919.0, 8531.0, 34401.0, 3620038.0, 487330.0, 26781.0, 7301.0, 2580.0, 989.0, 456.0, 218.0, 128.0, 77.0, 36.0, 29.0, 22.0, 16.0, 9.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.10552978515625, -3.9844970703125, -3.86346435546875, -3.742431640625, -3.62139892578125, -3.5003662109375, -3.37933349609375, -3.25830078125, -3.13726806640625, -3.0162353515625, -2.89520263671875, -2.774169921875, -2.65313720703125, -2.5321044921875, -2.41107177734375, -2.2900390625, -2.16900634765625, -2.0479736328125, -1.92694091796875, -1.805908203125, -1.68487548828125, -1.5638427734375, -1.44281005859375, -1.32177734375, -1.20074462890625, -1.0797119140625, -0.95867919921875, -0.837646484375, -0.71661376953125, -0.5955810546875, -0.47454833984375, -0.353515625, -0.23248291015625, -0.1114501953125, 0.00958251953125, 0.130615234375, 0.25164794921875, 0.3726806640625, 0.49371337890625, 0.61474609375, 0.73577880859375, 0.8568115234375, 0.97784423828125, 1.098876953125, 1.21990966796875, 1.3409423828125, 1.46197509765625, 1.5830078125, 1.70404052734375, 1.8250732421875, 1.94610595703125, 2.067138671875, 2.18817138671875, 2.3092041015625, 2.43023681640625, 2.55126953125, 2.67230224609375, 2.7933349609375, 2.91436767578125, 3.035400390625, 3.15643310546875, 3.2774658203125, 3.39849853515625, 3.51953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 9.0, 9.0, 8.0, 14.0, 17.0, 22.0, 35.0, 43.0, 40.0, 40.0, 68.0, 57.0, 70.0, 66.0, 77.0, 65.0, 73.0, 45.0, 47.0, 34.0, 25.0, 38.0, 21.0, 15.0, 17.0, 15.0, 8.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.438232421875, -0.4266471862792969, -0.41506195068359375, -0.4034767150878906, -0.3918914794921875, -0.3803062438964844, -0.36872100830078125, -0.3571357727050781, -0.345550537109375, -0.3339653015136719, -0.32238006591796875, -0.3107948303222656, -0.2992095947265625, -0.2876243591308594, -0.27603912353515625, -0.2644538879394531, -0.25286865234375, -0.24128341674804688, -0.22969818115234375, -0.21811294555664062, -0.2065277099609375, -0.19494247436523438, -0.18335723876953125, -0.17177200317382812, -0.160186767578125, -0.14860153198242188, -0.13701629638671875, -0.12543106079101562, -0.1138458251953125, -0.10226058959960938, -0.09067535400390625, -0.07909011840820312, -0.0675048828125, -0.055919647216796875, -0.04433441162109375, -0.032749176025390625, -0.0211639404296875, -0.009578704833984375, 0.00200653076171875, 0.013591766357421875, 0.025177001953125, 0.036762237548828125, 0.04834747314453125, 0.059932708740234375, 0.0715179443359375, 0.08310317993164062, 0.09468841552734375, 0.10627365112304688, 0.11785888671875, 0.12944412231445312, 0.14102935791015625, 0.15261459350585938, 0.1641998291015625, 0.17578506469726562, 0.18737030029296875, 0.19895553588867188, 0.210540771484375, 0.22212600708007812, 0.23371124267578125, 0.24529647827148438, 0.2568817138671875, 0.2684669494628906, 0.28005218505859375, 0.2916374206542969, 0.30322265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 11.0, 24.0, 32.0, 73.0, 122.0, 233.0, 467.0, 825.0, 1629.0, 3514.0, 7867.0, 19400.0, 60628.0, 745224.0, 3235276.0, 78069.0, 23560.0, 9204.0, 4121.0, 1938.0, 1004.0, 527.0, 252.0, 109.0, 73.0, 32.0, 27.0, 15.0, 13.0, 2.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7900390625, -1.7125091552734375, -1.634979248046875, -1.5574493408203125, -1.47991943359375, -1.4023895263671875, -1.324859619140625, -1.2473297119140625, -1.1697998046875, -1.0922698974609375, -1.014739990234375, -0.9372100830078125, -0.85968017578125, -0.7821502685546875, -0.704620361328125, -0.6270904541015625, -0.549560546875, -0.4720306396484375, -0.394500732421875, -0.3169708251953125, -0.23944091796875, -0.1619110107421875, -0.084381103515625, -0.0068511962890625, 0.0706787109375, 0.1482086181640625, 0.225738525390625, 0.3032684326171875, 0.38079833984375, 0.4583282470703125, 0.535858154296875, 0.6133880615234375, 0.69091796875, 0.7684478759765625, 0.845977783203125, 0.9235076904296875, 1.00103759765625, 1.0785675048828125, 1.156097412109375, 1.2336273193359375, 1.3111572265625, 1.3886871337890625, 1.466217041015625, 1.5437469482421875, 1.62127685546875, 1.6988067626953125, 1.776336669921875, 1.8538665771484375, 1.931396484375, 2.0089263916015625, 2.086456298828125, 2.1639862060546875, 2.24151611328125, 2.3190460205078125, 2.396575927734375, 2.4741058349609375, 2.5516357421875, 2.6291656494140625, 2.706695556640625, 2.7842254638671875, 2.86175537109375, 2.9392852783203125, 3.016815185546875, 3.0943450927734375, 3.171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 3.0, 7.0, 11.0, 16.0, 3.0, 14.0, 21.0, 22.0, 35.0, 42.0, 46.0, 91.0, 159.0, 419.0, 2008.0, 603.0, 199.0, 99.0, 51.0, 37.0, 34.0, 26.0, 18.0, 13.0, 15.0, 12.0, 9.0, 6.0, 11.0, 2.0, 2.0, 5.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6796875, -0.6567230224609375, -0.633758544921875, -0.6107940673828125, -0.58782958984375, -0.5648651123046875, -0.541900634765625, -0.5189361572265625, -0.4959716796875, -0.4730072021484375, -0.450042724609375, -0.4270782470703125, -0.40411376953125, -0.3811492919921875, -0.358184814453125, -0.3352203369140625, -0.312255859375, -0.2892913818359375, -0.266326904296875, -0.2433624267578125, -0.22039794921875, -0.1974334716796875, -0.174468994140625, -0.1515045166015625, -0.1285400390625, -0.1055755615234375, -0.082611083984375, -0.0596466064453125, -0.03668212890625, -0.0137176513671875, 0.009246826171875, 0.0322113037109375, 0.05517578125, 0.0781402587890625, 0.101104736328125, 0.1240692138671875, 0.14703369140625, 0.1699981689453125, 0.192962646484375, 0.2159271240234375, 0.2388916015625, 0.2618560791015625, 0.284820556640625, 0.3077850341796875, 0.33074951171875, 0.3537139892578125, 0.376678466796875, 0.3996429443359375, 0.422607421875, 0.4455718994140625, 0.468536376953125, 0.4915008544921875, 0.51446533203125, 0.5374298095703125, 0.560394287109375, 0.5833587646484375, 0.6063232421875, 0.6292877197265625, 0.652252197265625, 0.6752166748046875, 0.69818115234375, 0.7211456298828125, 0.744110107421875, 0.7670745849609375, 0.7900390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 12.0, 34.0, 65.0, 115.0, 180.0, 250.0, 158.0, 91.0, 39.0, 29.0, 15.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3989129066467285, -4.091261386871338, -3.783609628677368, -3.4759578704833984, -3.168306350708008, -2.860654592514038, -2.5530028343200684, -2.2453513145446777, -1.937699556350708, -1.6300479173660278, -1.3223962783813477, -1.014744520187378, -0.7070928812026978, -0.3994412422180176, -0.09178948402404785, 0.21586203575134277, 0.5235137939453125, 0.8311654329299927, 1.1388170719146729, 1.4464688301086426, 1.7541204690933228, 2.061772108078003, 2.3694238662719727, 2.6770753860473633, 2.984727144241333, 3.2923789024353027, 3.6000304222106934, 3.907682180404663, 4.215333938598633, 4.522985458374023, 4.830636978149414, 5.138288497924805, 5.445940971374512, 5.753592491149902, 6.061244487762451, 6.368896007537842, 6.676547527313232, 6.984199523925781, 7.291851043701172, 7.5995025634765625, 7.907154083251953, 8.214805603027344, 8.522457122802734, 8.830108642578125, 9.137761116027832, 9.445412635803223, 9.753064155578613, 10.060715675354004, 10.368368148803711, 10.676019668579102, 10.983671188354492, 11.291322708129883, 11.59897518157959, 11.90662670135498, 12.214278221130371, 12.521929740905762, 12.829581260681152, 13.137232780456543, 13.444884300231934, 13.75253677368164, 14.060188293457031, 14.367839813232422, 14.675491333007812, 14.983142852783203, 15.290794372558594]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 6.0, 9.0, 5.0, 7.0, 10.0, 12.0, 14.0, 15.0, 12.0, 26.0, 23.0, 24.0, 31.0, 25.0, 22.0, 30.0, 36.0, 36.0, 26.0, 30.0, 31.0, 37.0, 29.0, 32.0, 28.0, 34.0, 33.0, 36.0, 40.0, 32.0, 31.0, 22.0, 21.0, 25.0, 13.0, 25.0, 12.0, 10.0, 16.0, 19.0, 9.0, 11.0, 7.0, 3.0, 4.0, 10.0, 0.0, 5.0, 7.0, 1.0, 4.0, 3.0, 2.0], "bins": [-2.152097463607788, -2.0877439975738525, -2.023390293121338, -1.9590368270874023, -1.8946833610534668, -1.8303297758102417, -1.7659761905670166, -1.701622724533081, -1.6372692584991455, -1.5729156732559204, -1.5085622072219849, -1.4442086219787598, -1.3798551559448242, -1.3155015707015991, -1.251147985458374, -1.1867945194244385, -1.1224409341812134, -1.0580873489379883, -0.9937338829040527, -0.9293802976608276, -0.8650268316268921, -0.800673246383667, -0.7363197207450867, -0.6719661951065063, -0.607612669467926, -0.5432591438293457, -0.4789056181907654, -0.41455206274986267, -0.35019853711128235, -0.285845011472702, -0.22149145603179932, -0.157137930393219, -0.09278440475463867, -0.028430871665477753, 0.035922661423683167, 0.10027620196342468, 0.164629727602005, 0.22898325324058533, 0.29333680868148804, 0.35769033432006836, 0.4220438599586487, 0.486397385597229, 0.5507509112358093, 0.6151044368743896, 0.6794580221176147, 0.7438114881515503, 0.8081650733947754, 0.8725185990333557, 0.936872124671936, 1.0012257099151611, 1.0655791759490967, 1.1299327611923218, 1.1942862272262573, 1.2586398124694824, 1.322993278503418, 1.387346863746643, 1.4517004489898682, 1.5160540342330933, 1.5804075002670288, 1.644761085510254, 1.7091145515441895, 1.7734681367874146, 1.8378217220306396, 1.9021751880645752, 1.9665286540985107]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 2.0, 3.0, 10.0, 9.0, 13.0, 21.0, 22.0, 48.0, 64.0, 102.0, 193.0, 280.0, 536.0, 986.0, 1951.0, 4106.0, 8861.0, 21751.0, 59523.0, 404476.0, 444895.0, 60956.0, 22116.0, 9064.0, 4142.0, 2095.0, 1024.0, 511.0, 317.0, 183.0, 99.0, 52.0, 43.0, 27.0, 21.0, 17.0, 6.0, 12.0, 4.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.505859375, -2.427581787109375, -2.34930419921875, -2.271026611328125, -2.1927490234375, -2.114471435546875, -2.03619384765625, -1.957916259765625, -1.879638671875, -1.801361083984375, -1.72308349609375, -1.644805908203125, -1.5665283203125, -1.488250732421875, -1.40997314453125, -1.331695556640625, -1.25341796875, -1.175140380859375, -1.09686279296875, -1.018585205078125, -0.9403076171875, -0.862030029296875, -0.78375244140625, -0.705474853515625, -0.627197265625, -0.548919677734375, -0.47064208984375, -0.392364501953125, -0.3140869140625, -0.235809326171875, -0.15753173828125, -0.079254150390625, -0.0009765625, 0.077301025390625, 0.15557861328125, 0.233856201171875, 0.3121337890625, 0.390411376953125, 0.46868896484375, 0.546966552734375, 0.625244140625, 0.703521728515625, 0.78179931640625, 0.860076904296875, 0.9383544921875, 1.016632080078125, 1.09490966796875, 1.173187255859375, 1.25146484375, 1.329742431640625, 1.40802001953125, 1.486297607421875, 1.5645751953125, 1.642852783203125, 1.72113037109375, 1.799407958984375, 1.877685546875, 1.955963134765625, 2.03424072265625, 2.112518310546875, 2.1907958984375, 2.269073486328125, 2.34735107421875, 2.425628662109375, 2.50390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 6.0, 10.0, 12.0, 9.0, 8.0, 28.0, 22.0, 34.0, 32.0, 36.0, 48.0, 42.0, 70.0, 71.0, 66.0, 80.0, 59.0, 54.0, 62.0, 34.0, 42.0, 38.0, 36.0, 24.0, 15.0, 15.0, 15.0, 6.0, 11.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.416259765625, -0.4049720764160156, -0.39368438720703125, -0.3823966979980469, -0.3711090087890625, -0.3598213195800781, -0.34853363037109375, -0.3372459411621094, -0.325958251953125, -0.3146705627441406, -0.30338287353515625, -0.2920951843261719, -0.2808074951171875, -0.2695198059082031, -0.25823211669921875, -0.24694442749023438, -0.23565673828125, -0.22436904907226562, -0.21308135986328125, -0.20179367065429688, -0.1905059814453125, -0.17921829223632812, -0.16793060302734375, -0.15664291381835938, -0.145355224609375, -0.13406753540039062, -0.12277984619140625, -0.11149215698242188, -0.1002044677734375, -0.08891677856445312, -0.07762908935546875, -0.06634140014648438, -0.0550537109375, -0.043766021728515625, -0.03247833251953125, -0.021190643310546875, -0.0099029541015625, 0.001384735107421875, 0.01267242431640625, 0.023960113525390625, 0.035247802734375, 0.046535491943359375, 0.05782318115234375, 0.06911087036132812, 0.0803985595703125, 0.09168624877929688, 0.10297393798828125, 0.11426162719726562, 0.12554931640625, 0.13683700561523438, 0.14812469482421875, 0.15941238403320312, 0.1707000732421875, 0.18198776245117188, 0.19327545166015625, 0.20456314086914062, 0.215850830078125, 0.22713851928710938, 0.23842620849609375, 0.24971389770507812, 0.2610015869140625, 0.2722892761230469, 0.28357696533203125, 0.2948646545410156, 0.30615234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 8.0, 11.0, 11.0, 12.0, 19.0, 28.0, 20.0, 39.0, 65.0, 79.0, 131.0, 194.0, 310.0, 506.0, 1047.0, 2481.0, 7037.0, 22996.0, 88804.0, 733949.0, 141638.0, 33116.0, 9722.0, 3279.0, 1360.0, 649.0, 353.0, 214.0, 157.0, 88.0, 61.0, 49.0, 32.0, 29.0, 18.0, 15.0, 6.0, 5.0, 5.0, 4.0, 4.0, 2.0, 0.0, 5.0], "bins": [-3.263671875, -3.18133544921875, -3.0989990234375, -3.01666259765625, -2.934326171875, -2.85198974609375, -2.7696533203125, -2.68731689453125, -2.60498046875, -2.52264404296875, -2.4403076171875, -2.35797119140625, -2.275634765625, -2.19329833984375, -2.1109619140625, -2.02862548828125, -1.9462890625, -1.86395263671875, -1.7816162109375, -1.69927978515625, -1.616943359375, -1.53460693359375, -1.4522705078125, -1.36993408203125, -1.28759765625, -1.20526123046875, -1.1229248046875, -1.04058837890625, -0.958251953125, -0.87591552734375, -0.7935791015625, -0.71124267578125, -0.62890625, -0.54656982421875, -0.4642333984375, -0.38189697265625, -0.299560546875, -0.21722412109375, -0.1348876953125, -0.05255126953125, 0.02978515625, 0.11212158203125, 0.1944580078125, 0.27679443359375, 0.359130859375, 0.44146728515625, 0.5238037109375, 0.60614013671875, 0.6884765625, 0.77081298828125, 0.8531494140625, 0.93548583984375, 1.017822265625, 1.10015869140625, 1.1824951171875, 1.26483154296875, 1.34716796875, 1.42950439453125, 1.5118408203125, 1.59417724609375, 1.676513671875, 1.75885009765625, 1.8411865234375, 1.92352294921875, 2.005859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 7.0, 5.0, 9.0, 12.0, 10.0, 12.0, 18.0, 19.0, 30.0, 43.0, 31.0, 31.0, 46.0, 51.0, 54.0, 41.0, 55.0, 65.0, 51.0, 39.0, 48.0, 61.0, 44.0, 33.0, 34.0, 32.0, 23.0, 22.0, 17.0, 14.0, 7.0, 11.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.1515045166015625, -1.108673095703125, -1.0658416748046875, -1.02301025390625, -0.9801788330078125, -0.937347412109375, -0.8945159912109375, -0.8516845703125, -0.8088531494140625, -0.766021728515625, -0.7231903076171875, -0.68035888671875, -0.6375274658203125, -0.594696044921875, -0.5518646240234375, -0.509033203125, -0.4662017822265625, -0.423370361328125, -0.3805389404296875, -0.33770751953125, -0.2948760986328125, -0.252044677734375, -0.2092132568359375, -0.1663818359375, -0.1235504150390625, -0.080718994140625, -0.0378875732421875, 0.00494384765625, 0.0477752685546875, 0.090606689453125, 0.1334381103515625, 0.17626953125, 0.2191009521484375, 0.261932373046875, 0.3047637939453125, 0.34759521484375, 0.3904266357421875, 0.433258056640625, 0.4760894775390625, 0.5189208984375, 0.5617523193359375, 0.604583740234375, 0.6474151611328125, 0.69024658203125, 0.7330780029296875, 0.775909423828125, 0.8187408447265625, 0.861572265625, 0.9044036865234375, 0.947235107421875, 0.9900665283203125, 1.03289794921875, 1.0757293701171875, 1.118560791015625, 1.1613922119140625, 1.2042236328125, 1.2470550537109375, 1.289886474609375, 1.3327178955078125, 1.37554931640625, 1.4183807373046875, 1.461212158203125, 1.5040435791015625, 1.546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 9.0, 10.0, 17.0, 19.0, 22.0, 36.0, 48.0, 74.0, 109.0, 158.0, 231.0, 438.0, 735.0, 1392.0, 2580.0, 4904.0, 10532.0, 25826.0, 82476.0, 533557.0, 292446.0, 56120.0, 19477.0, 8295.0, 4076.0, 2119.0, 1126.0, 717.0, 361.0, 220.0, 151.0, 86.0, 47.0, 43.0, 30.0, 27.0, 15.0, 8.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0434341430664062, -1.0116729736328125, -0.9799118041992188, -0.948150634765625, -0.9163894653320312, -0.8846282958984375, -0.8528671264648438, -0.82110595703125, -0.7893447875976562, -0.7575836181640625, -0.7258224487304688, -0.694061279296875, -0.6623001098632812, -0.6305389404296875, -0.5987777709960938, -0.5670166015625, -0.5352554321289062, -0.5034942626953125, -0.47173309326171875, -0.439971923828125, -0.40821075439453125, -0.3764495849609375, -0.34468841552734375, -0.31292724609375, -0.28116607666015625, -0.2494049072265625, -0.21764373779296875, -0.185882568359375, -0.15412139892578125, -0.1223602294921875, -0.09059906005859375, -0.058837890625, -0.02707672119140625, 0.0046844482421875, 0.03644561767578125, 0.068206787109375, 0.09996795654296875, 0.1317291259765625, 0.16349029541015625, 0.19525146484375, 0.22701263427734375, 0.2587738037109375, 0.29053497314453125, 0.322296142578125, 0.35405731201171875, 0.3858184814453125, 0.41757965087890625, 0.4493408203125, 0.48110198974609375, 0.5128631591796875, 0.5446243286132812, 0.576385498046875, 0.6081466674804688, 0.6399078369140625, 0.6716690063476562, 0.70343017578125, 0.7351913452148438, 0.7669525146484375, 0.7987136840820312, 0.830474853515625, 0.8622360229492188, 0.8939971923828125, 0.9257583618164062, 0.95751953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 10.0, 10.0, 10.0, 25.0, 46.0, 70.0, 129.0, 220.0, 183.0, 114.0, 58.0, 35.0, 20.0, 15.0, 12.0, 7.0, 3.0, 8.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004987716674804688, -0.0004856213927268982, -0.00047247111797332764, -0.0004593208432197571, -0.0004461705684661865, -0.00043302029371261597, -0.0004198700189590454, -0.00040671974420547485, -0.0003935694694519043, -0.00038041919469833374, -0.0003672689199447632, -0.0003541186451911926, -0.00034096837043762207, -0.0003278180956840515, -0.00031466782093048096, -0.0003015175461769104, -0.00028836727142333984, -0.0002752169966697693, -0.00026206672191619873, -0.0002489164471626282, -0.00023576617240905762, -0.00022261589765548706, -0.0002094656229019165, -0.00019631534814834595, -0.0001831650733947754, -0.00017001479864120483, -0.00015686452388763428, -0.00014371424913406372, -0.00013056397438049316, -0.00011741369962692261, -0.00010426342487335205, -9.11131501197815e-05, -7.796287536621094e-05, -6.481260061264038e-05, -5.1662325859069824e-05, -3.851205110549927e-05, -2.536177635192871e-05, -1.2211501598358154e-05, 9.387731552124023e-07, 1.4089047908782959e-05, 2.7239322662353516e-05, 4.038959741592407e-05, 5.353987216949463e-05, 6.669014692306519e-05, 7.984042167663574e-05, 9.29906964302063e-05, 0.00010614097118377686, 0.00011929124593734741, 0.00013244152069091797, 0.00014559179544448853, 0.00015874207019805908, 0.00017189234495162964, 0.0001850426197052002, 0.00019819289445877075, 0.0002113431692123413, 0.00022449344396591187, 0.00023764371871948242, 0.000250793993473053, 0.00026394426822662354, 0.0002770945429801941, 0.00029024481773376465, 0.0003033950924873352, 0.00031654536724090576, 0.0003296956419944763, 0.0003428459167480469]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 8.0, 9.0, 9.0, 14.0, 29.0, 27.0, 39.0, 69.0, 94.0, 159.0, 254.0, 451.0, 837.0, 1972.0, 5333.0, 16874.0, 75418.0, 679747.0, 218222.0, 33840.0, 9296.0, 3112.0, 1236.0, 571.0, 319.0, 208.0, 105.0, 82.0, 55.0, 40.0, 30.0, 21.0, 17.0, 9.0, 11.0, 8.0, 5.0, 9.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2768402099609375, -1.235321044921875, -1.1938018798828125, -1.15228271484375, -1.1107635498046875, -1.069244384765625, -1.0277252197265625, -0.9862060546875, -0.9446868896484375, -0.903167724609375, -0.8616485595703125, -0.82012939453125, -0.7786102294921875, -0.737091064453125, -0.6955718994140625, -0.654052734375, -0.6125335693359375, -0.571014404296875, -0.5294952392578125, -0.48797607421875, -0.4464569091796875, -0.404937744140625, -0.3634185791015625, -0.3218994140625, -0.2803802490234375, -0.238861083984375, -0.1973419189453125, -0.15582275390625, -0.1143035888671875, -0.072784423828125, -0.0312652587890625, 0.01025390625, 0.0517730712890625, 0.093292236328125, 0.1348114013671875, 0.17633056640625, 0.2178497314453125, 0.259368896484375, 0.3008880615234375, 0.3424072265625, 0.3839263916015625, 0.425445556640625, 0.4669647216796875, 0.50848388671875, 0.5500030517578125, 0.591522216796875, 0.6330413818359375, 0.674560546875, 0.7160797119140625, 0.757598876953125, 0.7991180419921875, 0.84063720703125, 0.8821563720703125, 0.923675537109375, 0.9651947021484375, 1.0067138671875, 1.0482330322265625, 1.089752197265625, 1.1312713623046875, 1.17279052734375, 1.2143096923828125, 1.255828857421875, 1.2973480224609375, 1.3388671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 11.0, 2.0, 4.0, 9.0, 12.0, 15.0, 11.0, 16.0, 23.0, 19.0, 31.0, 43.0, 66.0, 78.0, 125.0, 137.0, 101.0, 69.0, 50.0, 43.0, 33.0, 16.0, 19.0, 12.0, 10.0, 10.0, 10.0, 6.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6767044067382812, -0.6556549072265625, -0.6346054077148438, -0.613555908203125, -0.5925064086914062, -0.5714569091796875, -0.5504074096679688, -0.52935791015625, -0.5083084106445312, -0.4872589111328125, -0.46620941162109375, -0.445159912109375, -0.42411041259765625, -0.4030609130859375, -0.38201141357421875, -0.3609619140625, -0.33991241455078125, -0.3188629150390625, -0.29781341552734375, -0.276763916015625, -0.25571441650390625, -0.2346649169921875, -0.21361541748046875, -0.19256591796875, -0.17151641845703125, -0.1504669189453125, -0.12941741943359375, -0.108367919921875, -0.08731842041015625, -0.0662689208984375, -0.04521942138671875, -0.024169921875, -0.00312042236328125, 0.0179290771484375, 0.03897857666015625, 0.060028076171875, 0.08107757568359375, 0.1021270751953125, 0.12317657470703125, 0.14422607421875, 0.16527557373046875, 0.1863250732421875, 0.20737457275390625, 0.228424072265625, 0.24947357177734375, 0.2705230712890625, 0.29157257080078125, 0.3126220703125, 0.33367156982421875, 0.3547210693359375, 0.37577056884765625, 0.396820068359375, 0.41786956787109375, 0.4389190673828125, 0.45996856689453125, 0.48101806640625, 0.5020675659179688, 0.5231170654296875, 0.5441665649414062, 0.565216064453125, 0.5862655639648438, 0.6073150634765625, 0.6283645629882812, 0.6494140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 8.0, 23.0, 43.0, 109.0, 206.0, 291.0, 180.0, 77.0, 44.0, 18.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.208810806274414, -25.37373924255371, -24.538667678833008, -23.703596115112305, -22.8685245513916, -22.033451080322266, -21.198379516601562, -20.36330795288086, -19.528236389160156, -18.693164825439453, -17.85809326171875, -17.023021697998047, -16.187950134277344, -15.352877616882324, -14.517806053161621, -13.682733535766602, -12.847662925720215, -12.012591361999512, -11.177519798278809, -10.342447280883789, -9.507375717163086, -8.672304153442383, -7.83723258972168, -7.002160549163818, -6.167088985443115, -5.332017421722412, -4.496945381164551, -3.6618738174438477, -2.8268020153045654, -1.9917302131652832, -1.15665864944458, -0.32158660888671875, 0.5134849548339844, 1.3485567569732666, 2.183628559112549, 3.018700122833252, 3.853771924972534, 4.688843727111816, 5.5239152908325195, 6.358987331390381, 7.194058895111084, 8.029130935668945, 8.864202499389648, 9.699274063110352, 10.534345626831055, 11.369417190551758, 12.204488754272461, 13.03956127166748, 13.874632835388184, 14.709704399108887, 15.54477596282959, 16.37984848022461, 17.214920043945312, 18.049991607666016, 18.88506317138672, 19.720134735107422, 20.555206298828125, 21.390277862548828, 22.22534942626953, 23.060420989990234, 23.895492553710938, 24.73056411743164, 25.565635681152344, 26.40070915222168, 27.235780715942383]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 2.0, 8.0, 12.0, 12.0, 7.0, 18.0, 11.0, 20.0, 22.0, 23.0, 37.0, 24.0, 33.0, 33.0, 35.0, 45.0, 43.0, 42.0, 40.0, 37.0, 41.0, 44.0, 42.0, 39.0, 28.0, 35.0, 28.0, 29.0, 31.0, 22.0, 19.0, 20.0, 21.0, 15.0, 10.0, 14.0, 12.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.088301658630371, -4.912003993988037, -4.735706329345703, -4.559408664703369, -4.383111000061035, -4.206813335418701, -4.030515670776367, -3.8542182445526123, -3.6779205799102783, -3.5016229152679443, -3.3253252506256104, -3.1490278244018555, -2.9727301597595215, -2.7964324951171875, -2.6201348304748535, -2.4438371658325195, -2.2675395011901855, -2.0912418365478516, -1.9149441719055176, -1.7386466264724731, -1.5623489618301392, -1.3860512971878052, -1.2097537517547607, -1.0334560871124268, -0.8571584224700928, -0.6808607578277588, -0.5045631527900696, -0.32826554775238037, -0.1519678831100464, 0.024329781532287598, 0.20062732696533203, 0.376924991607666, 0.55322265625, 0.729520320892334, 0.9058179259300232, 1.0821155309677124, 1.2584131956100464, 1.4347108602523804, 1.6110084056854248, 1.7873060703277588, 1.9636037349700928, 2.1399013996124268, 2.3161990642547607, 2.4924964904785156, 2.6687941551208496, 2.8450918197631836, 3.0213894844055176, 3.1976871490478516, 3.3739848136901855, 3.5502824783325195, 3.7265801429748535, 3.9028778076171875, 4.0791754722595215, 4.2554731369018555, 4.431770324707031, 4.608068466186523, 4.784365653991699, 4.960663318634033, 5.136960983276367, 5.313258647918701, 5.489556312561035, 5.665853977203369, 5.842151641845703, 6.018448829650879, 6.194746971130371]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 20.0, 22.0, 20.0, 38.0, 75.0, 96.0, 167.0, 282.0, 489.0, 877.0, 1587.0, 3565.0, 8991.0, 27750.0, 295490.0, 3790583.0, 42724.0, 12278.0, 4685.0, 2134.0, 1018.0, 543.0, 332.0, 195.0, 115.0, 60.0, 40.0, 31.0, 19.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.703033447265625, -3.57598876953125, -3.448944091796875, -3.3218994140625, -3.194854736328125, -3.06781005859375, -2.940765380859375, -2.813720703125, -2.686676025390625, -2.55963134765625, -2.432586669921875, -2.3055419921875, -2.178497314453125, -2.05145263671875, -1.924407958984375, -1.79736328125, -1.670318603515625, -1.54327392578125, -1.416229248046875, -1.2891845703125, -1.162139892578125, -1.03509521484375, -0.908050537109375, -0.781005859375, -0.653961181640625, -0.52691650390625, -0.399871826171875, -0.2728271484375, -0.145782470703125, -0.01873779296875, 0.108306884765625, 0.2353515625, 0.362396240234375, 0.48944091796875, 0.616485595703125, 0.7435302734375, 0.870574951171875, 0.99761962890625, 1.124664306640625, 1.251708984375, 1.378753662109375, 1.50579833984375, 1.632843017578125, 1.7598876953125, 1.886932373046875, 2.01397705078125, 2.141021728515625, 2.26806640625, 2.395111083984375, 2.52215576171875, 2.649200439453125, 2.7762451171875, 2.903289794921875, 3.03033447265625, 3.157379150390625, 3.284423828125, 3.411468505859375, 3.53851318359375, 3.665557861328125, 3.7926025390625, 3.919647216796875, 4.04669189453125, 4.173736572265625, 4.30078125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 10.0, 10.0, 12.0, 13.0, 20.0, 13.0, 25.0, 29.0, 37.0, 37.0, 34.0, 59.0, 51.0, 46.0, 76.0, 65.0, 72.0, 52.0, 45.0, 51.0, 53.0, 37.0, 24.0, 32.0, 15.0, 18.0, 14.0, 11.0, 9.0, 6.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.416259765625, -0.4053306579589844, -0.39440155029296875, -0.3834724426269531, -0.3725433349609375, -0.3616142272949219, -0.35068511962890625, -0.3397560119628906, -0.328826904296875, -0.3178977966308594, -0.30696868896484375, -0.2960395812988281, -0.2851104736328125, -0.2741813659667969, -0.26325225830078125, -0.2523231506347656, -0.24139404296875, -0.23046493530273438, -0.21953582763671875, -0.20860671997070312, -0.1976776123046875, -0.18674850463867188, -0.17581939697265625, -0.16489028930664062, -0.153961181640625, -0.14303207397460938, -0.13210296630859375, -0.12117385864257812, -0.1102447509765625, -0.09931564331054688, -0.08838653564453125, -0.07745742797851562, -0.0665283203125, -0.055599212646484375, -0.04467010498046875, -0.033740997314453125, -0.0228118896484375, -0.011882781982421875, -0.00095367431640625, 0.009975433349609375, 0.020904541015625, 0.031833648681640625, 0.04276275634765625, 0.053691864013671875, 0.0646209716796875, 0.07555007934570312, 0.08647918701171875, 0.09740829467773438, 0.10833740234375, 0.11926651000976562, 0.13019561767578125, 0.14112472534179688, 0.1520538330078125, 0.16298294067382812, 0.17391204833984375, 0.18484115600585938, 0.195770263671875, 0.20669937133789062, 0.21762847900390625, 0.22855758666992188, 0.2394866943359375, 0.2504158020019531, 0.26134490966796875, 0.2722740173339844, 0.283203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 17.0, 17.0, 24.0, 28.0, 57.0, 62.0, 75.0, 172.0, 249.0, 362.0, 657.0, 1217.0, 1962.0, 3883.0, 7819.0, 16446.0, 40066.0, 153697.0, 3664680.0, 217304.0, 47676.0, 18690.0, 8853.0, 4416.0, 2472.0, 1428.0, 753.0, 437.0, 263.0, 184.0, 100.0, 67.0, 41.0, 34.0, 16.0, 19.0, 14.0, 8.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.884765625, -1.818817138671875, -1.75286865234375, -1.686920166015625, -1.6209716796875, -1.555023193359375, -1.48907470703125, -1.423126220703125, -1.357177734375, -1.291229248046875, -1.22528076171875, -1.159332275390625, -1.0933837890625, -1.027435302734375, -0.96148681640625, -0.895538330078125, -0.82958984375, -0.763641357421875, -0.69769287109375, -0.631744384765625, -0.5657958984375, -0.499847412109375, -0.43389892578125, -0.367950439453125, -0.302001953125, -0.236053466796875, -0.17010498046875, -0.104156494140625, -0.0382080078125, 0.027740478515625, 0.09368896484375, 0.159637451171875, 0.2255859375, 0.291534423828125, 0.35748291015625, 0.423431396484375, 0.4893798828125, 0.555328369140625, 0.62127685546875, 0.687225341796875, 0.753173828125, 0.819122314453125, 0.88507080078125, 0.951019287109375, 1.0169677734375, 1.082916259765625, 1.14886474609375, 1.214813232421875, 1.28076171875, 1.346710205078125, 1.41265869140625, 1.478607177734375, 1.5445556640625, 1.610504150390625, 1.67645263671875, 1.742401123046875, 1.808349609375, 1.874298095703125, 1.94024658203125, 2.006195068359375, 2.0721435546875, 2.138092041015625, 2.20404052734375, 2.269989013671875, 2.3359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 16.0, 13.0, 11.0, 10.0, 21.0, 34.0, 45.0, 71.0, 90.0, 233.0, 1692.0, 1255.0, 208.0, 119.0, 52.0, 40.0, 36.0, 19.0, 15.0, 16.0, 13.0, 7.0, 4.0, 12.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8134765625, -0.78802490234375, -0.7625732421875, -0.73712158203125, -0.711669921875, -0.68621826171875, -0.6607666015625, -0.63531494140625, -0.60986328125, -0.58441162109375, -0.5589599609375, -0.53350830078125, -0.508056640625, -0.48260498046875, -0.4571533203125, -0.43170166015625, -0.40625, -0.38079833984375, -0.3553466796875, -0.32989501953125, -0.304443359375, -0.27899169921875, -0.2535400390625, -0.22808837890625, -0.20263671875, -0.17718505859375, -0.1517333984375, -0.12628173828125, -0.100830078125, -0.07537841796875, -0.0499267578125, -0.02447509765625, 0.0009765625, 0.02642822265625, 0.0518798828125, 0.07733154296875, 0.102783203125, 0.12823486328125, 0.1536865234375, 0.17913818359375, 0.20458984375, 0.23004150390625, 0.2554931640625, 0.28094482421875, 0.306396484375, 0.33184814453125, 0.3572998046875, 0.38275146484375, 0.408203125, 0.43365478515625, 0.4591064453125, 0.48455810546875, 0.510009765625, 0.53546142578125, 0.5609130859375, 0.58636474609375, 0.61181640625, 0.63726806640625, 0.6627197265625, 0.68817138671875, 0.713623046875, 0.73907470703125, 0.7645263671875, 0.78997802734375, 0.8154296875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 11.0, 17.0, 36.0, 53.0, 72.0, 125.0, 158.0, 139.0, 115.0, 87.0, 70.0, 38.0, 29.0, 11.0, 13.0, 8.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.591280937194824, -5.402379512786865, -5.2134785652160645, -5.0245771408081055, -4.8356757164001465, -4.6467742919921875, -4.457873344421387, -4.268971920013428, -4.080070495605469, -3.891169309616089, -3.70226788520813, -3.51336669921875, -3.324465274810791, -3.135564088821411, -2.9466629028320312, -2.7577614784240723, -2.5688605308532715, -2.3799593448638916, -2.1910579204559326, -2.0021567344665527, -1.8132554292678833, -1.6243541240692139, -1.435452938079834, -1.2465516328811646, -1.0576503276824951, -0.8687490224838257, -0.679847776889801, -0.49094653129577637, -0.30204522609710693, -0.1131439208984375, 0.07575726509094238, 0.2646585702896118, 0.45356035232543945, 0.6424616575241089, 0.8313629031181335, 1.0202641487121582, 1.2091654539108276, 1.398066759109497, 1.586967945098877, 1.7758692502975464, 1.9647705554962158, 2.1536717414855957, 2.3425731658935547, 2.5314743518829346, 2.7203755378723145, 2.9092769622802734, 3.0981781482696533, 3.287079334259033, 3.475980758666992, 3.664881944656372, 3.853783369064331, 4.042684555053711, 4.23158597946167, 4.420487403869629, 4.60938835144043, 4.798289775848389, 4.987191200256348, 5.176092624664307, 5.364993572235107, 5.553894996643066, 5.742796421051025, 5.931697845458984, 6.120598793029785, 6.309500217437744, 6.498401165008545]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 5.0, 11.0, 13.0, 10.0, 9.0, 14.0, 20.0, 16.0, 26.0, 28.0, 30.0, 33.0, 35.0, 28.0, 43.0, 36.0, 59.0, 37.0, 40.0, 36.0, 40.0, 36.0, 35.0, 34.0, 30.0, 34.0, 25.0, 32.0, 30.0, 23.0, 20.0, 15.0, 21.0, 18.0, 11.0, 12.0, 8.0, 6.0, 7.0, 10.0, 1.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.4644687175750732, -2.3910274505615234, -2.3175859451293945, -2.2441444396972656, -2.170703172683716, -2.097261905670166, -2.023820400238037, -1.9503790140151978, -1.8769376277923584, -1.803496241569519, -1.7300548553466797, -1.6566134691238403, -1.583172082901001, -1.5097306966781616, -1.4362893104553223, -1.362847924232483, -1.2894065380096436, -1.2159651517868042, -1.1425237655639648, -1.0690823793411255, -0.9956409931182861, -0.9221996068954468, -0.8487582206726074, -0.7753168344497681, -0.7018754482269287, -0.6284340620040894, -0.55499267578125, -0.48155128955841064, -0.4081099033355713, -0.33466851711273193, -0.2612271308898926, -0.18778574466705322, -0.11434459686279297, -0.04090321063995361, 0.03253817558288574, 0.1059795618057251, 0.17942094802856445, 0.2528623342514038, 0.32630372047424316, 0.3997451066970825, 0.4731864929199219, 0.5466278791427612, 0.6200692653656006, 0.6935106515884399, 0.7669520378112793, 0.8403934240341187, 0.913834810256958, 0.9872761964797974, 1.0607175827026367, 1.134158968925476, 1.2076003551483154, 1.2810417413711548, 1.3544831275939941, 1.4279245138168335, 1.5013659000396729, 1.5748072862625122, 1.6482486724853516, 1.721690058708191, 1.7951314449310303, 1.8685728311538696, 1.942014217376709, 2.015455722808838, 2.0888969898223877, 2.1623382568359375, 2.2357797622680664]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 10.0, 10.0, 7.0, 16.0, 32.0, 48.0, 83.0, 108.0, 177.0, 320.0, 565.0, 1050.0, 1979.0, 4354.0, 10166.0, 26343.0, 78595.0, 667195.0, 187604.0, 41949.0, 15674.0, 6256.0, 2817.0, 1368.0, 737.0, 403.0, 236.0, 165.0, 102.0, 55.0, 42.0, 25.0, 12.0, 16.0, 14.0, 3.0, 2.0, 1.0, 1.0, 2.0, 7.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.478515625, -2.409149169921875, -2.33978271484375, -2.270416259765625, -2.2010498046875, -2.131683349609375, -2.06231689453125, -1.992950439453125, -1.923583984375, -1.854217529296875, -1.78485107421875, -1.715484619140625, -1.6461181640625, -1.576751708984375, -1.50738525390625, -1.438018798828125, -1.36865234375, -1.299285888671875, -1.22991943359375, -1.160552978515625, -1.0911865234375, -1.021820068359375, -0.95245361328125, -0.883087158203125, -0.813720703125, -0.744354248046875, -0.67498779296875, -0.605621337890625, -0.5362548828125, -0.466888427734375, -0.39752197265625, -0.328155517578125, -0.2587890625, -0.189422607421875, -0.12005615234375, -0.050689697265625, 0.0186767578125, 0.088043212890625, 0.15740966796875, 0.226776123046875, 0.296142578125, 0.365509033203125, 0.43487548828125, 0.504241943359375, 0.5736083984375, 0.642974853515625, 0.71234130859375, 0.781707763671875, 0.85107421875, 0.920440673828125, 0.98980712890625, 1.059173583984375, 1.1285400390625, 1.197906494140625, 1.26727294921875, 1.336639404296875, 1.406005859375, 1.475372314453125, 1.54473876953125, 1.614105224609375, 1.6834716796875, 1.752838134765625, 1.82220458984375, 1.891571044921875, 1.9609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 12.0, 13.0, 21.0, 18.0, 24.0, 29.0, 21.0, 31.0, 49.0, 39.0, 63.0, 67.0, 51.0, 53.0, 62.0, 58.0, 68.0, 51.0, 43.0, 36.0, 30.0, 30.0, 25.0, 15.0, 16.0, 11.0, 10.0, 6.0, 6.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.417724609375, -0.4068336486816406, -0.39594268798828125, -0.3850517272949219, -0.3741607666015625, -0.3632698059082031, -0.35237884521484375, -0.3414878845214844, -0.330596923828125, -0.3197059631347656, -0.30881500244140625, -0.2979240417480469, -0.2870330810546875, -0.2761421203613281, -0.26525115966796875, -0.2543601989746094, -0.24346923828125, -0.23257827758789062, -0.22168731689453125, -0.21079635620117188, -0.1999053955078125, -0.18901443481445312, -0.17812347412109375, -0.16723251342773438, -0.156341552734375, -0.14545059204101562, -0.13455963134765625, -0.12366867065429688, -0.1127777099609375, -0.10188674926757812, -0.09099578857421875, -0.08010482788085938, -0.0692138671875, -0.058322906494140625, -0.04743194580078125, -0.036540985107421875, -0.0256500244140625, -0.014759063720703125, -0.00386810302734375, 0.007022857666015625, 0.017913818359375, 0.028804779052734375, 0.03969573974609375, 0.050586700439453125, 0.0614776611328125, 0.07236862182617188, 0.08325958251953125, 0.09415054321289062, 0.10504150390625, 0.11593246459960938, 0.12682342529296875, 0.13771438598632812, 0.1486053466796875, 0.15949630737304688, 0.17038726806640625, 0.18127822875976562, 0.192169189453125, 0.20306015014648438, 0.21395111083984375, 0.22484207153320312, 0.2357330322265625, 0.24662399291992188, 0.25751495361328125, 0.2684059143066406, 0.279296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 10.0, 9.0, 3.0, 4.0, 9.0, 15.0, 15.0, 20.0, 21.0, 36.0, 54.0, 84.0, 107.0, 194.0, 346.0, 558.0, 998.0, 1891.0, 3509.0, 6569.0, 13075.0, 27409.0, 66134.0, 502020.0, 320516.0, 56393.0, 24143.0, 11567.0, 5886.0, 3007.0, 1664.0, 936.0, 491.0, 295.0, 171.0, 116.0, 80.0, 67.0, 24.0, 25.0, 18.0, 10.0, 13.0, 11.0, 10.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5224609375, -1.4732208251953125, -1.423980712890625, -1.3747406005859375, -1.32550048828125, -1.2762603759765625, -1.227020263671875, -1.1777801513671875, -1.1285400390625, -1.0792999267578125, -1.030059814453125, -0.9808197021484375, -0.93157958984375, -0.8823394775390625, -0.833099365234375, -0.7838592529296875, -0.734619140625, -0.6853790283203125, -0.636138916015625, -0.5868988037109375, -0.53765869140625, -0.4884185791015625, -0.439178466796875, -0.3899383544921875, -0.3406982421875, -0.2914581298828125, -0.242218017578125, -0.1929779052734375, -0.14373779296875, -0.0944976806640625, -0.045257568359375, 0.0039825439453125, 0.05322265625, 0.1024627685546875, 0.151702880859375, 0.2009429931640625, 0.25018310546875, 0.2994232177734375, 0.348663330078125, 0.3979034423828125, 0.4471435546875, 0.4963836669921875, 0.545623779296875, 0.5948638916015625, 0.64410400390625, 0.6933441162109375, 0.742584228515625, 0.7918243408203125, 0.841064453125, 0.8903045654296875, 0.939544677734375, 0.9887847900390625, 1.03802490234375, 1.0872650146484375, 1.136505126953125, 1.1857452392578125, 1.2349853515625, 1.2842254638671875, 1.333465576171875, 1.3827056884765625, 1.43194580078125, 1.4811859130859375, 1.530426025390625, 1.5796661376953125, 1.62890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 8.0, 9.0, 7.0, 12.0, 14.0, 16.0, 23.0, 21.0, 32.0, 32.0, 39.0, 39.0, 47.0, 49.0, 49.0, 51.0, 61.0, 46.0, 50.0, 46.0, 48.0, 48.0, 45.0, 38.0, 18.0, 26.0, 19.0, 16.0, 9.0, 13.0, 10.0, 8.0, 7.0, 7.0, 4.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.404296875, -1.3602447509765625, -1.316192626953125, -1.2721405029296875, -1.22808837890625, -1.1840362548828125, -1.139984130859375, -1.0959320068359375, -1.0518798828125, -1.0078277587890625, -0.963775634765625, -0.9197235107421875, -0.87567138671875, -0.8316192626953125, -0.787567138671875, -0.7435150146484375, -0.699462890625, -0.6554107666015625, -0.611358642578125, -0.5673065185546875, -0.52325439453125, -0.4792022705078125, -0.435150146484375, -0.3910980224609375, -0.3470458984375, -0.3029937744140625, -0.258941650390625, -0.2148895263671875, -0.17083740234375, -0.1267852783203125, -0.082733154296875, -0.0386810302734375, 0.00537109375, 0.0494232177734375, 0.093475341796875, 0.1375274658203125, 0.18157958984375, 0.2256317138671875, 0.269683837890625, 0.3137359619140625, 0.3577880859375, 0.4018402099609375, 0.445892333984375, 0.4899444580078125, 0.53399658203125, 0.5780487060546875, 0.622100830078125, 0.6661529541015625, 0.710205078125, 0.7542572021484375, 0.798309326171875, 0.8423614501953125, 0.88641357421875, 0.9304656982421875, 0.974517822265625, 1.0185699462890625, 1.0626220703125, 1.1066741943359375, 1.150726318359375, 1.1947784423828125, 1.23883056640625, 1.2828826904296875, 1.326934814453125, 1.3709869384765625, 1.4150390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 12.0, 21.0, 28.0, 48.0, 55.0, 74.0, 121.0, 201.0, 295.0, 538.0, 982.0, 1749.0, 3442.0, 7436.0, 18201.0, 57636.0, 370465.0, 480595.0, 69753.0, 20423.0, 8234.0, 3873.0, 1879.0, 1016.0, 522.0, 355.0, 200.0, 100.0, 91.0, 51.0, 43.0, 29.0, 23.0, 20.0, 10.0, 7.0, 6.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.90283203125, -0.8763275146484375, -0.849822998046875, -0.8233184814453125, -0.79681396484375, -0.7703094482421875, -0.743804931640625, -0.7173004150390625, -0.6907958984375, -0.6642913818359375, -0.637786865234375, -0.6112823486328125, -0.58477783203125, -0.5582733154296875, -0.531768798828125, -0.5052642822265625, -0.478759765625, -0.4522552490234375, -0.425750732421875, -0.3992462158203125, -0.37274169921875, -0.3462371826171875, -0.319732666015625, -0.2932281494140625, -0.2667236328125, -0.2402191162109375, -0.213714599609375, -0.1872100830078125, -0.16070556640625, -0.1342010498046875, -0.107696533203125, -0.0811920166015625, -0.0546875, -0.0281829833984375, -0.001678466796875, 0.0248260498046875, 0.05133056640625, 0.0778350830078125, 0.104339599609375, 0.1308441162109375, 0.1573486328125, 0.1838531494140625, 0.210357666015625, 0.2368621826171875, 0.26336669921875, 0.2898712158203125, 0.316375732421875, 0.3428802490234375, 0.369384765625, 0.3958892822265625, 0.422393798828125, 0.4488983154296875, 0.47540283203125, 0.5019073486328125, 0.528411865234375, 0.5549163818359375, 0.5814208984375, 0.6079254150390625, 0.634429931640625, 0.6609344482421875, 0.68743896484375, 0.7139434814453125, 0.740447998046875, 0.7669525146484375, 0.79345703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 8.0, 23.0, 19.0, 39.0, 59.0, 102.0, 158.0, 192.0, 149.0, 75.0, 52.0, 38.0, 23.0, 18.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0004012584686279297, -0.0003915242850780487, -0.0003817901015281677, -0.00037205591797828674, -0.00036232173442840576, -0.0003525875508785248, -0.0003428533673286438, -0.0003331191837787628, -0.00032338500022888184, -0.00031365081667900085, -0.0003039166331291199, -0.0002941824495792389, -0.0002844482660293579, -0.00027471408247947693, -0.00026497989892959595, -0.00025524571537971497, -0.000245511531829834, -0.000235777348279953, -0.00022604316473007202, -0.00021630898118019104, -0.00020657479763031006, -0.00019684061408042908, -0.0001871064305305481, -0.00017737224698066711, -0.00016763806343078613, -0.00015790387988090515, -0.00014816969633102417, -0.0001384355127811432, -0.0001287013292312622, -0.00011896714568138123, -0.00010923296213150024, -9.949877858161926e-05, -8.976459503173828e-05, -8.00304114818573e-05, -7.029622793197632e-05, -6.056204438209534e-05, -5.0827860832214355e-05, -4.1093677282333374e-05, -3.135949373245239e-05, -2.162531018257141e-05, -1.189112663269043e-05, -2.1569430828094482e-06, 7.577240467071533e-06, 1.7311424016952515e-05, 2.7045607566833496e-05, 3.677979111671448e-05, 4.651397466659546e-05, 5.624815821647644e-05, 6.598234176635742e-05, 7.57165253162384e-05, 8.545070886611938e-05, 9.518489241600037e-05, 0.00010491907596588135, 0.00011465325951576233, 0.0001243874430656433, 0.0001341216266155243, 0.00014385581016540527, 0.00015358999371528625, 0.00016332417726516724, 0.00017305836081504822, 0.0001827925443649292, 0.00019252672791481018, 0.00020226091146469116, 0.00021199509501457214, 0.00022172927856445312]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 9.0, 13.0, 30.0, 24.0, 51.0, 75.0, 147.0, 239.0, 462.0, 787.0, 1495.0, 3198.0, 7449.0, 23433.0, 125730.0, 713140.0, 133495.0, 24180.0, 7923.0, 3243.0, 1590.0, 807.0, 410.0, 242.0, 136.0, 87.0, 39.0, 27.0, 23.0, 15.0, 16.0, 10.0, 6.0, 6.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.2060546875, -1.1739044189453125, -1.141754150390625, -1.1096038818359375, -1.07745361328125, -1.0453033447265625, -1.013153076171875, -0.9810028076171875, -0.9488525390625, -0.9167022705078125, -0.884552001953125, -0.8524017333984375, -0.82025146484375, -0.7881011962890625, -0.755950927734375, -0.7238006591796875, -0.691650390625, -0.6595001220703125, -0.627349853515625, -0.5951995849609375, -0.56304931640625, -0.5308990478515625, -0.498748779296875, -0.4665985107421875, -0.4344482421875, -0.4022979736328125, -0.370147705078125, -0.3379974365234375, -0.30584716796875, -0.2736968994140625, -0.241546630859375, -0.2093963623046875, -0.17724609375, -0.1450958251953125, -0.112945556640625, -0.0807952880859375, -0.04864501953125, -0.0164947509765625, 0.015655517578125, 0.0478057861328125, 0.0799560546875, 0.1121063232421875, 0.144256591796875, 0.1764068603515625, 0.20855712890625, 0.2407073974609375, 0.272857666015625, 0.3050079345703125, 0.337158203125, 0.3693084716796875, 0.401458740234375, 0.4336090087890625, 0.46575927734375, 0.4979095458984375, 0.530059814453125, 0.5622100830078125, 0.5943603515625, 0.6265106201171875, 0.658660888671875, 0.6908111572265625, 0.72296142578125, 0.7551116943359375, 0.787261962890625, 0.8194122314453125, 0.8515625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 5.0, 4.0, 6.0, 5.0, 16.0, 8.0, 20.0, 26.0, 25.0, 41.0, 45.0, 84.0, 127.0, 152.0, 99.0, 88.0, 56.0, 32.0, 37.0, 24.0, 17.0, 9.0, 15.0, 12.0, 12.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.65771484375, -0.6380386352539062, -0.6183624267578125, -0.5986862182617188, -0.579010009765625, -0.5593338012695312, -0.5396575927734375, -0.5199813842773438, -0.50030517578125, -0.48062896728515625, -0.4609527587890625, -0.44127655029296875, -0.421600341796875, -0.40192413330078125, -0.3822479248046875, -0.36257171630859375, -0.3428955078125, -0.32321929931640625, -0.3035430908203125, -0.28386688232421875, -0.264190673828125, -0.24451446533203125, -0.2248382568359375, -0.20516204833984375, -0.18548583984375, -0.16580963134765625, -0.1461334228515625, -0.12645721435546875, -0.106781005859375, -0.08710479736328125, -0.0674285888671875, -0.04775238037109375, -0.028076171875, -0.00839996337890625, 0.0112762451171875, 0.03095245361328125, 0.050628662109375, 0.07030487060546875, 0.0899810791015625, 0.10965728759765625, 0.12933349609375, 0.14900970458984375, 0.1686859130859375, 0.18836212158203125, 0.208038330078125, 0.22771453857421875, 0.2473907470703125, 0.26706695556640625, 0.2867431640625, 0.30641937255859375, 0.3260955810546875, 0.34577178955078125, 0.365447998046875, 0.38512420654296875, 0.4048004150390625, 0.42447662353515625, 0.44415283203125, 0.46382904052734375, 0.4835052490234375, 0.5031814575195312, 0.522857666015625, 0.5425338745117188, 0.5622100830078125, 0.5818862915039062, 0.6015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 17.0, 24.0, 44.0, 51.0, 66.0, 100.0, 105.0, 134.0, 118.0, 95.0, 70.0, 52.0, 27.0, 27.0, 19.0, 7.0, 8.0, 7.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.09968376159668, -11.737569808959961, -11.375455856323242, -11.013341903686523, -10.651227951049805, -10.289113998413086, -9.927000045776367, -9.564886093139648, -9.20277214050293, -8.840658187866211, -8.478544235229492, -8.116430282592773, -7.754316329956055, -7.392202377319336, -7.030088424682617, -6.667974472045898, -6.30586051940918, -5.943746566772461, -5.581632614135742, -5.219518661499023, -4.857404708862305, -4.495290756225586, -4.133176803588867, -3.7710628509521484, -3.4089488983154297, -3.046834945678711, -2.684720993041992, -2.3226070404052734, -1.9604930877685547, -1.598379135131836, -1.2362651824951172, -0.8741512298583984, -0.5120382308959961, -0.14992427825927734, 0.2121896743774414, 0.5743036270141602, 0.9364175796508789, 1.2985315322875977, 1.6606454849243164, 2.022759437561035, 2.384873390197754, 2.7469873428344727, 3.1091012954711914, 3.47121524810791, 3.833329200744629, 4.195443153381348, 4.557557106018066, 4.919671058654785, 5.281785011291504, 5.643898963928223, 6.006012916564941, 6.36812686920166, 6.730240821838379, 7.092354774475098, 7.454468727111816, 7.816582679748535, 8.178696632385254, 8.540810585021973, 8.902924537658691, 9.26503849029541, 9.627152442932129, 9.989266395568848, 10.351380348205566, 10.713494300842285, 11.075608253479004]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 3.0, 8.0, 3.0, 5.0, 6.0, 7.0, 12.0, 17.0, 25.0, 29.0, 28.0, 22.0, 39.0, 40.0, 36.0, 43.0, 44.0, 40.0, 39.0, 48.0, 51.0, 45.0, 45.0, 40.0, 55.0, 35.0, 27.0, 31.0, 26.0, 23.0, 26.0, 21.0, 20.0, 15.0, 11.0, 5.0, 5.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.871341228485107, -6.6572370529174805, -6.443133354187012, -6.229029178619385, -6.014925479888916, -5.800821304321289, -5.58671760559082, -5.372613430023193, -5.158509254455566, -4.9444050788879395, -4.730301380157471, -4.516197204589844, -4.302093505859375, -4.087989330291748, -3.8738853931427, -3.6597814559936523, -3.4456775188446045, -3.2315735816955566, -3.017469644546509, -2.803365707397461, -2.589261531829834, -2.375157594680786, -2.1610536575317383, -1.9469496011734009, -1.732845664024353, -1.5187417268753052, -1.3046376705169678, -1.09053373336792, -0.8764297366142273, -0.6623257398605347, -0.4482218027114868, -0.23411774635314941, -0.020013809204101562, 0.19409017264842987, 0.4081941545009613, 0.6222981214523315, 0.8364021182060242, 1.0505061149597168, 1.2646100521087646, 1.478714108467102, 1.69281804561615, 1.9069219827651978, 2.121026039123535, 2.335129976272583, 2.549233913421631, 2.763338088989258, 2.9774417877197266, 3.1915459632873535, 3.4056499004364014, 3.619753837585449, 3.833857774734497, 4.047961711883545, 4.262065887451172, 4.476169586181641, 4.690273761749268, 4.9043779373168945, 5.118481636047363, 5.33258581161499, 5.546689510345459, 5.760793685913086, 5.974897384643555, 6.189001560211182, 6.403105735778809, 6.617209434509277, 6.831313610076904]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 9.0, 11.0, 12.0, 10.0, 27.0, 41.0, 43.0, 56.0, 84.0, 126.0, 220.0, 486.0, 1272.0, 2897.0, 8888.0, 36737.0, 3842541.0, 267627.0, 22631.0, 6363.0, 2289.0, 927.0, 437.0, 234.0, 100.0, 70.0, 40.0, 33.0, 21.0, 15.0, 9.0, 10.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.56640625, -5.4019775390625, -5.237548828125, -5.0731201171875, -4.90869140625, -4.7442626953125, -4.579833984375, -4.4154052734375, -4.2509765625, -4.0865478515625, -3.922119140625, -3.7576904296875, -3.59326171875, -3.4288330078125, -3.264404296875, -3.0999755859375, -2.935546875, -2.7711181640625, -2.606689453125, -2.4422607421875, -2.27783203125, -2.1134033203125, -1.948974609375, -1.7845458984375, -1.6201171875, -1.4556884765625, -1.291259765625, -1.1268310546875, -0.96240234375, -0.7979736328125, -0.633544921875, -0.4691162109375, -0.3046875, -0.1402587890625, 0.024169921875, 0.1885986328125, 0.35302734375, 0.5174560546875, 0.681884765625, 0.8463134765625, 1.0107421875, 1.1751708984375, 1.339599609375, 1.5040283203125, 1.66845703125, 1.8328857421875, 1.997314453125, 2.1617431640625, 2.326171875, 2.4906005859375, 2.655029296875, 2.8194580078125, 2.98388671875, 3.1483154296875, 3.312744140625, 3.4771728515625, 3.6416015625, 3.8060302734375, 3.970458984375, 4.1348876953125, 4.29931640625, 4.4637451171875, 4.628173828125, 4.7926025390625, 4.95703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 11.0, 10.0, 14.0, 19.0, 16.0, 23.0, 24.0, 35.0, 37.0, 33.0, 42.0, 49.0, 56.0, 58.0, 50.0, 56.0, 61.0, 64.0, 53.0, 48.0, 37.0, 42.0, 27.0, 20.0, 13.0, 26.0, 15.0, 6.0, 10.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.416748046875, -0.405731201171875, -0.39471435546875, -0.383697509765625, -0.3726806640625, -0.361663818359375, -0.35064697265625, -0.339630126953125, -0.32861328125, -0.317596435546875, -0.30657958984375, -0.295562744140625, -0.2845458984375, -0.273529052734375, -0.26251220703125, -0.251495361328125, -0.240478515625, -0.229461669921875, -0.21844482421875, -0.207427978515625, -0.1964111328125, -0.185394287109375, -0.17437744140625, -0.163360595703125, -0.15234375, -0.141326904296875, -0.13031005859375, -0.119293212890625, -0.1082763671875, -0.097259521484375, -0.08624267578125, -0.075225830078125, -0.064208984375, -0.053192138671875, -0.04217529296875, -0.031158447265625, -0.0201416015625, -0.009124755859375, 0.00189208984375, 0.012908935546875, 0.02392578125, 0.034942626953125, 0.04595947265625, 0.056976318359375, 0.0679931640625, 0.079010009765625, 0.09002685546875, 0.101043701171875, 0.112060546875, 0.123077392578125, 0.13409423828125, 0.145111083984375, 0.1561279296875, 0.167144775390625, 0.17816162109375, 0.189178466796875, 0.2001953125, 0.211212158203125, 0.22222900390625, 0.233245849609375, 0.2442626953125, 0.255279541015625, 0.26629638671875, 0.277313232421875, 0.288330078125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 11.0, 18.0, 15.0, 33.0, 54.0, 84.0, 118.0, 199.0, 335.0, 535.0, 930.0, 1565.0, 2805.0, 5307.0, 10482.0, 21300.0, 51698.0, 232156.0, 3664925.0, 126785.0, 38933.0, 17202.0, 8500.0, 4513.0, 2393.0, 1373.0, 808.0, 470.0, 247.0, 190.0, 120.0, 75.0, 36.0, 19.0, 16.0, 10.0, 6.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.64453125, -2.569732666015625, -2.49493408203125, -2.420135498046875, -2.3453369140625, -2.270538330078125, -2.19573974609375, -2.120941162109375, -2.046142578125, -1.971343994140625, -1.89654541015625, -1.821746826171875, -1.7469482421875, -1.672149658203125, -1.59735107421875, -1.522552490234375, -1.44775390625, -1.372955322265625, -1.29815673828125, -1.223358154296875, -1.1485595703125, -1.073760986328125, -0.99896240234375, -0.924163818359375, -0.849365234375, -0.774566650390625, -0.69976806640625, -0.624969482421875, -0.5501708984375, -0.475372314453125, -0.40057373046875, -0.325775146484375, -0.2509765625, -0.176177978515625, -0.10137939453125, -0.026580810546875, 0.0482177734375, 0.123016357421875, 0.19781494140625, 0.272613525390625, 0.347412109375, 0.422210693359375, 0.49700927734375, 0.571807861328125, 0.6466064453125, 0.721405029296875, 0.79620361328125, 0.871002197265625, 0.94580078125, 1.020599365234375, 1.09539794921875, 1.170196533203125, 1.2449951171875, 1.319793701171875, 1.39459228515625, 1.469390869140625, 1.544189453125, 1.618988037109375, 1.69378662109375, 1.768585205078125, 1.8433837890625, 1.918182373046875, 1.99298095703125, 2.067779541015625, 2.142578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 5.0, 6.0, 4.0, 8.0, 11.0, 9.0, 6.0, 16.0, 20.0, 16.0, 15.0, 24.0, 33.0, 59.0, 85.0, 143.0, 416.0, 2401.0, 387.0, 136.0, 52.0, 38.0, 37.0, 25.0, 18.0, 15.0, 15.0, 12.0, 7.0, 10.0, 11.0, 5.0, 9.0, 4.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.737030029296875, -0.71282958984375, -0.688629150390625, -0.6644287109375, -0.640228271484375, -0.61602783203125, -0.591827392578125, -0.567626953125, -0.543426513671875, -0.51922607421875, -0.495025634765625, -0.4708251953125, -0.446624755859375, -0.42242431640625, -0.398223876953125, -0.3740234375, -0.349822998046875, -0.32562255859375, -0.301422119140625, -0.2772216796875, -0.253021240234375, -0.22882080078125, -0.204620361328125, -0.180419921875, -0.156219482421875, -0.13201904296875, -0.107818603515625, -0.0836181640625, -0.059417724609375, -0.03521728515625, -0.011016845703125, 0.01318359375, 0.037384033203125, 0.06158447265625, 0.085784912109375, 0.1099853515625, 0.134185791015625, 0.15838623046875, 0.182586669921875, 0.206787109375, 0.230987548828125, 0.25518798828125, 0.279388427734375, 0.3035888671875, 0.327789306640625, 0.35198974609375, 0.376190185546875, 0.400390625, 0.424591064453125, 0.44879150390625, 0.472991943359375, 0.4971923828125, 0.521392822265625, 0.54559326171875, 0.569793701171875, 0.593994140625, 0.618194580078125, 0.64239501953125, 0.666595458984375, 0.6907958984375, 0.714996337890625, 0.73919677734375, 0.763397216796875, 0.78759765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 9.0, 12.0, 26.0, 16.0, 37.0, 59.0, 72.0, 91.0, 99.0, 95.0, 93.0, 104.0, 79.0, 51.0, 43.0, 35.0, 22.0, 14.0, 13.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.523571491241455, -4.372081756591797, -4.220592498779297, -4.069102764129639, -3.9176132678985596, -3.7661237716674805, -3.6146342754364014, -3.4631447792053223, -3.311655044555664, -3.160165548324585, -3.008676052093506, -2.8571863174438477, -2.7056968212127686, -2.5542073249816895, -2.4027178287506104, -2.2512283325195312, -2.099738836288452, -1.948249340057373, -1.7967597246170044, -1.6452702283859253, -1.4937806129455566, -1.3422911167144775, -1.1908016204833984, -1.0393120050430298, -0.8878225088119507, -0.7363329529762268, -0.5848433971405029, -0.43335390090942383, -0.28186434507369995, -0.13037478923797607, 0.021114706993103027, 0.17260432243347168, 0.3240938186645508, 0.47558337450027466, 0.6270729303359985, 0.7785624265670776, 0.9300519824028015, 1.0815415382385254, 1.2330310344696045, 1.3845206499099731, 1.5360101461410522, 1.6874996423721313, 1.8389892578125, 1.990478754043579, 2.141968250274658, 2.2934579849243164, 2.4449472427368164, 2.5964369773864746, 2.7479264736175537, 2.899415969848633, 3.050905466079712, 3.202394962310791, 3.353884696960449, 3.5053741931915283, 3.6568636894226074, 3.8083534240722656, 3.9598426818847656, 4.111332416534424, 4.262821674346924, 4.414311408996582, 4.565800666809082, 4.71729040145874, 4.868780136108398, 5.020269393920898, 5.171759128570557]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 4.0, 4.0, 7.0, 6.0, 10.0, 8.0, 15.0, 18.0, 9.0, 14.0, 34.0, 37.0, 37.0, 38.0, 27.0, 30.0, 35.0, 34.0, 35.0, 44.0, 39.0, 43.0, 37.0, 31.0, 40.0, 30.0, 30.0, 33.0, 31.0, 30.0, 24.0, 22.0, 23.0, 18.0, 17.0, 13.0, 13.0, 12.0, 12.0, 5.0, 6.0, 4.0, 8.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.2546870708465576, -2.184597969055176, -2.114509105682373, -2.044420003890991, -1.9743309020996094, -1.9042418003082275, -1.8341528177261353, -1.764063835144043, -1.6939747333526611, -1.6238856315612793, -1.553796648979187, -1.4837076663970947, -1.413618564605713, -1.343529462814331, -1.2734404802322388, -1.2033514976501465, -1.1332623958587646, -1.0631732940673828, -0.9930843114852905, -0.9229952692985535, -0.8529062271118164, -0.7828171849250793, -0.7127281427383423, -0.6426391005516052, -0.5725500583648682, -0.5024610161781311, -0.43237197399139404, -0.362282931804657, -0.2921938896179199, -0.22210484743118286, -0.1520158052444458, -0.08192676305770874, -0.011837482452392578, 0.05825155973434448, 0.12834060192108154, 0.1984296441078186, 0.26851868629455566, 0.3386077284812927, 0.4086967706680298, 0.47878581285476685, 0.5488748550415039, 0.618963897228241, 0.689052939414978, 0.7591419816017151, 0.8292310237884521, 0.8993200659751892, 0.9694091081619263, 1.0394980907440186, 1.1095871925354004, 1.1796762943267822, 1.2497652769088745, 1.3198542594909668, 1.3899433612823486, 1.4600324630737305, 1.5301214456558228, 1.600210428237915, 1.6702995300292969, 1.7403886318206787, 1.810477614402771, 1.8805665969848633, 1.9506556987762451, 2.020744800567627, 2.0908336639404297, 2.1609227657318115, 2.2310118675231934]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 9.0, 4.0, 6.0, 13.0, 14.0, 24.0, 35.0, 59.0, 93.0, 131.0, 195.0, 289.0, 433.0, 806.0, 1401.0, 2581.0, 4812.0, 9775.0, 20058.0, 44013.0, 100627.0, 300667.0, 358172.0, 111615.0, 48378.0, 22206.0, 10495.0, 5179.0, 2666.0, 1546.0, 832.0, 527.0, 272.0, 204.0, 116.0, 83.0, 54.0, 45.0, 36.0, 17.0, 15.0, 10.0, 13.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.837890625, -1.7805633544921875, -1.723236083984375, -1.6659088134765625, -1.60858154296875, -1.5512542724609375, -1.493927001953125, -1.4365997314453125, -1.3792724609375, -1.3219451904296875, -1.264617919921875, -1.2072906494140625, -1.14996337890625, -1.0926361083984375, -1.035308837890625, -0.9779815673828125, -0.920654296875, -0.8633270263671875, -0.805999755859375, -0.7486724853515625, -0.69134521484375, -0.6340179443359375, -0.576690673828125, -0.5193634033203125, -0.4620361328125, -0.4047088623046875, -0.347381591796875, -0.2900543212890625, -0.23272705078125, -0.1753997802734375, -0.118072509765625, -0.0607452392578125, -0.00341796875, 0.0539093017578125, 0.111236572265625, 0.1685638427734375, 0.22589111328125, 0.2832183837890625, 0.340545654296875, 0.3978729248046875, 0.4552001953125, 0.5125274658203125, 0.569854736328125, 0.6271820068359375, 0.68450927734375, 0.7418365478515625, 0.799163818359375, 0.8564910888671875, 0.913818359375, 0.9711456298828125, 1.028472900390625, 1.0858001708984375, 1.14312744140625, 1.2004547119140625, 1.257781982421875, 1.3151092529296875, 1.3724365234375, 1.4297637939453125, 1.487091064453125, 1.5444183349609375, 1.60174560546875, 1.6590728759765625, 1.716400146484375, 1.7737274169921875, 1.8310546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 5.0, 8.0, 5.0, 8.0, 9.0, 15.0, 16.0, 14.0, 22.0, 24.0, 29.0, 34.0, 36.0, 36.0, 49.0, 49.0, 65.0, 56.0, 55.0, 56.0, 69.0, 47.0, 50.0, 39.0, 49.0, 26.0, 34.0, 19.0, 10.0, 17.0, 9.0, 14.0, 9.0, 2.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.432861328125, -0.4215126037597656, -0.41016387939453125, -0.3988151550292969, -0.3874664306640625, -0.3761177062988281, -0.36476898193359375, -0.3534202575683594, -0.342071533203125, -0.3307228088378906, -0.31937408447265625, -0.3080253601074219, -0.2966766357421875, -0.2853279113769531, -0.27397918701171875, -0.2626304626464844, -0.25128173828125, -0.23993301391601562, -0.22858428955078125, -0.21723556518554688, -0.2058868408203125, -0.19453811645507812, -0.18318939208984375, -0.17184066772460938, -0.160491943359375, -0.14914321899414062, -0.13779449462890625, -0.12644577026367188, -0.1150970458984375, -0.10374832153320312, -0.09239959716796875, -0.08105087280273438, -0.0697021484375, -0.058353424072265625, -0.04700469970703125, -0.035655975341796875, -0.0243072509765625, -0.012958526611328125, -0.00160980224609375, 0.009738922119140625, 0.021087646484375, 0.032436370849609375, 0.04378509521484375, 0.055133819580078125, 0.0664825439453125, 0.07783126831054688, 0.08917999267578125, 0.10052871704101562, 0.11187744140625, 0.12322616577148438, 0.13457489013671875, 0.14592361450195312, 0.1572723388671875, 0.16862106323242188, 0.17996978759765625, 0.19131851196289062, 0.202667236328125, 0.21401596069335938, 0.22536468505859375, 0.23671340942382812, 0.2480621337890625, 0.2594108581542969, 0.27075958251953125, 0.2821083068847656, 0.29345703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 0.0, 7.0, 6.0, 9.0, 14.0, 18.0, 21.0, 21.0, 21.0, 39.0, 54.0, 85.0, 101.0, 119.0, 161.0, 247.0, 328.0, 521.0, 928.0, 1801.0, 4207.0, 11296.0, 35453.0, 123905.0, 544999.0, 231385.0, 61793.0, 18764.0, 6460.0, 2453.0, 1252.0, 620.0, 402.0, 287.0, 199.0, 128.0, 97.0, 86.0, 61.0, 58.0, 34.0, 32.0, 21.0, 18.0, 15.0, 11.0, 6.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9580078125, -1.8898468017578125, -1.821685791015625, -1.7535247802734375, -1.68536376953125, -1.6172027587890625, -1.549041748046875, -1.4808807373046875, -1.4127197265625, -1.3445587158203125, -1.276397705078125, -1.2082366943359375, -1.14007568359375, -1.0719146728515625, -1.003753662109375, -0.9355926513671875, -0.867431640625, -0.7992706298828125, -0.731109619140625, -0.6629486083984375, -0.59478759765625, -0.5266265869140625, -0.458465576171875, -0.3903045654296875, -0.3221435546875, -0.2539825439453125, -0.185821533203125, -0.1176605224609375, -0.04949951171875, 0.0186614990234375, 0.086822509765625, 0.1549835205078125, 0.22314453125, 0.2913055419921875, 0.359466552734375, 0.4276275634765625, 0.49578857421875, 0.5639495849609375, 0.632110595703125, 0.7002716064453125, 0.7684326171875, 0.8365936279296875, 0.904754638671875, 0.9729156494140625, 1.04107666015625, 1.1092376708984375, 1.177398681640625, 1.2455596923828125, 1.313720703125, 1.3818817138671875, 1.450042724609375, 1.5182037353515625, 1.58636474609375, 1.6545257568359375, 1.722686767578125, 1.7908477783203125, 1.8590087890625, 1.9271697998046875, 1.995330810546875, 2.0634918212890625, 2.13165283203125, 2.1998138427734375, 2.267974853515625, 2.3361358642578125, 2.404296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 9.0, 5.0, 7.0, 8.0, 11.0, 20.0, 17.0, 26.0, 32.0, 36.0, 35.0, 35.0, 51.0, 51.0, 51.0, 57.0, 56.0, 59.0, 52.0, 57.0, 45.0, 51.0, 32.0, 36.0, 35.0, 29.0, 24.0, 16.0, 17.0, 14.0, 7.0, 4.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6708984375, -1.6148681640625, -1.558837890625, -1.5028076171875, -1.44677734375, -1.3907470703125, -1.334716796875, -1.2786865234375, -1.22265625, -1.1666259765625, -1.110595703125, -1.0545654296875, -0.99853515625, -0.9425048828125, -0.886474609375, -0.8304443359375, -0.7744140625, -0.7183837890625, -0.662353515625, -0.6063232421875, -0.55029296875, -0.4942626953125, -0.438232421875, -0.3822021484375, -0.326171875, -0.2701416015625, -0.214111328125, -0.1580810546875, -0.10205078125, -0.0460205078125, 0.010009765625, 0.0660400390625, 0.1220703125, 0.1781005859375, 0.234130859375, 0.2901611328125, 0.34619140625, 0.4022216796875, 0.458251953125, 0.5142822265625, 0.5703125, 0.6263427734375, 0.682373046875, 0.7384033203125, 0.79443359375, 0.8504638671875, 0.906494140625, 0.9625244140625, 1.0185546875, 1.0745849609375, 1.130615234375, 1.1866455078125, 1.24267578125, 1.2987060546875, 1.354736328125, 1.4107666015625, 1.466796875, 1.5228271484375, 1.578857421875, 1.6348876953125, 1.69091796875, 1.7469482421875, 1.802978515625, 1.8590087890625, 1.9150390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 6.0, 10.0, 8.0, 16.0, 26.0, 35.0, 41.0, 67.0, 127.0, 196.0, 390.0, 746.0, 1653.0, 3674.0, 9192.0, 25098.0, 90500.0, 589062.0, 251948.0, 48903.0, 15800.0, 6114.0, 2499.0, 1148.0, 530.0, 304.0, 159.0, 100.0, 60.0, 42.0, 22.0, 20.0, 14.0, 7.0, 10.0, 11.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90380859375, -0.8687515258789062, -0.8336944580078125, -0.7986373901367188, -0.763580322265625, -0.7285232543945312, -0.6934661865234375, -0.6584091186523438, -0.62335205078125, -0.5882949829101562, -0.5532379150390625, -0.5181808471679688, -0.483123779296875, -0.44806671142578125, -0.4130096435546875, -0.37795257568359375, -0.3428955078125, -0.30783843994140625, -0.2727813720703125, -0.23772430419921875, -0.202667236328125, -0.16761016845703125, -0.1325531005859375, -0.09749603271484375, -0.06243896484375, -0.02738189697265625, 0.0076751708984375, 0.04273223876953125, 0.077789306640625, 0.11284637451171875, 0.1479034423828125, 0.18296051025390625, 0.218017578125, 0.25307464599609375, 0.2881317138671875, 0.32318878173828125, 0.358245849609375, 0.39330291748046875, 0.4283599853515625, 0.46341705322265625, 0.49847412109375, 0.5335311889648438, 0.5685882568359375, 0.6036453247070312, 0.638702392578125, 0.6737594604492188, 0.7088165283203125, 0.7438735961914062, 0.7789306640625, 0.8139877319335938, 0.8490447998046875, 0.8841018676757812, 0.919158935546875, 0.9542160034179688, 0.9892730712890625, 1.0243301391601562, 1.05938720703125, 1.0944442749023438, 1.1295013427734375, 1.1645584106445312, 1.199615478515625, 1.2346725463867188, 1.2697296142578125, 1.3047866821289062, 1.33984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 8.0, 4.0, 6.0, 7.0, 14.0, 7.0, 12.0, 26.0, 25.0, 33.0, 28.0, 40.0, 57.0, 79.0, 82.0, 109.0, 98.0, 84.0, 61.0, 43.0, 36.0, 26.0, 25.0, 14.0, 14.0, 14.0, 7.0, 7.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018227100372314453, -0.00017648003995418549, -0.00017068907618522644, -0.0001648981124162674, -0.00015910714864730835, -0.0001533161848783493, -0.00014752522110939026, -0.0001417342573404312, -0.00013594329357147217, -0.00013015232980251312, -0.00012436136603355408, -0.00011857040226459503, -0.00011277943849563599, -0.00010698847472667694, -0.0001011975109577179, -9.540654718875885e-05, -8.96155834197998e-05, -8.382461965084076e-05, -7.803365588188171e-05, -7.224269211292267e-05, -6.645172834396362e-05, -6.066076457500458e-05, -5.486980080604553e-05, -4.907883703708649e-05, -4.328787326812744e-05, -3.7496909499168396e-05, -3.170594573020935e-05, -2.5914981961250305e-05, -2.012401819229126e-05, -1.4333054423332214e-05, -8.542090654373169e-06, -2.7511268854141235e-06, 3.039836883544922e-06, 8.830800652503967e-06, 1.4621764421463013e-05, 2.0412728190422058e-05, 2.6203691959381104e-05, 3.199465572834015e-05, 3.7785619497299194e-05, 4.357658326625824e-05, 4.9367547035217285e-05, 5.515851080417633e-05, 6.0949474573135376e-05, 6.674043834209442e-05, 7.253140211105347e-05, 7.832236588001251e-05, 8.411332964897156e-05, 8.99042934179306e-05, 9.569525718688965e-05, 0.0001014862209558487, 0.00010727718472480774, 0.00011306814849376678, 0.00011885911226272583, 0.00012465007603168488, 0.00013044103980064392, 0.00013623200356960297, 0.000142022967338562, 0.00014781393110752106, 0.0001536048948764801, 0.00015939585864543915, 0.0001651868224143982, 0.00017097778618335724, 0.00017676874995231628, 0.00018255971372127533, 0.00018835067749023438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 13.0, 6.0, 21.0, 24.0, 29.0, 30.0, 53.0, 53.0, 105.0, 160.0, 316.0, 508.0, 1014.0, 2300.0, 6007.0, 18793.0, 88705.0, 657734.0, 223445.0, 33546.0, 9261.0, 3330.0, 1409.0, 695.0, 352.0, 213.0, 130.0, 71.0, 57.0, 31.0, 26.0, 22.0, 19.0, 17.0, 10.0, 10.0, 7.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5791015625, -1.534881591796875, -1.49066162109375, -1.446441650390625, -1.4022216796875, -1.358001708984375, -1.31378173828125, -1.269561767578125, -1.225341796875, -1.181121826171875, -1.13690185546875, -1.092681884765625, -1.0484619140625, -1.004241943359375, -0.96002197265625, -0.915802001953125, -0.87158203125, -0.827362060546875, -0.78314208984375, -0.738922119140625, -0.6947021484375, -0.650482177734375, -0.60626220703125, -0.562042236328125, -0.517822265625, -0.473602294921875, -0.42938232421875, -0.385162353515625, -0.3409423828125, -0.296722412109375, -0.25250244140625, -0.208282470703125, -0.1640625, -0.119842529296875, -0.07562255859375, -0.031402587890625, 0.0128173828125, 0.057037353515625, 0.10125732421875, 0.145477294921875, 0.189697265625, 0.233917236328125, 0.27813720703125, 0.322357177734375, 0.3665771484375, 0.410797119140625, 0.45501708984375, 0.499237060546875, 0.54345703125, 0.587677001953125, 0.63189697265625, 0.676116943359375, 0.7203369140625, 0.764556884765625, 0.80877685546875, 0.852996826171875, 0.897216796875, 0.941436767578125, 0.98565673828125, 1.029876708984375, 1.0740966796875, 1.118316650390625, 1.16253662109375, 1.206756591796875, 1.2509765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 0.0, 4.0, 6.0, 14.0, 14.0, 21.0, 13.0, 20.0, 19.0, 37.0, 42.0, 65.0, 53.0, 67.0, 107.0, 102.0, 87.0, 63.0, 54.0, 47.0, 41.0, 28.0, 13.0, 15.0, 11.0, 16.0, 6.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.7568359375, -0.7346343994140625, -0.712432861328125, -0.6902313232421875, -0.66802978515625, -0.6458282470703125, -0.623626708984375, -0.6014251708984375, -0.5792236328125, -0.5570220947265625, -0.534820556640625, -0.5126190185546875, -0.49041748046875, -0.4682159423828125, -0.446014404296875, -0.4238128662109375, -0.401611328125, -0.3794097900390625, -0.357208251953125, -0.3350067138671875, -0.31280517578125, -0.2906036376953125, -0.268402099609375, -0.2462005615234375, -0.2239990234375, -0.2017974853515625, -0.179595947265625, -0.1573944091796875, -0.13519287109375, -0.1129913330078125, -0.090789794921875, -0.0685882568359375, -0.04638671875, -0.0241851806640625, -0.001983642578125, 0.0202178955078125, 0.04241943359375, 0.0646209716796875, 0.086822509765625, 0.1090240478515625, 0.1312255859375, 0.1534271240234375, 0.175628662109375, 0.1978302001953125, 0.22003173828125, 0.2422332763671875, 0.264434814453125, 0.2866363525390625, 0.308837890625, 0.3310394287109375, 0.353240966796875, 0.3754425048828125, 0.39764404296875, 0.4198455810546875, 0.442047119140625, 0.4642486572265625, 0.4864501953125, 0.5086517333984375, 0.530853271484375, 0.5530548095703125, 0.57525634765625, 0.5974578857421875, 0.619659423828125, 0.6418609619140625, 0.6640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 10.0, 9.0, 12.0, 36.0, 40.0, 86.0, 138.0, 167.0, 173.0, 145.0, 93.0, 33.0, 34.0, 16.0, 10.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.237560272216797, -16.597808837890625, -15.958057403564453, -15.318305969238281, -14.67855453491211, -14.038803100585938, -13.39905071258545, -12.759299278259277, -12.119547843933105, -11.479796409606934, -10.840044975280762, -10.20029354095459, -9.560541152954102, -8.92078971862793, -8.281038284301758, -7.641286849975586, -7.001535415649414, -6.361783981323242, -5.72203254699707, -5.08228063583374, -4.442529201507568, -3.8027777671813965, -3.1630260944366455, -2.5232744216918945, -1.8835229873657227, -1.2437714338302612, -0.6040198802947998, 0.03573167324066162, 0.675483226776123, 1.315234661102295, 1.954986333847046, 2.594738006591797, 3.2344913482666016, 3.8742427825927734, 4.513994216918945, 5.153746128082275, 5.793497562408447, 6.433248996734619, 7.073000907897949, 7.712752342224121, 8.352503776550293, 8.992255210876465, 9.632006645202637, 10.271758079528809, 10.911510467529297, 11.551261901855469, 12.19101333618164, 12.830764770507812, 13.470516204833984, 14.110267639160156, 14.750019073486328, 15.3897705078125, 16.029521942138672, 16.669273376464844, 17.309024810791016, 17.948776245117188, 18.58852767944336, 19.22827911376953, 19.868030548095703, 20.507781982421875, 21.147533416748047, 21.78728485107422, 22.42703628540039, 23.066787719726562, 23.706541061401367]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 7.0, 6.0, 9.0, 6.0, 7.0, 5.0, 15.0, 5.0, 7.0, 20.0, 22.0, 21.0, 20.0, 20.0, 27.0, 29.0, 34.0, 38.0, 33.0, 29.0, 45.0, 40.0, 46.0, 36.0, 45.0, 45.0, 38.0, 35.0, 49.0, 26.0, 27.0, 36.0, 28.0, 19.0, 23.0, 15.0, 11.0, 13.0, 11.0, 9.0, 11.0, 13.0, 4.0, 8.0, 1.0, 8.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.188767910003662, -6.961972236633301, -6.7351765632629395, -6.508380889892578, -6.281585216522217, -6.0547895431518555, -5.827993392944336, -5.601198196411133, -5.374402046203613, -5.147606372833252, -4.920810699462891, -4.694015026092529, -4.467219352722168, -4.240423679351807, -4.013628005981445, -3.786832094192505, -3.5600366592407227, -3.3332409858703613, -3.1064453125, -2.8796496391296387, -2.6528539657592773, -2.426058292388916, -2.1992623805999756, -1.9724667072296143, -1.745671033859253, -1.5188753604888916, -1.2920796871185303, -1.0652838945388794, -0.8384882211685181, -0.6116925477981567, -0.38489675521850586, -0.15810108184814453, 0.068695068359375, 0.2954907715320587, 0.5222864747047424, 0.7490822076797485, 0.9758778810501099, 1.2026735544204712, 1.429469347000122, 1.6562650203704834, 1.8830606937408447, 2.109856367111206, 2.3366520404815674, 2.563447952270508, 2.790243625640869, 3.0170392990112305, 3.243834972381592, 3.470630645751953, 3.6974263191223145, 3.924221992492676, 4.151017665863037, 4.377813339233398, 4.60460901260376, 4.831404685974121, 5.058200836181641, 5.284996032714844, 5.511792182922363, 5.738587856292725, 5.965383529663086, 6.192179203033447, 6.418974876403809, 6.64577054977417, 6.872566223144531, 7.099362373352051, 7.326157569885254]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 8.0, 15.0, 16.0, 20.0, 29.0, 46.0, 59.0, 134.0, 184.0, 326.0, 619.0, 1258.0, 2927.0, 9204.0, 39699.0, 3464227.0, 629466.0, 32410.0, 8276.0, 2760.0, 1232.0, 603.0, 288.0, 187.0, 104.0, 69.0, 41.0, 22.0, 16.0, 6.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.7838134765625, -4.634033203125, -4.4842529296875, -4.33447265625, -4.1846923828125, -4.034912109375, -3.8851318359375, -3.7353515625, -3.5855712890625, -3.435791015625, -3.2860107421875, -3.13623046875, -2.9864501953125, -2.836669921875, -2.6868896484375, -2.537109375, -2.3873291015625, -2.237548828125, -2.0877685546875, -1.93798828125, -1.7882080078125, -1.638427734375, -1.4886474609375, -1.3388671875, -1.1890869140625, -1.039306640625, -0.8895263671875, -0.73974609375, -0.5899658203125, -0.440185546875, -0.2904052734375, -0.140625, 0.0091552734375, 0.158935546875, 0.3087158203125, 0.45849609375, 0.6082763671875, 0.758056640625, 0.9078369140625, 1.0576171875, 1.2073974609375, 1.357177734375, 1.5069580078125, 1.65673828125, 1.8065185546875, 1.956298828125, 2.1060791015625, 2.255859375, 2.4056396484375, 2.555419921875, 2.7052001953125, 2.85498046875, 3.0047607421875, 3.154541015625, 3.3043212890625, 3.4541015625, 3.6038818359375, 3.753662109375, 3.9034423828125, 4.05322265625, 4.2030029296875, 4.352783203125, 4.5025634765625, 4.65234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 4.0, 4.0, 8.0, 11.0, 18.0, 21.0, 14.0, 30.0, 30.0, 35.0, 43.0, 41.0, 36.0, 49.0, 54.0, 54.0, 67.0, 46.0, 51.0, 47.0, 49.0, 44.0, 37.0, 32.0, 32.0, 23.0, 26.0, 20.0, 17.0, 10.0, 12.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.427978515625, -0.4166069030761719, -0.40523529052734375, -0.3938636779785156, -0.3824920654296875, -0.3711204528808594, -0.35974884033203125, -0.3483772277832031, -0.337005615234375, -0.3256340026855469, -0.31426239013671875, -0.3028907775878906, -0.2915191650390625, -0.2801475524902344, -0.26877593994140625, -0.2574043273925781, -0.24603271484375, -0.23466110229492188, -0.22328948974609375, -0.21191787719726562, -0.2005462646484375, -0.18917465209960938, -0.17780303955078125, -0.16643142700195312, -0.155059814453125, -0.14368820190429688, -0.13231658935546875, -0.12094497680664062, -0.1095733642578125, -0.09820175170898438, -0.08683013916015625, -0.07545852661132812, -0.0640869140625, -0.052715301513671875, -0.04134368896484375, -0.029972076416015625, -0.0186004638671875, -0.007228851318359375, 0.00414276123046875, 0.015514373779296875, 0.026885986328125, 0.038257598876953125, 0.04962921142578125, 0.061000823974609375, 0.0723724365234375, 0.08374404907226562, 0.09511566162109375, 0.10648727416992188, 0.11785888671875, 0.12923049926757812, 0.14060211181640625, 0.15197372436523438, 0.1633453369140625, 0.17471694946289062, 0.18608856201171875, 0.19746017456054688, 0.208831787109375, 0.22020339965820312, 0.23157501220703125, 0.24294662475585938, 0.2543182373046875, 0.2656898498535156, 0.27706146240234375, 0.2884330749511719, 0.2998046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 1.0, 2.0, 3.0, 5.0, 14.0, 17.0, 22.0, 32.0, 60.0, 89.0, 127.0, 170.0, 265.0, 410.0, 631.0, 1054.0, 1878.0, 2993.0, 5524.0, 10481.0, 20797.0, 46576.0, 141093.0, 3298407.0, 512858.0, 84010.0, 32611.0, 15376.0, 7982.0, 4324.0, 2456.0, 1478.0, 964.0, 553.0, 385.0, 228.0, 148.0, 86.0, 63.0, 44.0, 24.0, 19.0, 12.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.087890625, -2.0261077880859375, -1.964324951171875, -1.9025421142578125, -1.84075927734375, -1.7789764404296875, -1.717193603515625, -1.6554107666015625, -1.5936279296875, -1.5318450927734375, -1.470062255859375, -1.4082794189453125, -1.34649658203125, -1.2847137451171875, -1.222930908203125, -1.1611480712890625, -1.099365234375, -1.0375823974609375, -0.975799560546875, -0.9140167236328125, -0.85223388671875, -0.7904510498046875, -0.728668212890625, -0.6668853759765625, -0.6051025390625, -0.5433197021484375, -0.481536865234375, -0.4197540283203125, -0.35797119140625, -0.2961883544921875, -0.234405517578125, -0.1726226806640625, -0.11083984375, -0.0490570068359375, 0.012725830078125, 0.0745086669921875, 0.13629150390625, 0.1980743408203125, 0.259857177734375, 0.3216400146484375, 0.3834228515625, 0.4452056884765625, 0.506988525390625, 0.5687713623046875, 0.63055419921875, 0.6923370361328125, 0.754119873046875, 0.8159027099609375, 0.877685546875, 0.9394683837890625, 1.001251220703125, 1.0630340576171875, 1.12481689453125, 1.1865997314453125, 1.248382568359375, 1.3101654052734375, 1.3719482421875, 1.4337310791015625, 1.495513916015625, 1.5572967529296875, 1.61907958984375, 1.6808624267578125, 1.742645263671875, 1.8044281005859375, 1.8662109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 3.0, 7.0, 6.0, 9.0, 11.0, 9.0, 12.0, 24.0, 25.0, 21.0, 44.0, 50.0, 77.0, 133.0, 235.0, 996.0, 1662.0, 287.0, 126.0, 75.0, 54.0, 47.0, 20.0, 22.0, 25.0, 9.0, 14.0, 16.0, 7.0, 5.0, 7.0, 6.0, 3.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-1.0673828125, -1.0385818481445312, -1.0097808837890625, -0.9809799194335938, -0.952178955078125, -0.9233779907226562, -0.8945770263671875, -0.8657760620117188, -0.83697509765625, -0.8081741333007812, -0.7793731689453125, -0.7505722045898438, -0.721771240234375, -0.6929702758789062, -0.6641693115234375, -0.6353683471679688, -0.6065673828125, -0.5777664184570312, -0.5489654541015625, -0.5201644897460938, -0.491363525390625, -0.46256256103515625, -0.4337615966796875, -0.40496063232421875, -0.37615966796875, -0.34735870361328125, -0.3185577392578125, -0.28975677490234375, -0.260955810546875, -0.23215484619140625, -0.2033538818359375, -0.17455291748046875, -0.145751953125, -0.11695098876953125, -0.0881500244140625, -0.05934906005859375, -0.030548095703125, -0.00174713134765625, 0.0270538330078125, 0.05585479736328125, 0.08465576171875, 0.11345672607421875, 0.1422576904296875, 0.17105865478515625, 0.199859619140625, 0.22866058349609375, 0.2574615478515625, 0.28626251220703125, 0.3150634765625, 0.34386444091796875, 0.3726654052734375, 0.40146636962890625, 0.430267333984375, 0.45906829833984375, 0.4878692626953125, 0.5166702270507812, 0.54547119140625, 0.5742721557617188, 0.6030731201171875, 0.6318740844726562, 0.660675048828125, 0.6894760131835938, 0.7182769775390625, 0.7470779418945312, 0.77587890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 7.0, 10.0, 11.0, 32.0, 32.0, 56.0, 93.0, 123.0, 131.0, 121.0, 113.0, 83.0, 61.0, 46.0, 22.0, 18.0, 12.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4877519607543945, -4.250966548919678, -4.014181137084961, -3.777395725250244, -3.5406103134155273, -3.3038249015808105, -3.0670394897460938, -2.830254077911377, -2.59346866607666, -2.3566832542419434, -2.1198978424072266, -1.8831124305725098, -1.646327018737793, -1.4095414876937866, -1.1727560758590698, -0.935970664024353, -0.6991851329803467, -0.4623997211456299, -0.2256142795085907, 0.011171162128448486, 0.24795657396316528, 0.48474204540252686, 0.7215274572372437, 0.9583128690719604, 1.1950982809066772, 1.431883692741394, 1.6686691045761108, 1.9054546356201172, 2.142240047454834, 2.379025459289551, 2.6158108711242676, 2.8525962829589844, 3.089381694793701, 3.326167106628418, 3.5629525184631348, 3.7997379302978516, 4.036523342132568, 4.273308753967285, 4.510094165802002, 4.746879577636719, 4.9836649894714355, 5.220450401306152, 5.457235813140869, 5.694021224975586, 5.930806636810303, 6.1675920486450195, 6.404377460479736, 6.641162872314453, 6.877948760986328, 7.114734172821045, 7.351519584655762, 7.5883049964904785, 7.825090408325195, 8.06187629699707, 8.298661231994629, 8.535447120666504, 8.772232055664062, 9.009017944335938, 9.245802879333496, 9.482588768005371, 9.71937370300293, 9.956159591674805, 10.192944526672363, 10.429730415344238, 10.666515350341797]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 9.0, 10.0, 5.0, 14.0, 13.0, 13.0, 14.0, 12.0, 27.0, 31.0, 24.0, 30.0, 53.0, 36.0, 50.0, 44.0, 41.0, 49.0, 33.0, 48.0, 44.0, 41.0, 42.0, 46.0, 43.0, 32.0, 24.0, 34.0, 19.0, 28.0, 15.0, 18.0, 11.0, 8.0, 11.0, 4.0, 11.0, 8.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29060435295105, -3.182262897491455, -3.0739214420318604, -2.9655799865722656, -2.857238531112671, -2.748897075653076, -2.6405553817749023, -2.5322141647338867, -2.423872470855713, -2.315531015396118, -2.2071895599365234, -2.0988481044769287, -1.990506649017334, -1.8821651935577393, -1.773823618888855, -1.6654821634292603, -1.557140827178955, -1.4487993717193604, -1.3404579162597656, -1.232116460800171, -1.1237750053405762, -1.0154335498809814, -0.9070919752120972, -0.7987505197525024, -0.6904090642929077, -0.582067608833313, -0.4737261235713959, -0.36538463830947876, -0.25704318284988403, -0.1487017273902893, -0.040360212326049805, 0.06798124313354492, 0.17632293701171875, 0.2846643924713135, 0.3930058777332306, 0.5013473629951477, 0.6096888184547424, 0.7180302739143372, 0.8263717889785767, 0.9347132444381714, 1.0430546998977661, 1.1513961553573608, 1.2597376108169556, 1.3680791854858398, 1.4764206409454346, 1.5847620964050293, 1.693103551864624, 1.8014450073242188, 1.9097864627838135, 2.018127918243408, 2.126469373703003, 2.2348108291625977, 2.3431522846221924, 2.451493740081787, 2.559835433959961, 2.6681766510009766, 2.7765183448791504, 2.884859800338745, 2.99320125579834, 3.1015427112579346, 3.2098841667175293, 3.318225622177124, 3.4265670776367188, 3.5349087715148926, 3.643249988555908]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 15.0, 13.0, 23.0, 45.0, 58.0, 77.0, 137.0, 231.0, 346.0, 598.0, 1050.0, 2103.0, 4220.0, 8726.0, 20172.0, 50706.0, 138475.0, 335977.0, 297112.0, 114015.0, 42014.0, 16935.0, 7573.0, 3569.0, 1856.0, 1008.0, 575.0, 328.0, 212.0, 124.0, 74.0, 51.0, 36.0, 32.0, 17.0, 11.0, 4.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.966796875, -1.912017822265625, -1.85723876953125, -1.802459716796875, -1.7476806640625, -1.692901611328125, -1.63812255859375, -1.583343505859375, -1.528564453125, -1.473785400390625, -1.41900634765625, -1.364227294921875, -1.3094482421875, -1.254669189453125, -1.19989013671875, -1.145111083984375, -1.09033203125, -1.035552978515625, -0.98077392578125, -0.925994873046875, -0.8712158203125, -0.816436767578125, -0.76165771484375, -0.706878662109375, -0.652099609375, -0.597320556640625, -0.54254150390625, -0.487762451171875, -0.4329833984375, -0.378204345703125, -0.32342529296875, -0.268646240234375, -0.2138671875, -0.159088134765625, -0.10430908203125, -0.049530029296875, 0.0052490234375, 0.060028076171875, 0.11480712890625, 0.169586181640625, 0.224365234375, 0.279144287109375, 0.33392333984375, 0.388702392578125, 0.4434814453125, 0.498260498046875, 0.55303955078125, 0.607818603515625, 0.66259765625, 0.717376708984375, 0.77215576171875, 0.826934814453125, 0.8817138671875, 0.936492919921875, 0.99127197265625, 1.046051025390625, 1.100830078125, 1.155609130859375, 1.21038818359375, 1.265167236328125, 1.3199462890625, 1.374725341796875, 1.42950439453125, 1.484283447265625, 1.5390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 3.0, 10.0, 22.0, 20.0, 28.0, 26.0, 33.0, 33.0, 40.0, 46.0, 37.0, 47.0, 51.0, 46.0, 43.0, 62.0, 58.0, 48.0, 42.0, 54.0, 43.0, 31.0, 31.0, 26.0, 20.0, 16.0, 10.0, 14.0, 12.0, 7.0, 9.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.454345703125, -0.4422874450683594, -0.43022918701171875, -0.4181709289550781, -0.4061126708984375, -0.3940544128417969, -0.38199615478515625, -0.3699378967285156, -0.357879638671875, -0.3458213806152344, -0.33376312255859375, -0.3217048645019531, -0.3096466064453125, -0.2975883483886719, -0.28553009033203125, -0.2734718322753906, -0.26141357421875, -0.24935531616210938, -0.23729705810546875, -0.22523880004882812, -0.2131805419921875, -0.20112228393554688, -0.18906402587890625, -0.17700576782226562, -0.164947509765625, -0.15288925170898438, -0.14083099365234375, -0.12877273559570312, -0.1167144775390625, -0.10465621948242188, -0.09259796142578125, -0.08053970336914062, -0.0684814453125, -0.056423187255859375, -0.04436492919921875, -0.032306671142578125, -0.0202484130859375, -0.008190155029296875, 0.00386810302734375, 0.015926361083984375, 0.027984619140625, 0.040042877197265625, 0.05210113525390625, 0.06415939331054688, 0.0762176513671875, 0.08827590942382812, 0.10033416748046875, 0.11239242553710938, 0.12445068359375, 0.13650894165039062, 0.14856719970703125, 0.16062545776367188, 0.1726837158203125, 0.18474197387695312, 0.19680023193359375, 0.20885848999023438, 0.220916748046875, 0.23297500610351562, 0.24503326416015625, 0.2570915222167969, 0.2691497802734375, 0.2812080383300781, 0.29326629638671875, 0.3053245544433594, 0.3173828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 9.0, 5.0, 21.0, 25.0, 27.0, 50.0, 72.0, 97.0, 144.0, 192.0, 338.0, 564.0, 1072.0, 2392.0, 7452.0, 31625.0, 209640.0, 639247.0, 124643.0, 21396.0, 5478.0, 1927.0, 853.0, 432.0, 264.0, 186.0, 118.0, 95.0, 54.0, 45.0, 28.0, 25.0, 11.0, 10.0, 3.0, 0.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.410552978515625, -2.31915283203125, -2.227752685546875, -2.1363525390625, -2.044952392578125, -1.95355224609375, -1.862152099609375, -1.770751953125, -1.679351806640625, -1.58795166015625, -1.496551513671875, -1.4051513671875, -1.313751220703125, -1.22235107421875, -1.130950927734375, -1.03955078125, -0.948150634765625, -0.85675048828125, -0.765350341796875, -0.6739501953125, -0.582550048828125, -0.49114990234375, -0.399749755859375, -0.308349609375, -0.216949462890625, -0.12554931640625, -0.034149169921875, 0.0572509765625, 0.148651123046875, 0.24005126953125, 0.331451416015625, 0.4228515625, 0.514251708984375, 0.60565185546875, 0.697052001953125, 0.7884521484375, 0.879852294921875, 0.97125244140625, 1.062652587890625, 1.154052734375, 1.245452880859375, 1.33685302734375, 1.428253173828125, 1.5196533203125, 1.611053466796875, 1.70245361328125, 1.793853759765625, 1.88525390625, 1.976654052734375, 2.06805419921875, 2.159454345703125, 2.2508544921875, 2.342254638671875, 2.43365478515625, 2.525054931640625, 2.616455078125, 2.707855224609375, 2.79925537109375, 2.890655517578125, 2.9820556640625, 3.073455810546875, 3.16485595703125, 3.256256103515625, 3.34765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 15.0, 18.0, 21.0, 24.0, 27.0, 29.0, 24.0, 35.0, 39.0, 33.0, 45.0, 48.0, 49.0, 48.0, 54.0, 59.0, 51.0, 48.0, 51.0, 41.0, 36.0, 28.0, 24.0, 25.0, 19.0, 23.0, 13.0, 14.0, 13.0, 9.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.1484375, -2.0889434814453125, -2.029449462890625, -1.9699554443359375, -1.91046142578125, -1.8509674072265625, -1.791473388671875, -1.7319793701171875, -1.6724853515625, -1.6129913330078125, -1.553497314453125, -1.4940032958984375, -1.43450927734375, -1.3750152587890625, -1.315521240234375, -1.2560272216796875, -1.196533203125, -1.1370391845703125, -1.077545166015625, -1.0180511474609375, -0.95855712890625, -0.8990631103515625, -0.839569091796875, -0.7800750732421875, -0.7205810546875, -0.6610870361328125, -0.601593017578125, -0.5420989990234375, -0.48260498046875, -0.4231109619140625, -0.363616943359375, -0.3041229248046875, -0.24462890625, -0.1851348876953125, -0.125640869140625, -0.0661468505859375, -0.00665283203125, 0.0528411865234375, 0.112335205078125, 0.1718292236328125, 0.2313232421875, 0.2908172607421875, 0.350311279296875, 0.4098052978515625, 0.46929931640625, 0.5287933349609375, 0.588287353515625, 0.6477813720703125, 0.707275390625, 0.7667694091796875, 0.826263427734375, 0.8857574462890625, 0.94525146484375, 1.0047454833984375, 1.064239501953125, 1.1237335205078125, 1.1832275390625, 1.2427215576171875, 1.302215576171875, 1.3617095947265625, 1.42120361328125, 1.4806976318359375, 1.540191650390625, 1.5996856689453125, 1.6591796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 9.0, 3.0, 15.0, 17.0, 28.0, 45.0, 64.0, 133.0, 192.0, 334.0, 630.0, 1443.0, 3304.0, 9158.0, 30710.0, 141334.0, 575766.0, 221502.0, 43923.0, 12124.0, 4235.0, 1675.0, 808.0, 406.0, 234.0, 141.0, 108.0, 61.0, 53.0, 23.0, 17.0, 12.0, 11.0, 8.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.6220703125, -1.5789642333984375, -1.535858154296875, -1.4927520751953125, -1.44964599609375, -1.4065399169921875, -1.363433837890625, -1.3203277587890625, -1.2772216796875, -1.2341156005859375, -1.191009521484375, -1.1479034423828125, -1.10479736328125, -1.0616912841796875, -1.018585205078125, -0.9754791259765625, -0.932373046875, -0.8892669677734375, -0.846160888671875, -0.8030548095703125, -0.75994873046875, -0.7168426513671875, -0.673736572265625, -0.6306304931640625, -0.5875244140625, -0.5444183349609375, -0.501312255859375, -0.4582061767578125, -0.41510009765625, -0.3719940185546875, -0.328887939453125, -0.2857818603515625, -0.24267578125, -0.1995697021484375, -0.156463623046875, -0.1133575439453125, -0.07025146484375, -0.0271453857421875, 0.015960693359375, 0.0590667724609375, 0.1021728515625, 0.1452789306640625, 0.188385009765625, 0.2314910888671875, 0.27459716796875, 0.3177032470703125, 0.360809326171875, 0.4039154052734375, 0.447021484375, 0.4901275634765625, 0.533233642578125, 0.5763397216796875, 0.61944580078125, 0.6625518798828125, 0.705657958984375, 0.7487640380859375, 0.7918701171875, 0.8349761962890625, 0.878082275390625, 0.9211883544921875, 0.96429443359375, 1.0074005126953125, 1.050506591796875, 1.0936126708984375, 1.13671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 7.0, 11.0, 11.0, 17.0, 31.0, 19.0, 33.0, 40.0, 49.0, 50.0, 70.0, 71.0, 65.0, 87.0, 77.0, 53.0, 46.0, 52.0, 34.0, 39.0, 31.0, 18.0, 25.0, 15.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014352798461914062, -0.00013797171413898468, -0.00013241544365882874, -0.0001268591731786728, -0.00012130290269851685, -0.0001157466322183609, -0.00011019036173820496, -0.00010463409125804901, -9.907782077789307e-05, -9.352155029773712e-05, -8.796527981758118e-05, -8.240900933742523e-05, -7.685273885726929e-05, -7.129646837711334e-05, -6.57401978969574e-05, -6.018392741680145e-05, -5.462765693664551e-05, -4.907138645648956e-05, -4.351511597633362e-05, -3.795884549617767e-05, -3.240257501602173e-05, -2.6846304535865784e-05, -2.129003405570984e-05, -1.5733763575553894e-05, -1.017749309539795e-05, -4.621222615242004e-06, 9.350478649139404e-07, 6.491318345069885e-06, 1.204758882522583e-05, 1.7603859305381775e-05, 2.316012978553772e-05, 2.8716400265693665e-05, 3.427267074584961e-05, 3.9828941226005554e-05, 4.53852117061615e-05, 5.0941482186317444e-05, 5.649775266647339e-05, 6.205402314662933e-05, 6.761029362678528e-05, 7.316656410694122e-05, 7.872283458709717e-05, 8.427910506725311e-05, 8.983537554740906e-05, 9.5391646027565e-05, 0.00010094791650772095, 0.00010650418698787689, 0.00011206045746803284, 0.00011761672794818878, 0.00012317299842834473, 0.00012872926890850067, 0.00013428553938865662, 0.00013984180986881256, 0.0001453980803489685, 0.00015095435082912445, 0.0001565106213092804, 0.00016206689178943634, 0.00016762316226959229, 0.00017317943274974823, 0.00017873570322990417, 0.00018429197371006012, 0.00018984824419021606, 0.000195404514670372, 0.00020096078515052795, 0.0002065170556306839, 0.00021207332611083984]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 11.0, 27.0, 36.0, 59.0, 72.0, 141.0, 246.0, 365.0, 748.0, 1719.0, 4527.0, 16941.0, 99951.0, 642991.0, 236394.0, 32193.0, 7387.0, 2427.0, 1034.0, 529.0, 256.0, 167.0, 108.0, 53.0, 49.0, 29.0, 18.0, 13.0, 10.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.71875, -1.6627655029296875, -1.606781005859375, -1.5507965087890625, -1.49481201171875, -1.4388275146484375, -1.382843017578125, -1.3268585205078125, -1.2708740234375, -1.2148895263671875, -1.158905029296875, -1.1029205322265625, -1.04693603515625, -0.9909515380859375, -0.934967041015625, -0.8789825439453125, -0.822998046875, -0.7670135498046875, -0.711029052734375, -0.6550445556640625, -0.59906005859375, -0.5430755615234375, -0.487091064453125, -0.4311065673828125, -0.3751220703125, -0.3191375732421875, -0.263153076171875, -0.2071685791015625, -0.15118408203125, -0.0951995849609375, -0.039215087890625, 0.0167694091796875, 0.07275390625, 0.1287384033203125, 0.184722900390625, 0.2407073974609375, 0.29669189453125, 0.3526763916015625, 0.408660888671875, 0.4646453857421875, 0.5206298828125, 0.5766143798828125, 0.632598876953125, 0.6885833740234375, 0.74456787109375, 0.8005523681640625, 0.856536865234375, 0.9125213623046875, 0.968505859375, 1.0244903564453125, 1.080474853515625, 1.1364593505859375, 1.19244384765625, 1.2484283447265625, 1.304412841796875, 1.3603973388671875, 1.4163818359375, 1.4723663330078125, 1.528350830078125, 1.5843353271484375, 1.64031982421875, 1.6963043212890625, 1.752288818359375, 1.8082733154296875, 1.8642578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 5.0, 3.0, 10.0, 13.0, 18.0, 25.0, 29.0, 26.0, 37.0, 59.0, 58.0, 65.0, 72.0, 92.0, 82.0, 85.0, 64.0, 51.0, 53.0, 42.0, 35.0, 20.0, 15.0, 14.0, 5.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2481689453125, -1.216064453125, -1.1839599609375, -1.15185546875, -1.1197509765625, -1.087646484375, -1.0555419921875, -1.0234375, -0.9913330078125, -0.959228515625, -0.9271240234375, -0.89501953125, -0.8629150390625, -0.830810546875, -0.7987060546875, -0.7666015625, -0.7344970703125, -0.702392578125, -0.6702880859375, -0.63818359375, -0.6060791015625, -0.573974609375, -0.5418701171875, -0.509765625, -0.4776611328125, -0.445556640625, -0.4134521484375, -0.38134765625, -0.3492431640625, -0.317138671875, -0.2850341796875, -0.2529296875, -0.2208251953125, -0.188720703125, -0.1566162109375, -0.12451171875, -0.0924072265625, -0.060302734375, -0.0281982421875, 0.00390625, 0.0360107421875, 0.068115234375, 0.1002197265625, 0.13232421875, 0.1644287109375, 0.196533203125, 0.2286376953125, 0.2607421875, 0.2928466796875, 0.324951171875, 0.3570556640625, 0.38916015625, 0.4212646484375, 0.453369140625, 0.4854736328125, 0.517578125, 0.5496826171875, 0.581787109375, 0.6138916015625, 0.64599609375, 0.6781005859375, 0.710205078125, 0.7423095703125, 0.7744140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 18.0, 28.0, 56.0, 94.0, 196.0, 216.0, 176.0, 104.0, 55.0, 32.0, 14.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.35030746459961, -30.536706924438477, -29.723108291625977, -28.909507751464844, -28.09590721130371, -27.28230857849121, -26.468708038330078, -25.655109405517578, -24.841508865356445, -24.027908325195312, -23.214309692382812, -22.40070915222168, -21.587108612060547, -20.773509979248047, -19.959909439086914, -19.14630889892578, -18.33271026611328, -17.51910972595215, -16.70551109313965, -15.891910552978516, -15.0783109664917, -14.264711380004883, -13.45111083984375, -12.637511253356934, -11.823909759521484, -11.010310173034668, -10.196709632873535, -9.383110046386719, -8.569510459899902, -7.755910396575928, -6.942310333251953, -6.128710746765137, -5.31511116027832, -4.501511096954346, -3.6879115104675293, -2.8743114471435547, -2.060711622238159, -1.2471117973327637, -0.43351173400878906, 0.38008785247802734, 1.193687915802002, 2.0072877407073975, 2.820887565612793, 3.6344876289367676, 4.448087692260742, 5.261687278747559, 6.075287342071533, 6.88888692855835, 7.702486991882324, 8.51608657836914, 9.329687118530273, 10.14328670501709, 10.956886291503906, 11.770486831665039, 12.584086418151855, 13.397686004638672, 14.211286544799805, 15.024886131286621, 15.838486671447754, 16.65208625793457, 17.465686798095703, 18.279285430908203, 19.092885971069336, 19.90648651123047, 20.72008514404297]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 9.0, 6.0, 4.0, 13.0, 9.0, 14.0, 11.0, 20.0, 21.0, 30.0, 28.0, 40.0, 37.0, 38.0, 41.0, 42.0, 43.0, 45.0, 43.0, 47.0, 43.0, 45.0, 45.0, 32.0, 43.0, 36.0, 29.0, 25.0, 28.0, 25.0, 23.0, 15.0, 10.0, 10.0, 11.0, 7.0, 8.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.550844192504883, -9.25841236114502, -8.965980529785156, -8.67354965209961, -8.381117820739746, -8.088685989379883, -7.7962541580200195, -7.503822326660156, -7.211390495300293, -6.91895866394043, -6.626527309417725, -6.334095478057861, -6.041663646697998, -5.749232292175293, -5.45680046081543, -5.164368629455566, -4.871937274932861, -4.579505443572998, -4.287074089050293, -3.9946422576904297, -3.7022104263305664, -3.4097788333892822, -3.117347240447998, -2.8249154090881348, -2.5324838161468506, -2.2400522232055664, -1.9476203918457031, -1.655188798904419, -1.3627570867538452, -1.0703253746032715, -0.7778937816619873, -0.485461950302124, -0.19303035736083984, 0.0994013249874115, 0.39183300733566284, 0.6842646598815918, 0.9766963720321655, 1.2691280841827393, 1.5615596771240234, 1.8539915084838867, 2.146423101425171, 2.438854694366455, 2.7312865257263184, 3.0237181186676025, 3.3161497116088867, 3.60858154296875, 3.901013135910034, 4.193445205688477, 4.485876560211182, 4.778308391571045, 5.07073974609375, 5.363171577453613, 5.655603408813477, 5.94803524017334, 6.240466594696045, 6.532898426055908, 6.825329780578613, 7.117761611938477, 7.410192966461182, 7.702624797821045, 7.995056629180908, 8.287487983703613, 8.579919815063477, 8.87235164642334, 9.164783477783203]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 18.0, 21.0, 25.0, 52.0, 76.0, 125.0, 184.0, 443.0, 1557.0, 17737.0, 4168487.0, 3974.0, 828.0, 305.0, 181.0, 97.0, 48.0, 39.0, 26.0, 23.0, 7.0, 9.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.171875, -15.699951171875, -15.22802734375, -14.756103515625, -14.2841796875, -13.812255859375, -13.34033203125, -12.868408203125, -12.396484375, -11.924560546875, -11.45263671875, -10.980712890625, -10.5087890625, -10.036865234375, -9.56494140625, -9.093017578125, -8.62109375, -8.149169921875, -7.67724609375, -7.205322265625, -6.7333984375, -6.261474609375, -5.78955078125, -5.317626953125, -4.845703125, -4.373779296875, -3.90185546875, -3.429931640625, -2.9580078125, -2.486083984375, -2.01416015625, -1.542236328125, -1.0703125, -0.598388671875, -0.12646484375, 0.345458984375, 0.8173828125, 1.289306640625, 1.76123046875, 2.233154296875, 2.705078125, 3.177001953125, 3.64892578125, 4.120849609375, 4.5927734375, 5.064697265625, 5.53662109375, 6.008544921875, 6.48046875, 6.952392578125, 7.42431640625, 7.896240234375, 8.3681640625, 8.840087890625, 9.31201171875, 9.783935546875, 10.255859375, 10.727783203125, 11.19970703125, 11.671630859375, 12.1435546875, 12.615478515625, 13.08740234375, 13.559326171875, 14.03125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 1.0, 2.0, 7.0, 8.0, 4.0, 14.0, 14.0, 20.0, 24.0, 30.0, 29.0, 36.0, 34.0, 35.0, 38.0, 60.0, 48.0, 54.0, 57.0, 42.0, 53.0, 60.0, 34.0, 46.0, 45.0, 34.0, 23.0, 27.0, 25.0, 23.0, 11.0, 13.0, 16.0, 5.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.44580078125, -0.4326324462890625, -0.419464111328125, -0.4062957763671875, -0.39312744140625, -0.3799591064453125, -0.366790771484375, -0.3536224365234375, -0.3404541015625, -0.3272857666015625, -0.314117431640625, -0.3009490966796875, -0.28778076171875, -0.2746124267578125, -0.261444091796875, -0.2482757568359375, -0.235107421875, -0.2219390869140625, -0.208770751953125, -0.1956024169921875, -0.18243408203125, -0.1692657470703125, -0.156097412109375, -0.1429290771484375, -0.1297607421875, -0.1165924072265625, -0.103424072265625, -0.0902557373046875, -0.07708740234375, -0.0639190673828125, -0.050750732421875, -0.0375823974609375, -0.0244140625, -0.0112457275390625, 0.001922607421875, 0.0150909423828125, 0.02825927734375, 0.0414276123046875, 0.054595947265625, 0.0677642822265625, 0.0809326171875, 0.0941009521484375, 0.107269287109375, 0.1204376220703125, 0.13360595703125, 0.1467742919921875, 0.159942626953125, 0.1731109619140625, 0.186279296875, 0.1994476318359375, 0.212615966796875, 0.2257843017578125, 0.23895263671875, 0.2521209716796875, 0.265289306640625, 0.2784576416015625, 0.2916259765625, 0.3047943115234375, 0.317962646484375, 0.3311309814453125, 0.34429931640625, 0.3574676513671875, 0.370635986328125, 0.3838043212890625, 0.39697265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 13.0, 23.0, 29.0, 39.0, 65.0, 83.0, 146.0, 237.0, 350.0, 562.0, 1047.0, 2092.0, 4011.0, 9810.0, 51644.0, 4077427.0, 30875.0, 7988.0, 3543.0, 1771.0, 1002.0, 494.0, 349.0, 190.0, 120.0, 96.0, 77.0, 46.0, 28.0, 24.0, 24.0, 19.0, 15.0, 7.0, 10.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.50390625, -2.4090576171875, -2.314208984375, -2.2193603515625, -2.12451171875, -2.0296630859375, -1.934814453125, -1.8399658203125, -1.7451171875, -1.6502685546875, -1.555419921875, -1.4605712890625, -1.36572265625, -1.2708740234375, -1.176025390625, -1.0811767578125, -0.986328125, -0.8914794921875, -0.796630859375, -0.7017822265625, -0.60693359375, -0.5120849609375, -0.417236328125, -0.3223876953125, -0.2275390625, -0.1326904296875, -0.037841796875, 0.0570068359375, 0.15185546875, 0.2467041015625, 0.341552734375, 0.4364013671875, 0.53125, 0.6260986328125, 0.720947265625, 0.8157958984375, 0.91064453125, 1.0054931640625, 1.100341796875, 1.1951904296875, 1.2900390625, 1.3848876953125, 1.479736328125, 1.5745849609375, 1.66943359375, 1.7642822265625, 1.859130859375, 1.9539794921875, 2.048828125, 2.1436767578125, 2.238525390625, 2.3333740234375, 2.42822265625, 2.5230712890625, 2.617919921875, 2.7127685546875, 2.8076171875, 2.9024658203125, 2.997314453125, 3.0921630859375, 3.18701171875, 3.2818603515625, 3.376708984375, 3.4715576171875, 3.56640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 1.0, 6.0, 6.0, 5.0, 14.0, 25.0, 46.0, 166.0, 3522.0, 154.0, 52.0, 21.0, 16.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3408203125, -0.3263092041015625, -0.311798095703125, -0.2972869873046875, -0.28277587890625, -0.2682647705078125, -0.253753662109375, -0.2392425537109375, -0.2247314453125, -0.2102203369140625, -0.195709228515625, -0.1811981201171875, -0.16668701171875, -0.1521759033203125, -0.137664794921875, -0.1231536865234375, -0.108642578125, -0.0941314697265625, -0.079620361328125, -0.0651092529296875, -0.05059814453125, -0.0360870361328125, -0.021575927734375, -0.0070648193359375, 0.0074462890625, 0.0219573974609375, 0.036468505859375, 0.0509796142578125, 0.06549072265625, 0.0800018310546875, 0.094512939453125, 0.1090240478515625, 0.12353515625, 0.1380462646484375, 0.152557373046875, 0.1670684814453125, 0.18157958984375, 0.1960906982421875, 0.210601806640625, 0.2251129150390625, 0.2396240234375, 0.2541351318359375, 0.268646240234375, 0.2831573486328125, 0.29766845703125, 0.3121795654296875, 0.326690673828125, 0.3412017822265625, 0.355712890625, 0.3702239990234375, 0.384735107421875, 0.3992462158203125, 0.41375732421875, 0.4282684326171875, 0.442779541015625, 0.4572906494140625, 0.4718017578125, 0.4863128662109375, 0.500823974609375, 0.5153350830078125, 0.52984619140625, 0.5443572998046875, 0.558868408203125, 0.5733795166015625, 0.587890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 5.0, 16.0, 42.0, 167.0, 308.0, 288.0, 134.0, 36.0, 13.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9276905655860901, -0.7617236375808716, -0.5957567691802979, -0.42978987097740173, -0.2638229727745056, -0.09785610437393188, 0.06811082363128662, 0.23407775163650513, 0.40004462003707886, 0.5660115480422974, 0.7319784164428711, 0.8979452848434448, 1.0639121532440186, 1.2298791408538818, 1.3958460092544556, 1.5618128776550293, 1.7277798652648926, 1.8937467336654663, 2.05971360206604, 2.2256805896759033, 2.3916473388671875, 2.557614326477051, 2.723581314086914, 2.8895483016967773, 3.0555150508880615, 3.221482038497925, 3.387448787689209, 3.5534157752990723, 3.7193827629089355, 3.8853495121002197, 4.051316261291504, 4.217283248901367, 4.3832502365112305, 4.549217224121094, 4.715184211730957, 4.881150722503662, 5.047117710113525, 5.213084697723389, 5.379051685333252, 5.545018672943115, 5.71098518371582, 5.876952171325684, 6.042919158935547, 6.208885669708252, 6.374852657318115, 6.5408196449279785, 6.706786632537842, 6.872753620147705, 7.038720607757568, 7.204687595367432, 7.370654582977295, 7.53662109375, 7.702588081359863, 7.868555068969727, 8.03452205657959, 8.200489044189453, 8.366456031799316, 8.53242301940918, 8.698390007019043, 8.864356994628906, 9.03032398223877, 9.196290969848633, 9.36225700378418, 9.528223991394043, 9.694190979003906]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 11.0, 9.0, 13.0, 19.0, 20.0, 25.0, 24.0, 25.0, 27.0, 32.0, 35.0, 46.0, 39.0, 39.0, 39.0, 44.0, 45.0, 47.0, 41.0, 50.0, 38.0, 46.0, 32.0, 39.0, 25.0, 25.0, 28.0, 17.0, 20.0, 14.0, 14.0, 9.0, 13.0, 7.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8888269066810608, -0.8589125275611877, -0.8289980888366699, -0.7990837097167969, -0.7691693305969238, -0.739254891872406, -0.709340512752533, -0.6794260740280151, -0.6495116949081421, -0.619597315788269, -0.5896828770637512, -0.5597684979438782, -0.5298540592193604, -0.4999396800994873, -0.47002530097961426, -0.4401108920574188, -0.4101964831352234, -0.38028207421302795, -0.3503676652908325, -0.3204532861709595, -0.29053887724876404, -0.2606244683265686, -0.23071007430553436, -0.20079568028450012, -0.1708812713623047, -0.14096686244010925, -0.11105246841907501, -0.08113806694746017, -0.05122366547584534, -0.021309256553649902, 0.008605137467384338, 0.03851953148841858, 0.06843400001525879, 0.09834840148687363, 0.12826280295848846, 0.1581771969795227, 0.18809160590171814, 0.21800601482391357, 0.24792040884494781, 0.27783480286598206, 0.3077492117881775, 0.3376636207103729, 0.36757802963256836, 0.3974924087524414, 0.42740681767463684, 0.4573212265968323, 0.4872356057167053, 0.5171500444412231, 0.5470644235610962, 0.5769788026809692, 0.6068932414054871, 0.6368076205253601, 0.6667220592498779, 0.696636438369751, 0.726550817489624, 0.7564651966094971, 0.7863796353340149, 0.8162940144538879, 0.8462084531784058, 0.8761228322982788, 0.9060372114181519, 0.9359516501426697, 0.9658660292625427, 0.9957804679870605, 1.0256948471069336]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 8.0, 16.0, 28.0, 24.0, 42.0, 55.0, 77.0, 94.0, 171.0, 240.0, 440.0, 747.0, 1428.0, 2756.0, 5669.0, 12050.0, 27677.0, 64960.0, 154296.0, 293918.0, 263610.0, 125249.0, 52591.0, 22430.0, 10012.0, 4763.0, 2242.0, 1234.0, 638.0, 386.0, 233.0, 152.0, 65.0, 67.0, 36.0, 34.0, 16.0, 27.0, 12.0, 14.0, 13.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.326171875, -1.2817840576171875, -1.237396240234375, -1.1930084228515625, -1.14862060546875, -1.1042327880859375, -1.059844970703125, -1.0154571533203125, -0.9710693359375, -0.9266815185546875, -0.882293701171875, -0.8379058837890625, -0.79351806640625, -0.7491302490234375, -0.704742431640625, -0.6603546142578125, -0.615966796875, -0.5715789794921875, -0.527191162109375, -0.4828033447265625, -0.43841552734375, -0.3940277099609375, -0.349639892578125, -0.3052520751953125, -0.2608642578125, -0.2164764404296875, -0.172088623046875, -0.1277008056640625, -0.08331298828125, -0.0389251708984375, 0.005462646484375, 0.0498504638671875, 0.09423828125, 0.1386260986328125, 0.183013916015625, 0.2274017333984375, 0.27178955078125, 0.3161773681640625, 0.360565185546875, 0.4049530029296875, 0.4493408203125, 0.4937286376953125, 0.538116455078125, 0.5825042724609375, 0.62689208984375, 0.6712799072265625, 0.715667724609375, 0.7600555419921875, 0.804443359375, 0.8488311767578125, 0.893218994140625, 0.9376068115234375, 0.98199462890625, 1.0263824462890625, 1.070770263671875, 1.1151580810546875, 1.1595458984375, 1.2039337158203125, 1.248321533203125, 1.2927093505859375, 1.33709716796875, 1.3814849853515625, 1.425872802734375, 1.4702606201171875, 1.5146484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 10.0, 5.0, 11.0, 17.0, 18.0, 16.0, 25.0, 25.0, 28.0, 33.0, 34.0, 35.0, 36.0, 48.0, 40.0, 47.0, 57.0, 41.0, 47.0, 44.0, 46.0, 38.0, 42.0, 33.0, 35.0, 30.0, 26.0, 25.0, 24.0, 12.0, 15.0, 14.0, 7.0, 4.0, 3.0, 6.0, 5.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.43896484375, -0.42620849609375, -0.4134521484375, -0.40069580078125, -0.387939453125, -0.37518310546875, -0.3624267578125, -0.34967041015625, -0.3369140625, -0.32415771484375, -0.3114013671875, -0.29864501953125, -0.285888671875, -0.27313232421875, -0.2603759765625, -0.24761962890625, -0.23486328125, -0.22210693359375, -0.2093505859375, -0.19659423828125, -0.183837890625, -0.17108154296875, -0.1583251953125, -0.14556884765625, -0.1328125, -0.12005615234375, -0.1072998046875, -0.09454345703125, -0.081787109375, -0.06903076171875, -0.0562744140625, -0.04351806640625, -0.03076171875, -0.01800537109375, -0.0052490234375, 0.00750732421875, 0.020263671875, 0.03302001953125, 0.0457763671875, 0.05853271484375, 0.0712890625, 0.08404541015625, 0.0968017578125, 0.10955810546875, 0.122314453125, 0.13507080078125, 0.1478271484375, 0.16058349609375, 0.17333984375, 0.18609619140625, 0.1988525390625, 0.21160888671875, 0.224365234375, 0.23712158203125, 0.2498779296875, 0.26263427734375, 0.275390625, 0.28814697265625, 0.3009033203125, 0.31365966796875, 0.326416015625, 0.33917236328125, 0.3519287109375, 0.36468505859375, 0.37744140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 7.0, 18.0, 27.0, 44.0, 64.0, 99.0, 158.0, 271.0, 450.0, 829.0, 1756.0, 5779.0, 35517.0, 446110.0, 507297.0, 40028.0, 6163.0, 1844.0, 904.0, 470.0, 242.0, 179.0, 106.0, 60.0, 36.0, 35.0, 21.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96875, -3.8643798828125, -3.760009765625, -3.6556396484375, -3.55126953125, -3.4468994140625, -3.342529296875, -3.2381591796875, -3.1337890625, -3.0294189453125, -2.925048828125, -2.8206787109375, -2.71630859375, -2.6119384765625, -2.507568359375, -2.4031982421875, -2.298828125, -2.1944580078125, -2.090087890625, -1.9857177734375, -1.88134765625, -1.7769775390625, -1.672607421875, -1.5682373046875, -1.4638671875, -1.3594970703125, -1.255126953125, -1.1507568359375, -1.04638671875, -0.9420166015625, -0.837646484375, -0.7332763671875, -0.62890625, -0.5245361328125, -0.420166015625, -0.3157958984375, -0.21142578125, -0.1070556640625, -0.002685546875, 0.1016845703125, 0.2060546875, 0.3104248046875, 0.414794921875, 0.5191650390625, 0.62353515625, 0.7279052734375, 0.832275390625, 0.9366455078125, 1.041015625, 1.1453857421875, 1.249755859375, 1.3541259765625, 1.45849609375, 1.5628662109375, 1.667236328125, 1.7716064453125, 1.8759765625, 1.9803466796875, 2.084716796875, 2.1890869140625, 2.29345703125, 2.3978271484375, 2.502197265625, 2.6065673828125, 2.7109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 10.0, 7.0, 6.0, 11.0, 13.0, 15.0, 18.0, 26.0, 30.0, 20.0, 40.0, 44.0, 45.0, 50.0, 53.0, 47.0, 45.0, 55.0, 48.0, 39.0, 47.0, 36.0, 49.0, 47.0, 30.0, 34.0, 27.0, 24.0, 19.0, 9.0, 16.0, 7.0, 7.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.1881103515625, -2.118408203125, -2.0487060546875, -1.97900390625, -1.9093017578125, -1.839599609375, -1.7698974609375, -1.7001953125, -1.6304931640625, -1.560791015625, -1.4910888671875, -1.42138671875, -1.3516845703125, -1.281982421875, -1.2122802734375, -1.142578125, -1.0728759765625, -1.003173828125, -0.9334716796875, -0.86376953125, -0.7940673828125, -0.724365234375, -0.6546630859375, -0.5849609375, -0.5152587890625, -0.445556640625, -0.3758544921875, -0.30615234375, -0.2364501953125, -0.166748046875, -0.0970458984375, -0.02734375, 0.0423583984375, 0.112060546875, 0.1817626953125, 0.25146484375, 0.3211669921875, 0.390869140625, 0.4605712890625, 0.5302734375, 0.5999755859375, 0.669677734375, 0.7393798828125, 0.80908203125, 0.8787841796875, 0.948486328125, 1.0181884765625, 1.087890625, 1.1575927734375, 1.227294921875, 1.2969970703125, 1.36669921875, 1.4364013671875, 1.506103515625, 1.5758056640625, 1.6455078125, 1.7152099609375, 1.784912109375, 1.8546142578125, 1.92431640625, 1.9940185546875, 2.063720703125, 2.1334228515625, 2.203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 11.0, 6.0, 10.0, 13.0, 12.0, 32.0, 47.0, 73.0, 138.0, 255.0, 623.0, 1376.0, 3652.0, 12543.0, 57839.0, 436459.0, 456643.0, 59562.0, 12932.0, 3720.0, 1364.0, 596.0, 284.0, 139.0, 78.0, 47.0, 23.0, 20.0, 17.0, 8.0, 6.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.5263671875, -1.483978271484375, -1.44158935546875, -1.399200439453125, -1.3568115234375, -1.314422607421875, -1.27203369140625, -1.229644775390625, -1.187255859375, -1.144866943359375, -1.10247802734375, -1.060089111328125, -1.0177001953125, -0.975311279296875, -0.93292236328125, -0.890533447265625, -0.84814453125, -0.805755615234375, -0.76336669921875, -0.720977783203125, -0.6785888671875, -0.636199951171875, -0.59381103515625, -0.551422119140625, -0.509033203125, -0.466644287109375, -0.42425537109375, -0.381866455078125, -0.3394775390625, -0.297088623046875, -0.25469970703125, -0.212310791015625, -0.169921875, -0.127532958984375, -0.08514404296875, -0.042755126953125, -0.0003662109375, 0.042022705078125, 0.08441162109375, 0.126800537109375, 0.169189453125, 0.211578369140625, 0.25396728515625, 0.296356201171875, 0.3387451171875, 0.381134033203125, 0.42352294921875, 0.465911865234375, 0.50830078125, 0.550689697265625, 0.59307861328125, 0.635467529296875, 0.6778564453125, 0.720245361328125, 0.76263427734375, 0.805023193359375, 0.847412109375, 0.889801025390625, 0.93218994140625, 0.974578857421875, 1.0169677734375, 1.059356689453125, 1.10174560546875, 1.144134521484375, 1.1865234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 6.0, 19.0, 17.0, 19.0, 16.0, 23.0, 28.0, 41.0, 44.0, 60.0, 47.0, 70.0, 50.0, 61.0, 66.0, 61.0, 68.0, 36.0, 49.0, 36.0, 28.0, 23.0, 22.0, 22.0, 12.0, 15.0, 12.0, 6.0, 9.0, 2.0, 4.0, 4.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001556873321533203, -0.00015095993876457214, -0.00014623254537582397, -0.0001415051519870758, -0.00013677775859832764, -0.00013205036520957947, -0.0001273229718208313, -0.00012259557843208313, -0.00011786818504333496, -0.00011314079165458679, -0.00010841339826583862, -0.00010368600487709045, -9.895861148834229e-05, -9.423121809959412e-05, -8.950382471084595e-05, -8.477643132209778e-05, -8.004903793334961e-05, -7.532164454460144e-05, -7.059425115585327e-05, -6.58668577671051e-05, -6.113946437835693e-05, -5.6412070989608765e-05, -5.1684677600860596e-05, -4.695728421211243e-05, -4.222989082336426e-05, -3.750249743461609e-05, -3.277510404586792e-05, -2.804771065711975e-05, -2.3320317268371582e-05, -1.8592923879623413e-05, -1.3865530490875244e-05, -9.138137102127075e-06, -4.410743713378906e-06, 3.166496753692627e-07, 5.044043064117432e-06, 9.7714364528656e-06, 1.449882984161377e-05, 1.922622323036194e-05, 2.3953616619110107e-05, 2.8681010007858276e-05, 3.3408403396606445e-05, 3.8135796785354614e-05, 4.286319017410278e-05, 4.759058356285095e-05, 5.231797695159912e-05, 5.704537034034729e-05, 6.177276372909546e-05, 6.650015711784363e-05, 7.12275505065918e-05, 7.595494389533997e-05, 8.068233728408813e-05, 8.54097306728363e-05, 9.013712406158447e-05, 9.486451745033264e-05, 9.959191083908081e-05, 0.00010431930422782898, 0.00010904669761657715, 0.00011377409100532532, 0.00011850148439407349, 0.00012322887778282166, 0.00012795627117156982, 0.000132683664560318, 0.00013741105794906616, 0.00014213845133781433, 0.0001468658447265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 8.0, 11.0, 10.0, 10.0, 27.0, 39.0, 63.0, 115.0, 249.0, 408.0, 958.0, 2506.0, 10170.0, 108726.0, 818725.0, 92901.0, 9495.0, 2278.0, 901.0, 375.0, 205.0, 133.0, 83.0, 41.0, 29.0, 21.0, 16.0, 8.0, 3.0, 7.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.896484375, -1.8362274169921875, -1.775970458984375, -1.7157135009765625, -1.65545654296875, -1.5951995849609375, -1.534942626953125, -1.4746856689453125, -1.4144287109375, -1.3541717529296875, -1.293914794921875, -1.2336578369140625, -1.17340087890625, -1.1131439208984375, -1.052886962890625, -0.9926300048828125, -0.932373046875, -0.8721160888671875, -0.811859130859375, -0.7516021728515625, -0.69134521484375, -0.6310882568359375, -0.570831298828125, -0.5105743408203125, -0.4503173828125, -0.3900604248046875, -0.329803466796875, -0.2695465087890625, -0.20928955078125, -0.1490325927734375, -0.088775634765625, -0.0285186767578125, 0.03173828125, 0.0919952392578125, 0.152252197265625, 0.2125091552734375, 0.27276611328125, 0.3330230712890625, 0.393280029296875, 0.4535369873046875, 0.5137939453125, 0.5740509033203125, 0.634307861328125, 0.6945648193359375, 0.75482177734375, 0.8150787353515625, 0.875335693359375, 0.9355926513671875, 0.995849609375, 1.0561065673828125, 1.116363525390625, 1.1766204833984375, 1.23687744140625, 1.2971343994140625, 1.357391357421875, 1.4176483154296875, 1.4779052734375, 1.5381622314453125, 1.598419189453125, 1.6586761474609375, 1.71893310546875, 1.7791900634765625, 1.839447021484375, 1.8997039794921875, 1.9599609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 10.0, 7.0, 13.0, 23.0, 29.0, 37.0, 53.0, 70.0, 107.0, 93.0, 102.0, 100.0, 91.0, 61.0, 48.0, 41.0, 30.0, 20.0, 17.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.487579345703125, -1.44781494140625, -1.408050537109375, -1.3682861328125, -1.328521728515625, -1.28875732421875, -1.248992919921875, -1.209228515625, -1.169464111328125, -1.12969970703125, -1.089935302734375, -1.0501708984375, -1.010406494140625, -0.97064208984375, -0.930877685546875, -0.89111328125, -0.851348876953125, -0.81158447265625, -0.771820068359375, -0.7320556640625, -0.692291259765625, -0.65252685546875, -0.612762451171875, -0.572998046875, -0.533233642578125, -0.49346923828125, -0.453704833984375, -0.4139404296875, -0.374176025390625, -0.33441162109375, -0.294647216796875, -0.2548828125, -0.215118408203125, -0.17535400390625, -0.135589599609375, -0.0958251953125, -0.056060791015625, -0.01629638671875, 0.023468017578125, 0.063232421875, 0.102996826171875, 0.14276123046875, 0.182525634765625, 0.2222900390625, 0.262054443359375, 0.30181884765625, 0.341583251953125, 0.38134765625, 0.421112060546875, 0.46087646484375, 0.500640869140625, 0.5404052734375, 0.580169677734375, 0.61993408203125, 0.659698486328125, 0.699462890625, 0.739227294921875, 0.77899169921875, 0.818756103515625, 0.8585205078125, 0.898284912109375, 0.93804931640625, 0.977813720703125, 1.017578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 6.0, 9.0, 7.0, 15.0, 16.0, 27.0, 45.0, 87.0, 95.0, 118.0, 132.0, 126.0, 115.0, 81.0, 52.0, 27.0, 16.0, 5.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.357519149780273, -9.861992835998535, -9.366466522216797, -8.870939254760742, -8.375412940979004, -7.879886627197266, -7.384360313415527, -6.888833999633789, -6.393307209014893, -5.897780895233154, -5.402254104614258, -4.9067277908325195, -4.411201477050781, -3.9156746864318848, -3.4201483726501465, -2.924621820449829, -2.4290952682495117, -1.9335687160491943, -1.4380422830581665, -0.9425158500671387, -0.4469892978668213, 0.048537254333496094, 0.5440635681152344, 1.0395901203155518, 1.5351166725158691, 2.0306432247161865, 2.526169776916504, 3.021696090698242, 3.5172226428985596, 4.012749195098877, 4.508275508880615, 5.003802299499512, 5.49932861328125, 5.994854927062988, 6.490381717681885, 6.985908031463623, 7.4814348220825195, 7.976961135864258, 8.472487449645996, 8.968013763427734, 9.463541030883789, 9.959067344665527, 10.454593658447266, 10.95012092590332, 11.445647239685059, 11.941173553466797, 12.436699867248535, 12.932226181030273, 13.427752494812012, 13.92327880859375, 14.418805122375488, 14.914331436157227, 15.409858703613281, 15.90538501739502, 16.400911331176758, 16.896438598632812, 17.391963958740234, 17.88749122619629, 18.38301658630371, 18.878543853759766, 19.374069213867188, 19.869596481323242, 20.365123748779297, 20.86064910888672, 21.356176376342773]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 5.0, 3.0, 6.0, 4.0, 6.0, 13.0, 9.0, 13.0, 14.0, 23.0, 34.0, 24.0, 32.0, 44.0, 38.0, 45.0, 51.0, 59.0, 48.0, 57.0, 61.0, 55.0, 52.0, 43.0, 34.0, 27.0, 40.0, 36.0, 27.0, 15.0, 20.0, 16.0, 13.0, 10.0, 4.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.27833366394043, -12.89414119720459, -12.50994873046875, -12.12575626373291, -11.74156379699707, -11.357370376586914, -10.97317886352539, -10.588985443115234, -10.204792976379395, -9.820600509643555, -9.436408042907715, -9.052215576171875, -8.668023109436035, -8.283830642700195, -7.899637699127197, -7.515444755554199, -7.131252765655518, -6.747060298919678, -6.362867832183838, -5.97867488861084, -5.594482421875, -5.21028995513916, -4.82609748840332, -4.4419050216674805, -4.057712554931641, -3.673520088195801, -3.289327383041382, -2.905134916305542, -2.520942211151123, -2.136749744415283, -1.7525572776794434, -1.3683645725250244, -0.9841718673706055, -0.5999792814254761, -0.21578675508499146, 0.16840577125549316, 0.5525983572006226, 0.936790943145752, 1.3209834098815918, 1.7051761150360107, 2.0893685817718506, 2.4735610485076904, 2.8577537536621094, 3.241946220397949, 3.626138687133789, 4.010331153869629, 4.394523620605469, 4.778716564178467, 5.162909030914307, 5.5471014976501465, 5.931293964385986, 6.315486907958984, 6.699679374694824, 7.083871841430664, 7.468064308166504, 7.852256774902344, 8.236449241638184, 8.620641708374023, 9.004834175109863, 9.389026641845703, 9.773219108581543, 10.157411575317383, 10.541604995727539, 10.925797462463379, 11.309989929199219]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 13.0, 17.0, 17.0, 39.0, 45.0, 79.0, 92.0, 160.0, 347.0, 858.0, 2889.0, 23263.0, 4153174.0, 9981.0, 1938.0, 629.0, 297.0, 152.0, 91.0, 57.0, 47.0, 23.0, 30.0, 14.0, 6.0, 4.0, 7.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.240966796875, -9.94287109375, -9.644775390625, -9.3466796875, -9.048583984375, -8.75048828125, -8.452392578125, -8.154296875, -7.856201171875, -7.55810546875, -7.260009765625, -6.9619140625, -6.663818359375, -6.36572265625, -6.067626953125, -5.76953125, -5.471435546875, -5.17333984375, -4.875244140625, -4.5771484375, -4.279052734375, -3.98095703125, -3.682861328125, -3.384765625, -3.086669921875, -2.78857421875, -2.490478515625, -2.1923828125, -1.894287109375, -1.59619140625, -1.298095703125, -1.0, -0.701904296875, -0.40380859375, -0.105712890625, 0.1923828125, 0.490478515625, 0.78857421875, 1.086669921875, 1.384765625, 1.682861328125, 1.98095703125, 2.279052734375, 2.5771484375, 2.875244140625, 3.17333984375, 3.471435546875, 3.76953125, 4.067626953125, 4.36572265625, 4.663818359375, 4.9619140625, 5.260009765625, 5.55810546875, 5.856201171875, 6.154296875, 6.452392578125, 6.75048828125, 7.048583984375, 7.3466796875, 7.644775390625, 7.94287109375, 8.240966796875, 8.5390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 14.0, 15.0, 21.0, 26.0, 29.0, 31.0, 25.0, 36.0, 52.0, 48.0, 51.0, 61.0, 52.0, 67.0, 58.0, 55.0, 62.0, 46.0, 33.0, 34.0, 43.0, 23.0, 19.0, 16.0, 8.0, 13.0, 9.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4556465148925781, -0.43985748291015625, -0.4240684509277344, -0.4082794189453125, -0.3924903869628906, -0.37670135498046875, -0.3609123229980469, -0.345123291015625, -0.3293342590332031, -0.31354522705078125, -0.2977561950683594, -0.2819671630859375, -0.2661781311035156, -0.25038909912109375, -0.23460006713867188, -0.21881103515625, -0.20302200317382812, -0.18723297119140625, -0.17144393920898438, -0.1556549072265625, -0.13986587524414062, -0.12407684326171875, -0.10828781127929688, -0.092498779296875, -0.07670974731445312, -0.06092071533203125, -0.045131683349609375, -0.0293426513671875, -0.013553619384765625, 0.00223541259765625, 0.018024444580078125, 0.0338134765625, 0.049602508544921875, 0.06539154052734375, 0.08118057250976562, 0.0969696044921875, 0.11275863647460938, 0.12854766845703125, 0.14433670043945312, 0.160125732421875, 0.17591476440429688, 0.19170379638671875, 0.20749282836914062, 0.2232818603515625, 0.23907089233398438, 0.25485992431640625, 0.2706489562988281, 0.28643798828125, 0.3022270202636719, 0.31801605224609375, 0.3338050842285156, 0.3495941162109375, 0.3653831481933594, 0.38117218017578125, 0.3969612121582031, 0.412750244140625, 0.4285392761230469, 0.44432830810546875, 0.4601173400878906, 0.4759063720703125, 0.4916954040527344, 0.5074844360351562, 0.5232734680175781, 0.5390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 9.0, 6.0, 7.0, 10.0, 10.0, 20.0, 20.0, 25.0, 35.0, 47.0, 79.0, 91.0, 138.0, 172.0, 239.0, 336.0, 398.0, 573.0, 817.0, 1258.0, 1883.0, 3037.0, 5392.0, 10289.0, 29552.0, 364165.0, 3711262.0, 37091.0, 11719.0, 5772.0, 3271.0, 2030.0, 1345.0, 850.0, 620.0, 432.0, 297.0, 232.0, 180.0, 129.0, 113.0, 83.0, 58.0, 46.0, 37.0, 33.0, 21.0, 14.0, 14.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6279296875, -1.5738067626953125, -1.519683837890625, -1.4655609130859375, -1.41143798828125, -1.3573150634765625, -1.303192138671875, -1.2490692138671875, -1.1949462890625, -1.1408233642578125, -1.086700439453125, -1.0325775146484375, -0.97845458984375, -0.9243316650390625, -0.870208740234375, -0.8160858154296875, -0.761962890625, -0.7078399658203125, -0.653717041015625, -0.5995941162109375, -0.54547119140625, -0.4913482666015625, -0.437225341796875, -0.3831024169921875, -0.3289794921875, -0.2748565673828125, -0.220733642578125, -0.1666107177734375, -0.11248779296875, -0.0583648681640625, -0.004241943359375, 0.0498809814453125, 0.10400390625, 0.1581268310546875, 0.212249755859375, 0.2663726806640625, 0.32049560546875, 0.3746185302734375, 0.428741455078125, 0.4828643798828125, 0.5369873046875, 0.5911102294921875, 0.645233154296875, 0.6993560791015625, 0.75347900390625, 0.8076019287109375, 0.861724853515625, 0.9158477783203125, 0.969970703125, 1.0240936279296875, 1.078216552734375, 1.1323394775390625, 1.18646240234375, 1.2405853271484375, 1.294708251953125, 1.3488311767578125, 1.4029541015625, 1.4570770263671875, 1.511199951171875, 1.5653228759765625, 1.61944580078125, 1.6735687255859375, 1.727691650390625, 1.7818145751953125, 1.8359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 15.0, 17.0, 36.0, 106.0, 3356.0, 375.0, 65.0, 35.0, 14.0, 5.0, 12.0, 8.0, 7.0, 2.0, 0.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61572265625, -0.5936203002929688, -0.5715179443359375, -0.5494155883789062, -0.527313232421875, -0.5052108764648438, -0.4831085205078125, -0.46100616455078125, -0.43890380859375, -0.41680145263671875, -0.3946990966796875, -0.37259674072265625, -0.350494384765625, -0.32839202880859375, -0.3062896728515625, -0.28418731689453125, -0.2620849609375, -0.23998260498046875, -0.2178802490234375, -0.19577789306640625, -0.173675537109375, -0.15157318115234375, -0.1294708251953125, -0.10736846923828125, -0.08526611328125, -0.06316375732421875, -0.0410614013671875, -0.01895904541015625, 0.003143310546875, 0.02524566650390625, 0.0473480224609375, 0.06945037841796875, 0.091552734375, 0.11365509033203125, 0.1357574462890625, 0.15785980224609375, 0.179962158203125, 0.20206451416015625, 0.2241668701171875, 0.24626922607421875, 0.26837158203125, 0.29047393798828125, 0.3125762939453125, 0.33467864990234375, 0.356781005859375, 0.37888336181640625, 0.4009857177734375, 0.42308807373046875, 0.4451904296875, 0.46729278564453125, 0.4893951416015625, 0.5114974975585938, 0.533599853515625, 0.5557022094726562, 0.5778045654296875, 0.5999069213867188, 0.62200927734375, 0.6441116333007812, 0.6662139892578125, 0.6883163452148438, 0.710418701171875, 0.7325210571289062, 0.7546234130859375, 0.7767257690429688, 0.798828125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 22.0, 39.0, 85.0, 115.0, 161.0, 184.0, 156.0, 98.0, 60.0, 33.0, 12.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6858787536621094, -2.5830469131469727, -2.480215072631836, -2.377383232116699, -2.2745513916015625, -2.171719551086426, -2.068887710571289, -1.966055989265442, -1.8632241487503052, -1.7603923082351685, -1.6575604677200317, -1.5547287464141846, -1.4518969058990479, -1.3490650653839111, -1.2462332248687744, -1.1434013843536377, -1.040569543838501, -0.9377377033233643, -0.8349058628082275, -0.7320740818977356, -0.6292422413825989, -0.5264104008674622, -0.4235786199569702, -0.3207467794418335, -0.21791493892669678, -0.11508311331272125, -0.012251287698745728, 0.0905805230140686, 0.19341236352920532, 0.29624420404434204, 0.399075984954834, 0.5019078254699707, 0.6047396659851074, 0.7075715065002441, 0.8104033470153809, 0.9132351279258728, 1.0160670280456543, 1.118898868560791, 1.2217305898666382, 1.324562430381775, 1.4273942708969116, 1.5302261114120483, 1.633057951927185, 1.7358896732330322, 1.838721513748169, 1.9415533542633057, 2.0443851947784424, 2.147217035293579, 2.250048875808716, 2.3528807163238525, 2.4557125568389893, 2.558544397354126, 2.6613762378692627, 2.7642080783843994, 2.867039680480957, 2.9698715209960938, 3.0727033615112305, 3.175535202026367, 3.278367042541504, 3.3811988830566406, 3.4840307235717773, 3.586862564086914, 3.689694404602051, 3.7925262451171875, 3.895358085632324]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 12.0, 17.0, 10.0, 32.0, 36.0, 31.0, 44.0, 54.0, 69.0, 76.0, 84.0, 63.0, 79.0, 65.0, 62.0, 47.0, 42.0, 41.0, 30.0, 25.0, 27.0, 19.0, 9.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2540318965911865, -1.1996937990188599, -1.1453555822372437, -1.091017484664917, -1.0366792678833008, -0.9823411703109741, -0.9280030727386475, -0.873664915561676, -0.8193267583847046, -0.7649886012077332, -0.7106504440307617, -0.6563123464584351, -0.6019741892814636, -0.5476360321044922, -0.49329790472984314, -0.4389597773551941, -0.38462162017822266, -0.3302834630012512, -0.2759453356266022, -0.22160719335079193, -0.1672690510749817, -0.11293089389801025, -0.058592766523361206, -0.004254639148712158, 0.05008351802825928, 0.10442166030406952, 0.15875980257987976, 0.21309794485569, 0.26743608713150024, 0.3217742443084717, 0.3761123716831207, 0.4304504990577698, 0.4847886562347412, 0.5391268134117126, 0.5934649705886841, 0.6478030681610107, 0.7021412253379822, 0.7564793825149536, 0.8108174800872803, 0.8651556372642517, 0.9194937944412231, 0.9738319516181946, 1.028170108795166, 1.0825082063674927, 1.1368463039398193, 1.1911845207214355, 1.2455226182937622, 1.2998607158660889, 1.354198932647705, 1.4085370302200317, 1.462875247001648, 1.5172133445739746, 1.5715515613555908, 1.6258896589279175, 1.6802277565002441, 1.7345659732818604, 1.788904070854187, 1.8432421684265137, 1.8975803852081299, 1.9519184827804565, 2.006256580352783, 2.0605947971343994, 2.1149330139160156, 2.1692709922790527, 2.223609209060669]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 10.0, 18.0, 22.0, 27.0, 43.0, 47.0, 82.0, 110.0, 184.0, 272.0, 448.0, 786.0, 1286.0, 2335.0, 4525.0, 8945.0, 18157.0, 39538.0, 89461.0, 199169.0, 304606.0, 205620.0, 93439.0, 41257.0, 18716.0, 9043.0, 4571.0, 2353.0, 1365.0, 784.0, 467.0, 283.0, 188.0, 124.0, 72.0, 50.0, 29.0, 23.0, 27.0, 19.0, 9.0, 6.0, 5.0, 7.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.998046875, -0.9663848876953125, -0.934722900390625, -0.9030609130859375, -0.87139892578125, -0.8397369384765625, -0.808074951171875, -0.7764129638671875, -0.7447509765625, -0.7130889892578125, -0.681427001953125, -0.6497650146484375, -0.61810302734375, -0.5864410400390625, -0.554779052734375, -0.5231170654296875, -0.491455078125, -0.4597930908203125, -0.428131103515625, -0.3964691162109375, -0.36480712890625, -0.3331451416015625, -0.301483154296875, -0.2698211669921875, -0.2381591796875, -0.2064971923828125, -0.174835205078125, -0.1431732177734375, -0.11151123046875, -0.0798492431640625, -0.048187255859375, -0.0165252685546875, 0.01513671875, 0.0467987060546875, 0.078460693359375, 0.1101226806640625, 0.14178466796875, 0.1734466552734375, 0.205108642578125, 0.2367706298828125, 0.2684326171875, 0.3000946044921875, 0.331756591796875, 0.3634185791015625, 0.39508056640625, 0.4267425537109375, 0.458404541015625, 0.4900665283203125, 0.521728515625, 0.5533905029296875, 0.585052490234375, 0.6167144775390625, 0.64837646484375, 0.6800384521484375, 0.711700439453125, 0.7433624267578125, 0.7750244140625, 0.8066864013671875, 0.838348388671875, 0.8700103759765625, 0.90167236328125, 0.9333343505859375, 0.964996337890625, 0.9966583251953125, 1.0283203125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 12.0, 21.0, 27.0, 27.0, 30.0, 20.0, 42.0, 49.0, 40.0, 47.0, 54.0, 64.0, 53.0, 66.0, 51.0, 53.0, 56.0, 36.0, 28.0, 44.0, 36.0, 19.0, 18.0, 17.0, 11.0, 9.0, 5.0, 4.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.51123046875, -0.4953460693359375, -0.479461669921875, -0.4635772705078125, -0.44769287109375, -0.4318084716796875, -0.415924072265625, -0.4000396728515625, -0.3841552734375, -0.3682708740234375, -0.352386474609375, -0.3365020751953125, -0.32061767578125, -0.3047332763671875, -0.288848876953125, -0.2729644775390625, -0.257080078125, -0.2411956787109375, -0.225311279296875, -0.2094268798828125, -0.19354248046875, -0.1776580810546875, -0.161773681640625, -0.1458892822265625, -0.1300048828125, -0.1141204833984375, -0.098236083984375, -0.0823516845703125, -0.06646728515625, -0.0505828857421875, -0.034698486328125, -0.0188140869140625, -0.0029296875, 0.0129547119140625, 0.028839111328125, 0.0447235107421875, 0.06060791015625, 0.0764923095703125, 0.092376708984375, 0.1082611083984375, 0.1241455078125, 0.1400299072265625, 0.155914306640625, 0.1717987060546875, 0.18768310546875, 0.2035675048828125, 0.219451904296875, 0.2353363037109375, 0.251220703125, 0.2671051025390625, 0.282989501953125, 0.2988739013671875, 0.31475830078125, 0.3306427001953125, 0.346527099609375, 0.3624114990234375, 0.3782958984375, 0.3941802978515625, 0.410064697265625, 0.4259490966796875, 0.44183349609375, 0.4577178955078125, 0.473602294921875, 0.4894866943359375, 0.50537109375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 14.0, 13.0, 11.0, 39.0, 50.0, 73.0, 162.0, 253.0, 425.0, 781.0, 1714.0, 4851.0, 44383.0, 807355.0, 173337.0, 10287.0, 2392.0, 1057.0, 586.0, 327.0, 165.0, 107.0, 57.0, 38.0, 23.0, 23.0, 3.0, 6.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.75390625, -2.654510498046875, -2.55511474609375, -2.455718994140625, -2.3563232421875, -2.256927490234375, -2.15753173828125, -2.058135986328125, -1.958740234375, -1.859344482421875, -1.75994873046875, -1.660552978515625, -1.5611572265625, -1.461761474609375, -1.36236572265625, -1.262969970703125, -1.16357421875, -1.064178466796875, -0.96478271484375, -0.865386962890625, -0.7659912109375, -0.666595458984375, -0.56719970703125, -0.467803955078125, -0.368408203125, -0.269012451171875, -0.16961669921875, -0.070220947265625, 0.0291748046875, 0.128570556640625, 0.22796630859375, 0.327362060546875, 0.4267578125, 0.526153564453125, 0.62554931640625, 0.724945068359375, 0.8243408203125, 0.923736572265625, 1.02313232421875, 1.122528076171875, 1.221923828125, 1.321319580078125, 1.42071533203125, 1.520111083984375, 1.6195068359375, 1.718902587890625, 1.81829833984375, 1.917694091796875, 2.01708984375, 2.116485595703125, 2.21588134765625, 2.315277099609375, 2.4146728515625, 2.514068603515625, 2.61346435546875, 2.712860107421875, 2.812255859375, 2.911651611328125, 3.01104736328125, 3.110443115234375, 3.2098388671875, 3.309234619140625, 3.40863037109375, 3.508026123046875, 3.607421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 9.0, 7.0, 14.0, 16.0, 22.0, 11.0, 15.0, 33.0, 35.0, 47.0, 42.0, 48.0, 52.0, 46.0, 55.0, 63.0, 69.0, 63.0, 48.0, 35.0, 33.0, 47.0, 31.0, 40.0, 25.0, 20.0, 13.0, 9.0, 11.0, 12.0, 8.0, 8.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.258270263671875, -2.18646240234375, -2.114654541015625, -2.0428466796875, -1.971038818359375, -1.89923095703125, -1.827423095703125, -1.755615234375, -1.683807373046875, -1.61199951171875, -1.540191650390625, -1.4683837890625, -1.396575927734375, -1.32476806640625, -1.252960205078125, -1.18115234375, -1.109344482421875, -1.03753662109375, -0.965728759765625, -0.8939208984375, -0.822113037109375, -0.75030517578125, -0.678497314453125, -0.606689453125, -0.534881591796875, -0.46307373046875, -0.391265869140625, -0.3194580078125, -0.247650146484375, -0.17584228515625, -0.104034423828125, -0.0322265625, 0.039581298828125, 0.11138916015625, 0.183197021484375, 0.2550048828125, 0.326812744140625, 0.39862060546875, 0.470428466796875, 0.542236328125, 0.614044189453125, 0.68585205078125, 0.757659912109375, 0.8294677734375, 0.901275634765625, 0.97308349609375, 1.044891357421875, 1.11669921875, 1.188507080078125, 1.26031494140625, 1.332122802734375, 1.4039306640625, 1.475738525390625, 1.54754638671875, 1.619354248046875, 1.691162109375, 1.762969970703125, 1.83477783203125, 1.906585693359375, 1.9783935546875, 2.050201416015625, 2.12200927734375, 2.193817138671875, 2.265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 14.0, 8.0, 13.0, 17.0, 19.0, 23.0, 33.0, 47.0, 47.0, 78.0, 78.0, 150.0, 216.0, 338.0, 553.0, 1002.0, 2003.0, 4155.0, 10877.0, 35655.0, 186806.0, 623610.0, 137439.0, 28561.0, 8927.0, 3602.0, 1694.0, 954.0, 544.0, 324.0, 223.0, 165.0, 85.0, 68.0, 41.0, 25.0, 24.0, 24.0, 26.0, 13.0, 14.0, 14.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.0986328125, -1.0647430419921875, -1.030853271484375, -0.9969635009765625, -0.96307373046875, -0.9291839599609375, -0.895294189453125, -0.8614044189453125, -0.8275146484375, -0.7936248779296875, -0.759735107421875, -0.7258453369140625, -0.69195556640625, -0.6580657958984375, -0.624176025390625, -0.5902862548828125, -0.556396484375, -0.5225067138671875, -0.488616943359375, -0.4547271728515625, -0.42083740234375, -0.3869476318359375, -0.353057861328125, -0.3191680908203125, -0.2852783203125, -0.2513885498046875, -0.217498779296875, -0.1836090087890625, -0.14971923828125, -0.1158294677734375, -0.081939697265625, -0.0480499267578125, -0.01416015625, 0.0197296142578125, 0.053619384765625, 0.0875091552734375, 0.12139892578125, 0.1552886962890625, 0.189178466796875, 0.2230682373046875, 0.2569580078125, 0.2908477783203125, 0.324737548828125, 0.3586273193359375, 0.39251708984375, 0.4264068603515625, 0.460296630859375, 0.4941864013671875, 0.528076171875, 0.5619659423828125, 0.595855712890625, 0.6297454833984375, 0.66363525390625, 0.6975250244140625, 0.731414794921875, 0.7653045654296875, 0.7991943359375, 0.8330841064453125, 0.866973876953125, 0.9008636474609375, 0.93475341796875, 0.9686431884765625, 1.002532958984375, 1.0364227294921875, 1.0703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 20.0, 34.0, 27.0, 38.0, 45.0, 63.0, 71.0, 87.0, 75.0, 80.0, 78.0, 72.0, 42.0, 47.0, 41.0, 29.0, 21.0, 23.0, 9.0, 15.0, 5.0, 11.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016307830810546875, -0.0001577623188495636, -0.00015244632959365845, -0.0001471303403377533, -0.00014181435108184814, -0.000136498361825943, -0.00013118237257003784, -0.0001258663833141327, -0.00012055039405822754, -0.00011523440480232239, -0.00010991841554641724, -0.00010460242629051208, -9.928643703460693e-05, -9.397044777870178e-05, -8.865445852279663e-05, -8.333846926689148e-05, -7.802248001098633e-05, -7.270649075508118e-05, -6.739050149917603e-05, -6.207451224327087e-05, -5.675852298736572e-05, -5.144253373146057e-05, -4.612654447555542e-05, -4.081055521965027e-05, -3.549456596374512e-05, -3.0178576707839966e-05, -2.4862587451934814e-05, -1.9546598196029663e-05, -1.4230608940124512e-05, -8.91461968421936e-06, -3.598630428314209e-06, 1.7173588275909424e-06, 7.033348083496094e-06, 1.2349337339401245e-05, 1.7665326595306396e-05, 2.2981315851211548e-05, 2.82973051071167e-05, 3.361329436302185e-05, 3.8929283618927e-05, 4.424527287483215e-05, 4.9561262130737305e-05, 5.4877251386642456e-05, 6.019324064254761e-05, 6.550922989845276e-05, 7.082521915435791e-05, 7.614120841026306e-05, 8.145719766616821e-05, 8.677318692207336e-05, 9.208917617797852e-05, 9.740516543388367e-05, 0.00010272115468978882, 0.00010803714394569397, 0.00011335313320159912, 0.00011866912245750427, 0.00012398511171340942, 0.00012930110096931458, 0.00013461709022521973, 0.00013993307948112488, 0.00014524906873703003, 0.00015056505799293518, 0.00015588104724884033, 0.00016119703650474548, 0.00016651302576065063, 0.00017182901501655579, 0.00017714500427246094]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 10.0, 15.0, 17.0, 41.0, 79.0, 160.0, 291.0, 681.0, 1897.0, 7804.0, 97713.0, 891119.0, 41138.0, 5063.0, 1425.0, 556.0, 239.0, 120.0, 61.0, 35.0, 29.0, 15.0, 11.0, 10.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.853515625, -2.76800537109375, -2.6824951171875, -2.59698486328125, -2.511474609375, -2.42596435546875, -2.3404541015625, -2.25494384765625, -2.16943359375, -2.08392333984375, -1.9984130859375, -1.91290283203125, -1.827392578125, -1.74188232421875, -1.6563720703125, -1.57086181640625, -1.4853515625, -1.39984130859375, -1.3143310546875, -1.22882080078125, -1.143310546875, -1.05780029296875, -0.9722900390625, -0.88677978515625, -0.80126953125, -0.71575927734375, -0.6302490234375, -0.54473876953125, -0.459228515625, -0.37371826171875, -0.2882080078125, -0.20269775390625, -0.1171875, -0.03167724609375, 0.0538330078125, 0.13934326171875, 0.224853515625, 0.31036376953125, 0.3958740234375, 0.48138427734375, 0.56689453125, 0.65240478515625, 0.7379150390625, 0.82342529296875, 0.908935546875, 0.99444580078125, 1.0799560546875, 1.16546630859375, 1.2509765625, 1.33648681640625, 1.4219970703125, 1.50750732421875, 1.593017578125, 1.67852783203125, 1.7640380859375, 1.84954833984375, 1.93505859375, 2.02056884765625, 2.1060791015625, 2.19158935546875, 2.277099609375, 2.36260986328125, 2.4481201171875, 2.53363037109375, 2.619140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 7.0, 14.0, 17.0, 27.0, 38.0, 62.0, 102.0, 110.0, 112.0, 135.0, 116.0, 67.0, 48.0, 41.0, 30.0, 24.0, 14.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6611328125, -1.6173095703125, -1.573486328125, -1.5296630859375, -1.48583984375, -1.4420166015625, -1.398193359375, -1.3543701171875, -1.310546875, -1.2667236328125, -1.222900390625, -1.1790771484375, -1.13525390625, -1.0914306640625, -1.047607421875, -1.0037841796875, -0.9599609375, -0.9161376953125, -0.872314453125, -0.8284912109375, -0.78466796875, -0.7408447265625, -0.697021484375, -0.6531982421875, -0.609375, -0.5655517578125, -0.521728515625, -0.4779052734375, -0.43408203125, -0.3902587890625, -0.346435546875, -0.3026123046875, -0.2587890625, -0.2149658203125, -0.171142578125, -0.1273193359375, -0.08349609375, -0.0396728515625, 0.004150390625, 0.0479736328125, 0.091796875, 0.1356201171875, 0.179443359375, 0.2232666015625, 0.26708984375, 0.3109130859375, 0.354736328125, 0.3985595703125, 0.4423828125, 0.4862060546875, 0.530029296875, 0.5738525390625, 0.61767578125, 0.6614990234375, 0.705322265625, 0.7491455078125, 0.79296875, 0.8367919921875, 0.880615234375, 0.9244384765625, 0.96826171875, 1.0120849609375, 1.055908203125, 1.0997314453125, 1.1435546875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 18.0, 38.0, 95.0, 214.0, 336.0, 197.0, 71.0, 23.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.997406005859375, -53.73543930053711, -52.473472595214844, -51.21150588989258, -49.94953918457031, -48.68757247924805, -47.42560577392578, -46.16364288330078, -44.90167236328125, -43.639705657958984, -42.37773895263672, -41.11577224731445, -39.85380554199219, -38.59183883666992, -37.329872131347656, -36.067909240722656, -34.80594253540039, -33.543975830078125, -32.28200912475586, -31.020042419433594, -29.758075714111328, -28.496109008789062, -27.23414421081543, -25.972177505493164, -24.7102108001709, -23.448244094848633, -22.186277389526367, -20.9243106842041, -19.66234588623047, -18.400379180908203, -17.138412475585938, -15.876445770263672, -14.614479064941406, -13.35251235961914, -12.090545654296875, -10.828579902648926, -9.56661319732666, -8.304646492004395, -7.042680263519287, -5.78071403503418, -4.518747329711914, -3.2567808628082275, -1.994814395904541, -0.7328479290008545, 0.529118537902832, 1.7910852432250977, 3.053051471710205, 4.3150177001953125, 5.576984405517578, 6.838951110839844, 8.10091781616211, 9.362883567810059, 10.624850273132324, 11.88681697845459, 13.148782730102539, 14.410749435424805, 15.67271614074707, 16.934682846069336, 18.1966495513916, 19.458616256713867, 20.7205810546875, 21.982547760009766, 23.24451446533203, 24.506481170654297, 25.768447875976562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 7.0, 5.0, 13.0, 23.0, 13.0, 20.0, 21.0, 35.0, 38.0, 32.0, 34.0, 41.0, 51.0, 42.0, 42.0, 54.0, 49.0, 54.0, 50.0, 60.0, 37.0, 42.0, 34.0, 35.0, 32.0, 22.0, 23.0, 12.0, 12.0, 17.0, 10.0, 7.0, 5.0, 7.0, 2.0, 6.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.820595741271973, -10.512228965759277, -10.203863143920898, -9.895496368408203, -9.587129592895508, -9.278763771057129, -8.970396995544434, -8.662031173706055, -8.35366439819336, -8.045297622680664, -7.736931800842285, -7.42856502532959, -7.120198726654053, -6.811832427978516, -6.50346565246582, -6.195099353790283, -5.886733055114746, -5.578366756439209, -5.270000457763672, -4.961633682250977, -4.6532673835754395, -4.344901084899902, -4.036534309387207, -3.72816801071167, -3.419801712036133, -3.1114354133605957, -2.8030688762664795, -2.4947023391723633, -2.186336040496826, -1.8779696226119995, -1.5696032047271729, -1.2612366676330566, -0.9528703689575195, -0.6445039510726929, -0.3361375331878662, -0.02777111530303955, 0.2805953025817871, 0.5889617204666138, 0.8973281383514404, 1.2056946754455566, 1.5140609741210938, 1.8224273920059204, 2.130793809890747, 2.4391603469848633, 2.7475266456604004, 3.0558929443359375, 3.3642594814300537, 3.67262601852417, 3.980992317199707, 4.289358615875244, 4.597724914550781, 4.906091690063477, 5.214457988739014, 5.522824287414551, 5.831191062927246, 6.139557361602783, 6.44792366027832, 6.756289958953857, 7.0646562576293945, 7.37302303314209, 7.681389331817627, 7.989755630493164, 8.29812240600586, 8.606489181518555, 8.914855003356934]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 11.0, 11.0, 19.0, 26.0, 35.0, 67.0, 98.0, 175.0, 364.0, 812.0, 3505.0, 4158087.0, 27903.0, 1901.0, 580.0, 277.0, 142.0, 84.0, 69.0, 30.0, 26.0, 7.0, 14.0, 8.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.7890625, -12.43212890625, -12.0751953125, -11.71826171875, -11.361328125, -11.00439453125, -10.6474609375, -10.29052734375, -9.93359375, -9.57666015625, -9.2197265625, -8.86279296875, -8.505859375, -8.14892578125, -7.7919921875, -7.43505859375, -7.078125, -6.72119140625, -6.3642578125, -6.00732421875, -5.650390625, -5.29345703125, -4.9365234375, -4.57958984375, -4.22265625, -3.86572265625, -3.5087890625, -3.15185546875, -2.794921875, -2.43798828125, -2.0810546875, -1.72412109375, -1.3671875, -1.01025390625, -0.6533203125, -0.29638671875, 0.060546875, 0.41748046875, 0.7744140625, 1.13134765625, 1.48828125, 1.84521484375, 2.2021484375, 2.55908203125, 2.916015625, 3.27294921875, 3.6298828125, 3.98681640625, 4.34375, 4.70068359375, 5.0576171875, 5.41455078125, 5.771484375, 6.12841796875, 6.4853515625, 6.84228515625, 7.19921875, 7.55615234375, 7.9130859375, 8.27001953125, 8.626953125, 8.98388671875, 9.3408203125, 9.69775390625, 10.0546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 10.0, 9.0, 10.0, 18.0, 17.0, 26.0, 31.0, 35.0, 48.0, 47.0, 62.0, 65.0, 79.0, 69.0, 79.0, 64.0, 66.0, 46.0, 63.0, 36.0, 32.0, 20.0, 20.0, 12.0, 8.0, 5.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.82080078125, -0.8004226684570312, -0.7800445556640625, -0.7596664428710938, -0.739288330078125, -0.7189102172851562, -0.6985321044921875, -0.6781539916992188, -0.65777587890625, -0.6373977661132812, -0.6170196533203125, -0.5966415405273438, -0.576263427734375, -0.5558853149414062, -0.5355072021484375, -0.5151290893554688, -0.4947509765625, -0.47437286376953125, -0.4539947509765625, -0.43361663818359375, -0.413238525390625, -0.39286041259765625, -0.3724822998046875, -0.35210418701171875, -0.33172607421875, -0.31134796142578125, -0.2909698486328125, -0.27059173583984375, -0.250213623046875, -0.22983551025390625, -0.2094573974609375, -0.18907928466796875, -0.168701171875, -0.14832305908203125, -0.1279449462890625, -0.10756683349609375, -0.087188720703125, -0.06681060791015625, -0.0464324951171875, -0.02605438232421875, -0.00567626953125, 0.01470184326171875, 0.0350799560546875, 0.05545806884765625, 0.075836181640625, 0.09621429443359375, 0.1165924072265625, 0.13697052001953125, 0.1573486328125, 0.17772674560546875, 0.1981048583984375, 0.21848297119140625, 0.238861083984375, 0.25923919677734375, 0.2796173095703125, 0.29999542236328125, 0.32037353515625, 0.34075164794921875, 0.3611297607421875, 0.38150787353515625, 0.401885986328125, 0.42226409912109375, 0.4426422119140625, 0.46302032470703125, 0.4833984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 10.0, 8.0, 12.0, 18.0, 38.0, 35.0, 69.0, 63.0, 120.0, 176.0, 241.0, 360.0, 496.0, 781.0, 1130.0, 1873.0, 3095.0, 6144.0, 16125.0, 199071.0, 3927313.0, 20599.0, 7099.0, 3512.0, 1957.0, 1274.0, 869.0, 580.0, 359.0, 255.0, 170.0, 127.0, 89.0, 50.0, 59.0, 33.0, 13.0, 22.0, 11.0, 5.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.5521697998046875, -1.496917724609375, -1.4416656494140625, -1.38641357421875, -1.3311614990234375, -1.275909423828125, -1.2206573486328125, -1.1654052734375, -1.1101531982421875, -1.054901123046875, -0.9996490478515625, -0.94439697265625, -0.8891448974609375, -0.833892822265625, -0.7786407470703125, -0.723388671875, -0.6681365966796875, -0.612884521484375, -0.5576324462890625, -0.50238037109375, -0.4471282958984375, -0.391876220703125, -0.3366241455078125, -0.2813720703125, -0.2261199951171875, -0.170867919921875, -0.1156158447265625, -0.06036376953125, -0.0051116943359375, 0.050140380859375, 0.1053924560546875, 0.16064453125, 0.2158966064453125, 0.271148681640625, 0.3264007568359375, 0.38165283203125, 0.4369049072265625, 0.492156982421875, 0.5474090576171875, 0.6026611328125, 0.6579132080078125, 0.713165283203125, 0.7684173583984375, 0.82366943359375, 0.8789215087890625, 0.934173583984375, 0.9894256591796875, 1.044677734375, 1.0999298095703125, 1.155181884765625, 1.2104339599609375, 1.26568603515625, 1.3209381103515625, 1.376190185546875, 1.4314422607421875, 1.4866943359375, 1.5419464111328125, 1.597198486328125, 1.6524505615234375, 1.70770263671875, 1.7629547119140625, 1.818206787109375, 1.8734588623046875, 1.9287109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 20.0, 48.0, 213.0, 3630.0, 59.0, 35.0, 12.0, 10.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51123046875, -0.493743896484375, -0.47625732421875, -0.458770751953125, -0.4412841796875, -0.423797607421875, -0.40631103515625, -0.388824462890625, -0.371337890625, -0.353851318359375, -0.33636474609375, -0.318878173828125, -0.3013916015625, -0.283905029296875, -0.26641845703125, -0.248931884765625, -0.2314453125, -0.213958740234375, -0.19647216796875, -0.178985595703125, -0.1614990234375, -0.144012451171875, -0.12652587890625, -0.109039306640625, -0.091552734375, -0.074066162109375, -0.05657958984375, -0.039093017578125, -0.0216064453125, -0.004119873046875, 0.01336669921875, 0.030853271484375, 0.04833984375, 0.065826416015625, 0.08331298828125, 0.100799560546875, 0.1182861328125, 0.135772705078125, 0.15325927734375, 0.170745849609375, 0.188232421875, 0.205718994140625, 0.22320556640625, 0.240692138671875, 0.2581787109375, 0.275665283203125, 0.29315185546875, 0.310638427734375, 0.328125, 0.345611572265625, 0.36309814453125, 0.380584716796875, 0.3980712890625, 0.415557861328125, 0.43304443359375, 0.450531005859375, 0.468017578125, 0.485504150390625, 0.50299072265625, 0.520477294921875, 0.5379638671875, 0.555450439453125, 0.57293701171875, 0.590423583984375, 0.60791015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 8.0, 13.0, 14.0, 36.0, 55.0, 64.0, 91.0, 122.0, 125.0, 114.0, 109.0, 82.0, 60.0, 37.0, 25.0, 16.0, 8.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.923123836517334, -1.8708850145339966, -1.8186461925506592, -1.7664073705673218, -1.7141685485839844, -1.661929726600647, -1.6096909046173096, -1.5574522018432617, -1.5052132606506348, -1.4529744386672974, -1.40073561668396, -1.3484967947006226, -1.2962579727172852, -1.2440191507339478, -1.1917803287506104, -1.1395416259765625, -1.087302803993225, -1.0350639820098877, -0.9828251600265503, -0.9305863380432129, -0.8783475160598755, -0.8261086940765381, -0.7738699316978455, -0.7216311097145081, -0.6693922877311707, -0.6171534657478333, -0.5649146437644958, -0.5126758813858032, -0.46043702960014343, -0.40819820761680603, -0.355959415435791, -0.3037205934524536, -0.2514817714691162, -0.1992429494857788, -0.1470041424036026, -0.09476533532142639, -0.04252651333808899, 0.009712308645248413, 0.06195110082626343, 0.11418992280960083, 0.16642874479293823, 0.21866756677627563, 0.27090638875961304, 0.32314518094062805, 0.37538400292396545, 0.42762282490730286, 0.47986161708831787, 0.5321004390716553, 0.5843392610549927, 0.6365780830383301, 0.6888169050216675, 0.7410557270050049, 0.7932945489883423, 0.8455333709716797, 0.8977721333503723, 0.9500109553337097, 1.0022497177124023, 1.0544885396957397, 1.1067273616790771, 1.1589661836624146, 1.211205005645752, 1.2634438276290894, 1.3156826496124268, 1.3679213523864746, 1.4201602935791016]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 4.0, 5.0, 1.0, 6.0, 12.0, 14.0, 13.0, 16.0, 28.0, 30.0, 39.0, 35.0, 36.0, 79.0, 51.0, 55.0, 56.0, 70.0, 53.0, 62.0, 54.0, 50.0, 43.0, 44.0, 30.0, 25.0, 15.0, 24.0, 12.0, 14.0, 10.0, 7.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7469944357872009, -0.7120823264122009, -0.6771702766418457, -0.6422581672668457, -0.6073460578918457, -0.5724339485168457, -0.5375218391418457, -0.5026097893714905, -0.4676976799964905, -0.4327855706214905, -0.39787349104881287, -0.36296141147613525, -0.32804930210113525, -0.29313719272613525, -0.25822511315345764, -0.22331301867961884, -0.18840092420578003, -0.15348882973194122, -0.11857673525810242, -0.08366464078426361, -0.048752546310424805, -0.013840451836585999, 0.021071642637252808, 0.055983737111091614, 0.09089583158493042, 0.12580792605876923, 0.16072002053260803, 0.19563211500644684, 0.23054420948028564, 0.26545631885528564, 0.30036839842796326, 0.33528047800064087, 0.3701925277709961, 0.4051046371459961, 0.4400167167186737, 0.4749287962913513, 0.5098409056663513, 0.5447530150413513, 0.5796650648117065, 0.6145771741867065, 0.6494892835617065, 0.6844013929367065, 0.7193135023117065, 0.7542255520820618, 0.7891376614570618, 0.8240497708320618, 0.858961820602417, 0.893873929977417, 0.928786039352417, 0.963698148727417, 0.998610258102417, 1.033522367477417, 1.068434476852417, 1.1033464670181274, 1.1382585763931274, 1.1731706857681274, 1.2080827951431274, 1.2429949045181274, 1.2779070138931274, 1.3128191232681274, 1.347731113433838, 1.382643222808838, 1.417555332183838, 1.452467441558838, 1.487379550933838]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 1.0, 7.0, 18.0, 19.0, 18.0, 39.0, 52.0, 88.0, 128.0, 242.0, 475.0, 919.0, 1815.0, 4136.0, 9789.0, 25095.0, 69456.0, 206105.0, 435822.0, 190161.0, 64153.0, 23355.0, 9150.0, 3875.0, 1713.0, 833.0, 443.0, 254.0, 137.0, 75.0, 53.0, 44.0, 29.0, 17.0, 13.0, 7.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8612442016601562, -0.8245391845703125, -0.7878341674804688, -0.751129150390625, -0.7144241333007812, -0.6777191162109375, -0.6410140991210938, -0.60430908203125, -0.5676040649414062, -0.5308990478515625, -0.49419403076171875, -0.457489013671875, -0.42078399658203125, -0.3840789794921875, -0.34737396240234375, -0.3106689453125, -0.27396392822265625, -0.2372589111328125, -0.20055389404296875, -0.163848876953125, -0.12714385986328125, -0.0904388427734375, -0.05373382568359375, -0.01702880859375, 0.01967620849609375, 0.0563812255859375, 0.09308624267578125, 0.129791259765625, 0.16649627685546875, 0.2032012939453125, 0.23990631103515625, 0.276611328125, 0.31331634521484375, 0.3500213623046875, 0.38672637939453125, 0.423431396484375, 0.46013641357421875, 0.4968414306640625, 0.5335464477539062, 0.57025146484375, 0.6069564819335938, 0.6436614990234375, 0.6803665161132812, 0.717071533203125, 0.7537765502929688, 0.7904815673828125, 0.8271865844726562, 0.8638916015625, 0.9005966186523438, 0.9373016357421875, 0.9740066528320312, 1.010711669921875, 1.0474166870117188, 1.0841217041015625, 1.1208267211914062, 1.15753173828125, 1.1942367553710938, 1.2309417724609375, 1.2676467895507812, 1.304351806640625, 1.3410568237304688, 1.3777618408203125, 1.4144668579101562, 1.451171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 8.0, 6.0, 7.0, 11.0, 18.0, 24.0, 28.0, 33.0, 42.0, 46.0, 55.0, 58.0, 64.0, 85.0, 69.0, 69.0, 75.0, 53.0, 46.0, 59.0, 37.0, 31.0, 19.0, 18.0, 14.0, 3.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.81451416015625, -0.7930908203125, -0.77166748046875, -0.750244140625, -0.72882080078125, -0.7073974609375, -0.68597412109375, -0.66455078125, -0.64312744140625, -0.6217041015625, -0.60028076171875, -0.578857421875, -0.55743408203125, -0.5360107421875, -0.51458740234375, -0.4931640625, -0.47174072265625, -0.4503173828125, -0.42889404296875, -0.407470703125, -0.38604736328125, -0.3646240234375, -0.34320068359375, -0.32177734375, -0.30035400390625, -0.2789306640625, -0.25750732421875, -0.236083984375, -0.21466064453125, -0.1932373046875, -0.17181396484375, -0.150390625, -0.12896728515625, -0.1075439453125, -0.08612060546875, -0.064697265625, -0.04327392578125, -0.0218505859375, -0.00042724609375, 0.02099609375, 0.04241943359375, 0.0638427734375, 0.08526611328125, 0.106689453125, 0.12811279296875, 0.1495361328125, 0.17095947265625, 0.1923828125, 0.21380615234375, 0.2352294921875, 0.25665283203125, 0.278076171875, 0.29949951171875, 0.3209228515625, 0.34234619140625, 0.36376953125, 0.38519287109375, 0.4066162109375, 0.42803955078125, 0.449462890625, 0.47088623046875, 0.4923095703125, 0.51373291015625, 0.53515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 16.0, 27.0, 23.0, 47.0, 60.0, 87.0, 115.0, 186.0, 219.0, 442.0, 648.0, 1147.0, 2569.0, 9606.0, 90286.0, 818316.0, 108101.0, 10651.0, 2812.0, 1209.0, 635.0, 458.0, 281.0, 189.0, 131.0, 91.0, 53.0, 36.0, 38.0, 18.0, 12.0, 10.0, 6.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.32708740234375, -2.2576904296875, -2.18829345703125, -2.118896484375, -2.04949951171875, -1.9801025390625, -1.91070556640625, -1.84130859375, -1.77191162109375, -1.7025146484375, -1.63311767578125, -1.563720703125, -1.49432373046875, -1.4249267578125, -1.35552978515625, -1.2861328125, -1.21673583984375, -1.1473388671875, -1.07794189453125, -1.008544921875, -0.93914794921875, -0.8697509765625, -0.80035400390625, -0.73095703125, -0.66156005859375, -0.5921630859375, -0.52276611328125, -0.453369140625, -0.38397216796875, -0.3145751953125, -0.24517822265625, -0.17578125, -0.10638427734375, -0.0369873046875, 0.03240966796875, 0.101806640625, 0.17120361328125, 0.2406005859375, 0.30999755859375, 0.37939453125, 0.44879150390625, 0.5181884765625, 0.58758544921875, 0.656982421875, 0.72637939453125, 0.7957763671875, 0.86517333984375, 0.9345703125, 1.00396728515625, 1.0733642578125, 1.14276123046875, 1.212158203125, 1.28155517578125, 1.3509521484375, 1.42034912109375, 1.48974609375, 1.55914306640625, 1.6285400390625, 1.69793701171875, 1.767333984375, 1.83673095703125, 1.9061279296875, 1.97552490234375, 2.044921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 8.0, 5.0, 10.0, 14.0, 11.0, 11.0, 24.0, 31.0, 28.0, 36.0, 29.0, 35.0, 35.0, 41.0, 44.0, 41.0, 61.0, 51.0, 37.0, 42.0, 42.0, 52.0, 44.0, 45.0, 24.0, 36.0, 21.0, 23.0, 22.0, 18.0, 13.0, 13.0, 9.0, 6.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9326171875, -1.8683319091796875, -1.804046630859375, -1.7397613525390625, -1.67547607421875, -1.6111907958984375, -1.546905517578125, -1.4826202392578125, -1.4183349609375, -1.3540496826171875, -1.289764404296875, -1.2254791259765625, -1.16119384765625, -1.0969085693359375, -1.032623291015625, -0.9683380126953125, -0.904052734375, -0.8397674560546875, -0.775482177734375, -0.7111968994140625, -0.64691162109375, -0.5826263427734375, -0.518341064453125, -0.4540557861328125, -0.3897705078125, -0.3254852294921875, -0.261199951171875, -0.1969146728515625, -0.13262939453125, -0.0683441162109375, -0.004058837890625, 0.0602264404296875, 0.12451171875, 0.1887969970703125, 0.253082275390625, 0.3173675537109375, 0.38165283203125, 0.4459381103515625, 0.510223388671875, 0.5745086669921875, 0.6387939453125, 0.7030792236328125, 0.767364501953125, 0.8316497802734375, 0.89593505859375, 0.9602203369140625, 1.024505615234375, 1.0887908935546875, 1.153076171875, 1.2173614501953125, 1.281646728515625, 1.3459320068359375, 1.41021728515625, 1.4745025634765625, 1.538787841796875, 1.6030731201171875, 1.6673583984375, 1.7316436767578125, 1.795928955078125, 1.8602142333984375, 1.92449951171875, 1.9887847900390625, 2.053070068359375, 2.1173553466796875, 2.181640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 3.0, 1.0, 6.0, 8.0, 12.0, 12.0, 18.0, 20.0, 27.0, 48.0, 76.0, 126.0, 218.0, 406.0, 1240.0, 7635.0, 208627.0, 809317.0, 17322.0, 2155.0, 594.0, 253.0, 144.0, 104.0, 54.0, 40.0, 24.0, 23.0, 14.0, 9.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.95703125, -1.89215087890625, -1.8272705078125, -1.76239013671875, -1.697509765625, -1.63262939453125, -1.5677490234375, -1.50286865234375, -1.43798828125, -1.37310791015625, -1.3082275390625, -1.24334716796875, -1.178466796875, -1.11358642578125, -1.0487060546875, -0.98382568359375, -0.9189453125, -0.85406494140625, -0.7891845703125, -0.72430419921875, -0.659423828125, -0.59454345703125, -0.5296630859375, -0.46478271484375, -0.39990234375, -0.33502197265625, -0.2701416015625, -0.20526123046875, -0.140380859375, -0.07550048828125, -0.0106201171875, 0.05426025390625, 0.119140625, 0.18402099609375, 0.2489013671875, 0.31378173828125, 0.378662109375, 0.44354248046875, 0.5084228515625, 0.57330322265625, 0.63818359375, 0.70306396484375, 0.7679443359375, 0.83282470703125, 0.897705078125, 0.96258544921875, 1.0274658203125, 1.09234619140625, 1.1572265625, 1.22210693359375, 1.2869873046875, 1.35186767578125, 1.416748046875, 1.48162841796875, 1.5465087890625, 1.61138916015625, 1.67626953125, 1.74114990234375, 1.8060302734375, 1.87091064453125, 1.935791015625, 2.00067138671875, 2.0655517578125, 2.13043212890625, 2.1953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 15.0, 14.0, 16.0, 18.0, 29.0, 30.0, 60.0, 55.0, 85.0, 117.0, 141.0, 111.0, 66.0, 53.0, 45.0, 34.0, 34.0, 13.0, 14.0, 11.0, 7.0, 11.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017380714416503906, -0.00016842782497406006, -0.00016304850578308105, -0.00015766918659210205, -0.00015228986740112305, -0.00014691054821014404, -0.00014153122901916504, -0.00013615190982818604, -0.00013077259063720703, -0.00012539327144622803, -0.00012001395225524902, -0.00011463463306427002, -0.00010925531387329102, -0.00010387599468231201, -9.849667549133301e-05, -9.3117356300354e-05, -8.7738037109375e-05, -8.2358717918396e-05, -7.697939872741699e-05, -7.160007953643799e-05, -6.622076034545898e-05, -6.084144115447998e-05, -5.5462121963500977e-05, -5.008280277252197e-05, -4.470348358154297e-05, -3.9324164390563965e-05, -3.394484519958496e-05, -2.8565526008605957e-05, -2.3186206817626953e-05, -1.780688762664795e-05, -1.2427568435668945e-05, -7.048249244689941e-06, -1.6689300537109375e-06, 3.7103891372680664e-06, 9.08970832824707e-06, 1.4469027519226074e-05, 1.9848346710205078e-05, 2.5227665901184082e-05, 3.0606985092163086e-05, 3.598630428314209e-05, 4.1365623474121094e-05, 4.67449426651001e-05, 5.21242618560791e-05, 5.7503581047058105e-05, 6.288290023803711e-05, 6.826221942901611e-05, 7.364153861999512e-05, 7.902085781097412e-05, 8.440017700195312e-05, 8.977949619293213e-05, 9.515881538391113e-05, 0.00010053813457489014, 0.00010591745376586914, 0.00011129677295684814, 0.00011667609214782715, 0.00012205541133880615, 0.00012743473052978516, 0.00013281404972076416, 0.00013819336891174316, 0.00014357268810272217, 0.00014895200729370117, 0.00015433132648468018, 0.00015971064567565918, 0.00016508996486663818, 0.0001704692840576172]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 8.0, 4.0, 12.0, 16.0, 23.0, 41.0, 59.0, 104.0, 166.0, 269.0, 494.0, 1069.0, 2783.0, 9899.0, 64817.0, 774618.0, 169400.0, 17615.0, 4110.0, 1482.0, 697.0, 370.0, 182.0, 91.0, 70.0, 53.0, 32.0, 20.0, 14.0, 11.0, 8.0, 3.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.384765625, -1.3423919677734375, -1.300018310546875, -1.2576446533203125, -1.21527099609375, -1.1728973388671875, -1.130523681640625, -1.0881500244140625, -1.0457763671875, -1.0034027099609375, -0.961029052734375, -0.9186553955078125, -0.87628173828125, -0.8339080810546875, -0.791534423828125, -0.7491607666015625, -0.706787109375, -0.6644134521484375, -0.622039794921875, -0.5796661376953125, -0.53729248046875, -0.4949188232421875, -0.452545166015625, -0.4101715087890625, -0.3677978515625, -0.3254241943359375, -0.283050537109375, -0.2406768798828125, -0.19830322265625, -0.1559295654296875, -0.113555908203125, -0.0711822509765625, -0.02880859375, 0.0135650634765625, 0.055938720703125, 0.0983123779296875, 0.14068603515625, 0.1830596923828125, 0.225433349609375, 0.2678070068359375, 0.3101806640625, 0.3525543212890625, 0.394927978515625, 0.4373016357421875, 0.47967529296875, 0.5220489501953125, 0.564422607421875, 0.6067962646484375, 0.649169921875, 0.6915435791015625, 0.733917236328125, 0.7762908935546875, 0.81866455078125, 0.8610382080078125, 0.903411865234375, 0.9457855224609375, 0.9881591796875, 1.0305328369140625, 1.072906494140625, 1.1152801513671875, 1.15765380859375, 1.2000274658203125, 1.242401123046875, 1.2847747802734375, 1.3271484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 6.0, 13.0, 8.0, 9.0, 13.0, 20.0, 28.0, 35.0, 59.0, 73.0, 94.0, 104.0, 105.0, 98.0, 82.0, 73.0, 51.0, 22.0, 24.0, 18.0, 17.0, 15.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2265625, -1.1961212158203125, -1.165679931640625, -1.1352386474609375, -1.10479736328125, -1.0743560791015625, -1.043914794921875, -1.0134735107421875, -0.9830322265625, -0.9525909423828125, -0.922149658203125, -0.8917083740234375, -0.86126708984375, -0.8308258056640625, -0.800384521484375, -0.7699432373046875, -0.739501953125, -0.7090606689453125, -0.678619384765625, -0.6481781005859375, -0.61773681640625, -0.5872955322265625, -0.556854248046875, -0.5264129638671875, -0.4959716796875, -0.4655303955078125, -0.435089111328125, -0.4046478271484375, -0.37420654296875, -0.3437652587890625, -0.313323974609375, -0.2828826904296875, -0.25244140625, -0.2220001220703125, -0.191558837890625, -0.1611175537109375, -0.13067626953125, -0.1002349853515625, -0.069793701171875, -0.0393524169921875, -0.0089111328125, 0.0215301513671875, 0.051971435546875, 0.0824127197265625, 0.11285400390625, 0.1432952880859375, 0.173736572265625, 0.2041778564453125, 0.234619140625, 0.2650604248046875, 0.295501708984375, 0.3259429931640625, 0.35638427734375, 0.3868255615234375, 0.417266845703125, 0.4477081298828125, 0.4781494140625, 0.5085906982421875, 0.539031982421875, 0.5694732666015625, 0.59991455078125, 0.6303558349609375, 0.660797119140625, 0.6912384033203125, 0.7216796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 27.0, 76.0, 210.0, 309.0, 239.0, 98.0, 27.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.731754302978516, -38.856903076171875, -37.982051849365234, -37.107200622558594, -36.23234939575195, -35.35749816894531, -34.482643127441406, -33.607791900634766, -32.732940673828125, -31.858089447021484, -30.983238220214844, -30.108386993408203, -29.23353385925293, -28.35868263244629, -27.48383140563965, -26.608980178833008, -25.734128952026367, -24.859277725219727, -23.984426498413086, -23.109573364257812, -22.234722137451172, -21.35987091064453, -20.48501968383789, -19.61016845703125, -18.73531723022461, -17.86046600341797, -16.985614776611328, -16.110763549804688, -15.235910415649414, -14.361059188842773, -13.486207962036133, -12.611356735229492, -11.736505508422852, -10.861654281616211, -9.986802101135254, -9.111950874328613, -8.237098693847656, -7.362247467041016, -6.487396240234375, -5.612544536590576, -4.737692832946777, -3.8628411293029785, -2.987989664077759, -2.113138198852539, -1.2382864952087402, -0.3634347915649414, 0.5114164352416992, 1.386268138885498, 2.261119842529297, 3.1359715461730957, 4.0108232498168945, 4.885674476623535, 5.760526180267334, 6.635377883911133, 7.510229110717773, 8.385080337524414, 9.259932518005371, 10.134783744812012, 11.009635925292969, 11.88448715209961, 12.75933837890625, 13.634190559387207, 14.509041786193848, 15.383893966674805, 16.258745193481445]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 13.0, 6.0, 12.0, 19.0, 16.0, 25.0, 31.0, 23.0, 26.0, 33.0, 29.0, 46.0, 52.0, 53.0, 55.0, 52.0, 51.0, 41.0, 46.0, 45.0, 46.0, 34.0, 33.0, 29.0, 24.0, 19.0, 19.0, 14.0, 15.0, 16.0, 10.0, 10.0, 7.0, 9.0, 2.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.301469802856445, -8.998381614685059, -8.695293426513672, -8.392206192016602, -8.089118003845215, -7.786029815673828, -7.482941627502441, -7.179853439331055, -6.876765251159668, -6.573677062988281, -6.270589351654053, -5.967501163482666, -5.664412975311279, -5.361325263977051, -5.058237075805664, -4.755148887634277, -4.452061176300049, -4.148972988128662, -3.8458850383758545, -3.542797088623047, -3.23970890045166, -2.9366209506988525, -2.633533000946045, -2.330444812774658, -2.0273568630218506, -1.7242687940597534, -1.4211807250976562, -1.1180927753448486, -0.8150047063827515, -0.5119166374206543, -0.20882868766784668, 0.09425950050354004, 0.39734745025634766, 0.7004355192184448, 1.003523588180542, 1.3066115379333496, 1.6096996068954468, 1.912787675857544, 2.2158756256103516, 2.5189638137817383, 2.822051763534546, 3.1251397132873535, 3.4282279014587402, 3.731315851211548, 4.0344038009643555, 4.337491989135742, 4.640580177307129, 4.943668365478516, 5.246756076812744, 5.549844264984131, 5.852931976318359, 6.156020164489746, 6.459108352661133, 6.7621965408325195, 7.065284252166748, 7.368372440338135, 7.671460151672363, 7.97454833984375, 8.277636528015137, 8.580724716186523, 8.883811950683594, 9.18690013885498, 9.489988327026367, 9.793076515197754, 10.09616470336914]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 19.0, 32.0, 43.0, 58.0, 90.0, 161.0, 289.0, 810.0, 4558.0, 4080419.0, 103645.0, 2885.0, 608.0, 243.0, 133.0, 86.0, 55.0, 39.0, 29.0, 17.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.0, -8.756103515625, -8.51220703125, -8.268310546875, -8.0244140625, -7.780517578125, -7.53662109375, -7.292724609375, -7.048828125, -6.804931640625, -6.56103515625, -6.317138671875, -6.0732421875, -5.829345703125, -5.58544921875, -5.341552734375, -5.09765625, -4.853759765625, -4.60986328125, -4.365966796875, -4.1220703125, -3.878173828125, -3.63427734375, -3.390380859375, -3.146484375, -2.902587890625, -2.65869140625, -2.414794921875, -2.1708984375, -1.927001953125, -1.68310546875, -1.439208984375, -1.1953125, -0.951416015625, -0.70751953125, -0.463623046875, -0.2197265625, 0.024169921875, 0.26806640625, 0.511962890625, 0.755859375, 0.999755859375, 1.24365234375, 1.487548828125, 1.7314453125, 1.975341796875, 2.21923828125, 2.463134765625, 2.70703125, 2.950927734375, 3.19482421875, 3.438720703125, 3.6826171875, 3.926513671875, 4.17041015625, 4.414306640625, 4.658203125, 4.902099609375, 5.14599609375, 5.389892578125, 5.6337890625, 5.877685546875, 6.12158203125, 6.365478515625, 6.609375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 2.0, 14.0, 3.0, 20.0, 17.0, 26.0, 20.0, 19.0, 23.0, 37.0, 46.0, 48.0, 52.0, 50.0, 51.0, 61.0, 67.0, 64.0, 50.0, 49.0, 45.0, 33.0, 41.0, 26.0, 23.0, 24.0, 18.0, 10.0, 13.0, 13.0, 9.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5634765625, -0.5485038757324219, -0.5335311889648438, -0.5185585021972656, -0.5035858154296875, -0.4886131286621094, -0.47364044189453125, -0.4586677551269531, -0.443695068359375, -0.4287223815917969, -0.41374969482421875, -0.3987770080566406, -0.3838043212890625, -0.3688316345214844, -0.35385894775390625, -0.3388862609863281, -0.32391357421875, -0.3089408874511719, -0.29396820068359375, -0.2789955139160156, -0.2640228271484375, -0.24905014038085938, -0.23407745361328125, -0.21910476684570312, -0.204132080078125, -0.18915939331054688, -0.17418670654296875, -0.15921401977539062, -0.1442413330078125, -0.12926864624023438, -0.11429595947265625, -0.09932327270507812, -0.0843505859375, -0.06937789916992188, -0.05440521240234375, -0.039432525634765625, -0.0244598388671875, -0.009487152099609375, 0.00548553466796875, 0.020458221435546875, 0.035430908203125, 0.050403594970703125, 0.06537628173828125, 0.08034896850585938, 0.0953216552734375, 0.11029434204101562, 0.12526702880859375, 0.14023971557617188, 0.15521240234375, 0.17018508911132812, 0.18515777587890625, 0.20013046264648438, 0.2151031494140625, 0.23007583618164062, 0.24504852294921875, 0.2600212097167969, 0.274993896484375, 0.2899665832519531, 0.30493927001953125, 0.3199119567871094, 0.3348846435546875, 0.3498573303222656, 0.36483001708984375, 0.3798027038574219, 0.394775390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 9.0, 10.0, 22.0, 33.0, 47.0, 70.0, 97.0, 133.0, 235.0, 414.0, 731.0, 1510.0, 3152.0, 7969.0, 34204.0, 4027888.0, 96913.0, 12190.0, 4403.0, 2033.0, 958.0, 498.0, 245.0, 175.0, 112.0, 47.0, 45.0, 37.0, 34.0, 20.0, 12.0, 7.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.6433868408203125, -1.576812744140625, -1.5102386474609375, -1.44366455078125, -1.3770904541015625, -1.310516357421875, -1.2439422607421875, -1.1773681640625, -1.1107940673828125, -1.044219970703125, -0.9776458740234375, -0.91107177734375, -0.8444976806640625, -0.777923583984375, -0.7113494873046875, -0.644775390625, -0.5782012939453125, -0.511627197265625, -0.4450531005859375, -0.37847900390625, -0.3119049072265625, -0.245330810546875, -0.1787567138671875, -0.1121826171875, -0.0456085205078125, 0.020965576171875, 0.0875396728515625, 0.15411376953125, 0.2206878662109375, 0.287261962890625, 0.3538360595703125, 0.42041015625, 0.4869842529296875, 0.553558349609375, 0.6201324462890625, 0.68670654296875, 0.7532806396484375, 0.819854736328125, 0.8864288330078125, 0.9530029296875, 1.0195770263671875, 1.086151123046875, 1.1527252197265625, 1.21929931640625, 1.2858734130859375, 1.352447509765625, 1.4190216064453125, 1.485595703125, 1.5521697998046875, 1.618743896484375, 1.6853179931640625, 1.75189208984375, 1.8184661865234375, 1.885040283203125, 1.9516143798828125, 2.0181884765625, 2.0847625732421875, 2.151336669921875, 2.2179107666015625, 2.28448486328125, 2.3510589599609375, 2.417633056640625, 2.4842071533203125, 2.55078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 10.0, 9.0, 37.0, 88.0, 379.0, 3272.0, 133.0, 52.0, 29.0, 15.0, 7.0, 6.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.8064422607421875, -0.778900146484375, -0.7513580322265625, -0.72381591796875, -0.6962738037109375, -0.668731689453125, -0.6411895751953125, -0.6136474609375, -0.5861053466796875, -0.558563232421875, -0.5310211181640625, -0.50347900390625, -0.4759368896484375, -0.448394775390625, -0.4208526611328125, -0.393310546875, -0.3657684326171875, -0.338226318359375, -0.3106842041015625, -0.28314208984375, -0.2555999755859375, -0.228057861328125, -0.2005157470703125, -0.1729736328125, -0.1454315185546875, -0.117889404296875, -0.0903472900390625, -0.06280517578125, -0.0352630615234375, -0.007720947265625, 0.0198211669921875, 0.04736328125, 0.0749053955078125, 0.102447509765625, 0.1299896240234375, 0.15753173828125, 0.1850738525390625, 0.212615966796875, 0.2401580810546875, 0.2677001953125, 0.2952423095703125, 0.322784423828125, 0.3503265380859375, 0.37786865234375, 0.4054107666015625, 0.432952880859375, 0.4604949951171875, 0.488037109375, 0.5155792236328125, 0.543121337890625, 0.5706634521484375, 0.59820556640625, 0.6257476806640625, 0.653289794921875, 0.6808319091796875, 0.7083740234375, 0.7359161376953125, 0.763458251953125, 0.7910003662109375, 0.81854248046875, 0.8460845947265625, 0.873626708984375, 0.9011688232421875, 0.9287109375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 10.0, 20.0, 29.0, 45.0, 71.0, 120.0, 157.0, 181.0, 118.0, 81.0, 61.0, 33.0, 22.0, 15.0, 10.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3088436126708984, -3.1937520503997803, -3.078660726547241, -2.963569164276123, -2.848477602005005, -2.7333860397338867, -2.6182947158813477, -2.5032031536102295, -2.3881115913391113, -2.273020029067993, -2.157928705215454, -2.042837142944336, -1.9277455806732178, -1.8126541376113892, -1.6975626945495605, -1.5824711322784424, -1.4673796892166138, -1.3522882461547852, -1.237196683883667, -1.1221052408218384, -1.0070136785507202, -0.8919222354888916, -0.7768307328224182, -0.6617392301559448, -0.5466477274894714, -0.43155622482299805, -0.31646472215652466, -0.20137324929237366, -0.08628174662590027, 0.028809726238250732, 0.14390122890472412, 0.2589927315711975, 0.3740842342376709, 0.4891757369041443, 0.6042672395706177, 0.7193586826324463, 0.8344502449035645, 0.9495416879653931, 1.0646331310272217, 1.1797246932983398, 1.294816255569458, 1.4099076986312866, 1.5249992609024048, 1.6400907039642334, 1.7551822662353516, 1.8702737092971802, 1.9853651523590088, 2.100456714630127, 2.215548038482666, 2.330639600753784, 2.4457309246063232, 2.5608224868774414, 2.6759140491485596, 2.7910056114196777, 2.906096935272217, 3.021188497543335, 3.136280059814453, 3.2513716220855713, 3.3664629459381104, 3.4815545082092285, 3.5966460704803467, 3.711737632751465, 3.826828956604004, 3.941920518875122, 4.05701208114624]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 6.0, 9.0, 9.0, 7.0, 14.0, 17.0, 16.0, 22.0, 19.0, 24.0, 25.0, 27.0, 27.0, 40.0, 34.0, 32.0, 29.0, 42.0, 33.0, 42.0, 40.0, 37.0, 40.0, 47.0, 32.0, 23.0, 39.0, 40.0, 25.0, 24.0, 33.0, 14.0, 17.0, 18.0, 19.0, 12.0, 15.0, 10.0, 10.0, 6.0, 5.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0], "bins": [-1.5749783515930176, -1.5290923118591309, -1.4832062721252441, -1.4373202323913574, -1.3914341926574707, -1.345548152923584, -1.2996621131896973, -1.2537760734558105, -1.2078900337219238, -1.162003993988037, -1.1161179542541504, -1.0702319145202637, -1.024345874786377, -0.9784598350524902, -0.9325737357139587, -0.886687695980072, -0.8408015966415405, -0.7949155569076538, -0.7490295171737671, -0.7031434774398804, -0.6572574377059937, -0.6113713979721069, -0.5654852986335754, -0.5195992588996887, -0.473713219165802, -0.4278271794319153, -0.38194113969802856, -0.33605507016181946, -0.29016903042793274, -0.24428299069404602, -0.19839692115783691, -0.1525108814239502, -0.10662472248077393, -0.06073867529630661, -0.014852628111839294, 0.031033426523208618, 0.07691946625709534, 0.12280550599098206, 0.16869157552719116, 0.21457761526107788, 0.2604636549949646, 0.3063496947288513, 0.35223573446273804, 0.39812180399894714, 0.44400784373283386, 0.4898938834667206, 0.5357799530029297, 0.5816659927368164, 0.6275520324707031, 0.6734380722045898, 0.7193241119384766, 0.7652101516723633, 0.81109619140625, 0.8569822311401367, 0.9028683304786682, 0.9487543702125549, 0.9946404099464417, 1.0405265092849731, 1.0864125490188599, 1.1322985887527466, 1.1781846284866333, 1.22407066822052, 1.2699567079544067, 1.3158427476882935, 1.3617287874221802]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 5.0, 8.0, 12.0, 21.0, 20.0, 47.0, 59.0, 85.0, 159.0, 261.0, 422.0, 818.0, 1510.0, 3088.0, 6839.0, 17834.0, 51216.0, 164229.0, 479146.0, 217777.0, 66544.0, 22282.0, 8525.0, 3654.0, 1825.0, 872.0, 522.0, 285.0, 162.0, 107.0, 73.0, 46.0, 29.0, 21.0, 12.0, 15.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.8818359375, -1.8274688720703125, -1.773101806640625, -1.7187347412109375, -1.66436767578125, -1.6100006103515625, -1.555633544921875, -1.5012664794921875, -1.4468994140625, -1.3925323486328125, -1.338165283203125, -1.2837982177734375, -1.22943115234375, -1.1750640869140625, -1.120697021484375, -1.0663299560546875, -1.011962890625, -0.9575958251953125, -0.903228759765625, -0.8488616943359375, -0.79449462890625, -0.7401275634765625, -0.685760498046875, -0.6313934326171875, -0.5770263671875, -0.5226593017578125, -0.468292236328125, -0.4139251708984375, -0.35955810546875, -0.3051910400390625, -0.250823974609375, -0.1964569091796875, -0.14208984375, -0.0877227783203125, -0.033355712890625, 0.0210113525390625, 0.07537841796875, 0.1297454833984375, 0.184112548828125, 0.2384796142578125, 0.2928466796875, 0.3472137451171875, 0.401580810546875, 0.4559478759765625, 0.51031494140625, 0.5646820068359375, 0.619049072265625, 0.6734161376953125, 0.727783203125, 0.7821502685546875, 0.836517333984375, 0.8908843994140625, 0.94525146484375, 0.9996185302734375, 1.053985595703125, 1.1083526611328125, 1.1627197265625, 1.2170867919921875, 1.271453857421875, 1.3258209228515625, 1.38018798828125, 1.4345550537109375, 1.488922119140625, 1.5432891845703125, 1.59765625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 9.0, 7.0, 9.0, 7.0, 15.0, 19.0, 18.0, 31.0, 16.0, 30.0, 41.0, 44.0, 45.0, 47.0, 52.0, 55.0, 68.0, 68.0, 51.0, 56.0, 39.0, 46.0, 40.0, 31.0, 29.0, 15.0, 23.0, 20.0, 16.0, 11.0, 13.0, 6.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56396484375, -0.5484771728515625, -0.532989501953125, -0.5175018310546875, -0.50201416015625, -0.4865264892578125, -0.471038818359375, -0.4555511474609375, -0.4400634765625, -0.4245758056640625, -0.409088134765625, -0.3936004638671875, -0.37811279296875, -0.3626251220703125, -0.347137451171875, -0.3316497802734375, -0.316162109375, -0.3006744384765625, -0.285186767578125, -0.2696990966796875, -0.25421142578125, -0.2387237548828125, -0.223236083984375, -0.2077484130859375, -0.1922607421875, -0.1767730712890625, -0.161285400390625, -0.1457977294921875, -0.13031005859375, -0.1148223876953125, -0.099334716796875, -0.0838470458984375, -0.068359375, -0.0528717041015625, -0.037384033203125, -0.0218963623046875, -0.00640869140625, 0.0090789794921875, 0.024566650390625, 0.0400543212890625, 0.0555419921875, 0.0710296630859375, 0.086517333984375, 0.1020050048828125, 0.11749267578125, 0.1329803466796875, 0.148468017578125, 0.1639556884765625, 0.179443359375, 0.1949310302734375, 0.210418701171875, 0.2259063720703125, 0.24139404296875, 0.2568817138671875, 0.272369384765625, 0.2878570556640625, 0.3033447265625, 0.3188323974609375, 0.334320068359375, 0.3498077392578125, 0.36529541015625, 0.3807830810546875, 0.396270751953125, 0.4117584228515625, 0.42724609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 5.0, 9.0, 9.0, 6.0, 19.0, 21.0, 25.0, 24.0, 41.0, 53.0, 65.0, 109.0, 128.0, 199.0, 300.0, 438.0, 729.0, 1344.0, 3069.0, 9652.0, 51360.0, 523328.0, 399770.0, 43291.0, 8540.0, 2694.0, 1241.0, 677.0, 443.0, 271.0, 183.0, 143.0, 96.0, 67.0, 54.0, 33.0, 26.0, 27.0, 18.0, 11.0, 5.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-2.59375, -2.5216064453125, -2.449462890625, -2.3773193359375, -2.30517578125, -2.2330322265625, -2.160888671875, -2.0887451171875, -2.0166015625, -1.9444580078125, -1.872314453125, -1.8001708984375, -1.72802734375, -1.6558837890625, -1.583740234375, -1.5115966796875, -1.439453125, -1.3673095703125, -1.295166015625, -1.2230224609375, -1.15087890625, -1.0787353515625, -1.006591796875, -0.9344482421875, -0.8623046875, -0.7901611328125, -0.718017578125, -0.6458740234375, -0.57373046875, -0.5015869140625, -0.429443359375, -0.3572998046875, -0.28515625, -0.2130126953125, -0.140869140625, -0.0687255859375, 0.00341796875, 0.0755615234375, 0.147705078125, 0.2198486328125, 0.2919921875, 0.3641357421875, 0.436279296875, 0.5084228515625, 0.58056640625, 0.6527099609375, 0.724853515625, 0.7969970703125, 0.869140625, 0.9412841796875, 1.013427734375, 1.0855712890625, 1.15771484375, 1.2298583984375, 1.302001953125, 1.3741455078125, 1.4462890625, 1.5184326171875, 1.590576171875, 1.6627197265625, 1.73486328125, 1.8070068359375, 1.879150390625, 1.9512939453125, 2.0234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 7.0, 7.0, 9.0, 14.0, 14.0, 20.0, 18.0, 23.0, 31.0, 26.0, 38.0, 37.0, 54.0, 48.0, 53.0, 58.0, 47.0, 52.0, 66.0, 55.0, 55.0, 45.0, 36.0, 25.0, 30.0, 28.0, 18.0, 23.0, 16.0, 11.0, 9.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8603515625, -1.7918243408203125, -1.723297119140625, -1.6547698974609375, -1.58624267578125, -1.5177154541015625, -1.449188232421875, -1.3806610107421875, -1.3121337890625, -1.2436065673828125, -1.175079345703125, -1.1065521240234375, -1.03802490234375, -0.9694976806640625, -0.900970458984375, -0.8324432373046875, -0.763916015625, -0.6953887939453125, -0.626861572265625, -0.5583343505859375, -0.48980712890625, -0.4212799072265625, -0.352752685546875, -0.2842254638671875, -0.2156982421875, -0.1471710205078125, -0.078643798828125, -0.0101165771484375, 0.05841064453125, 0.1269378662109375, 0.195465087890625, 0.2639923095703125, 0.33251953125, 0.4010467529296875, 0.469573974609375, 0.5381011962890625, 0.60662841796875, 0.6751556396484375, 0.743682861328125, 0.8122100830078125, 0.8807373046875, 0.9492645263671875, 1.017791748046875, 1.0863189697265625, 1.15484619140625, 1.2233734130859375, 1.291900634765625, 1.3604278564453125, 1.428955078125, 1.4974822998046875, 1.566009521484375, 1.6345367431640625, 1.70306396484375, 1.7715911865234375, 1.840118408203125, 1.9086456298828125, 1.9771728515625, 2.0457000732421875, 2.114227294921875, 2.1827545166015625, 2.25128173828125, 2.3198089599609375, 2.388336181640625, 2.4568634033203125, 2.525390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 4.0, 8.0, 9.0, 13.0, 17.0, 30.0, 42.0, 64.0, 83.0, 124.0, 212.0, 398.0, 771.0, 1898.0, 5313.0, 21271.0, 152943.0, 737730.0, 103951.0, 16080.0, 4401.0, 1527.0, 681.0, 382.0, 208.0, 124.0, 94.0, 42.0, 41.0, 28.0, 13.0, 9.0, 11.0, 4.0, 7.0, 5.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.0712890625, -1.0401611328125, -1.009033203125, -0.9779052734375, -0.94677734375, -0.9156494140625, -0.884521484375, -0.8533935546875, -0.822265625, -0.7911376953125, -0.760009765625, -0.7288818359375, -0.69775390625, -0.6666259765625, -0.635498046875, -0.6043701171875, -0.5732421875, -0.5421142578125, -0.510986328125, -0.4798583984375, -0.44873046875, -0.4176025390625, -0.386474609375, -0.3553466796875, -0.32421875, -0.2930908203125, -0.261962890625, -0.2308349609375, -0.19970703125, -0.1685791015625, -0.137451171875, -0.1063232421875, -0.0751953125, -0.0440673828125, -0.012939453125, 0.0181884765625, 0.04931640625, 0.0804443359375, 0.111572265625, 0.1427001953125, 0.173828125, 0.2049560546875, 0.236083984375, 0.2672119140625, 0.29833984375, 0.3294677734375, 0.360595703125, 0.3917236328125, 0.4228515625, 0.4539794921875, 0.485107421875, 0.5162353515625, 0.54736328125, 0.5784912109375, 0.609619140625, 0.6407470703125, 0.671875, 0.7030029296875, 0.734130859375, 0.7652587890625, 0.79638671875, 0.8275146484375, 0.858642578125, 0.8897705078125, 0.9208984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 11.0, 5.0, 11.0, 12.0, 16.0, 24.0, 30.0, 42.0, 41.0, 53.0, 74.0, 97.0, 121.0, 110.0, 73.0, 58.0, 48.0, 30.0, 35.0, 19.0, 14.0, 15.0, 15.0, 7.0, 6.0, 10.0, 7.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011587142944335938, -0.0001102052628993988, -0.00010453909635543823, -9.887292981147766e-05, -9.320676326751709e-05, -8.754059672355652e-05, -8.187443017959595e-05, -7.620826363563538e-05, -7.05420970916748e-05, -6.487593054771423e-05, -5.920976400375366e-05, -5.354359745979309e-05, -4.787743091583252e-05, -4.221126437187195e-05, -3.654509782791138e-05, -3.0878931283950806e-05, -2.5212764739990234e-05, -1.9546598196029663e-05, -1.3880431652069092e-05, -8.21426510810852e-06, -2.5480985641479492e-06, 3.118067979812622e-06, 8.784234523773193e-06, 1.4450401067733765e-05, 2.0116567611694336e-05, 2.5782734155654907e-05, 3.144890069961548e-05, 3.711506724357605e-05, 4.278123378753662e-05, 4.844740033149719e-05, 5.4113566875457764e-05, 5.9779733419418335e-05, 6.54458999633789e-05, 7.111206650733948e-05, 7.677823305130005e-05, 8.244439959526062e-05, 8.811056613922119e-05, 9.377673268318176e-05, 9.944289922714233e-05, 0.0001051090657711029, 0.00011077523231506348, 0.00011644139885902405, 0.00012210756540298462, 0.0001277737319469452, 0.00013343989849090576, 0.00013910606503486633, 0.0001447722315788269, 0.00015043839812278748, 0.00015610456466674805, 0.00016177073121070862, 0.0001674368977546692, 0.00017310306429862976, 0.00017876923084259033, 0.0001844353973865509, 0.00019010156393051147, 0.00019576773047447205, 0.00020143389701843262, 0.0002071000635623932, 0.00021276623010635376, 0.00021843239665031433, 0.0002240985631942749, 0.00022976472973823547, 0.00023543089628219604, 0.00024109706282615662, 0.0002467632293701172]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 8.0, 10.0, 11.0, 20.0, 19.0, 25.0, 54.0, 79.0, 123.0, 228.0, 438.0, 905.0, 2638.0, 10306.0, 92324.0, 844685.0, 82734.0, 9594.0, 2440.0, 896.0, 414.0, 229.0, 110.0, 61.0, 54.0, 44.0, 34.0, 21.0, 11.0, 5.0, 7.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.775390625, -1.7325897216796875, -1.689788818359375, -1.6469879150390625, -1.60418701171875, -1.5613861083984375, -1.518585205078125, -1.4757843017578125, -1.4329833984375, -1.3901824951171875, -1.347381591796875, -1.3045806884765625, -1.26177978515625, -1.2189788818359375, -1.176177978515625, -1.1333770751953125, -1.090576171875, -1.0477752685546875, -1.004974365234375, -0.9621734619140625, -0.91937255859375, -0.8765716552734375, -0.833770751953125, -0.7909698486328125, -0.7481689453125, -0.7053680419921875, -0.662567138671875, -0.6197662353515625, -0.57696533203125, -0.5341644287109375, -0.491363525390625, -0.4485626220703125, -0.40576171875, -0.3629608154296875, -0.320159912109375, -0.2773590087890625, -0.23455810546875, -0.1917572021484375, -0.148956298828125, -0.1061553955078125, -0.0633544921875, -0.0205535888671875, 0.022247314453125, 0.0650482177734375, 0.10784912109375, 0.1506500244140625, 0.193450927734375, 0.2362518310546875, 0.279052734375, 0.3218536376953125, 0.364654541015625, 0.4074554443359375, 0.45025634765625, 0.4930572509765625, 0.535858154296875, 0.5786590576171875, 0.6214599609375, 0.6642608642578125, 0.707061767578125, 0.7498626708984375, 0.79266357421875, 0.8354644775390625, 0.878265380859375, 0.9210662841796875, 0.9638671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 9.0, 10.0, 28.0, 41.0, 39.0, 58.0, 69.0, 84.0, 108.0, 102.0, 97.0, 85.0, 80.0, 42.0, 39.0, 27.0, 25.0, 18.0, 4.0, 7.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6640625, -0.6343994140625, -0.604736328125, -0.5750732421875, -0.54541015625, -0.5157470703125, -0.486083984375, -0.4564208984375, -0.4267578125, -0.3970947265625, -0.367431640625, -0.3377685546875, -0.30810546875, -0.2784423828125, -0.248779296875, -0.2191162109375, -0.189453125, -0.1597900390625, -0.130126953125, -0.1004638671875, -0.07080078125, -0.0411376953125, -0.011474609375, 0.0181884765625, 0.0478515625, 0.0775146484375, 0.107177734375, 0.1368408203125, 0.16650390625, 0.1961669921875, 0.225830078125, 0.2554931640625, 0.28515625, 0.3148193359375, 0.344482421875, 0.3741455078125, 0.40380859375, 0.4334716796875, 0.463134765625, 0.4927978515625, 0.5224609375, 0.5521240234375, 0.581787109375, 0.6114501953125, 0.64111328125, 0.6707763671875, 0.700439453125, 0.7301025390625, 0.759765625, 0.7894287109375, 0.819091796875, 0.8487548828125, 0.87841796875, 0.9080810546875, 0.937744140625, 0.9674072265625, 0.9970703125, 1.0267333984375, 1.056396484375, 1.0860595703125, 1.11572265625, 1.1453857421875, 1.175048828125, 1.2047119140625, 1.234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 9.0, 22.0, 46.0, 120.0, 253.0, 258.0, 164.0, 76.0, 24.0, 12.0, 10.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.5809326171875, -34.79084396362305, -34.000755310058594, -33.21066665649414, -32.42057800292969, -31.630491256713867, -30.840402603149414, -30.05031394958496, -29.260225296020508, -28.470136642456055, -27.6800479888916, -26.88995933532715, -26.099872589111328, -25.309783935546875, -24.519695281982422, -23.72960662841797, -22.939517974853516, -22.149429321289062, -21.35934066772461, -20.569252014160156, -19.779163360595703, -18.989076614379883, -18.19898796081543, -17.408899307250977, -16.618810653686523, -15.82872200012207, -15.038633346557617, -14.24854564666748, -13.458456993103027, -12.668368339538574, -11.878280639648438, -11.088191986083984, -10.298104286193848, -9.508015632629395, -8.717927932739258, -7.927839279174805, -7.137750625610352, -6.347661972045898, -5.5575737953186035, -4.767485618591309, -3.9773969650268555, -3.1873085498809814, -2.3972201347351074, -1.6071317195892334, -0.8170433044433594, -0.02695488929748535, 0.7631335258483887, 1.5532217025756836, 2.3433103561401367, 3.1333987712860107, 3.9234871864318848, 4.71357536315918, 5.503664016723633, 6.293752670288086, 7.083840847015381, 7.873929023742676, 8.664017677307129, 9.454106330871582, 10.244194030761719, 11.034282684326172, 11.824371337890625, 12.614459991455078, 13.404548645019531, 14.194636344909668, 14.984724998474121]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 4.0, 7.0, 8.0, 10.0, 21.0, 24.0, 31.0, 34.0, 44.0, 43.0, 51.0, 57.0, 50.0, 68.0, 72.0, 68.0, 56.0, 58.0, 53.0, 45.0, 31.0, 31.0, 28.0, 24.0, 23.0, 13.0, 20.0, 8.0, 6.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.903568267822266, -9.546171188354492, -9.188774108886719, -8.831377029418945, -8.473979949951172, -8.116582870483398, -7.759186267852783, -7.40178918838501, -7.044392108917236, -6.686995029449463, -6.3295979499816895, -5.972201347351074, -5.614804267883301, -5.257407188415527, -4.900010108947754, -4.5426130294799805, -4.185215950012207, -3.8278188705444336, -3.47042179107666, -3.113024950027466, -2.7556278705596924, -2.398230791091919, -2.0408339500427246, -1.6834368705749512, -1.3260397911071777, -0.9686427712440491, -0.6112457513809204, -0.2538487911224365, 0.10354828834533691, 0.46094536781311035, 0.8183422088623047, 1.1757392883300781, 1.5331363677978516, 1.890533447265625, 2.2479305267333984, 2.6053273677825928, 2.962724447250366, 3.3201215267181396, 3.677518367767334, 4.034915447235107, 4.392312526702881, 4.749709606170654, 5.107106685638428, 5.464503288269043, 5.821900367736816, 6.17929744720459, 6.536694526672363, 6.894091606140137, 7.25148868560791, 7.608885765075684, 7.966282844543457, 8.32367992401123, 8.681077003479004, 9.038474082946777, 9.395870208740234, 9.753267288208008, 10.110664367675781, 10.468061447143555, 10.825458526611328, 11.182855606079102, 11.540252685546875, 11.897649765014648, 12.255046844482422, 12.612443923950195, 12.969841003417969]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 11.0, 16.0, 14.0, 19.0, 25.0, 54.0, 95.0, 145.0, 322.0, 623.0, 1360.0, 3049.0, 8689.0, 30838.0, 211425.0, 3746863.0, 151664.0, 25933.0, 7779.0, 2921.0, 1194.0, 566.0, 305.0, 160.0, 73.0, 53.0, 27.0, 16.0, 16.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.1875, -2.1290740966796875, -2.070648193359375, -2.0122222900390625, -1.95379638671875, -1.8953704833984375, -1.836944580078125, -1.7785186767578125, -1.7200927734375, -1.6616668701171875, -1.603240966796875, -1.5448150634765625, -1.48638916015625, -1.4279632568359375, -1.369537353515625, -1.3111114501953125, -1.252685546875, -1.1942596435546875, -1.135833740234375, -1.0774078369140625, -1.01898193359375, -0.9605560302734375, -0.902130126953125, -0.8437042236328125, -0.7852783203125, -0.7268524169921875, -0.668426513671875, -0.6100006103515625, -0.55157470703125, -0.4931488037109375, -0.434722900390625, -0.3762969970703125, -0.31787109375, -0.2594451904296875, -0.201019287109375, -0.1425933837890625, -0.08416748046875, -0.0257415771484375, 0.032684326171875, 0.0911102294921875, 0.1495361328125, 0.2079620361328125, 0.266387939453125, 0.3248138427734375, 0.38323974609375, 0.4416656494140625, 0.500091552734375, 0.5585174560546875, 0.616943359375, 0.6753692626953125, 0.733795166015625, 0.7922210693359375, 0.85064697265625, 0.9090728759765625, 0.967498779296875, 1.0259246826171875, 1.0843505859375, 1.1427764892578125, 1.201202392578125, 1.2596282958984375, 1.31805419921875, 1.3764801025390625, 1.434906005859375, 1.4933319091796875, 1.5517578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 7.0, 8.0, 11.0, 10.0, 22.0, 34.0, 26.0, 45.0, 46.0, 66.0, 55.0, 50.0, 72.0, 61.0, 70.0, 62.0, 47.0, 56.0, 39.0, 35.0, 33.0, 28.0, 26.0, 25.0, 15.0, 10.0, 5.0, 18.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46240234375, -0.44628143310546875, -0.4301605224609375, -0.41403961181640625, -0.397918701171875, -0.38179779052734375, -0.3656768798828125, -0.34955596923828125, -0.33343505859375, -0.31731414794921875, -0.3011932373046875, -0.28507232666015625, -0.268951416015625, -0.25283050537109375, -0.2367095947265625, -0.22058868408203125, -0.2044677734375, -0.18834686279296875, -0.1722259521484375, -0.15610504150390625, -0.139984130859375, -0.12386322021484375, -0.1077423095703125, -0.09162139892578125, -0.07550048828125, -0.05937957763671875, -0.0432586669921875, -0.02713775634765625, -0.011016845703125, 0.00510406494140625, 0.0212249755859375, 0.03734588623046875, 0.053466796875, 0.06958770751953125, 0.0857086181640625, 0.10182952880859375, 0.117950439453125, 0.13407135009765625, 0.1501922607421875, 0.16631317138671875, 0.18243408203125, 0.19855499267578125, 0.2146759033203125, 0.23079681396484375, 0.246917724609375, 0.26303863525390625, 0.2791595458984375, 0.29528045654296875, 0.3114013671875, 0.32752227783203125, 0.3436431884765625, 0.35976409912109375, 0.375885009765625, 0.39200592041015625, 0.4081268310546875, 0.42424774169921875, 0.44036865234375, 0.45648956298828125, 0.4726104736328125, 0.48873138427734375, 0.504852294921875, 0.5209732055664062, 0.5370941162109375, 0.5532150268554688, 0.5693359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 11.0, 12.0, 9.0, 14.0, 14.0, 35.0, 55.0, 62.0, 118.0, 277.0, 568.0, 1252.0, 3381.0, 9882.0, 33772.0, 175833.0, 3632599.0, 273635.0, 43767.0, 12091.0, 4073.0, 1499.0, 640.0, 292.0, 156.0, 83.0, 51.0, 26.0, 22.0, 12.0, 12.0, 7.0, 9.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9111328125, -1.8589019775390625, -1.806671142578125, -1.7544403076171875, -1.70220947265625, -1.6499786376953125, -1.597747802734375, -1.5455169677734375, -1.4932861328125, -1.4410552978515625, -1.388824462890625, -1.3365936279296875, -1.28436279296875, -1.2321319580078125, -1.179901123046875, -1.1276702880859375, -1.075439453125, -1.0232086181640625, -0.970977783203125, -0.9187469482421875, -0.86651611328125, -0.8142852783203125, -0.762054443359375, -0.7098236083984375, -0.6575927734375, -0.6053619384765625, -0.553131103515625, -0.5009002685546875, -0.44866943359375, -0.3964385986328125, -0.344207763671875, -0.2919769287109375, -0.23974609375, -0.1875152587890625, -0.135284423828125, -0.0830535888671875, -0.03082275390625, 0.0214080810546875, 0.073638916015625, 0.1258697509765625, 0.1781005859375, 0.2303314208984375, 0.282562255859375, 0.3347930908203125, 0.38702392578125, 0.4392547607421875, 0.491485595703125, 0.5437164306640625, 0.595947265625, 0.6481781005859375, 0.700408935546875, 0.7526397705078125, 0.80487060546875, 0.8571014404296875, 0.909332275390625, 0.9615631103515625, 1.0137939453125, 1.0660247802734375, 1.118255615234375, 1.1704864501953125, 1.22271728515625, 1.2749481201171875, 1.327178955078125, 1.3794097900390625, 1.431640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 7.0, 7.0, 13.0, 8.0, 18.0, 22.0, 24.0, 32.0, 40.0, 58.0, 79.0, 134.0, 312.0, 784.0, 1231.0, 613.0, 237.0, 126.0, 86.0, 51.0, 46.0, 32.0, 14.0, 15.0, 10.0, 10.0, 8.0, 8.0, 7.0, 4.0, 3.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.2621307373046875, -1.220550537109375, -1.1789703369140625, -1.13739013671875, -1.0958099365234375, -1.054229736328125, -1.0126495361328125, -0.9710693359375, -0.9294891357421875, -0.887908935546875, -0.8463287353515625, -0.80474853515625, -0.7631683349609375, -0.721588134765625, -0.6800079345703125, -0.638427734375, -0.5968475341796875, -0.555267333984375, -0.5136871337890625, -0.47210693359375, -0.4305267333984375, -0.388946533203125, -0.3473663330078125, -0.3057861328125, -0.2642059326171875, -0.222625732421875, -0.1810455322265625, -0.13946533203125, -0.0978851318359375, -0.056304931640625, -0.0147247314453125, 0.02685546875, 0.0684356689453125, 0.110015869140625, 0.1515960693359375, 0.19317626953125, 0.2347564697265625, 0.276336669921875, 0.3179168701171875, 0.3594970703125, 0.4010772705078125, 0.442657470703125, 0.4842376708984375, 0.52581787109375, 0.5673980712890625, 0.608978271484375, 0.6505584716796875, 0.692138671875, 0.7337188720703125, 0.775299072265625, 0.8168792724609375, 0.85845947265625, 0.9000396728515625, 0.941619873046875, 0.9832000732421875, 1.0247802734375, 1.0663604736328125, 1.107940673828125, 1.1495208740234375, 1.19110107421875, 1.2326812744140625, 1.274261474609375, 1.3158416748046875, 1.357421875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 16.0, 67.0, 108.0, 240.0, 275.0, 156.0, 66.0, 35.0, 11.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.50558090209961, -21.88620376586914, -21.266828536987305, -20.64745330810547, -20.028076171875, -19.40869903564453, -18.789323806762695, -18.16994857788086, -17.55057144165039, -16.931194305419922, -16.311819076538086, -15.692442893981934, -15.073066711425781, -14.453690528869629, -13.834314346313477, -13.214938163757324, -12.595561981201172, -11.97618579864502, -11.356809616088867, -10.737433433532715, -10.118057250976562, -9.49868106842041, -8.879304885864258, -8.259928703308105, -7.640552520751953, -7.021176338195801, -6.401800155639648, -5.782423973083496, -5.163047790527344, -4.543671607971191, -3.924295425415039, -3.3049192428588867, -2.6855430603027344, -2.066166877746582, -1.4467906951904297, -0.8274145126342773, -0.208038330078125, 0.41133785247802734, 1.0307140350341797, 1.650090217590332, 2.2694664001464844, 2.8888425827026367, 3.508218765258789, 4.127594947814941, 4.746971130371094, 5.366347312927246, 5.985723495483398, 6.605099678039551, 7.224475860595703, 7.8438520431518555, 8.463228225708008, 9.08260440826416, 9.701980590820312, 10.321356773376465, 10.940732955932617, 11.56010913848877, 12.179485321044922, 12.798861503601074, 13.418237686157227, 14.037613868713379, 14.656990051269531, 15.276366233825684, 15.895742416381836, 16.515117645263672, 17.13449478149414]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 10.0, 12.0, 10.0, 19.0, 15.0, 15.0, 32.0, 30.0, 34.0, 40.0, 50.0, 45.0, 53.0, 68.0, 56.0, 54.0, 55.0, 51.0, 56.0, 51.0, 30.0, 36.0, 29.0, 28.0, 29.0, 22.0, 17.0, 9.0, 7.0, 5.0, 4.0, 9.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.204517364501953, -6.986541271209717, -6.768564701080322, -6.550588607788086, -6.332612037658691, -6.114635944366455, -5.896659851074219, -5.678683280944824, -5.46070671081543, -5.242730617523193, -5.024754047393799, -4.8067779541015625, -4.588801383972168, -4.370825290679932, -4.152849197387695, -3.934872627258301, -3.7168965339660645, -3.498920202255249, -3.2809438705444336, -3.0629677772521973, -2.8449912071228027, -2.6270151138305664, -2.409038782119751, -2.1910624504089355, -1.9730861186981201, -1.7551097869873047, -1.5371334552764893, -1.3191572427749634, -1.101180911064148, -0.8832045793533325, -0.6652283668518066, -0.4472520351409912, -0.22927570343017578, -0.01129940152168274, 0.2066769003868103, 0.42465317249298096, 0.6426295042037964, 0.8606058359146118, 1.0785820484161377, 1.2965583801269531, 1.5145347118377686, 1.732511043548584, 1.9504873752593994, 2.168463706970215, 2.386439800262451, 2.6044163703918457, 2.822392463684082, 3.0403687953948975, 3.258345127105713, 3.4763214588165283, 3.6942977905273438, 3.91227388381958, 4.130250453948975, 4.348226547241211, 4.5662031173706055, 4.784179210662842, 5.002155303955078, 5.2201313972473145, 5.438107967376709, 5.656084060668945, 5.87406063079834, 6.092036724090576, 6.3100128173828125, 6.527989387512207, 6.745965957641602]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 8.0, 7.0, 11.0, 19.0, 22.0, 48.0, 56.0, 69.0, 148.0, 216.0, 356.0, 679.0, 1224.0, 2440.0, 4926.0, 10787.0, 26132.0, 71746.0, 303483.0, 462908.0, 102306.0, 34492.0, 13929.0, 6154.0, 2928.0, 1509.0, 801.0, 433.0, 262.0, 159.0, 110.0, 49.0, 50.0, 22.0, 21.0, 18.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.35205078125, -1.3056640625, -1.25927734375, -1.212890625, -1.16650390625, -1.1201171875, -1.07373046875, -1.02734375, -0.98095703125, -0.9345703125, -0.88818359375, -0.841796875, -0.79541015625, -0.7490234375, -0.70263671875, -0.65625, -0.60986328125, -0.5634765625, -0.51708984375, -0.470703125, -0.42431640625, -0.3779296875, -0.33154296875, -0.28515625, -0.23876953125, -0.1923828125, -0.14599609375, -0.099609375, -0.05322265625, -0.0068359375, 0.03955078125, 0.0859375, 0.13232421875, 0.1787109375, 0.22509765625, 0.271484375, 0.31787109375, 0.3642578125, 0.41064453125, 0.45703125, 0.50341796875, 0.5498046875, 0.59619140625, 0.642578125, 0.68896484375, 0.7353515625, 0.78173828125, 0.828125, 0.87451171875, 0.9208984375, 0.96728515625, 1.013671875, 1.06005859375, 1.1064453125, 1.15283203125, 1.19921875, 1.24560546875, 1.2919921875, 1.33837890625, 1.384765625, 1.43115234375, 1.4775390625, 1.52392578125, 1.5703125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 9.0, 6.0, 5.0, 11.0, 11.0, 10.0, 18.0, 29.0, 32.0, 31.0, 35.0, 43.0, 45.0, 62.0, 58.0, 55.0, 61.0, 67.0, 63.0, 50.0, 38.0, 27.0, 53.0, 28.0, 28.0, 22.0, 22.0, 20.0, 19.0, 15.0, 10.0, 3.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.503082275390625, -0.48809814453125, -0.473114013671875, -0.4581298828125, -0.443145751953125, -0.42816162109375, -0.413177490234375, -0.398193359375, -0.383209228515625, -0.36822509765625, -0.353240966796875, -0.3382568359375, -0.323272705078125, -0.30828857421875, -0.293304443359375, -0.2783203125, -0.263336181640625, -0.24835205078125, -0.233367919921875, -0.2183837890625, -0.203399658203125, -0.18841552734375, -0.173431396484375, -0.158447265625, -0.143463134765625, -0.12847900390625, -0.113494873046875, -0.0985107421875, -0.083526611328125, -0.06854248046875, -0.053558349609375, -0.03857421875, -0.023590087890625, -0.00860595703125, 0.006378173828125, 0.0213623046875, 0.036346435546875, 0.05133056640625, 0.066314697265625, 0.081298828125, 0.096282958984375, 0.11126708984375, 0.126251220703125, 0.1412353515625, 0.156219482421875, 0.17120361328125, 0.186187744140625, 0.201171875, 0.216156005859375, 0.23114013671875, 0.246124267578125, 0.2611083984375, 0.276092529296875, 0.29107666015625, 0.306060791015625, 0.321044921875, 0.336029052734375, 0.35101318359375, 0.365997314453125, 0.3809814453125, 0.395965576171875, 0.41094970703125, 0.425933837890625, 0.44091796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 11.0, 7.0, 15.0, 17.0, 20.0, 23.0, 36.0, 61.0, 74.0, 96.0, 145.0, 239.0, 341.0, 600.0, 1148.0, 2643.0, 8840.0, 53291.0, 774319.0, 178691.0, 19613.0, 4551.0, 1709.0, 772.0, 423.0, 271.0, 167.0, 122.0, 94.0, 51.0, 45.0, 30.0, 14.0, 18.0, 16.0, 11.0, 8.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.623046875, -2.542938232421875, -2.46282958984375, -2.382720947265625, -2.3026123046875, -2.222503662109375, -2.14239501953125, -2.062286376953125, -1.982177734375, -1.902069091796875, -1.82196044921875, -1.741851806640625, -1.6617431640625, -1.581634521484375, -1.50152587890625, -1.421417236328125, -1.34130859375, -1.261199951171875, -1.18109130859375, -1.100982666015625, -1.0208740234375, -0.940765380859375, -0.86065673828125, -0.780548095703125, -0.700439453125, -0.620330810546875, -0.54022216796875, -0.460113525390625, -0.3800048828125, -0.299896240234375, -0.21978759765625, -0.139678955078125, -0.0595703125, 0.020538330078125, 0.10064697265625, 0.180755615234375, 0.2608642578125, 0.340972900390625, 0.42108154296875, 0.501190185546875, 0.581298828125, 0.661407470703125, 0.74151611328125, 0.821624755859375, 0.9017333984375, 0.981842041015625, 1.06195068359375, 1.142059326171875, 1.22216796875, 1.302276611328125, 1.38238525390625, 1.462493896484375, 1.5426025390625, 1.622711181640625, 1.70281982421875, 1.782928466796875, 1.863037109375, 1.943145751953125, 2.02325439453125, 2.103363037109375, 2.1834716796875, 2.263580322265625, 2.34368896484375, 2.423797607421875, 2.50390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 5.0, 7.0, 10.0, 14.0, 9.0, 17.0, 25.0, 27.0, 29.0, 35.0, 36.0, 48.0, 53.0, 63.0, 60.0, 49.0, 66.0, 59.0, 53.0, 43.0, 46.0, 51.0, 33.0, 32.0, 30.0, 24.0, 17.0, 21.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.933868408203125, -1.86187744140625, -1.789886474609375, -1.7178955078125, -1.645904541015625, -1.57391357421875, -1.501922607421875, -1.429931640625, -1.357940673828125, -1.28594970703125, -1.213958740234375, -1.1419677734375, -1.069976806640625, -0.99798583984375, -0.925994873046875, -0.85400390625, -0.782012939453125, -0.71002197265625, -0.638031005859375, -0.5660400390625, -0.494049072265625, -0.42205810546875, -0.350067138671875, -0.278076171875, -0.206085205078125, -0.13409423828125, -0.062103271484375, 0.0098876953125, 0.081878662109375, 0.15386962890625, 0.225860595703125, 0.2978515625, 0.369842529296875, 0.44183349609375, 0.513824462890625, 0.5858154296875, 0.657806396484375, 0.72979736328125, 0.801788330078125, 0.873779296875, 0.945770263671875, 1.01776123046875, 1.089752197265625, 1.1617431640625, 1.233734130859375, 1.30572509765625, 1.377716064453125, 1.44970703125, 1.521697998046875, 1.59368896484375, 1.665679931640625, 1.7376708984375, 1.809661865234375, 1.88165283203125, 1.953643798828125, 2.025634765625, 2.097625732421875, 2.16961669921875, 2.241607666015625, 2.3135986328125, 2.385589599609375, 2.45758056640625, 2.529571533203125, 2.6015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 7.0, 15.0, 22.0, 31.0, 54.0, 104.0, 164.0, 380.0, 984.0, 3311.0, 17774.0, 297261.0, 693946.0, 27822.0, 4499.0, 1240.0, 483.0, 210.0, 83.0, 53.0, 29.0, 22.0, 10.0, 16.0, 7.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6435546875, -1.5992584228515625, -1.554962158203125, -1.5106658935546875, -1.46636962890625, -1.4220733642578125, -1.377777099609375, -1.3334808349609375, -1.2891845703125, -1.2448883056640625, -1.200592041015625, -1.1562957763671875, -1.11199951171875, -1.0677032470703125, -1.023406982421875, -0.9791107177734375, -0.934814453125, -0.8905181884765625, -0.846221923828125, -0.8019256591796875, -0.75762939453125, -0.7133331298828125, -0.669036865234375, -0.6247406005859375, -0.5804443359375, -0.5361480712890625, -0.491851806640625, -0.4475555419921875, -0.40325927734375, -0.3589630126953125, -0.314666748046875, -0.2703704833984375, -0.22607421875, -0.1817779541015625, -0.137481689453125, -0.0931854248046875, -0.04888916015625, -0.0045928955078125, 0.039703369140625, 0.0839996337890625, 0.1282958984375, 0.1725921630859375, 0.216888427734375, 0.2611846923828125, 0.30548095703125, 0.3497772216796875, 0.394073486328125, 0.4383697509765625, 0.482666015625, 0.5269622802734375, 0.571258544921875, 0.6155548095703125, 0.65985107421875, 0.7041473388671875, 0.748443603515625, 0.7927398681640625, 0.8370361328125, 0.8813323974609375, 0.925628662109375, 0.9699249267578125, 1.01422119140625, 1.0585174560546875, 1.102813720703125, 1.1471099853515625, 1.19140625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 8.0, 15.0, 10.0, 12.0, 26.0, 52.0, 77.0, 128.0, 222.0, 166.0, 100.0, 57.0, 37.0, 28.0, 16.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027942657470703125, -0.0002706162631511688, -0.0002618059515953064, -0.00025299564003944397, -0.00024418532848358154, -0.00023537501692771912, -0.0002265647053718567, -0.00021775439381599426, -0.00020894408226013184, -0.0002001337707042694, -0.00019132345914840698, -0.00018251314759254456, -0.00017370283603668213, -0.0001648925244808197, -0.00015608221292495728, -0.00014727190136909485, -0.00013846158981323242, -0.00012965127825737, -0.00012084096670150757, -0.00011203065514564514, -0.00010322034358978271, -9.441003203392029e-05, -8.559972047805786e-05, -7.678940892219543e-05, -6.797909736633301e-05, -5.916878581047058e-05, -5.0358474254608154e-05, -4.154816269874573e-05, -3.27378511428833e-05, -2.3927539587020874e-05, -1.5117228031158447e-05, -6.3069164752960205e-06, 2.5033950805664062e-06, 1.1313706636428833e-05, 2.012401819229126e-05, 2.8934329748153687e-05, 3.774464130401611e-05, 4.655495285987854e-05, 5.536526441574097e-05, 6.41755759716034e-05, 7.298588752746582e-05, 8.179619908332825e-05, 9.060651063919067e-05, 9.94168221950531e-05, 0.00010822713375091553, 0.00011703744530677795, 0.00012584775686264038, 0.0001346580684185028, 0.00014346837997436523, 0.00015227869153022766, 0.0001610890030860901, 0.00016989931464195251, 0.00017870962619781494, 0.00018751993775367737, 0.0001963302493095398, 0.00020514056086540222, 0.00021395087242126465, 0.00022276118397712708, 0.0002315714955329895, 0.00024038180708885193, 0.00024919211864471436, 0.0002580024302005768, 0.0002668127417564392, 0.00027562305331230164, 0.00028443336486816406]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 11.0, 19.0, 24.0, 29.0, 51.0, 83.0, 168.0, 277.0, 613.0, 1600.0, 5654.0, 43997.0, 864835.0, 117593.0, 9738.0, 2183.0, 825.0, 368.0, 178.0, 117.0, 60.0, 46.0, 30.0, 15.0, 12.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.537109375, -1.488555908203125, -1.44000244140625, -1.391448974609375, -1.3428955078125, -1.294342041015625, -1.24578857421875, -1.197235107421875, -1.148681640625, -1.100128173828125, -1.05157470703125, -1.003021240234375, -0.9544677734375, -0.905914306640625, -0.85736083984375, -0.808807373046875, -0.76025390625, -0.711700439453125, -0.66314697265625, -0.614593505859375, -0.5660400390625, -0.517486572265625, -0.46893310546875, -0.420379638671875, -0.371826171875, -0.323272705078125, -0.27471923828125, -0.226165771484375, -0.1776123046875, -0.129058837890625, -0.08050537109375, -0.031951904296875, 0.0166015625, 0.065155029296875, 0.11370849609375, 0.162261962890625, 0.2108154296875, 0.259368896484375, 0.30792236328125, 0.356475830078125, 0.405029296875, 0.453582763671875, 0.50213623046875, 0.550689697265625, 0.5992431640625, 0.647796630859375, 0.69635009765625, 0.744903564453125, 0.79345703125, 0.842010498046875, 0.89056396484375, 0.939117431640625, 0.9876708984375, 1.036224365234375, 1.08477783203125, 1.133331298828125, 1.181884765625, 1.230438232421875, 1.27899169921875, 1.327545166015625, 1.3760986328125, 1.424652099609375, 1.47320556640625, 1.521759033203125, 1.5703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 7.0, 9.0, 21.0, 12.0, 19.0, 25.0, 27.0, 29.0, 39.0, 48.0, 59.0, 78.0, 83.0, 70.0, 60.0, 71.0, 58.0, 53.0, 39.0, 32.0, 39.0, 20.0, 20.0, 18.0, 13.0, 5.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.58935546875, -0.569366455078125, -0.54937744140625, -0.529388427734375, -0.5093994140625, -0.489410400390625, -0.46942138671875, -0.449432373046875, -0.429443359375, -0.409454345703125, -0.38946533203125, -0.369476318359375, -0.3494873046875, -0.329498291015625, -0.30950927734375, -0.289520263671875, -0.26953125, -0.249542236328125, -0.22955322265625, -0.209564208984375, -0.1895751953125, -0.169586181640625, -0.14959716796875, -0.129608154296875, -0.109619140625, -0.089630126953125, -0.06964111328125, -0.049652099609375, -0.0296630859375, -0.009674072265625, 0.01031494140625, 0.030303955078125, 0.05029296875, 0.070281982421875, 0.09027099609375, 0.110260009765625, 0.1302490234375, 0.150238037109375, 0.17022705078125, 0.190216064453125, 0.210205078125, 0.230194091796875, 0.25018310546875, 0.270172119140625, 0.2901611328125, 0.310150146484375, 0.33013916015625, 0.350128173828125, 0.3701171875, 0.390106201171875, 0.41009521484375, 0.430084228515625, 0.4500732421875, 0.470062255859375, 0.49005126953125, 0.510040283203125, 0.530029296875, 0.550018310546875, 0.57000732421875, 0.589996337890625, 0.6099853515625, 0.629974365234375, 0.64996337890625, 0.669952392578125, 0.68994140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 32.0, 75.0, 143.0, 237.0, 250.0, 129.0, 67.0, 24.0, 12.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.929275512695312, -24.216503143310547, -23.503732681274414, -22.79096031188965, -22.078189849853516, -21.36541748046875, -20.652645111083984, -19.93987274169922, -19.227102279663086, -18.51432991027832, -17.801559448242188, -17.088787078857422, -16.376014709472656, -15.663244247436523, -14.950471878051758, -14.237700462341309, -13.52492904663086, -12.81215763092041, -12.099386215209961, -11.386613845825195, -10.673842430114746, -9.961071014404297, -9.248298645019531, -8.535527229309082, -7.822755813598633, -7.109984397888184, -6.397212505340576, -5.684440612792969, -4.9716691970825195, -4.25889778137207, -3.546125888824463, -2.8333539962768555, -2.1205825805664062, -1.407810926437378, -0.6950392723083496, 0.01773238182067871, 0.730504035949707, 1.4432756900787354, 2.1560473442077637, 2.868819236755371, 3.5815906524658203, 4.2943620681762695, 5.007133960723877, 5.719905853271484, 6.432677268981934, 7.145448684692383, 7.85822057723999, 8.570992469787598, 9.283763885498047, 9.996535301208496, 10.709306716918945, 11.422079086303711, 12.13485050201416, 12.84762191772461, 13.560394287109375, 14.273165702819824, 14.985937118530273, 15.698708534240723, 16.411479949951172, 17.124252319335938, 17.837024688720703, 18.549795150756836, 19.2625675201416, 19.975337982177734, 20.6881103515625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 8.0, 15.0, 13.0, 21.0, 14.0, 15.0, 27.0, 30.0, 27.0, 27.0, 41.0, 45.0, 50.0, 51.0, 56.0, 60.0, 46.0, 54.0, 65.0, 37.0, 38.0, 33.0, 33.0, 31.0, 25.0, 20.0, 24.0, 10.0, 18.0, 13.0, 11.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.304425239562988, -7.067749500274658, -6.831073760986328, -6.594398021697998, -6.357722282409668, -6.121046543121338, -5.884370803833008, -5.647695541381836, -5.411019325256348, -5.174343585968018, -4.9376678466796875, -4.700992107391357, -4.464316368103027, -4.227640628814697, -3.9909651279449463, -3.754289388656616, -3.5176138877868652, -3.280938148498535, -3.044262409210205, -2.807586669921875, -2.570910930633545, -2.334235191345215, -2.097559690475464, -1.8608839511871338, -1.6242082118988037, -1.3875324726104736, -1.1508567333221436, -0.914181113243103, -0.677505373954773, -0.44082963466644287, -0.20415401458740234, 0.032521724700927734, 0.2691974639892578, 0.5058732032775879, 0.7425488829612732, 0.9792245626449585, 1.2159003019332886, 1.4525760412216187, 1.6892516613006592, 1.9259274005889893, 2.1626031398773193, 2.3992788791656494, 2.6359546184539795, 2.8726301193237305, 3.1093058586120605, 3.3459815979003906, 3.5826573371887207, 3.819333076477051, 4.056008815765381, 4.292684555053711, 4.529360294342041, 4.766036033630371, 5.002711772918701, 5.239387512207031, 5.476062774658203, 5.712738990783691, 5.949414253234863, 6.186089992523193, 6.422765731811523, 6.6594414710998535, 6.896117210388184, 7.132792949676514, 7.369468688964844, 7.606143951416016, 7.842820167541504]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 7.0, 4.0, 7.0, 6.0, 16.0, 15.0, 27.0, 20.0, 21.0, 45.0, 57.0, 53.0, 82.0, 149.0, 211.0, 400.0, 745.0, 2109.0, 7880.0, 55370.0, 3860492.0, 242659.0, 17678.0, 3728.0, 1157.0, 494.0, 252.0, 156.0, 99.0, 83.0, 62.0, 34.0, 30.0, 26.0, 21.0, 20.0, 16.0, 13.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.572265625, -2.488555908203125, -2.40484619140625, -2.321136474609375, -2.2374267578125, -2.153717041015625, -2.07000732421875, -1.986297607421875, -1.902587890625, -1.818878173828125, -1.73516845703125, -1.651458740234375, -1.5677490234375, -1.484039306640625, -1.40032958984375, -1.316619873046875, -1.23291015625, -1.149200439453125, -1.06549072265625, -0.981781005859375, -0.8980712890625, -0.814361572265625, -0.73065185546875, -0.646942138671875, -0.563232421875, -0.479522705078125, -0.39581298828125, -0.312103271484375, -0.2283935546875, -0.144683837890625, -0.06097412109375, 0.022735595703125, 0.1064453125, 0.190155029296875, 0.27386474609375, 0.357574462890625, 0.4412841796875, 0.524993896484375, 0.60870361328125, 0.692413330078125, 0.776123046875, 0.859832763671875, 0.94354248046875, 1.027252197265625, 1.1109619140625, 1.194671630859375, 1.27838134765625, 1.362091064453125, 1.44580078125, 1.529510498046875, 1.61322021484375, 1.696929931640625, 1.7806396484375, 1.864349365234375, 1.94805908203125, 2.031768798828125, 2.115478515625, 2.199188232421875, 2.28289794921875, 2.366607666015625, 2.4503173828125, 2.534027099609375, 2.61773681640625, 2.701446533203125, 2.78515625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 4.0, 7.0, 8.0, 8.0, 17.0, 9.0, 17.0, 20.0, 26.0, 34.0, 30.0, 35.0, 47.0, 39.0, 43.0, 52.0, 58.0, 39.0, 62.0, 43.0, 38.0, 56.0, 36.0, 27.0, 37.0, 32.0, 33.0, 27.0, 18.0, 20.0, 17.0, 13.0, 13.0, 11.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.452392578125, -0.4397850036621094, -0.42717742919921875, -0.4145698547363281, -0.4019622802734375, -0.3893547058105469, -0.37674713134765625, -0.3641395568847656, -0.351531982421875, -0.3389244079589844, -0.32631683349609375, -0.3137092590332031, -0.3011016845703125, -0.2884941101074219, -0.27588653564453125, -0.2632789611816406, -0.25067138671875, -0.23806381225585938, -0.22545623779296875, -0.21284866333007812, -0.2002410888671875, -0.18763351440429688, -0.17502593994140625, -0.16241836547851562, -0.149810791015625, -0.13720321655273438, -0.12459564208984375, -0.11198806762695312, -0.0993804931640625, -0.08677291870117188, -0.07416534423828125, -0.061557769775390625, -0.0489501953125, -0.036342620849609375, -0.02373504638671875, -0.011127471923828125, 0.0014801025390625, 0.014087677001953125, 0.02669525146484375, 0.039302825927734375, 0.051910400390625, 0.06451797485351562, 0.07712554931640625, 0.08973312377929688, 0.1023406982421875, 0.11494827270507812, 0.12755584716796875, 0.14016342163085938, 0.15277099609375, 0.16537857055664062, 0.17798614501953125, 0.19059371948242188, 0.2032012939453125, 0.21580886840820312, 0.22841644287109375, 0.24102401733398438, 0.253631591796875, 0.2662391662597656, 0.27884674072265625, 0.2914543151855469, 0.3040618896484375, 0.3166694641113281, 0.32927703857421875, 0.3418846130371094, 0.3544921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 8.0, 5.0, 9.0, 14.0, 10.0, 11.0, 21.0, 29.0, 44.0, 64.0, 96.0, 151.0, 254.0, 368.0, 677.0, 1179.0, 2089.0, 4442.0, 9337.0, 22322.0, 64269.0, 340131.0, 3334298.0, 310294.0, 62777.0, 22269.0, 9419.0, 4310.0, 2319.0, 1227.0, 683.0, 400.0, 241.0, 160.0, 90.0, 82.0, 56.0, 26.0, 25.0, 19.0, 22.0, 15.0, 9.0, 4.0, 7.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92822265625, -0.8917922973632812, -0.8553619384765625, -0.8189315795898438, -0.782501220703125, -0.7460708618164062, -0.7096405029296875, -0.6732101440429688, -0.63677978515625, -0.6003494262695312, -0.5639190673828125, -0.5274887084960938, -0.491058349609375, -0.45462799072265625, -0.4181976318359375, -0.38176727294921875, -0.3453369140625, -0.30890655517578125, -0.2724761962890625, -0.23604583740234375, -0.199615478515625, -0.16318511962890625, -0.1267547607421875, -0.09032440185546875, -0.05389404296875, -0.01746368408203125, 0.0189666748046875, 0.05539703369140625, 0.091827392578125, 0.12825775146484375, 0.1646881103515625, 0.20111846923828125, 0.237548828125, 0.27397918701171875, 0.3104095458984375, 0.34683990478515625, 0.383270263671875, 0.41970062255859375, 0.4561309814453125, 0.49256134033203125, 0.52899169921875, 0.5654220581054688, 0.6018524169921875, 0.6382827758789062, 0.674713134765625, 0.7111434936523438, 0.7475738525390625, 0.7840042114257812, 0.8204345703125, 0.8568649291992188, 0.8932952880859375, 0.9297256469726562, 0.966156005859375, 1.0025863647460938, 1.0390167236328125, 1.0754470825195312, 1.11187744140625, 1.1483078002929688, 1.1847381591796875, 1.2211685180664062, 1.257598876953125, 1.2940292358398438, 1.3304595947265625, 1.3668899536132812, 1.4033203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 10.0, 15.0, 20.0, 16.0, 28.0, 40.0, 72.0, 98.0, 216.0, 516.0, 1289.0, 876.0, 361.0, 163.0, 78.0, 68.0, 44.0, 31.0, 21.0, 14.0, 19.0, 14.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.24609375, -1.19964599609375, -1.1531982421875, -1.10675048828125, -1.060302734375, -1.01385498046875, -0.9674072265625, -0.92095947265625, -0.87451171875, -0.82806396484375, -0.7816162109375, -0.73516845703125, -0.688720703125, -0.64227294921875, -0.5958251953125, -0.54937744140625, -0.5029296875, -0.45648193359375, -0.4100341796875, -0.36358642578125, -0.317138671875, -0.27069091796875, -0.2242431640625, -0.17779541015625, -0.13134765625, -0.08489990234375, -0.0384521484375, 0.00799560546875, 0.054443359375, 0.10089111328125, 0.1473388671875, 0.19378662109375, 0.240234375, 0.28668212890625, 0.3331298828125, 0.37957763671875, 0.426025390625, 0.47247314453125, 0.5189208984375, 0.56536865234375, 0.61181640625, 0.65826416015625, 0.7047119140625, 0.75115966796875, 0.797607421875, 0.84405517578125, 0.8905029296875, 0.93695068359375, 0.9833984375, 1.02984619140625, 1.0762939453125, 1.12274169921875, 1.169189453125, 1.21563720703125, 1.2620849609375, 1.30853271484375, 1.35498046875, 1.40142822265625, 1.4478759765625, 1.49432373046875, 1.540771484375, 1.58721923828125, 1.6336669921875, 1.68011474609375, 1.7265625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 3.0, 12.0, 39.0, 97.0, 222.0, 311.0, 186.0, 71.0, 34.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.68231201171875, -9.05036449432373, -8.418416976928711, -7.786470413208008, -7.154522895812988, -6.522575378417969, -5.890628337860107, -5.258681297302246, -4.626733779907227, -3.994786500930786, -3.3628392219543457, -2.7308919429779053, -2.098944664001465, -1.4669973850250244, -0.835050106048584, -0.20310306549072266, 0.4288444519042969, 1.0607917308807373, 1.6927390098571777, 2.324686288833618, 2.9566335678100586, 3.588580846786499, 4.2205281257629395, 4.852475166320801, 5.48442268371582, 6.11637020111084, 6.748317241668701, 7.3802642822265625, 8.012211799621582, 8.644159317016602, 9.276105880737305, 9.908053398132324, 10.540002822875977, 11.171950340270996, 11.803897857666016, 12.435844421386719, 13.067791938781738, 13.699739456176758, 14.331686019897461, 14.96363353729248, 15.5955810546875, 16.227527618408203, 16.85947608947754, 17.491422653198242, 18.123371124267578, 18.75531768798828, 19.387264251708984, 20.019210815429688, 20.651159286499023, 21.283105850219727, 21.915054321289062, 22.547000885009766, 23.17894744873047, 23.810895919799805, 24.442842483520508, 25.074790954589844, 25.706737518310547, 26.33868408203125, 26.970632553100586, 27.60257911682129, 28.234527587890625, 28.866474151611328, 29.49842071533203, 30.130367279052734, 30.76231575012207]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 8.0, 12.0, 17.0, 15.0, 22.0, 26.0, 27.0, 33.0, 35.0, 43.0, 38.0, 38.0, 49.0, 46.0, 56.0, 51.0, 55.0, 58.0, 48.0, 48.0, 42.0, 37.0, 35.0, 28.0, 27.0, 16.0, 13.0, 12.0, 9.0, 11.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.846559524536133, -6.65513277053833, -6.4637064933776855, -6.272279739379883, -6.080853462219238, -5.8894267082214355, -5.697999954223633, -5.506573677062988, -5.315147399902344, -5.123720645904541, -4.9322943687438965, -4.740867614746094, -4.549441337585449, -4.3580145835876465, -4.166587829589844, -3.975161552429199, -3.7837347984313965, -3.592308282852173, -3.400881767272949, -3.2094550132751465, -3.018028736114502, -2.826601982116699, -2.6351754665374756, -2.443748950958252, -2.2523224353790283, -2.0608959197998047, -1.869469404220581, -1.6780427694320679, -1.4866162538528442, -1.2951897382736206, -1.1037631034851074, -0.9123365879058838, -0.7209100723266602, -0.5294835567474365, -0.3380569815635681, -0.1466304063796997, 0.044796109199523926, 0.23622262477874756, 0.42764925956726074, 0.6190757751464844, 0.810502290725708, 1.0019288063049316, 1.1933553218841553, 1.3847819566726685, 1.576208472251892, 1.7676349878311157, 1.959061622619629, 2.1504881381988525, 2.341914653778076, 2.5333411693573, 2.7247676849365234, 2.916194438934326, 3.1076207160949707, 3.2990474700927734, 3.490473985671997, 3.6819005012512207, 3.8733270168304443, 4.064753532409668, 4.256180286407471, 4.447606563568115, 4.639033317565918, 4.8304595947265625, 5.021886348724365, 5.213313102722168, 5.4047393798828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 8.0, 9.0, 23.0, 25.0, 34.0, 54.0, 89.0, 134.0, 232.0, 353.0, 674.0, 1142.0, 2273.0, 4501.0, 10153.0, 27148.0, 94496.0, 468676.0, 333001.0, 67954.0, 21144.0, 8215.0, 3886.0, 1863.0, 1022.0, 587.0, 339.0, 170.0, 125.0, 74.0, 46.0, 35.0, 20.0, 18.0, 8.0, 5.0, 9.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.4873504638671875, -1.443450927734375, -1.3995513916015625, -1.35565185546875, -1.3117523193359375, -1.267852783203125, -1.2239532470703125, -1.1800537109375, -1.1361541748046875, -1.092254638671875, -1.0483551025390625, -1.00445556640625, -0.9605560302734375, -0.916656494140625, -0.8727569580078125, -0.828857421875, -0.7849578857421875, -0.741058349609375, -0.6971588134765625, -0.65325927734375, -0.6093597412109375, -0.565460205078125, -0.5215606689453125, -0.4776611328125, -0.4337615966796875, -0.389862060546875, -0.3459625244140625, -0.30206298828125, -0.2581634521484375, -0.214263916015625, -0.1703643798828125, -0.12646484375, -0.0825653076171875, -0.038665771484375, 0.0052337646484375, 0.04913330078125, 0.0930328369140625, 0.136932373046875, 0.1808319091796875, 0.2247314453125, 0.2686309814453125, 0.312530517578125, 0.3564300537109375, 0.40032958984375, 0.4442291259765625, 0.488128662109375, 0.5320281982421875, 0.575927734375, 0.6198272705078125, 0.663726806640625, 0.7076263427734375, 0.75152587890625, 0.7954254150390625, 0.839324951171875, 0.8832244873046875, 0.9271240234375, 0.9710235595703125, 1.014923095703125, 1.0588226318359375, 1.10272216796875, 1.1466217041015625, 1.190521240234375, 1.2344207763671875, 1.2783203125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 4.0, 13.0, 15.0, 16.0, 23.0, 14.0, 25.0, 29.0, 43.0, 39.0, 41.0, 46.0, 56.0, 54.0, 47.0, 55.0, 46.0, 43.0, 52.0, 45.0, 36.0, 34.0, 40.0, 29.0, 30.0, 29.0, 17.0, 16.0, 16.0, 9.0, 7.0, 12.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.54736328125, -0.5327873229980469, -0.5182113647460938, -0.5036354064941406, -0.4890594482421875, -0.4744834899902344, -0.45990753173828125, -0.4453315734863281, -0.430755615234375, -0.4161796569824219, -0.40160369873046875, -0.3870277404785156, -0.3724517822265625, -0.3578758239746094, -0.34329986572265625, -0.3287239074707031, -0.31414794921875, -0.2995719909667969, -0.28499603271484375, -0.2704200744628906, -0.2558441162109375, -0.24126815795898438, -0.22669219970703125, -0.21211624145507812, -0.197540283203125, -0.18296432495117188, -0.16838836669921875, -0.15381240844726562, -0.1392364501953125, -0.12466049194335938, -0.11008453369140625, -0.09550857543945312, -0.0809326171875, -0.06635665893554688, -0.05178070068359375, -0.037204742431640625, -0.0226287841796875, -0.008052825927734375, 0.00652313232421875, 0.021099090576171875, 0.035675048828125, 0.050251007080078125, 0.06482696533203125, 0.07940292358398438, 0.0939788818359375, 0.10855484008789062, 0.12313079833984375, 0.13770675659179688, 0.15228271484375, 0.16685867309570312, 0.18143463134765625, 0.19601058959960938, 0.2105865478515625, 0.22516250610351562, 0.23973846435546875, 0.2543144226074219, 0.268890380859375, 0.2834663391113281, 0.29804229736328125, 0.3126182556152344, 0.3271942138671875, 0.3417701721191406, 0.35634613037109375, 0.3709220886230469, 0.385498046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 16.0, 13.0, 21.0, 25.0, 47.0, 47.0, 82.0, 118.0, 215.0, 345.0, 762.0, 1710.0, 5288.0, 25441.0, 297594.0, 665959.0, 39486.0, 7181.0, 2188.0, 859.0, 453.0, 234.0, 146.0, 98.0, 55.0, 48.0, 31.0, 28.0, 18.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.453125, -2.376739501953125, -2.30035400390625, -2.223968505859375, -2.1475830078125, -2.071197509765625, -1.99481201171875, -1.918426513671875, -1.842041015625, -1.765655517578125, -1.68927001953125, -1.612884521484375, -1.5364990234375, -1.460113525390625, -1.38372802734375, -1.307342529296875, -1.23095703125, -1.154571533203125, -1.07818603515625, -1.001800537109375, -0.9254150390625, -0.849029541015625, -0.77264404296875, -0.696258544921875, -0.619873046875, -0.543487548828125, -0.46710205078125, -0.390716552734375, -0.3143310546875, -0.237945556640625, -0.16156005859375, -0.085174560546875, -0.0087890625, 0.067596435546875, 0.14398193359375, 0.220367431640625, 0.2967529296875, 0.373138427734375, 0.44952392578125, 0.525909423828125, 0.602294921875, 0.678680419921875, 0.75506591796875, 0.831451416015625, 0.9078369140625, 0.984222412109375, 1.06060791015625, 1.136993408203125, 1.21337890625, 1.289764404296875, 1.36614990234375, 1.442535400390625, 1.5189208984375, 1.595306396484375, 1.67169189453125, 1.748077392578125, 1.824462890625, 1.900848388671875, 1.97723388671875, 2.053619384765625, 2.1300048828125, 2.206390380859375, 2.28277587890625, 2.359161376953125, 2.435546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 4.0, 7.0, 10.0, 14.0, 21.0, 19.0, 24.0, 28.0, 31.0, 37.0, 30.0, 39.0, 43.0, 70.0, 54.0, 74.0, 57.0, 61.0, 53.0, 48.0, 46.0, 44.0, 34.0, 24.0, 31.0, 22.0, 18.0, 15.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.012237548828125, -1.94244384765625, -1.872650146484375, -1.8028564453125, -1.733062744140625, -1.66326904296875, -1.593475341796875, -1.523681640625, -1.453887939453125, -1.38409423828125, -1.314300537109375, -1.2445068359375, -1.174713134765625, -1.10491943359375, -1.035125732421875, -0.96533203125, -0.895538330078125, -0.82574462890625, -0.755950927734375, -0.6861572265625, -0.616363525390625, -0.54656982421875, -0.476776123046875, -0.406982421875, -0.337188720703125, -0.26739501953125, -0.197601318359375, -0.1278076171875, -0.058013916015625, 0.01177978515625, 0.081573486328125, 0.1513671875, 0.221160888671875, 0.29095458984375, 0.360748291015625, 0.4305419921875, 0.500335693359375, 0.57012939453125, 0.639923095703125, 0.709716796875, 0.779510498046875, 0.84930419921875, 0.919097900390625, 0.9888916015625, 1.058685302734375, 1.12847900390625, 1.198272705078125, 1.26806640625, 1.337860107421875, 1.40765380859375, 1.477447509765625, 1.5472412109375, 1.617034912109375, 1.68682861328125, 1.756622314453125, 1.826416015625, 1.896209716796875, 1.96600341796875, 2.035797119140625, 2.1055908203125, 2.175384521484375, 2.24517822265625, 2.314971923828125, 2.384765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 9.0, 3.0, 9.0, 15.0, 21.0, 32.0, 71.0, 168.0, 717.0, 5135.0, 396493.0, 638772.0, 5966.0, 760.0, 204.0, 79.0, 48.0, 21.0, 11.0, 12.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.776580810546875, -2.68988037109375, -2.603179931640625, -2.5164794921875, -2.429779052734375, -2.34307861328125, -2.256378173828125, -2.169677734375, -2.082977294921875, -1.99627685546875, -1.909576416015625, -1.8228759765625, -1.736175537109375, -1.64947509765625, -1.562774658203125, -1.47607421875, -1.389373779296875, -1.30267333984375, -1.215972900390625, -1.1292724609375, -1.042572021484375, -0.95587158203125, -0.869171142578125, -0.782470703125, -0.695770263671875, -0.60906982421875, -0.522369384765625, -0.4356689453125, -0.348968505859375, -0.26226806640625, -0.175567626953125, -0.0888671875, -0.002166748046875, 0.08453369140625, 0.171234130859375, 0.2579345703125, 0.344635009765625, 0.43133544921875, 0.518035888671875, 0.604736328125, 0.691436767578125, 0.77813720703125, 0.864837646484375, 0.9515380859375, 1.038238525390625, 1.12493896484375, 1.211639404296875, 1.29833984375, 1.385040283203125, 1.47174072265625, 1.558441162109375, 1.6451416015625, 1.731842041015625, 1.81854248046875, 1.905242919921875, 1.991943359375, 2.078643798828125, 2.16534423828125, 2.252044677734375, 2.3387451171875, 2.425445556640625, 2.51214599609375, 2.598846435546875, 2.685546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 9.0, 8.0, 12.0, 10.0, 12.0, 17.0, 24.0, 48.0, 72.0, 96.0, 140.0, 155.0, 121.0, 68.0, 60.0, 24.0, 29.0, 14.0, 18.0, 14.0, 9.0, 9.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00020754337310791016, -0.00020165927708148956, -0.00019577518105506897, -0.00018989108502864838, -0.00018400698900222778, -0.0001781228929758072, -0.0001722387969493866, -0.000166354700922966, -0.0001604706048965454, -0.00015458650887012482, -0.00014870241284370422, -0.00014281831681728363, -0.00013693422079086304, -0.00013105012476444244, -0.00012516602873802185, -0.00011928193271160126, -0.00011339783668518066, -0.00010751374065876007, -0.00010162964463233948, -9.574554860591888e-05, -8.986145257949829e-05, -8.39773565530777e-05, -7.80932605266571e-05, -7.220916450023651e-05, -6.632506847381592e-05, -6.0440972447395325e-05, -5.455687642097473e-05, -4.867278039455414e-05, -4.2788684368133545e-05, -3.690458834171295e-05, -3.102049231529236e-05, -2.5136396288871765e-05, -1.9252300262451172e-05, -1.3368204236030579e-05, -7.484108209609985e-06, -1.600012183189392e-06, 4.284083843231201e-06, 1.0168179869651794e-05, 1.6052275896072388e-05, 2.193637192249298e-05, 2.7820467948913574e-05, 3.370456397533417e-05, 3.958866000175476e-05, 4.5472756028175354e-05, 5.135685205459595e-05, 5.724094808101654e-05, 6.312504410743713e-05, 6.900914013385773e-05, 7.489323616027832e-05, 8.077733218669891e-05, 8.666142821311951e-05, 9.25455242395401e-05, 9.84296202659607e-05, 0.00010431371629238129, 0.00011019781231880188, 0.00011608190834522247, 0.00012196600437164307, 0.00012785010039806366, 0.00013373419642448425, 0.00013961829245090485, 0.00014550238847732544, 0.00015138648450374603, 0.00015727058053016663, 0.00016315467655658722, 0.0001690387725830078]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 12.0, 11.0, 37.0, 39.0, 81.0, 127.0, 226.0, 519.0, 1403.0, 6024.0, 68075.0, 914594.0, 49901.0, 5158.0, 1321.0, 487.0, 233.0, 122.0, 69.0, 37.0, 30.0, 9.0, 10.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.904296875, -1.85345458984375, -1.8026123046875, -1.75177001953125, -1.700927734375, -1.65008544921875, -1.5992431640625, -1.54840087890625, -1.49755859375, -1.44671630859375, -1.3958740234375, -1.34503173828125, -1.294189453125, -1.24334716796875, -1.1925048828125, -1.14166259765625, -1.0908203125, -1.03997802734375, -0.9891357421875, -0.93829345703125, -0.887451171875, -0.83660888671875, -0.7857666015625, -0.73492431640625, -0.68408203125, -0.63323974609375, -0.5823974609375, -0.53155517578125, -0.480712890625, -0.42987060546875, -0.3790283203125, -0.32818603515625, -0.27734375, -0.22650146484375, -0.1756591796875, -0.12481689453125, -0.073974609375, -0.02313232421875, 0.0277099609375, 0.07855224609375, 0.12939453125, 0.18023681640625, 0.2310791015625, 0.28192138671875, 0.332763671875, 0.38360595703125, 0.4344482421875, 0.48529052734375, 0.5361328125, 0.58697509765625, 0.6378173828125, 0.68865966796875, 0.739501953125, 0.79034423828125, 0.8411865234375, 0.89202880859375, 0.94287109375, 0.99371337890625, 1.0445556640625, 1.09539794921875, 1.146240234375, 1.19708251953125, 1.2479248046875, 1.29876708984375, 1.349609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 1.0, 5.0, 16.0, 7.0, 9.0, 12.0, 23.0, 23.0, 19.0, 31.0, 42.0, 65.0, 52.0, 69.0, 85.0, 66.0, 69.0, 81.0, 47.0, 49.0, 33.0, 29.0, 32.0, 25.0, 17.0, 11.0, 14.0, 6.0, 9.0, 5.0, 9.0, 7.0, 2.0, 4.0, 2.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.59716796875, -0.5776824951171875, -0.558197021484375, -0.5387115478515625, -0.51922607421875, -0.4997406005859375, -0.480255126953125, -0.4607696533203125, -0.4412841796875, -0.4217987060546875, -0.402313232421875, -0.3828277587890625, -0.36334228515625, -0.3438568115234375, -0.324371337890625, -0.3048858642578125, -0.285400390625, -0.2659149169921875, -0.246429443359375, -0.2269439697265625, -0.20745849609375, -0.1879730224609375, -0.168487548828125, -0.1490020751953125, -0.1295166015625, -0.1100311279296875, -0.090545654296875, -0.0710601806640625, -0.05157470703125, -0.0320892333984375, -0.012603759765625, 0.0068817138671875, 0.0263671875, 0.0458526611328125, 0.065338134765625, 0.0848236083984375, 0.10430908203125, 0.1237945556640625, 0.143280029296875, 0.1627655029296875, 0.1822509765625, 0.2017364501953125, 0.221221923828125, 0.2407073974609375, 0.26019287109375, 0.2796783447265625, 0.299163818359375, 0.3186492919921875, 0.338134765625, 0.3576202392578125, 0.377105712890625, 0.3965911865234375, 0.41607666015625, 0.4355621337890625, 0.455047607421875, 0.4745330810546875, 0.4940185546875, 0.5135040283203125, 0.532989501953125, 0.5524749755859375, 0.57196044921875, 0.5914459228515625, 0.610931396484375, 0.6304168701171875, 0.64990234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 16.0, 18.0, 57.0, 134.0, 242.0, 312.0, 135.0, 43.0, 19.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.01019287109375, -37.2553825378418, -36.500572204589844, -35.74576187133789, -34.99095153808594, -34.23614501953125, -33.48133087158203, -32.726524353027344, -31.97171401977539, -31.216903686523438, -30.462093353271484, -29.70728302001953, -28.95247459411621, -28.197664260864258, -27.442853927612305, -26.68804359436035, -25.9332332611084, -25.178422927856445, -24.423612594604492, -23.668804168701172, -22.91399383544922, -22.159183502197266, -21.404373168945312, -20.64956283569336, -19.894752502441406, -19.139942169189453, -18.3851318359375, -17.630321502685547, -16.875513076782227, -16.120702743530273, -15.36589241027832, -14.611082077026367, -13.856271743774414, -13.101461410522461, -12.346652030944824, -11.591841697692871, -10.837032318115234, -10.082221984863281, -9.327411651611328, -8.572601318359375, -7.817791938781738, -7.062982082366943, -6.308172225952148, -5.553361892700195, -4.7985520362854, -4.0437421798706055, -3.2889318466186523, -2.5341219902038574, -1.7793121337890625, -1.024502158164978, -0.26969218254089355, 0.48511791229248047, 1.2399277687072754, 1.9947376251220703, 2.7495479583740234, 3.5043578147888184, 4.259167671203613, 5.013977527618408, 5.768787384033203, 6.523597717285156, 7.278407573699951, 8.033217430114746, 8.7880277633667, 9.542837142944336, 10.297647476196289]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 6.0, 12.0, 11.0, 16.0, 17.0, 27.0, 19.0, 30.0, 23.0, 31.0, 29.0, 48.0, 64.0, 51.0, 59.0, 54.0, 61.0, 53.0, 43.0, 37.0, 39.0, 52.0, 27.0, 26.0, 22.0, 24.0, 23.0, 19.0, 12.0, 9.0, 5.0, 6.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.124910354614258, -8.862466812133789, -8.600022315979004, -8.337578773498535, -8.07513427734375, -7.812690734863281, -7.5502471923828125, -7.2878031730651855, -7.025359153747559, -6.762915134429932, -6.500471115112305, -6.238027572631836, -5.975583553314209, -5.713139533996582, -5.450695991516113, -5.188251972198486, -4.925807952880859, -4.663363933563232, -4.4009199142456055, -4.138476371765137, -3.8760323524475098, -3.613588333129883, -3.351144552230835, -3.088700771331787, -2.82625675201416, -2.563812732696533, -2.3013689517974854, -2.0389251708984375, -1.7764811515808105, -1.5140372514724731, -1.2515933513641357, -0.9891494512557983, -0.7267045974731445, -0.46426069736480713, -0.20181679725646973, 0.060627102851867676, 0.3230710029602051, 0.5855149030685425, 0.8479588031768799, 1.1104027032852173, 1.3728466033935547, 1.635290503501892, 1.8977344036102295, 2.1601781845092773, 2.4226222038269043, 2.6850662231445312, 2.947510004043579, 3.209953784942627, 3.472397804260254, 3.734841823577881, 3.9972856044769287, 4.259729385375977, 4.5221734046936035, 4.7846174240112305, 5.047060966491699, 5.309504985809326, 5.571949005126953, 5.83439302444458, 6.096837043762207, 6.359280586242676, 6.621724605560303, 6.88416862487793, 7.146612167358398, 7.409056186676025, 7.671500205993652]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 13.0, 12.0, 16.0, 28.0, 34.0, 52.0, 81.0, 112.0, 161.0, 263.0, 421.0, 664.0, 1029.0, 1929.0, 3536.0, 6724.0, 13892.0, 31428.0, 83120.0, 345183.0, 2297672.0, 1133898.0, 175549.0, 53989.0, 22237.0, 10200.0, 5256.0, 2707.0, 1557.0, 916.0, 531.0, 339.0, 226.0, 157.0, 95.0, 93.0, 41.0, 34.0, 20.0, 13.0, 10.0, 6.0, 9.0, 5.0, 7.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.70654296875, -0.68499755859375, -0.6634521484375, -0.64190673828125, -0.620361328125, -0.59881591796875, -0.5772705078125, -0.55572509765625, -0.5341796875, -0.51263427734375, -0.4910888671875, -0.46954345703125, -0.447998046875, -0.42645263671875, -0.4049072265625, -0.38336181640625, -0.36181640625, -0.34027099609375, -0.3187255859375, -0.29718017578125, -0.275634765625, -0.25408935546875, -0.2325439453125, -0.21099853515625, -0.189453125, -0.16790771484375, -0.1463623046875, -0.12481689453125, -0.103271484375, -0.08172607421875, -0.0601806640625, -0.03863525390625, -0.01708984375, 0.00445556640625, 0.0260009765625, 0.04754638671875, 0.069091796875, 0.09063720703125, 0.1121826171875, 0.13372802734375, 0.1552734375, 0.17681884765625, 0.1983642578125, 0.21990966796875, 0.241455078125, 0.26300048828125, 0.2845458984375, 0.30609130859375, 0.32763671875, 0.34918212890625, 0.3707275390625, 0.39227294921875, 0.413818359375, 0.43536376953125, 0.4569091796875, 0.47845458984375, 0.5, 0.52154541015625, 0.5430908203125, 0.56463623046875, 0.586181640625, 0.60772705078125, 0.6292724609375, 0.65081787109375, 0.67236328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 9.0, 16.0, 9.0, 16.0, 16.0, 20.0, 13.0, 33.0, 35.0, 28.0, 37.0, 51.0, 48.0, 30.0, 47.0, 52.0, 60.0, 64.0, 48.0, 44.0, 49.0, 34.0, 44.0, 25.0, 30.0, 26.0, 21.0, 10.0, 15.0, 7.0, 13.0, 11.0, 14.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.466064453125, -0.4527702331542969, -0.43947601318359375, -0.4261817932128906, -0.4128875732421875, -0.3995933532714844, -0.38629913330078125, -0.3730049133300781, -0.359710693359375, -0.3464164733886719, -0.33312225341796875, -0.3198280334472656, -0.3065338134765625, -0.2932395935058594, -0.27994537353515625, -0.2666511535644531, -0.25335693359375, -0.24006271362304688, -0.22676849365234375, -0.21347427368164062, -0.2001800537109375, -0.18688583374023438, -0.17359161376953125, -0.16029739379882812, -0.147003173828125, -0.13370895385742188, -0.12041473388671875, -0.10712051391601562, -0.0938262939453125, -0.08053207397460938, -0.06723785400390625, -0.053943634033203125, -0.0406494140625, -0.027355194091796875, -0.01406097412109375, -0.000766754150390625, 0.0125274658203125, 0.025821685791015625, 0.03911590576171875, 0.052410125732421875, 0.065704345703125, 0.07899856567382812, 0.09229278564453125, 0.10558700561523438, 0.1188812255859375, 0.13217544555664062, 0.14546966552734375, 0.15876388549804688, 0.17205810546875, 0.18535232543945312, 0.19864654541015625, 0.21194076538085938, 0.2252349853515625, 0.23852920532226562, 0.25182342529296875, 0.2651176452636719, 0.278411865234375, 0.2917060852050781, 0.30500030517578125, 0.3182945251464844, 0.3315887451171875, 0.3448829650878906, 0.35817718505859375, 0.3714714050292969, 0.384765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 9.0, 16.0, 26.0, 40.0, 44.0, 84.0, 139.0, 207.0, 395.0, 551.0, 1145.0, 2083.0, 4696.0, 12749.0, 44664.0, 274375.0, 3416512.0, 357839.0, 52541.0, 15035.0, 5666.0, 2508.0, 1275.0, 647.0, 380.0, 227.0, 157.0, 82.0, 57.0, 32.0, 28.0, 21.0, 6.0, 10.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4851531982421875, -1.438079833984375, -1.3910064697265625, -1.34393310546875, -1.2968597412109375, -1.249786376953125, -1.2027130126953125, -1.1556396484375, -1.1085662841796875, -1.061492919921875, -1.0144195556640625, -0.96734619140625, -0.9202728271484375, -0.873199462890625, -0.8261260986328125, -0.779052734375, -0.7319793701171875, -0.684906005859375, -0.6378326416015625, -0.59075927734375, -0.5436859130859375, -0.496612548828125, -0.4495391845703125, -0.4024658203125, -0.3553924560546875, -0.308319091796875, -0.2612457275390625, -0.21417236328125, -0.1670989990234375, -0.120025634765625, -0.0729522705078125, -0.02587890625, 0.0211944580078125, 0.068267822265625, 0.1153411865234375, 0.16241455078125, 0.2094879150390625, 0.256561279296875, 0.3036346435546875, 0.3507080078125, 0.3977813720703125, 0.444854736328125, 0.4919281005859375, 0.53900146484375, 0.5860748291015625, 0.633148193359375, 0.6802215576171875, 0.727294921875, 0.7743682861328125, 0.821441650390625, 0.8685150146484375, 0.91558837890625, 0.9626617431640625, 1.009735107421875, 1.0568084716796875, 1.1038818359375, 1.1509552001953125, 1.198028564453125, 1.2451019287109375, 1.29217529296875, 1.3392486572265625, 1.386322021484375, 1.4333953857421875, 1.48046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 9.0, 8.0, 14.0, 18.0, 16.0, 41.0, 62.0, 78.0, 128.0, 188.0, 335.0, 634.0, 956.0, 639.0, 318.0, 184.0, 112.0, 86.0, 49.0, 27.0, 36.0, 24.0, 17.0, 15.0, 13.0, 10.0, 6.0, 3.0, 3.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4310302734375, -1.382568359375, -1.3341064453125, -1.28564453125, -1.2371826171875, -1.188720703125, -1.1402587890625, -1.091796875, -1.0433349609375, -0.994873046875, -0.9464111328125, -0.89794921875, -0.8494873046875, -0.801025390625, -0.7525634765625, -0.7041015625, -0.6556396484375, -0.607177734375, -0.5587158203125, -0.51025390625, -0.4617919921875, -0.413330078125, -0.3648681640625, -0.31640625, -0.2679443359375, -0.219482421875, -0.1710205078125, -0.12255859375, -0.0740966796875, -0.025634765625, 0.0228271484375, 0.0712890625, 0.1197509765625, 0.168212890625, 0.2166748046875, 0.26513671875, 0.3135986328125, 0.362060546875, 0.4105224609375, 0.458984375, 0.5074462890625, 0.555908203125, 0.6043701171875, 0.65283203125, 0.7012939453125, 0.749755859375, 0.7982177734375, 0.8466796875, 0.8951416015625, 0.943603515625, 0.9920654296875, 1.04052734375, 1.0889892578125, 1.137451171875, 1.1859130859375, 1.234375, 1.2828369140625, 1.331298828125, 1.3797607421875, 1.42822265625, 1.4766845703125, 1.525146484375, 1.5736083984375, 1.6220703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 8.0, 23.0, 46.0, 234.0, 410.0, 193.0, 49.0, 20.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-51.32756805419922, -50.32958984375, -49.33161163330078, -48.33363342285156, -47.335655212402344, -46.337677001953125, -45.339698791503906, -44.34172058105469, -43.34374237060547, -42.34576416015625, -41.34778594970703, -40.34980773925781, -39.351829528808594, -38.353851318359375, -37.355873107910156, -36.35789489746094, -35.35991668701172, -34.3619384765625, -33.36396026611328, -32.36598205566406, -31.368003845214844, -30.370025634765625, -29.372047424316406, -28.374069213867188, -27.376087188720703, -26.378108978271484, -25.380130767822266, -24.382152557373047, -23.384174346923828, -22.38619613647461, -21.38821792602539, -20.390239715576172, -19.392263412475586, -18.394285202026367, -17.39630699157715, -16.39832878112793, -15.400350570678711, -14.402372360229492, -13.404393196105957, -12.406414985656738, -11.40843677520752, -10.4104585647583, -9.412480354309082, -8.414501190185547, -7.416523456573486, -6.418545246124268, -5.420566558837891, -4.422588348388672, -3.424610137939453, -2.4266319274902344, -1.4286534786224365, -0.43067502975463867, 0.5673031806945801, 1.5652813911437988, 2.563260078430176, 3.5612382888793945, 4.559216499328613, 5.557194709777832, 6.555172920227051, 7.553151607513428, 8.551130294799805, 9.549108505249023, 10.547086715698242, 11.545064926147461, 12.54304313659668]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 6.0, 4.0, 9.0, 2.0, 14.0, 16.0, 8.0, 16.0, 17.0, 19.0, 30.0, 32.0, 41.0, 38.0, 32.0, 35.0, 43.0, 46.0, 57.0, 47.0, 52.0, 51.0, 52.0, 41.0, 41.0, 35.0, 28.0, 27.0, 20.0, 28.0, 20.0, 12.0, 23.0, 14.0, 10.0, 8.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.792963027954102, -5.57534646987915, -5.357730388641357, -5.140113830566406, -4.922497749328613, -4.704881191253662, -4.487264633178711, -4.269648551940918, -4.052031993865967, -3.8344156742095947, -3.6167993545532227, -3.3991827964782715, -3.1815664768218994, -2.9639501571655273, -2.746333599090576, -2.528717279434204, -2.311100959777832, -2.09348464012146, -1.8758682012557983, -1.6582517623901367, -1.4406354427337646, -1.2230191230773926, -1.005402684211731, -0.7877862453460693, -0.5701699256896973, -0.3525535464286804, -0.13493716716766357, 0.08267921209335327, 0.3002955913543701, 0.5179119110107422, 0.7355283498764038, 0.9531447887420654, 1.1707611083984375, 1.3883774280548096, 1.6059938669204712, 1.8236103057861328, 2.041226625442505, 2.258842945098877, 2.476459503173828, 2.6940758228302, 2.9116921424865723, 3.1293084621429443, 3.3469247817993164, 3.5645413398742676, 3.7821576595306396, 3.9997739791870117, 4.217390537261963, 4.435007095336914, 4.652623176574707, 4.870239734649658, 5.087855815887451, 5.305472373962402, 5.523088455200195, 5.7407050132751465, 5.958321571350098, 6.175937652587891, 6.393554210662842, 6.611170768737793, 6.828786849975586, 7.046403408050537, 7.264019966125488, 7.481636047363281, 7.699252605438232, 7.916869163513184, 8.134485244750977]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 12.0, 10.0, 19.0, 24.0, 23.0, 33.0, 65.0, 93.0, 129.0, 245.0, 392.0, 626.0, 1088.0, 1991.0, 3843.0, 8134.0, 19718.0, 51498.0, 147030.0, 431825.0, 249180.0, 79418.0, 29508.0, 12009.0, 5387.0, 2770.0, 1453.0, 766.0, 501.0, 274.0, 172.0, 107.0, 69.0, 48.0, 36.0, 21.0, 6.0, 10.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3408203125, -1.3022003173828125, -1.263580322265625, -1.2249603271484375, -1.18634033203125, -1.1477203369140625, -1.109100341796875, -1.0704803466796875, -1.0318603515625, -0.9932403564453125, -0.954620361328125, -0.9160003662109375, -0.87738037109375, -0.8387603759765625, -0.800140380859375, -0.7615203857421875, -0.722900390625, -0.6842803955078125, -0.645660400390625, -0.6070404052734375, -0.56842041015625, -0.5298004150390625, -0.491180419921875, -0.4525604248046875, -0.4139404296875, -0.3753204345703125, -0.336700439453125, -0.2980804443359375, -0.25946044921875, -0.2208404541015625, -0.182220458984375, -0.1436004638671875, -0.10498046875, -0.0663604736328125, -0.027740478515625, 0.0108795166015625, 0.04949951171875, 0.0881195068359375, 0.126739501953125, 0.1653594970703125, 0.2039794921875, 0.2425994873046875, 0.281219482421875, 0.3198394775390625, 0.35845947265625, 0.3970794677734375, 0.435699462890625, 0.4743194580078125, 0.512939453125, 0.5515594482421875, 0.590179443359375, 0.6287994384765625, 0.66741943359375, 0.7060394287109375, 0.744659423828125, 0.7832794189453125, 0.8218994140625, 0.8605194091796875, 0.899139404296875, 0.9377593994140625, 0.97637939453125, 1.0149993896484375, 1.053619384765625, 1.0922393798828125, 1.130859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 7.0, 14.0, 8.0, 17.0, 15.0, 17.0, 29.0, 21.0, 32.0, 38.0, 33.0, 46.0, 50.0, 41.0, 51.0, 44.0, 46.0, 48.0, 64.0, 52.0, 45.0, 30.0, 41.0, 28.0, 27.0, 28.0, 24.0, 20.0, 13.0, 12.0, 9.0, 12.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48681640625, -0.47292327880859375, -0.4590301513671875, -0.44513702392578125, -0.431243896484375, -0.41735076904296875, -0.4034576416015625, -0.38956451416015625, -0.37567138671875, -0.36177825927734375, -0.3478851318359375, -0.33399200439453125, -0.320098876953125, -0.30620574951171875, -0.2923126220703125, -0.27841949462890625, -0.2645263671875, -0.25063323974609375, -0.2367401123046875, -0.22284698486328125, -0.208953857421875, -0.19506072998046875, -0.1811676025390625, -0.16727447509765625, -0.15338134765625, -0.13948822021484375, -0.1255950927734375, -0.11170196533203125, -0.097808837890625, -0.08391571044921875, -0.0700225830078125, -0.05612945556640625, -0.042236328125, -0.02834320068359375, -0.0144500732421875, -0.00055694580078125, 0.013336181640625, 0.02722930908203125, 0.0411224365234375, 0.05501556396484375, 0.06890869140625, 0.08280181884765625, 0.0966949462890625, 0.11058807373046875, 0.124481201171875, 0.13837432861328125, 0.1522674560546875, 0.16616058349609375, 0.1800537109375, 0.19394683837890625, 0.2078399658203125, 0.22173309326171875, 0.235626220703125, 0.24951934814453125, 0.2634124755859375, 0.27730560302734375, 0.29119873046875, 0.30509185791015625, 0.3189849853515625, 0.33287811279296875, 0.346771240234375, 0.36066436767578125, 0.3745574951171875, 0.38845062255859375, 0.40234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 16.0, 18.0, 26.0, 27.0, 52.0, 78.0, 109.0, 169.0, 290.0, 546.0, 1120.0, 2896.0, 12504.0, 215766.0, 782167.0, 25295.0, 4315.0, 1565.0, 665.0, 340.0, 201.0, 112.0, 73.0, 61.0, 33.0, 20.0, 24.0, 14.0, 14.0, 7.0, 7.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2421875, -4.1248779296875, -4.007568359375, -3.8902587890625, -3.77294921875, -3.6556396484375, -3.538330078125, -3.4210205078125, -3.3037109375, -3.1864013671875, -3.069091796875, -2.9517822265625, -2.83447265625, -2.7171630859375, -2.599853515625, -2.4825439453125, -2.365234375, -2.2479248046875, -2.130615234375, -2.0133056640625, -1.89599609375, -1.7786865234375, -1.661376953125, -1.5440673828125, -1.4267578125, -1.3094482421875, -1.192138671875, -1.0748291015625, -0.95751953125, -0.8402099609375, -0.722900390625, -0.6055908203125, -0.48828125, -0.3709716796875, -0.253662109375, -0.1363525390625, -0.01904296875, 0.0982666015625, 0.215576171875, 0.3328857421875, 0.4501953125, 0.5675048828125, 0.684814453125, 0.8021240234375, 0.91943359375, 1.0367431640625, 1.154052734375, 1.2713623046875, 1.388671875, 1.5059814453125, 1.623291015625, 1.7406005859375, 1.85791015625, 1.9752197265625, 2.092529296875, 2.2098388671875, 2.3271484375, 2.4444580078125, 2.561767578125, 2.6790771484375, 2.79638671875, 2.9136962890625, 3.031005859375, 3.1483154296875, 3.265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 6.0, 12.0, 21.0, 24.0, 26.0, 31.0, 33.0, 39.0, 47.0, 44.0, 55.0, 69.0, 67.0, 62.0, 45.0, 57.0, 52.0, 61.0, 42.0, 25.0, 40.0, 22.0, 24.0, 17.0, 17.0, 19.0, 8.0, 10.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.951171875, -2.87005615234375, -2.7889404296875, -2.70782470703125, -2.626708984375, -2.54559326171875, -2.4644775390625, -2.38336181640625, -2.30224609375, -2.22113037109375, -2.1400146484375, -2.05889892578125, -1.977783203125, -1.89666748046875, -1.8155517578125, -1.73443603515625, -1.6533203125, -1.57220458984375, -1.4910888671875, -1.40997314453125, -1.328857421875, -1.24774169921875, -1.1666259765625, -1.08551025390625, -1.00439453125, -0.92327880859375, -0.8421630859375, -0.76104736328125, -0.679931640625, -0.59881591796875, -0.5177001953125, -0.43658447265625, -0.35546875, -0.27435302734375, -0.1932373046875, -0.11212158203125, -0.031005859375, 0.05010986328125, 0.1312255859375, 0.21234130859375, 0.29345703125, 0.37457275390625, 0.4556884765625, 0.53680419921875, 0.617919921875, 0.69903564453125, 0.7801513671875, 0.86126708984375, 0.9423828125, 1.02349853515625, 1.1046142578125, 1.18572998046875, 1.266845703125, 1.34796142578125, 1.4290771484375, 1.51019287109375, 1.59130859375, 1.67242431640625, 1.7535400390625, 1.83465576171875, 1.915771484375, 1.99688720703125, 2.0780029296875, 2.15911865234375, 2.240234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 10.0, 6.0, 8.0, 11.0, 15.0, 20.0, 21.0, 30.0, 58.0, 73.0, 120.0, 216.0, 367.0, 738.0, 1976.0, 7134.0, 48832.0, 730592.0, 231436.0, 20232.0, 3990.0, 1293.0, 560.0, 298.0, 150.0, 119.0, 72.0, 41.0, 24.0, 31.0, 12.0, 12.0, 7.0, 5.0, 11.0, 1.0, 8.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9228515625, -0.893829345703125, -0.86480712890625, -0.835784912109375, -0.8067626953125, -0.777740478515625, -0.74871826171875, -0.719696044921875, -0.690673828125, -0.661651611328125, -0.63262939453125, -0.603607177734375, -0.5745849609375, -0.545562744140625, -0.51654052734375, -0.487518310546875, -0.45849609375, -0.429473876953125, -0.40045166015625, -0.371429443359375, -0.3424072265625, -0.313385009765625, -0.28436279296875, -0.255340576171875, -0.226318359375, -0.197296142578125, -0.16827392578125, -0.139251708984375, -0.1102294921875, -0.081207275390625, -0.05218505859375, -0.023162841796875, 0.005859375, 0.034881591796875, 0.06390380859375, 0.092926025390625, 0.1219482421875, 0.150970458984375, 0.17999267578125, 0.209014892578125, 0.238037109375, 0.267059326171875, 0.29608154296875, 0.325103759765625, 0.3541259765625, 0.383148193359375, 0.41217041015625, 0.441192626953125, 0.47021484375, 0.499237060546875, 0.52825927734375, 0.557281494140625, 0.5863037109375, 0.615325927734375, 0.64434814453125, 0.673370361328125, 0.702392578125, 0.731414794921875, 0.76043701171875, 0.789459228515625, 0.8184814453125, 0.847503662109375, 0.87652587890625, 0.905548095703125, 0.9345703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 9.0, 3.0, 7.0, 14.0, 17.0, 20.0, 23.0, 26.0, 31.0, 42.0, 33.0, 48.0, 70.0, 106.0, 130.0, 100.0, 57.0, 50.0, 35.0, 27.0, 31.0, 30.0, 20.0, 15.0, 13.0, 9.0, 9.0, 4.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019621849060058594, -0.00019081681966781616, -0.0001854151487350464, -0.0001800134778022766, -0.00017461180686950684, -0.00016921013593673706, -0.00016380846500396729, -0.0001584067940711975, -0.00015300512313842773, -0.00014760345220565796, -0.00014220178127288818, -0.0001368001103401184, -0.00013139843940734863, -0.00012599676847457886, -0.00012059509754180908, -0.0001151934266090393, -0.00010979175567626953, -0.00010439008474349976, -9.898841381072998e-05, -9.35867428779602e-05, -8.818507194519043e-05, -8.278340101242065e-05, -7.738173007965088e-05, -7.19800591468811e-05, -6.657838821411133e-05, -6.117671728134155e-05, -5.577504634857178e-05, -5.0373375415802e-05, -4.4971704483032227e-05, -3.957003355026245e-05, -3.4168362617492676e-05, -2.87666916847229e-05, -2.3365020751953125e-05, -1.796334981918335e-05, -1.2561678886413574e-05, -7.160007953643799e-06, -1.7583370208740234e-06, 3.643333911895752e-06, 9.045004844665527e-06, 1.4446675777435303e-05, 1.9848346710205078e-05, 2.5250017642974854e-05, 3.065168857574463e-05, 3.6053359508514404e-05, 4.145503044128418e-05, 4.6856701374053955e-05, 5.225837230682373e-05, 5.7660043239593506e-05, 6.306171417236328e-05, 6.846338510513306e-05, 7.386505603790283e-05, 7.926672697067261e-05, 8.466839790344238e-05, 9.007006883621216e-05, 9.547173976898193e-05, 0.00010087341070175171, 0.00010627508163452148, 0.00011167675256729126, 0.00011707842350006104, 0.0001224800944328308, 0.00012788176536560059, 0.00013328343629837036, 0.00013868510723114014, 0.0001440867781639099, 0.0001494884490966797]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 14.0, 19.0, 14.0, 39.0, 49.0, 104.0, 161.0, 323.0, 687.0, 2015.0, 7302.0, 79792.0, 897205.0, 51779.0, 5957.0, 1744.0, 662.0, 321.0, 137.0, 70.0, 48.0, 36.0, 27.0, 12.0, 5.0, 11.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.1586151123046875, -1.122894287109375, -1.0871734619140625, -1.05145263671875, -1.0157318115234375, -0.980010986328125, -0.9442901611328125, -0.9085693359375, -0.8728485107421875, -0.837127685546875, -0.8014068603515625, -0.76568603515625, -0.7299652099609375, -0.694244384765625, -0.6585235595703125, -0.622802734375, -0.5870819091796875, -0.551361083984375, -0.5156402587890625, -0.47991943359375, -0.4441986083984375, -0.408477783203125, -0.3727569580078125, -0.3370361328125, -0.3013153076171875, -0.265594482421875, -0.2298736572265625, -0.19415283203125, -0.1584320068359375, -0.122711181640625, -0.0869903564453125, -0.05126953125, -0.0155487060546875, 0.020172119140625, 0.0558929443359375, 0.09161376953125, 0.1273345947265625, 0.163055419921875, 0.1987762451171875, 0.2344970703125, 0.2702178955078125, 0.305938720703125, 0.3416595458984375, 0.37738037109375, 0.4131011962890625, 0.448822021484375, 0.4845428466796875, 0.520263671875, 0.5559844970703125, 0.591705322265625, 0.6274261474609375, 0.66314697265625, 0.6988677978515625, 0.734588623046875, 0.7703094482421875, 0.8060302734375, 0.8417510986328125, 0.877471923828125, 0.9131927490234375, 0.94891357421875, 0.9846343994140625, 1.020355224609375, 1.0560760498046875, 1.091796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 12.0, 10.0, 10.0, 10.0, 11.0, 27.0, 28.0, 36.0, 51.0, 74.0, 82.0, 92.0, 83.0, 73.0, 85.0, 66.0, 64.0, 50.0, 32.0, 23.0, 19.0, 12.0, 11.0, 3.0, 6.0, 8.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.84912109375, -0.8287086486816406, -0.8082962036132812, -0.7878837585449219, -0.7674713134765625, -0.7470588684082031, -0.7266464233398438, -0.7062339782714844, -0.685821533203125, -0.6654090881347656, -0.6449966430664062, -0.6245841979980469, -0.6041717529296875, -0.5837593078613281, -0.5633468627929688, -0.5429344177246094, -0.52252197265625, -0.5021095275878906, -0.48169708251953125, -0.4612846374511719, -0.4408721923828125, -0.4204597473144531, -0.40004730224609375, -0.3796348571777344, -0.359222412109375, -0.3388099670410156, -0.31839752197265625, -0.2979850769042969, -0.2775726318359375, -0.2571601867675781, -0.23674774169921875, -0.21633529663085938, -0.1959228515625, -0.17551040649414062, -0.15509796142578125, -0.13468551635742188, -0.1142730712890625, -0.09386062622070312, -0.07344818115234375, -0.053035736083984375, -0.032623291015625, -0.012210845947265625, 0.00820159912109375, 0.028614044189453125, 0.0490264892578125, 0.06943893432617188, 0.08985137939453125, 0.11026382446289062, 0.13067626953125, 0.15108871459960938, 0.17150115966796875, 0.19191360473632812, 0.2123260498046875, 0.23273849487304688, 0.25315093994140625, 0.2735633850097656, 0.293975830078125, 0.3143882751464844, 0.33480072021484375, 0.3552131652832031, 0.3756256103515625, 0.3960380554199219, 0.41645050048828125, 0.4368629455566406, 0.457275390625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 9.0, 19.0, 36.0, 70.0, 154.0, 264.0, 217.0, 118.0, 59.0, 21.0, 13.0, 6.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.8823184967041, -27.300050735473633, -26.717784881591797, -26.135517120361328, -25.55324935913086, -24.970983505249023, -24.388715744018555, -23.80644989013672, -23.22418212890625, -22.64191436767578, -22.059648513793945, -21.477380752563477, -20.895112991333008, -20.312847137451172, -19.730579376220703, -19.148311614990234, -18.566043853759766, -17.983776092529297, -17.40151023864746, -16.819242477416992, -16.236974716186523, -15.654708862304688, -15.072441101074219, -14.490174293518066, -13.907907485961914, -13.325640678405762, -12.743372917175293, -12.16110610961914, -11.578839302062988, -10.996572494506836, -10.414304733276367, -9.832037925720215, -9.249772071838379, -8.667505264282227, -8.085237503051758, -7.5029706954956055, -6.920703887939453, -6.338436603546143, -5.756169319152832, -5.17390251159668, -4.591635227203369, -4.009367942810059, -3.4271011352539062, -2.8448338508605957, -2.2625668048858643, -1.6802997589111328, -1.0980324745178223, -0.5157656669616699, 0.06650161743164062, 0.6487687230110168, 1.231035828590393, 1.813302993774414, 2.3955700397491455, 2.977837085723877, 3.5601043701171875, 4.14237117767334, 4.72463846206665, 5.306905746459961, 5.889172554016113, 6.471439838409424, 7.053707122802734, 7.635973930358887, 8.218240737915039, 8.800508499145508, 9.38277530670166]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 5.0, 5.0, 4.0, 9.0, 9.0, 13.0, 14.0, 16.0, 19.0, 15.0, 27.0, 22.0, 28.0, 27.0, 24.0, 34.0, 37.0, 44.0, 59.0, 57.0, 62.0, 56.0, 47.0, 41.0, 35.0, 37.0, 27.0, 22.0, 19.0, 22.0, 18.0, 22.0, 17.0, 14.0, 15.0, 4.0, 7.0, 9.0, 9.0, 12.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.732526779174805, -6.518301486968994, -6.304076194763184, -6.089851379394531, -5.875626087188721, -5.66140079498291, -5.447175979614258, -5.232950687408447, -5.018725395202637, -4.804500102996826, -4.590274810791016, -4.376049995422363, -4.161824703216553, -3.947599411010742, -3.7333743572235107, -3.5191493034362793, -3.3049240112304688, -3.090698719024658, -2.8764736652374268, -2.6622486114501953, -2.4480233192443848, -2.233798027038574, -2.0195729732513428, -1.8053478002548218, -1.5911226272583008, -1.3768974542617798, -1.1626722812652588, -0.9484471082687378, -0.7342219352722168, -0.5199967622756958, -0.3057715892791748, -0.09154641628265381, 0.12267875671386719, 0.3369039297103882, 0.5511291027069092, 0.7653542757034302, 0.9795794486999512, 1.1938046216964722, 1.4080297946929932, 1.6222549676895142, 1.8364801406860352, 2.0507054328918457, 2.264930486679077, 2.4791555404663086, 2.693380832672119, 2.9076061248779297, 3.121831178665161, 3.3360562324523926, 3.550281524658203, 3.7645068168640137, 3.978731870651245, 4.192956924438477, 4.407182216644287, 4.621407508850098, 4.83563232421875, 5.0498576164245605, 5.264082908630371, 5.478308200836182, 5.692533493041992, 5.9067583084106445, 6.120983600616455, 6.335208892822266, 6.549433708190918, 6.7636590003967285, 6.977884292602539]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 8.0, 4.0, 17.0, 9.0, 27.0, 28.0, 42.0, 77.0, 103.0, 170.0, 270.0, 506.0, 862.0, 1513.0, 2812.0, 5809.0, 12996.0, 32230.0, 108201.0, 753684.0, 2729723.0, 421838.0, 76711.0, 25375.0, 10491.0, 4924.0, 2521.0, 1310.0, 753.0, 437.0, 275.0, 190.0, 101.0, 77.0, 45.0, 46.0, 28.0, 13.0, 15.0, 4.0, 8.0, 9.0, 11.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63427734375, -0.6111068725585938, -0.5879364013671875, -0.5647659301757812, -0.541595458984375, -0.5184249877929688, -0.4952545166015625, -0.47208404541015625, -0.44891357421875, -0.42574310302734375, -0.4025726318359375, -0.37940216064453125, -0.356231689453125, -0.33306121826171875, -0.3098907470703125, -0.28672027587890625, -0.2635498046875, -0.24037933349609375, -0.2172088623046875, -0.19403839111328125, -0.170867919921875, -0.14769744873046875, -0.1245269775390625, -0.10135650634765625, -0.07818603515625, -0.05501556396484375, -0.0318450927734375, -0.00867462158203125, 0.014495849609375, 0.03766632080078125, 0.0608367919921875, 0.08400726318359375, 0.107177734375, 0.13034820556640625, 0.1535186767578125, 0.17668914794921875, 0.199859619140625, 0.22303009033203125, 0.2462005615234375, 0.26937103271484375, 0.29254150390625, 0.31571197509765625, 0.3388824462890625, 0.36205291748046875, 0.385223388671875, 0.40839385986328125, 0.4315643310546875, 0.45473480224609375, 0.4779052734375, 0.5010757446289062, 0.5242462158203125, 0.5474166870117188, 0.570587158203125, 0.5937576293945312, 0.6169281005859375, 0.6400985717773438, 0.66326904296875, 0.6864395141601562, 0.7096099853515625, 0.7327804565429688, 0.755950927734375, 0.7791213989257812, 0.8022918701171875, 0.8254623413085938, 0.8486328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 10.0, 12.0, 7.0, 13.0, 19.0, 16.0, 32.0, 21.0, 35.0, 37.0, 43.0, 37.0, 50.0, 60.0, 47.0, 62.0, 51.0, 49.0, 52.0, 45.0, 37.0, 43.0, 29.0, 28.0, 23.0, 27.0, 17.0, 18.0, 14.0, 12.0, 8.0, 12.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.480712890625, -0.46685791015625, -0.4530029296875, -0.43914794921875, -0.42529296875, -0.41143798828125, -0.3975830078125, -0.38372802734375, -0.369873046875, -0.35601806640625, -0.3421630859375, -0.32830810546875, -0.314453125, -0.30059814453125, -0.2867431640625, -0.27288818359375, -0.259033203125, -0.24517822265625, -0.2313232421875, -0.21746826171875, -0.20361328125, -0.18975830078125, -0.1759033203125, -0.16204833984375, -0.148193359375, -0.13433837890625, -0.1204833984375, -0.10662841796875, -0.0927734375, -0.07891845703125, -0.0650634765625, -0.05120849609375, -0.037353515625, -0.02349853515625, -0.0096435546875, 0.00421142578125, 0.01806640625, 0.03192138671875, 0.0457763671875, 0.05963134765625, 0.073486328125, 0.08734130859375, 0.1011962890625, 0.11505126953125, 0.12890625, 0.14276123046875, 0.1566162109375, 0.17047119140625, 0.184326171875, 0.19818115234375, 0.2120361328125, 0.22589111328125, 0.23974609375, 0.25360107421875, 0.2674560546875, 0.28131103515625, 0.295166015625, 0.30902099609375, 0.3228759765625, 0.33673095703125, 0.3505859375, 0.36444091796875, 0.3782958984375, 0.39215087890625, 0.406005859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 15.0, 20.0, 22.0, 28.0, 54.0, 65.0, 81.0, 141.0, 218.0, 315.0, 498.0, 933.0, 1670.0, 3174.0, 7198.0, 18283.0, 60514.0, 341408.0, 3153870.0, 485610.0, 79159.0, 23508.0, 8858.0, 3808.0, 1957.0, 1078.0, 642.0, 387.0, 244.0, 151.0, 102.0, 86.0, 52.0, 36.0, 24.0, 19.0, 14.0, 6.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93505859375, -0.9011459350585938, -0.8672332763671875, -0.8333206176757812, -0.799407958984375, -0.7654953002929688, -0.7315826416015625, -0.6976699829101562, -0.66375732421875, -0.6298446655273438, -0.5959320068359375, -0.5620193481445312, -0.528106689453125, -0.49419403076171875, -0.4602813720703125, -0.42636871337890625, -0.3924560546875, -0.35854339599609375, -0.3246307373046875, -0.29071807861328125, -0.256805419921875, -0.22289276123046875, -0.1889801025390625, -0.15506744384765625, -0.12115478515625, -0.08724212646484375, -0.0533294677734375, -0.01941680908203125, 0.014495849609375, 0.04840850830078125, 0.0823211669921875, 0.11623382568359375, 0.150146484375, 0.18405914306640625, 0.2179718017578125, 0.25188446044921875, 0.285797119140625, 0.31970977783203125, 0.3536224365234375, 0.38753509521484375, 0.42144775390625, 0.45536041259765625, 0.4892730712890625, 0.5231857299804688, 0.557098388671875, 0.5910110473632812, 0.6249237060546875, 0.6588363647460938, 0.6927490234375, 0.7266616821289062, 0.7605743408203125, 0.7944869995117188, 0.828399658203125, 0.8623123168945312, 0.8962249755859375, 0.9301376342773438, 0.96405029296875, 0.9979629516601562, 1.0318756103515625, 1.0657882690429688, 1.099700927734375, 1.1336135864257812, 1.1675262451171875, 1.2014389038085938, 1.2353515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 9.0, 8.0, 6.0, 9.0, 11.0, 13.0, 20.0, 21.0, 24.0, 54.0, 86.0, 86.0, 187.0, 303.0, 525.0, 787.0, 758.0, 407.0, 241.0, 144.0, 91.0, 53.0, 46.0, 37.0, 33.0, 21.0, 25.0, 8.0, 20.0, 12.0, 1.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.328125, -1.2863922119140625, -1.244659423828125, -1.2029266357421875, -1.16119384765625, -1.1194610595703125, -1.077728271484375, -1.0359954833984375, -0.9942626953125, -0.9525299072265625, -0.910797119140625, -0.8690643310546875, -0.82733154296875, -0.7855987548828125, -0.743865966796875, -0.7021331787109375, -0.660400390625, -0.6186676025390625, -0.576934814453125, -0.5352020263671875, -0.49346923828125, -0.4517364501953125, -0.410003662109375, -0.3682708740234375, -0.3265380859375, -0.2848052978515625, -0.243072509765625, -0.2013397216796875, -0.15960693359375, -0.1178741455078125, -0.076141357421875, -0.0344085693359375, 0.00732421875, 0.0490570068359375, 0.090789794921875, 0.1325225830078125, 0.17425537109375, 0.2159881591796875, 0.257720947265625, 0.2994537353515625, 0.3411865234375, 0.3829193115234375, 0.424652099609375, 0.4663848876953125, 0.50811767578125, 0.5498504638671875, 0.591583251953125, 0.6333160400390625, 0.675048828125, 0.7167816162109375, 0.758514404296875, 0.8002471923828125, 0.84197998046875, 0.8837127685546875, 0.925445556640625, 0.9671783447265625, 1.0089111328125, 1.0506439208984375, 1.092376708984375, 1.1341094970703125, 1.17584228515625, 1.2175750732421875, 1.259307861328125, 1.3010406494140625, 1.3427734375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 12.0, 12.0, 38.0, 129.0, 222.0, 251.0, 181.0, 80.0, 31.0, 13.0, 12.0, 9.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.166604042053223, -12.61992073059082, -12.073238372802734, -11.526556015014648, -10.979872703552246, -10.433189392089844, -9.886507034301758, -9.339824676513672, -8.79314136505127, -8.246458053588867, -7.699775695800781, -7.153092861175537, -6.606410026550293, -6.059727191925049, -5.513044357299805, -4.9663615226745605, -4.419678688049316, -3.8729958534240723, -3.326313018798828, -2.779630184173584, -2.23294734954834, -1.6862645149230957, -1.1395816802978516, -0.5928988456726074, -0.04621601104736328, 0.5004668235778809, 1.047149658203125, 1.5938324928283691, 2.1405153274536133, 2.6871981620788574, 3.2338809967041016, 3.7805638313293457, 4.327247619628906, 4.87393045425415, 5.4206132888793945, 5.967296123504639, 6.513978958129883, 7.060661792755127, 7.607344627380371, 8.154027938842773, 8.70071029663086, 9.247392654418945, 9.794075965881348, 10.34075927734375, 10.887441635131836, 11.434123992919922, 11.980807304382324, 12.527490615844727, 13.074172973632812, 13.620855331420898, 14.1675386428833, 14.714221954345703, 15.260904312133789, 15.807586669921875, 16.354270935058594, 16.90095329284668, 17.447635650634766, 17.99431800842285, 18.541000366210938, 19.087684631347656, 19.634366989135742, 20.181049346923828, 20.727733612060547, 21.274415969848633, 21.82109832763672]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 2.0, 4.0, 0.0, 7.0, 8.0, 10.0, 11.0, 19.0, 16.0, 21.0, 25.0, 24.0, 31.0, 44.0, 37.0, 47.0, 45.0, 47.0, 59.0, 54.0, 34.0, 50.0, 55.0, 61.0, 27.0, 30.0, 40.0, 23.0, 21.0, 28.0, 21.0, 23.0, 15.0, 12.0, 10.0, 5.0, 12.0, 9.0, 3.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.385213375091553, -7.182975769042969, -6.980737686157227, -6.778500080108643, -6.576262474060059, -6.374024868011475, -6.171787261962891, -5.969549179077148, -5.7673115730285645, -5.5650739669799805, -5.362835884094238, -5.160598278045654, -4.95836067199707, -4.756123065948486, -4.553885459899902, -4.35164737701416, -4.149409770965576, -3.947172164916992, -3.744934320449829, -3.542696475982666, -3.340458869934082, -3.138221263885498, -2.935983419418335, -2.733745574951172, -2.531507968902588, -2.329270362854004, -2.127032518386841, -1.9247947931289673, -1.7225570678710938, -1.5203193426132202, -1.3180816173553467, -1.1158438920974731, -0.9136066436767578, -0.7113689184188843, -0.5091311931610107, -0.3068934679031372, -0.10465574264526367, 0.09758198261260986, 0.2998197078704834, 0.5020574331283569, 0.7042951583862305, 0.906532883644104, 1.1087706089019775, 1.311008334159851, 1.5132460594177246, 1.7154837846755981, 1.9177215099334717, 2.1199593544006348, 2.3221969604492188, 2.5244345664978027, 2.726672410964966, 2.928910255432129, 3.131147861480713, 3.333385467529297, 3.53562331199646, 3.737861156463623, 3.940098762512207, 4.142336368560791, 4.344573974609375, 4.546812057495117, 4.749049663543701, 4.951287269592285, 5.153525352478027, 5.355762958526611, 5.558000564575195]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 6.0, 4.0, 4.0, 5.0, 7.0, 16.0, 23.0, 44.0, 78.0, 108.0, 163.0, 275.0, 437.0, 754.0, 1317.0, 2418.0, 4800.0, 10384.0, 24782.0, 74809.0, 338753.0, 437383.0, 97905.0, 29981.0, 12178.0, 5635.0, 2767.0, 1441.0, 810.0, 464.0, 286.0, 174.0, 121.0, 69.0, 54.0, 26.0, 19.0, 17.0, 17.0, 5.0, 4.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2314453125, -1.1918487548828125, -1.152252197265625, -1.1126556396484375, -1.07305908203125, -1.0334625244140625, -0.993865966796875, -0.9542694091796875, -0.9146728515625, -0.8750762939453125, -0.835479736328125, -0.7958831787109375, -0.75628662109375, -0.7166900634765625, -0.677093505859375, -0.6374969482421875, -0.597900390625, -0.5583038330078125, -0.518707275390625, -0.4791107177734375, -0.43951416015625, -0.3999176025390625, -0.360321044921875, -0.3207244873046875, -0.2811279296875, -0.2415313720703125, -0.201934814453125, -0.1623382568359375, -0.12274169921875, -0.0831451416015625, -0.043548583984375, -0.0039520263671875, 0.03564453125, 0.0752410888671875, 0.114837646484375, 0.1544342041015625, 0.19403076171875, 0.2336273193359375, 0.273223876953125, 0.3128204345703125, 0.3524169921875, 0.3920135498046875, 0.431610107421875, 0.4712066650390625, 0.51080322265625, 0.5503997802734375, 0.589996337890625, 0.6295928955078125, 0.669189453125, 0.7087860107421875, 0.748382568359375, 0.7879791259765625, 0.82757568359375, 0.8671722412109375, 0.906768798828125, 0.9463653564453125, 0.9859619140625, 1.0255584716796875, 1.065155029296875, 1.1047515869140625, 1.14434814453125, 1.1839447021484375, 1.223541259765625, 1.2631378173828125, 1.302734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 6.0, 14.0, 8.0, 14.0, 14.0, 18.0, 21.0, 20.0, 31.0, 32.0, 45.0, 51.0, 45.0, 35.0, 64.0, 62.0, 52.0, 51.0, 60.0, 50.0, 44.0, 36.0, 38.0, 45.0, 16.0, 39.0, 20.0, 17.0, 8.0, 11.0, 7.0, 3.0, 2.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47412109375, -0.4583740234375, -0.442626953125, -0.4268798828125, -0.4111328125, -0.3953857421875, -0.379638671875, -0.3638916015625, -0.34814453125, -0.3323974609375, -0.316650390625, -0.3009033203125, -0.28515625, -0.2694091796875, -0.253662109375, -0.2379150390625, -0.22216796875, -0.2064208984375, -0.190673828125, -0.1749267578125, -0.1591796875, -0.1434326171875, -0.127685546875, -0.1119384765625, -0.09619140625, -0.0804443359375, -0.064697265625, -0.0489501953125, -0.033203125, -0.0174560546875, -0.001708984375, 0.0140380859375, 0.02978515625, 0.0455322265625, 0.061279296875, 0.0770263671875, 0.0927734375, 0.1085205078125, 0.124267578125, 0.1400146484375, 0.15576171875, 0.1715087890625, 0.187255859375, 0.2030029296875, 0.21875, 0.2344970703125, 0.250244140625, 0.2659912109375, 0.28173828125, 0.2974853515625, 0.313232421875, 0.3289794921875, 0.3447265625, 0.3604736328125, 0.376220703125, 0.3919677734375, 0.40771484375, 0.4234619140625, 0.439208984375, 0.4549560546875, 0.470703125, 0.4864501953125, 0.502197265625, 0.5179443359375, 0.53369140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 13.0, 20.0, 21.0, 39.0, 52.0, 86.0, 136.0, 255.0, 462.0, 893.0, 2379.0, 9164.0, 83059.0, 888717.0, 52343.0, 7078.0, 2060.0, 778.0, 385.0, 213.0, 128.0, 92.0, 66.0, 35.0, 24.0, 16.0, 5.0, 5.0, 5.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30078125, -2.206573486328125, -2.11236572265625, -2.018157958984375, -1.9239501953125, -1.829742431640625, -1.73553466796875, -1.641326904296875, -1.547119140625, -1.452911376953125, -1.35870361328125, -1.264495849609375, -1.1702880859375, -1.076080322265625, -0.98187255859375, -0.887664794921875, -0.79345703125, -0.699249267578125, -0.60504150390625, -0.510833740234375, -0.4166259765625, -0.322418212890625, -0.22821044921875, -0.134002685546875, -0.039794921875, 0.054412841796875, 0.14862060546875, 0.242828369140625, 0.3370361328125, 0.431243896484375, 0.52545166015625, 0.619659423828125, 0.7138671875, 0.808074951171875, 0.90228271484375, 0.996490478515625, 1.0906982421875, 1.184906005859375, 1.27911376953125, 1.373321533203125, 1.467529296875, 1.561737060546875, 1.65594482421875, 1.750152587890625, 1.8443603515625, 1.938568115234375, 2.03277587890625, 2.126983642578125, 2.22119140625, 2.315399169921875, 2.40960693359375, 2.503814697265625, 2.5980224609375, 2.692230224609375, 2.78643798828125, 2.880645751953125, 2.974853515625, 3.069061279296875, 3.16326904296875, 3.257476806640625, 3.3516845703125, 3.445892333984375, 3.54010009765625, 3.634307861328125, 3.728515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 7.0, 10.0, 8.0, 10.0, 18.0, 19.0, 15.0, 37.0, 29.0, 42.0, 47.0, 45.0, 46.0, 68.0, 86.0, 67.0, 64.0, 57.0, 44.0, 26.0, 44.0, 35.0, 33.0, 38.0, 20.0, 11.0, 19.0, 16.0, 10.0, 10.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.57421875, -2.50537109375, -2.4365234375, -2.36767578125, -2.298828125, -2.22998046875, -2.1611328125, -2.09228515625, -2.0234375, -1.95458984375, -1.8857421875, -1.81689453125, -1.748046875, -1.67919921875, -1.6103515625, -1.54150390625, -1.47265625, -1.40380859375, -1.3349609375, -1.26611328125, -1.197265625, -1.12841796875, -1.0595703125, -0.99072265625, -0.921875, -0.85302734375, -0.7841796875, -0.71533203125, -0.646484375, -0.57763671875, -0.5087890625, -0.43994140625, -0.37109375, -0.30224609375, -0.2333984375, -0.16455078125, -0.095703125, -0.02685546875, 0.0419921875, 0.11083984375, 0.1796875, 0.24853515625, 0.3173828125, 0.38623046875, 0.455078125, 0.52392578125, 0.5927734375, 0.66162109375, 0.73046875, 0.79931640625, 0.8681640625, 0.93701171875, 1.005859375, 1.07470703125, 1.1435546875, 1.21240234375, 1.28125, 1.35009765625, 1.4189453125, 1.48779296875, 1.556640625, 1.62548828125, 1.6943359375, 1.76318359375, 1.83203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 2.0, 5.0, 8.0, 10.0, 19.0, 28.0, 26.0, 39.0, 73.0, 101.0, 164.0, 242.0, 486.0, 1141.0, 3156.0, 11660.0, 61718.0, 693246.0, 235825.0, 29862.0, 6878.0, 2104.0, 859.0, 331.0, 189.0, 106.0, 66.0, 51.0, 45.0, 29.0, 28.0, 13.0, 13.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71533203125, -0.6953506469726562, -0.6753692626953125, -0.6553878784179688, -0.635406494140625, -0.6154251098632812, -0.5954437255859375, -0.5754623413085938, -0.55548095703125, -0.5354995727539062, -0.5155181884765625, -0.49553680419921875, -0.475555419921875, -0.45557403564453125, -0.4355926513671875, -0.41561126708984375, -0.3956298828125, -0.37564849853515625, -0.3556671142578125, -0.33568572998046875, -0.315704345703125, -0.29572296142578125, -0.2757415771484375, -0.25576019287109375, -0.23577880859375, -0.21579742431640625, -0.1958160400390625, -0.17583465576171875, -0.155853271484375, -0.13587188720703125, -0.1158905029296875, -0.09590911865234375, -0.075927734375, -0.05594635009765625, -0.0359649658203125, -0.01598358154296875, 0.003997802734375, 0.02397918701171875, 0.0439605712890625, 0.06394195556640625, 0.08392333984375, 0.10390472412109375, 0.1238861083984375, 0.14386749267578125, 0.163848876953125, 0.18383026123046875, 0.2038116455078125, 0.22379302978515625, 0.2437744140625, 0.26375579833984375, 0.2837371826171875, 0.30371856689453125, 0.323699951171875, 0.34368133544921875, 0.3636627197265625, 0.38364410400390625, 0.40362548828125, 0.42360687255859375, 0.4435882568359375, 0.46356964111328125, 0.483551025390625, 0.5035324096679688, 0.5235137939453125, 0.5434951782226562, 0.5634765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 3.0, 6.0, 7.0, 10.0, 12.0, 13.0, 13.0, 20.0, 35.0, 55.0, 73.0, 103.0, 122.0, 119.0, 114.0, 70.0, 55.0, 31.0, 25.0, 18.0, 14.0, 12.0, 12.0, 3.0, 7.0, 5.0, 4.0, 0.0, 2.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00017642974853515625, -0.00017168186604976654, -0.00016693398356437683, -0.00016218610107898712, -0.0001574382185935974, -0.0001526903361082077, -0.000147942453622818, -0.00014319457113742828, -0.00013844668865203857, -0.00013369880616664886, -0.00012895092368125916, -0.00012420304119586945, -0.00011945515871047974, -0.00011470727622509003, -0.00010995939373970032, -0.00010521151125431061, -0.0001004636287689209, -9.571574628353119e-05, -9.096786379814148e-05, -8.621998131275177e-05, -8.147209882736206e-05, -7.672421634197235e-05, -7.197633385658264e-05, -6.722845137119293e-05, -6.248056888580322e-05, -5.773268640041351e-05, -5.2984803915023804e-05, -4.8236921429634094e-05, -4.3489038944244385e-05, -3.8741156458854675e-05, -3.3993273973464966e-05, -2.9245391488075256e-05, -2.4497509002685547e-05, -1.9749626517295837e-05, -1.5001744031906128e-05, -1.0253861546516418e-05, -5.505979061126709e-06, -7.580965757369995e-07, 3.98978590965271e-06, 8.73766839504242e-06, 1.3485550880432129e-05, 1.823343336582184e-05, 2.2981315851211548e-05, 2.7729198336601257e-05, 3.247708082199097e-05, 3.7224963307380676e-05, 4.1972845792770386e-05, 4.6720728278160095e-05, 5.1468610763549805e-05, 5.6216493248939514e-05, 6.0964375734329224e-05, 6.571225821971893e-05, 7.046014070510864e-05, 7.520802319049835e-05, 7.995590567588806e-05, 8.470378816127777e-05, 8.945167064666748e-05, 9.419955313205719e-05, 9.89474356174469e-05, 0.00010369531810283661, 0.00010844320058822632, 0.00011319108307361603, 0.00011793896555900574, 0.00012268684804439545, 0.00012743473052978516]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 21.0, 25.0, 37.0, 57.0, 112.0, 145.0, 259.0, 479.0, 957.0, 2087.0, 6143.0, 30894.0, 365745.0, 593396.0, 36665.0, 6944.0, 2297.0, 998.0, 534.0, 264.0, 174.0, 114.0, 48.0, 48.0, 21.0, 14.0, 16.0, 11.0, 5.0, 8.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.76611328125, -0.746490478515625, -0.72686767578125, -0.707244873046875, -0.6876220703125, -0.667999267578125, -0.64837646484375, -0.628753662109375, -0.609130859375, -0.589508056640625, -0.56988525390625, -0.550262451171875, -0.5306396484375, -0.511016845703125, -0.49139404296875, -0.471771240234375, -0.4521484375, -0.432525634765625, -0.41290283203125, -0.393280029296875, -0.3736572265625, -0.354034423828125, -0.33441162109375, -0.314788818359375, -0.295166015625, -0.275543212890625, -0.25592041015625, -0.236297607421875, -0.2166748046875, -0.197052001953125, -0.17742919921875, -0.157806396484375, -0.13818359375, -0.118560791015625, -0.09893798828125, -0.079315185546875, -0.0596923828125, -0.040069580078125, -0.02044677734375, -0.000823974609375, 0.018798828125, 0.038421630859375, 0.05804443359375, 0.077667236328125, 0.0972900390625, 0.116912841796875, 0.13653564453125, 0.156158447265625, 0.17578125, 0.195404052734375, 0.21502685546875, 0.234649658203125, 0.2542724609375, 0.273895263671875, 0.29351806640625, 0.313140869140625, 0.332763671875, 0.352386474609375, 0.37200927734375, 0.391632080078125, 0.4112548828125, 0.430877685546875, 0.45050048828125, 0.470123291015625, 0.48974609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 14.0, 19.0, 19.0, 32.0, 56.0, 99.0, 100.0, 144.0, 133.0, 118.0, 88.0, 55.0, 41.0, 34.0, 21.0, 8.0, 2.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7678298950195312, -0.7446441650390625, -0.7214584350585938, -0.698272705078125, -0.6750869750976562, -0.6519012451171875, -0.6287155151367188, -0.60552978515625, -0.5823440551757812, -0.5591583251953125, -0.5359725952148438, -0.512786865234375, -0.48960113525390625, -0.4664154052734375, -0.44322967529296875, -0.4200439453125, -0.39685821533203125, -0.3736724853515625, -0.35048675537109375, -0.327301025390625, -0.30411529541015625, -0.2809295654296875, -0.25774383544921875, -0.23455810546875, -0.21137237548828125, -0.1881866455078125, -0.16500091552734375, -0.141815185546875, -0.11862945556640625, -0.0954437255859375, -0.07225799560546875, -0.049072265625, -0.02588653564453125, -0.0027008056640625, 0.02048492431640625, 0.043670654296875, 0.06685638427734375, 0.0900421142578125, 0.11322784423828125, 0.13641357421875, 0.15959930419921875, 0.1827850341796875, 0.20597076416015625, 0.229156494140625, 0.25234222412109375, 0.2755279541015625, 0.29871368408203125, 0.3218994140625, 0.34508514404296875, 0.3682708740234375, 0.39145660400390625, 0.414642333984375, 0.43782806396484375, 0.4610137939453125, 0.48419952392578125, 0.50738525390625, 0.5305709838867188, 0.5537567138671875, 0.5769424438476562, 0.600128173828125, 0.6233139038085938, 0.6464996337890625, 0.6696853637695312, 0.69287109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 12.0, 9.0, 28.0, 47.0, 133.0, 201.0, 295.0, 152.0, 67.0, 25.0, 10.0, 10.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.67529296875, -20.13375473022461, -19.59221839904785, -19.05068016052246, -18.509143829345703, -17.967605590820312, -17.426069259643555, -16.884531021118164, -16.342994689941406, -15.801457405090332, -15.259920120239258, -14.718382835388184, -14.17684555053711, -13.635307312011719, -13.093770027160645, -12.55223274230957, -12.01069450378418, -11.469157218933105, -10.927619934082031, -10.386082649230957, -9.844545364379883, -9.303007125854492, -8.761469841003418, -8.219932556152344, -7.6783952713012695, -7.136857986450195, -6.595320701599121, -6.053782939910889, -5.5122456550598145, -4.97070837020874, -4.429170608520508, -3.8876333236694336, -3.3460941314697266, -2.8045568466186523, -2.263019323348999, -1.7214819192886353, -1.1799445152282715, -0.6384072303771973, -0.09686970710754395, 0.4446678161621094, 0.9862051010131836, 1.5277425050735474, 2.069279909133911, 2.6108174324035645, 3.1523547172546387, 3.693892002105713, 4.235429763793945, 4.7769670486450195, 5.318504333496094, 5.860041618347168, 6.401578903198242, 6.943116664886475, 7.484653949737549, 8.026191711425781, 8.567728996276855, 9.10926628112793, 9.650803565979004, 10.192340850830078, 10.733878135681152, 11.275415420532227, 11.816953659057617, 12.358489990234375, 12.900028228759766, 13.44156551361084, 13.983102798461914]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 8.0, 11.0, 6.0, 14.0, 21.0, 20.0, 17.0, 21.0, 34.0, 34.0, 35.0, 44.0, 55.0, 72.0, 64.0, 79.0, 61.0, 79.0, 43.0, 41.0, 43.0, 26.0, 23.0, 18.0, 23.0, 29.0, 15.0, 13.0, 8.0, 3.0, 10.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.19394588470459, -7.925246238708496, -7.656546592712402, -7.38784646987915, -7.119146823883057, -6.850447177886963, -6.581747055053711, -6.313047409057617, -6.044347763061523, -5.77564811706543, -5.506948471069336, -5.238248348236084, -4.96954870223999, -4.7008490562438965, -4.4321489334106445, -4.163449287414551, -3.894749641418457, -3.6260499954223633, -3.3573501110076904, -3.0886502265930176, -2.819950580596924, -2.55125093460083, -2.2825510501861572, -2.0138511657714844, -1.7451515197753906, -1.4764517545700073, -1.207751989364624, -0.9390522241592407, -0.6703524589538574, -0.4016526937484741, -0.13295292854309082, 0.13574683666229248, 0.4044456481933594, 0.6731454133987427, 0.941845178604126, 1.2105449438095093, 1.4792447090148926, 1.7479444742202759, 2.016644239425659, 2.285344123840332, 2.554043769836426, 2.8227434158325195, 3.0914433002471924, 3.3601431846618652, 3.628842830657959, 3.8975424766540527, 4.166242599487305, 4.434942245483398, 4.703641891479492, 4.972341537475586, 5.24104118347168, 5.509741306304932, 5.778440952301025, 6.047140598297119, 6.315840721130371, 6.584540367126465, 6.853240013122559, 7.121939659118652, 7.390639305114746, 7.659339427947998, 7.928039073944092, 8.196739196777344, 8.465438842773438, 8.734138488769531, 9.002838134765625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 7.0, 9.0, 8.0, 16.0, 18.0, 25.0, 37.0, 76.0, 106.0, 134.0, 244.0, 369.0, 672.0, 1297.0, 2826.0, 6734.0, 19322.0, 79790.0, 919538.0, 2871922.0, 234151.0, 37439.0, 11133.0, 4198.0, 1856.0, 962.0, 487.0, 319.0, 196.0, 132.0, 77.0, 63.0, 38.0, 20.0, 17.0, 7.0, 15.0, 8.0, 8.0, 4.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.9853515625, -0.9589004516601562, -0.9324493408203125, -0.9059982299804688, -0.879547119140625, -0.8530960083007812, -0.8266448974609375, -0.8001937866210938, -0.77374267578125, -0.7472915649414062, -0.7208404541015625, -0.6943893432617188, -0.667938232421875, -0.6414871215820312, -0.6150360107421875, -0.5885848999023438, -0.5621337890625, -0.5356826782226562, -0.5092315673828125, -0.48278045654296875, -0.456329345703125, -0.42987823486328125, -0.4034271240234375, -0.37697601318359375, -0.35052490234375, -0.32407379150390625, -0.2976226806640625, -0.27117156982421875, -0.244720458984375, -0.21826934814453125, -0.1918182373046875, -0.16536712646484375, -0.138916015625, -0.11246490478515625, -0.0860137939453125, -0.05956268310546875, -0.033111572265625, -0.00666046142578125, 0.0197906494140625, 0.04624176025390625, 0.07269287109375, 0.09914398193359375, 0.1255950927734375, 0.15204620361328125, 0.178497314453125, 0.20494842529296875, 0.2313995361328125, 0.25785064697265625, 0.2843017578125, 0.31075286865234375, 0.3372039794921875, 0.36365509033203125, 0.390106201171875, 0.41655731201171875, 0.4430084228515625, 0.46945953369140625, 0.49591064453125, 0.5223617553710938, 0.5488128662109375, 0.5752639770507812, 0.601715087890625, 0.6281661987304688, 0.6546173095703125, 0.6810684204101562, 0.70751953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 12.0, 4.0, 4.0, 15.0, 14.0, 11.0, 19.0, 15.0, 36.0, 30.0, 32.0, 33.0, 41.0, 46.0, 38.0, 45.0, 46.0, 61.0, 55.0, 43.0, 42.0, 36.0, 37.0, 34.0, 26.0, 37.0, 34.0, 21.0, 25.0, 16.0, 19.0, 14.0, 10.0, 8.0, 5.0, 10.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.463623046875, -0.4509429931640625, -0.438262939453125, -0.4255828857421875, -0.41290283203125, -0.4002227783203125, -0.387542724609375, -0.3748626708984375, -0.3621826171875, -0.3495025634765625, -0.336822509765625, -0.3241424560546875, -0.31146240234375, -0.2987823486328125, -0.286102294921875, -0.2734222412109375, -0.2607421875, -0.2480621337890625, -0.235382080078125, -0.2227020263671875, -0.21002197265625, -0.1973419189453125, -0.184661865234375, -0.1719818115234375, -0.1593017578125, -0.1466217041015625, -0.133941650390625, -0.1212615966796875, -0.10858154296875, -0.0959014892578125, -0.083221435546875, -0.0705413818359375, -0.057861328125, -0.0451812744140625, -0.032501220703125, -0.0198211669921875, -0.00714111328125, 0.0055389404296875, 0.018218994140625, 0.0308990478515625, 0.0435791015625, 0.0562591552734375, 0.068939208984375, 0.0816192626953125, 0.09429931640625, 0.1069793701171875, 0.119659423828125, 0.1323394775390625, 0.14501953125, 0.1576995849609375, 0.170379638671875, 0.1830596923828125, 0.19573974609375, 0.2084197998046875, 0.221099853515625, 0.2337799072265625, 0.2464599609375, 0.2591400146484375, 0.271820068359375, 0.2845001220703125, 0.29718017578125, 0.3098602294921875, 0.322540283203125, 0.3352203369140625, 0.347900390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 12.0, 13.0, 14.0, 23.0, 22.0, 56.0, 68.0, 136.0, 296.0, 630.0, 1482.0, 4811.0, 21131.0, 222214.0, 3782306.0, 137751.0, 16960.0, 4112.0, 1289.0, 464.0, 195.0, 96.0, 63.0, 40.0, 28.0, 14.0, 12.0, 3.0, 8.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9990234375, -1.942596435546875, -1.88616943359375, -1.829742431640625, -1.7733154296875, -1.716888427734375, -1.66046142578125, -1.604034423828125, -1.547607421875, -1.491180419921875, -1.43475341796875, -1.378326416015625, -1.3218994140625, -1.265472412109375, -1.20904541015625, -1.152618408203125, -1.09619140625, -1.039764404296875, -0.98333740234375, -0.926910400390625, -0.8704833984375, -0.814056396484375, -0.75762939453125, -0.701202392578125, -0.644775390625, -0.588348388671875, -0.53192138671875, -0.475494384765625, -0.4190673828125, -0.362640380859375, -0.30621337890625, -0.249786376953125, -0.193359375, -0.136932373046875, -0.08050537109375, -0.024078369140625, 0.0323486328125, 0.088775634765625, 0.14520263671875, 0.201629638671875, 0.258056640625, 0.314483642578125, 0.37091064453125, 0.427337646484375, 0.4837646484375, 0.540191650390625, 0.59661865234375, 0.653045654296875, 0.70947265625, 0.765899658203125, 0.82232666015625, 0.878753662109375, 0.9351806640625, 0.991607666015625, 1.04803466796875, 1.104461669921875, 1.160888671875, 1.217315673828125, 1.27374267578125, 1.330169677734375, 1.3865966796875, 1.443023681640625, 1.49945068359375, 1.555877685546875, 1.6123046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 5.0, 8.0, 9.0, 17.0, 20.0, 24.0, 35.0, 45.0, 77.0, 96.0, 170.0, 319.0, 682.0, 1058.0, 641.0, 325.0, 183.0, 109.0, 65.0, 44.0, 21.0, 26.0, 21.0, 17.0, 5.0, 5.0, 9.0, 2.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.5625, -1.52191162109375, -1.4813232421875, -1.44073486328125, -1.400146484375, -1.35955810546875, -1.3189697265625, -1.27838134765625, -1.23779296875, -1.19720458984375, -1.1566162109375, -1.11602783203125, -1.075439453125, -1.03485107421875, -0.9942626953125, -0.95367431640625, -0.9130859375, -0.87249755859375, -0.8319091796875, -0.79132080078125, -0.750732421875, -0.71014404296875, -0.6695556640625, -0.62896728515625, -0.58837890625, -0.54779052734375, -0.5072021484375, -0.46661376953125, -0.426025390625, -0.38543701171875, -0.3448486328125, -0.30426025390625, -0.263671875, -0.22308349609375, -0.1824951171875, -0.14190673828125, -0.101318359375, -0.06072998046875, -0.0201416015625, 0.02044677734375, 0.06103515625, 0.10162353515625, 0.1422119140625, 0.18280029296875, 0.223388671875, 0.26397705078125, 0.3045654296875, 0.34515380859375, 0.3857421875, 0.42633056640625, 0.4669189453125, 0.50750732421875, 0.548095703125, 0.58868408203125, 0.6292724609375, 0.66986083984375, 0.71044921875, 0.75103759765625, 0.7916259765625, 0.83221435546875, 0.872802734375, 0.91339111328125, 0.9539794921875, 0.99456787109375, 1.03515625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 4.0, 7.0, 10.0, 24.0, 70.0, 155.0, 295.0, 255.0, 107.0, 36.0, 18.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.349207878112793, -9.82542896270752, -9.301650047302246, -8.777871131896973, -8.2540922164917, -7.730313301086426, -7.2065348625183105, -6.682755947113037, -6.158977031707764, -5.63519811630249, -5.111419200897217, -4.587640762329102, -4.063861846923828, -3.5400826930999756, -3.0163040161132812, -2.492525100708008, -1.9687461853027344, -1.444967269897461, -0.921188473701477, -0.39740967750549316, 0.12636923789978027, 0.6501481533050537, 1.173926830291748, 1.6977057456970215, 2.221484661102295, 2.7452635765075684, 3.269042491912842, 3.792821168899536, 4.3165998458862305, 4.840378761291504, 5.364157676696777, 5.887936592102051, 6.411714553833008, 6.935493469238281, 7.459272384643555, 7.983051300048828, 8.506830215454102, 9.030609130859375, 9.554388046264648, 10.078166961669922, 10.601945877075195, 11.125724792480469, 11.649503707885742, 12.173282623291016, 12.697061538696289, 13.220840454101562, 13.744619369506836, 14.26839828491211, 14.792176246643066, 15.31595516204834, 15.839734077453613, 16.36351203918457, 16.887290954589844, 17.411069869995117, 17.93484878540039, 18.458627700805664, 18.982406616210938, 19.50618553161621, 20.029964447021484, 20.553743362426758, 21.07752227783203, 21.601301193237305, 22.125080108642578, 22.64885902404785, 23.172637939453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 12.0, 13.0, 16.0, 26.0, 27.0, 46.0, 26.0, 26.0, 54.0, 47.0, 39.0, 51.0, 45.0, 61.0, 53.0, 45.0, 50.0, 54.0, 48.0, 47.0, 34.0, 36.0, 17.0, 21.0, 13.0, 21.0, 20.0, 8.0, 13.0, 8.0, 3.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.016751289367676, -5.81986665725708, -5.622981548309326, -5.4260969161987305, -5.229211807250977, -5.032327175140381, -4.835442543029785, -4.638557434082031, -4.441672325134277, -4.244787693023682, -4.047902584075928, -3.851017951965332, -3.654132843017578, -3.4572482109069824, -3.2603633403778076, -3.063478469848633, -2.866593837738037, -2.6697089672088623, -2.4728240966796875, -2.275939464569092, -2.079054355621338, -1.8821696043014526, -1.6852848529815674, -1.4883999824523926, -1.2915151119232178, -1.094630241394043, -0.8977454304695129, -0.7008606195449829, -0.5039757490158081, -0.3070908784866333, -0.11020612716674805, 0.08667874336242676, 0.28356409072875977, 0.4804489314556122, 0.6773337721824646, 0.8742185831069946, 1.0711034536361694, 1.2679883241653442, 1.4648730754852295, 1.6617579460144043, 1.858642816543579, 2.055527687072754, 2.2524125576019287, 2.4492974281311035, 2.646182060241699, 2.843067169189453, 3.039951801300049, 3.2368366718292236, 3.4337215423583984, 3.6306064128875732, 3.827491283416748, 4.024375915527344, 4.221261024475098, 4.418145656585693, 4.615030288696289, 4.811915397644043, 5.008800506591797, 5.205685138702393, 5.4025702476501465, 5.599454879760742, 5.796339988708496, 5.993224620819092, 6.1901092529296875, 6.386994361877441, 6.583878993988037]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 11.0, 16.0, 17.0, 16.0, 42.0, 58.0, 125.0, 192.0, 339.0, 568.0, 1046.0, 2022.0, 4236.0, 10061.0, 30176.0, 122090.0, 462449.0, 313100.0, 69012.0, 19130.0, 6908.0, 3289.0, 1606.0, 869.0, 468.0, 270.0, 136.0, 97.0, 69.0, 48.0, 29.0, 13.0, 7.0, 4.0, 6.0, 8.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.87890625, -0.8521194458007812, -0.8253326416015625, -0.7985458374023438, -0.771759033203125, -0.7449722290039062, -0.7181854248046875, -0.6913986206054688, -0.66461181640625, -0.6378250122070312, -0.6110382080078125, -0.5842514038085938, -0.557464599609375, -0.5306777954101562, -0.5038909912109375, -0.47710418701171875, -0.4503173828125, -0.42353057861328125, -0.3967437744140625, -0.36995697021484375, -0.343170166015625, -0.31638336181640625, -0.2895965576171875, -0.26280975341796875, -0.23602294921875, -0.20923614501953125, -0.1824493408203125, -0.15566253662109375, -0.128875732421875, -0.10208892822265625, -0.0753021240234375, -0.04851531982421875, -0.021728515625, 0.00505828857421875, 0.0318450927734375, 0.05863189697265625, 0.085418701171875, 0.11220550537109375, 0.1389923095703125, 0.16577911376953125, 0.19256591796875, 0.21935272216796875, 0.2461395263671875, 0.27292633056640625, 0.299713134765625, 0.32649993896484375, 0.3532867431640625, 0.38007354736328125, 0.4068603515625, 0.43364715576171875, 0.4604339599609375, 0.48722076416015625, 0.514007568359375, 0.5407943725585938, 0.5675811767578125, 0.5943679809570312, 0.62115478515625, 0.6479415893554688, 0.6747283935546875, 0.7015151977539062, 0.728302001953125, 0.7550888061523438, 0.7818756103515625, 0.8086624145507812, 0.83544921875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 2.0, 7.0, 6.0, 4.0, 7.0, 8.0, 9.0, 5.0, 12.0, 15.0, 19.0, 26.0, 15.0, 33.0, 35.0, 21.0, 29.0, 46.0, 39.0, 36.0, 43.0, 31.0, 39.0, 44.0, 51.0, 47.0, 37.0, 34.0, 35.0, 30.0, 30.0, 24.0, 28.0, 25.0, 15.0, 18.0, 14.0, 18.0, 14.0, 8.0, 10.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.45361328125, -0.4409675598144531, -0.42832183837890625, -0.4156761169433594, -0.4030303955078125, -0.3903846740722656, -0.37773895263671875, -0.3650932312011719, -0.352447509765625, -0.3398017883300781, -0.32715606689453125, -0.3145103454589844, -0.3018646240234375, -0.2892189025878906, -0.27657318115234375, -0.2639274597167969, -0.25128173828125, -0.23863601684570312, -0.22599029541015625, -0.21334457397460938, -0.2006988525390625, -0.18805313110351562, -0.17540740966796875, -0.16276168823242188, -0.150115966796875, -0.13747024536132812, -0.12482452392578125, -0.11217880249023438, -0.0995330810546875, -0.08688735961914062, -0.07424163818359375, -0.061595916748046875, -0.0489501953125, -0.036304473876953125, -0.02365875244140625, -0.011013031005859375, 0.0016326904296875, 0.014278411865234375, 0.02692413330078125, 0.039569854736328125, 0.052215576171875, 0.06486129760742188, 0.07750701904296875, 0.09015274047851562, 0.1027984619140625, 0.11544418334960938, 0.12808990478515625, 0.14073562622070312, 0.15338134765625, 0.16602706909179688, 0.17867279052734375, 0.19131851196289062, 0.2039642333984375, 0.21660995483398438, 0.22925567626953125, 0.24190139770507812, 0.254547119140625, 0.2671928405761719, 0.27983856201171875, 0.2924842834472656, 0.3051300048828125, 0.3177757263183594, 0.33042144775390625, 0.3430671691894531, 0.355712890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 2.0, 4.0, 4.0, 7.0, 16.0, 15.0, 32.0, 17.0, 45.0, 59.0, 96.0, 159.0, 270.0, 651.0, 1534.0, 5247.0, 28987.0, 391856.0, 578524.0, 32287.0, 5648.0, 1706.0, 631.0, 284.0, 145.0, 110.0, 70.0, 30.0, 33.0, 19.0, 15.0, 15.0, 11.0, 5.0, 5.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.55859375, -1.5113983154296875, -1.464202880859375, -1.4170074462890625, -1.36981201171875, -1.3226165771484375, -1.275421142578125, -1.2282257080078125, -1.1810302734375, -1.1338348388671875, -1.086639404296875, -1.0394439697265625, -0.99224853515625, -0.9450531005859375, -0.897857666015625, -0.8506622314453125, -0.803466796875, -0.7562713623046875, -0.709075927734375, -0.6618804931640625, -0.61468505859375, -0.5674896240234375, -0.520294189453125, -0.4730987548828125, -0.4259033203125, -0.3787078857421875, -0.331512451171875, -0.2843170166015625, -0.23712158203125, -0.1899261474609375, -0.142730712890625, -0.0955352783203125, -0.04833984375, -0.0011444091796875, 0.046051025390625, 0.0932464599609375, 0.14044189453125, 0.1876373291015625, 0.234832763671875, 0.2820281982421875, 0.3292236328125, 0.3764190673828125, 0.423614501953125, 0.4708099365234375, 0.51800537109375, 0.5652008056640625, 0.612396240234375, 0.6595916748046875, 0.706787109375, 0.7539825439453125, 0.801177978515625, 0.8483734130859375, 0.89556884765625, 0.9427642822265625, 0.989959716796875, 1.0371551513671875, 1.0843505859375, 1.1315460205078125, 1.178741455078125, 1.2259368896484375, 1.27313232421875, 1.3203277587890625, 1.367523193359375, 1.4147186279296875, 1.4619140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 4.0, 8.0, 14.0, 18.0, 19.0, 27.0, 29.0, 39.0, 49.0, 41.0, 45.0, 47.0, 47.0, 52.0, 61.0, 57.0, 49.0, 63.0, 44.0, 51.0, 36.0, 26.0, 38.0, 20.0, 13.0, 15.0, 17.0, 11.0, 10.0, 7.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-2.302734375, -2.244232177734375, -2.18572998046875, -2.127227783203125, -2.0687255859375, -2.010223388671875, -1.95172119140625, -1.893218994140625, -1.834716796875, -1.776214599609375, -1.71771240234375, -1.659210205078125, -1.6007080078125, -1.542205810546875, -1.48370361328125, -1.425201416015625, -1.36669921875, -1.308197021484375, -1.24969482421875, -1.191192626953125, -1.1326904296875, -1.074188232421875, -1.01568603515625, -0.957183837890625, -0.898681640625, -0.840179443359375, -0.78167724609375, -0.723175048828125, -0.6646728515625, -0.606170654296875, -0.54766845703125, -0.489166259765625, -0.4306640625, -0.372161865234375, -0.31365966796875, -0.255157470703125, -0.1966552734375, -0.138153076171875, -0.07965087890625, -0.021148681640625, 0.037353515625, 0.095855712890625, 0.15435791015625, 0.212860107421875, 0.2713623046875, 0.329864501953125, 0.38836669921875, 0.446868896484375, 0.50537109375, 0.563873291015625, 0.62237548828125, 0.680877685546875, 0.7393798828125, 0.797882080078125, 0.85638427734375, 0.914886474609375, 0.973388671875, 1.031890869140625, 1.09039306640625, 1.148895263671875, 1.2073974609375, 1.265899658203125, 1.32440185546875, 1.382904052734375, 1.44140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 15.0, 18.0, 23.0, 36.0, 39.0, 65.0, 138.0, 212.0, 384.0, 810.0, 1984.0, 6048.0, 21775.0, 116993.0, 697295.0, 162694.0, 28382.0, 7249.0, 2418.0, 976.0, 430.0, 199.0, 130.0, 73.0, 48.0, 24.0, 31.0, 19.0, 7.0, 12.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380126953125, -0.3680915832519531, -0.35605621337890625, -0.3440208435058594, -0.3319854736328125, -0.3199501037597656, -0.30791473388671875, -0.2958793640136719, -0.283843994140625, -0.2718086242675781, -0.25977325439453125, -0.24773788452148438, -0.2357025146484375, -0.22366714477539062, -0.21163177490234375, -0.19959640502929688, -0.18756103515625, -0.17552566528320312, -0.16349029541015625, -0.15145492553710938, -0.1394195556640625, -0.12738418579101562, -0.11534881591796875, -0.10331344604492188, -0.091278076171875, -0.07924270629882812, -0.06720733642578125, -0.055171966552734375, -0.0431365966796875, -0.031101226806640625, -0.01906585693359375, -0.007030487060546875, 0.0050048828125, 0.017040252685546875, 0.02907562255859375, 0.041110992431640625, 0.0531463623046875, 0.06518173217773438, 0.07721710205078125, 0.08925247192382812, 0.101287841796875, 0.11332321166992188, 0.12535858154296875, 0.13739395141601562, 0.1494293212890625, 0.16146469116210938, 0.17350006103515625, 0.18553543090820312, 0.19757080078125, 0.20960617065429688, 0.22164154052734375, 0.23367691040039062, 0.2457122802734375, 0.2577476501464844, 0.26978302001953125, 0.2818183898925781, 0.293853759765625, 0.3058891296386719, 0.31792449951171875, 0.3299598693847656, 0.3419952392578125, 0.3540306091308594, 0.36606597900390625, 0.3781013488769531, 0.39013671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 13.0, 7.0, 13.0, 12.0, 13.0, 24.0, 52.0, 63.0, 72.0, 99.0, 115.0, 108.0, 109.0, 75.0, 80.0, 43.0, 32.0, 20.0, 14.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.445978164672852e-05, -8.157268166542053e-05, -7.868558168411255e-05, -7.579848170280457e-05, -7.291138172149658e-05, -7.00242817401886e-05, -6.713718175888062e-05, -6.425008177757263e-05, -6.136298179626465e-05, -5.8475881814956665e-05, -5.558878183364868e-05, -5.27016818523407e-05, -4.9814581871032715e-05, -4.692748188972473e-05, -4.404038190841675e-05, -4.1153281927108765e-05, -3.826618194580078e-05, -3.53790819644928e-05, -3.2491981983184814e-05, -2.960488200187683e-05, -2.6717782020568848e-05, -2.3830682039260864e-05, -2.094358205795288e-05, -1.8056482076644897e-05, -1.5169382095336914e-05, -1.228228211402893e-05, -9.395182132720947e-06, -6.508082151412964e-06, -3.6209821701049805e-06, -7.338821887969971e-07, 2.1532177925109863e-06, 5.04031777381897e-06, 7.927417755126953e-06, 1.0814517736434937e-05, 1.370161771774292e-05, 1.6588717699050903e-05, 1.9475817680358887e-05, 2.236291766166687e-05, 2.5250017642974854e-05, 2.8137117624282837e-05, 3.102421760559082e-05, 3.3911317586898804e-05, 3.679841756820679e-05, 3.968551754951477e-05, 4.2572617530822754e-05, 4.545971751213074e-05, 4.834681749343872e-05, 5.1233917474746704e-05, 5.412101745605469e-05, 5.700811743736267e-05, 5.9895217418670654e-05, 6.278231739997864e-05, 6.566941738128662e-05, 6.85565173625946e-05, 7.144361734390259e-05, 7.433071732521057e-05, 7.721781730651855e-05, 8.010491728782654e-05, 8.299201726913452e-05, 8.58791172504425e-05, 8.876621723175049e-05, 9.165331721305847e-05, 9.454041719436646e-05, 9.742751717567444e-05, 0.00010031461715698242]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 9.0, 7.0, 15.0, 22.0, 24.0, 31.0, 54.0, 74.0, 152.0, 216.0, 375.0, 699.0, 1491.0, 3510.0, 11101.0, 47846.0, 291922.0, 596330.0, 70999.0, 15331.0, 4530.0, 1875.0, 853.0, 416.0, 233.0, 140.0, 82.0, 65.0, 44.0, 22.0, 17.0, 21.0, 11.0, 4.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37109375, -0.35916900634765625, -0.3472442626953125, -0.33531951904296875, -0.323394775390625, -0.31147003173828125, -0.2995452880859375, -0.28762054443359375, -0.27569580078125, -0.26377105712890625, -0.2518463134765625, -0.23992156982421875, -0.227996826171875, -0.21607208251953125, -0.2041473388671875, -0.19222259521484375, -0.1802978515625, -0.16837310791015625, -0.1564483642578125, -0.14452362060546875, -0.132598876953125, -0.12067413330078125, -0.1087493896484375, -0.09682464599609375, -0.08489990234375, -0.07297515869140625, -0.0610504150390625, -0.04912567138671875, -0.037200927734375, -0.02527618408203125, -0.0133514404296875, -0.00142669677734375, 0.010498046875, 0.02242279052734375, 0.0343475341796875, 0.04627227783203125, 0.058197021484375, 0.07012176513671875, 0.0820465087890625, 0.09397125244140625, 0.10589599609375, 0.11782073974609375, 0.1297454833984375, 0.14167022705078125, 0.153594970703125, 0.16551971435546875, 0.1774444580078125, 0.18936920166015625, 0.2012939453125, 0.21321868896484375, 0.2251434326171875, 0.23706817626953125, 0.248992919921875, 0.26091766357421875, 0.2728424072265625, 0.28476715087890625, 0.29669189453125, 0.30861663818359375, 0.3205413818359375, 0.33246612548828125, 0.344390869140625, 0.35631561279296875, 0.3682403564453125, 0.38016510009765625, 0.39208984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 15.0, 14.0, 24.0, 27.0, 39.0, 46.0, 64.0, 120.0, 110.0, 133.0, 107.0, 97.0, 65.0, 47.0, 29.0, 23.0, 9.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6298828125, -0.6134109497070312, -0.5969390869140625, -0.5804672241210938, -0.563995361328125, -0.5475234985351562, -0.5310516357421875, -0.5145797729492188, -0.49810791015625, -0.48163604736328125, -0.4651641845703125, -0.44869232177734375, -0.432220458984375, -0.41574859619140625, -0.3992767333984375, -0.38280487060546875, -0.3663330078125, -0.34986114501953125, -0.3333892822265625, -0.31691741943359375, -0.300445556640625, -0.28397369384765625, -0.2675018310546875, -0.25102996826171875, -0.23455810546875, -0.21808624267578125, -0.2016143798828125, -0.18514251708984375, -0.168670654296875, -0.15219879150390625, -0.1357269287109375, -0.11925506591796875, -0.102783203125, -0.08631134033203125, -0.0698394775390625, -0.05336761474609375, -0.036895751953125, -0.02042388916015625, -0.0039520263671875, 0.01251983642578125, 0.02899169921875, 0.04546356201171875, 0.0619354248046875, 0.07840728759765625, 0.094879150390625, 0.11135101318359375, 0.1278228759765625, 0.14429473876953125, 0.1607666015625, 0.17723846435546875, 0.1937103271484375, 0.21018218994140625, 0.226654052734375, 0.24312591552734375, 0.2595977783203125, 0.27606964111328125, 0.29254150390625, 0.30901336669921875, 0.3254852294921875, 0.34195709228515625, 0.358428955078125, 0.37490081787109375, 0.3913726806640625, 0.40784454345703125, 0.42431640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 8.0, 11.0, 14.0, 33.0, 87.0, 229.0, 360.0, 173.0, 52.0, 20.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.79146385192871, -17.33894920349121, -16.886436462402344, -16.433921813964844, -15.981407165527344, -15.528892517089844, -15.07637882232666, -14.623865127563477, -14.171350479125977, -13.718835830688477, -13.266322135925293, -12.81380844116211, -12.36129379272461, -11.90877914428711, -11.456265449523926, -11.003751754760742, -10.551237106323242, -10.098722457885742, -9.646208763122559, -9.193695068359375, -8.741180419921875, -8.288665771484375, -7.836152076721191, -7.38363790512085, -6.931123733520508, -6.478609561920166, -6.026095390319824, -5.573581218719482, -5.121067047119141, -4.668552875518799, -4.216038703918457, -3.7635245323181152, -3.3110103607177734, -2.8584961891174316, -2.40598201751709, -1.953467845916748, -1.5009536743164062, -1.0484395027160645, -0.5959253311157227, -0.14341115951538086, 0.30910301208496094, 0.7616171836853027, 1.2141313552856445, 1.6666455268859863, 2.119159698486328, 2.57167387008667, 3.0241880416870117, 3.4767022132873535, 3.9292163848876953, 4.381730556488037, 4.834244728088379, 5.286758899688721, 5.7392730712890625, 6.191787242889404, 6.644301414489746, 7.096815586090088, 7.54932975769043, 8.00184440612793, 8.454358100891113, 8.906871795654297, 9.359386444091797, 9.811901092529297, 10.26441478729248, 10.716928482055664, 11.169443130493164]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 11.0, 8.0, 12.0, 9.0, 4.0, 19.0, 27.0, 39.0, 22.0, 26.0, 43.0, 32.0, 35.0, 40.0, 77.0, 81.0, 75.0, 84.0, 52.0, 38.0, 35.0, 27.0, 39.0, 24.0, 20.0, 19.0, 17.0, 15.0, 11.0, 12.0, 13.0, 11.0, 4.0, 3.0, 5.0, 3.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.619002342224121, -7.3963117599487305, -7.17362117767334, -6.950930595397949, -6.728240489959717, -6.505549907684326, -6.2828593254089355, -6.060168743133545, -5.837478160858154, -5.614787578582764, -5.392096996307373, -5.169406890869141, -4.94671630859375, -4.724025726318359, -4.501335144042969, -4.278644561767578, -4.0559539794921875, -3.833263397216797, -3.6105730533599854, -3.3878824710845947, -3.165191888809204, -2.9425015449523926, -2.719810962677002, -2.4971203804016113, -2.274430274963379, -2.0517396926879883, -1.8290492296218872, -1.6063587665557861, -1.3836681842803955, -1.1609777212142944, -0.9382872581481934, -0.7155966758728027, -0.4929060935974121, -0.27021557092666626, -0.0475250780582428, 0.17516541481018066, 0.3978559374809265, 0.6205464601516724, 0.8432369232177734, 1.065927505493164, 1.2886179685592651, 1.5113084316253662, 1.7339990139007568, 1.956689476966858, 2.179379940032959, 2.4020705223083496, 2.6247611045837402, 2.847451686859131, 3.0701420307159424, 3.292832612991333, 3.5155229568481445, 3.738213539123535, 3.960904121398926, 4.183594703674316, 4.406285285949707, 4.628975868225098, 4.85166597366333, 5.074356555938721, 5.297047138214111, 5.519737243652344, 5.742427825927734, 5.965118408203125, 6.187808990478516, 6.410499572753906, 6.633190155029297]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 11.0, 10.0, 26.0, 35.0, 55.0, 72.0, 112.0, 200.0, 301.0, 560.0, 982.0, 2006.0, 4290.0, 10731.0, 36004.0, 206206.0, 1948770.0, 1742716.0, 187040.0, 35277.0, 10342.0, 4127.0, 1945.0, 996.0, 558.0, 328.0, 179.0, 130.0, 88.0, 46.0, 38.0, 25.0, 14.0, 19.0, 8.0, 8.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.671875, -0.652099609375, -0.63232421875, -0.612548828125, -0.5927734375, -0.572998046875, -0.55322265625, -0.533447265625, -0.513671875, -0.493896484375, -0.47412109375, -0.454345703125, -0.4345703125, -0.414794921875, -0.39501953125, -0.375244140625, -0.35546875, -0.335693359375, -0.31591796875, -0.296142578125, -0.2763671875, -0.256591796875, -0.23681640625, -0.217041015625, -0.197265625, -0.177490234375, -0.15771484375, -0.137939453125, -0.1181640625, -0.098388671875, -0.07861328125, -0.058837890625, -0.0390625, -0.019287109375, 0.00048828125, 0.020263671875, 0.0400390625, 0.059814453125, 0.07958984375, 0.099365234375, 0.119140625, 0.138916015625, 0.15869140625, 0.178466796875, 0.1982421875, 0.218017578125, 0.23779296875, 0.257568359375, 0.27734375, 0.297119140625, 0.31689453125, 0.336669921875, 0.3564453125, 0.376220703125, 0.39599609375, 0.415771484375, 0.435546875, 0.455322265625, 0.47509765625, 0.494873046875, 0.5146484375, 0.534423828125, 0.55419921875, 0.573974609375, 0.59375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 5.0, 6.0, 11.0, 14.0, 18.0, 25.0, 26.0, 26.0, 29.0, 34.0, 49.0, 43.0, 49.0, 52.0, 33.0, 41.0, 44.0, 44.0, 44.0, 44.0, 45.0, 43.0, 37.0, 31.0, 26.0, 21.0, 18.0, 24.0, 20.0, 12.0, 14.0, 6.0, 15.0, 10.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.46630859375, -0.4533538818359375, -0.440399169921875, -0.4274444580078125, -0.41448974609375, -0.4015350341796875, -0.388580322265625, -0.3756256103515625, -0.3626708984375, -0.3497161865234375, -0.336761474609375, -0.3238067626953125, -0.31085205078125, -0.2978973388671875, -0.284942626953125, -0.2719879150390625, -0.259033203125, -0.2460784912109375, -0.233123779296875, -0.2201690673828125, -0.20721435546875, -0.1942596435546875, -0.181304931640625, -0.1683502197265625, -0.1553955078125, -0.1424407958984375, -0.129486083984375, -0.1165313720703125, -0.10357666015625, -0.0906219482421875, -0.077667236328125, -0.0647125244140625, -0.0517578125, -0.0388031005859375, -0.025848388671875, -0.0128936767578125, 6.103515625e-05, 0.0130157470703125, 0.025970458984375, 0.0389251708984375, 0.0518798828125, 0.0648345947265625, 0.077789306640625, 0.0907440185546875, 0.10369873046875, 0.1166534423828125, 0.129608154296875, 0.1425628662109375, 0.155517578125, 0.1684722900390625, 0.181427001953125, 0.1943817138671875, 0.20733642578125, 0.2202911376953125, 0.233245849609375, 0.2462005615234375, 0.2591552734375, 0.2721099853515625, 0.285064697265625, 0.2980194091796875, 0.31097412109375, 0.3239288330078125, 0.336883544921875, 0.3498382568359375, 0.36279296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 11.0, 11.0, 12.0, 28.0, 31.0, 53.0, 61.0, 139.0, 330.0, 860.0, 2872.0, 16304.0, 264314.0, 3808545.0, 88371.0, 9187.0, 1912.0, 653.0, 236.0, 130.0, 68.0, 41.0, 25.0, 18.0, 15.0, 13.0, 4.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.9140625, -1.8614044189453125, -1.808746337890625, -1.7560882568359375, -1.70343017578125, -1.6507720947265625, -1.598114013671875, -1.5454559326171875, -1.4927978515625, -1.4401397705078125, -1.387481689453125, -1.3348236083984375, -1.28216552734375, -1.2295074462890625, -1.176849365234375, -1.1241912841796875, -1.071533203125, -1.0188751220703125, -0.966217041015625, -0.9135589599609375, -0.86090087890625, -0.8082427978515625, -0.755584716796875, -0.7029266357421875, -0.6502685546875, -0.5976104736328125, -0.544952392578125, -0.4922943115234375, -0.43963623046875, -0.3869781494140625, -0.334320068359375, -0.2816619873046875, -0.22900390625, -0.1763458251953125, -0.123687744140625, -0.0710296630859375, -0.01837158203125, 0.0342864990234375, 0.086944580078125, 0.1396026611328125, 0.1922607421875, 0.2449188232421875, 0.297576904296875, 0.3502349853515625, 0.40289306640625, 0.4555511474609375, 0.508209228515625, 0.5608673095703125, 0.613525390625, 0.6661834716796875, 0.718841552734375, 0.7714996337890625, 0.82415771484375, 0.8768157958984375, 0.929473876953125, 0.9821319580078125, 1.0347900390625, 1.0874481201171875, 1.140106201171875, 1.1927642822265625, 1.24542236328125, 1.2980804443359375, 1.350738525390625, 1.4033966064453125, 1.4560546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 9.0, 22.0, 23.0, 28.0, 52.0, 85.0, 128.0, 276.0, 518.0, 981.0, 858.0, 458.0, 233.0, 143.0, 72.0, 49.0, 33.0, 20.0, 18.0, 8.0, 2.0, 10.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23828125, -1.200653076171875, -1.16302490234375, -1.125396728515625, -1.0877685546875, -1.050140380859375, -1.01251220703125, -0.974884033203125, -0.937255859375, -0.899627685546875, -0.86199951171875, -0.824371337890625, -0.7867431640625, -0.749114990234375, -0.71148681640625, -0.673858642578125, -0.63623046875, -0.598602294921875, -0.56097412109375, -0.523345947265625, -0.4857177734375, -0.448089599609375, -0.41046142578125, -0.372833251953125, -0.335205078125, -0.297576904296875, -0.25994873046875, -0.222320556640625, -0.1846923828125, -0.147064208984375, -0.10943603515625, -0.071807861328125, -0.0341796875, 0.003448486328125, 0.04107666015625, 0.078704833984375, 0.1163330078125, 0.153961181640625, 0.19158935546875, 0.229217529296875, 0.266845703125, 0.304473876953125, 0.34210205078125, 0.379730224609375, 0.4173583984375, 0.454986572265625, 0.49261474609375, 0.530242919921875, 0.56787109375, 0.605499267578125, 0.64312744140625, 0.680755615234375, 0.7183837890625, 0.756011962890625, 0.79364013671875, 0.831268310546875, 0.868896484375, 0.906524658203125, 0.94415283203125, 0.981781005859375, 1.0194091796875, 1.057037353515625, 1.09466552734375, 1.132293701171875, 1.169921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 8.0, 7.0, 9.0, 32.0, 56.0, 110.0, 227.0, 200.0, 165.0, 93.0, 44.0, 20.0, 12.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3206787109375, -11.00843620300293, -10.69619369506836, -10.383952140808105, -10.071709632873535, -9.759467124938965, -9.447224617004395, -9.13498306274414, -8.82274055480957, -8.510498046875, -8.19825553894043, -7.886013507843018, -7.5737714767456055, -7.261528968811035, -6.949286460876465, -6.637044429779053, -6.324801921844482, -6.012559413909912, -5.7003173828125, -5.38807487487793, -5.075832843780518, -4.763590335845947, -4.451348304748535, -4.139105796813965, -3.8268635272979736, -3.5146212577819824, -3.202378988265991, -2.89013671875, -2.5778942108154297, -2.2656521797180176, -1.9534096717834473, -1.641167402267456, -1.3289251327514648, -1.0166828632354736, -0.7044405341148376, -0.39219820499420166, -0.07995593547821045, 0.23228633403778076, 0.5445287227630615, 0.8567709922790527, 1.169013261795044, 1.4812555313110352, 1.7934978008270264, 2.1057400703430176, 2.417982578277588, 2.730224609375, 3.0424671173095703, 3.3547093868255615, 3.6669516563415527, 3.979193925857544, 4.291436195373535, 4.6036787033081055, 4.915920734405518, 5.228163242340088, 5.5404052734375, 5.85264778137207, 6.164890289306641, 6.477132797241211, 6.789374828338623, 7.101617336273193, 7.4138593673706055, 7.726101875305176, 8.038344383239746, 8.3505859375, 8.66282844543457]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 14.0, 14.0, 16.0, 23.0, 25.0, 30.0, 34.0, 33.0, 39.0, 52.0, 46.0, 51.0, 58.0, 64.0, 52.0, 38.0, 47.0, 38.0, 40.0, 38.0, 34.0, 31.0, 32.0, 31.0, 9.0, 15.0, 9.0, 12.0, 8.0, 8.0, 5.0, 9.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.476782321929932, -4.343027114868164, -4.2092719078063965, -4.075516700744629, -3.9417614936828613, -3.8080062866210938, -3.6742513179779053, -3.5404961109161377, -3.40674090385437, -3.2729856967926025, -3.139230489730835, -3.0054752826690674, -2.871720314025879, -2.7379651069641113, -2.6042098999023438, -2.470454692840576, -2.3366994857788086, -2.202944278717041, -2.0691890716552734, -1.9354339838027954, -1.8016787767410278, -1.6679235696792603, -1.5341684818267822, -1.4004132747650146, -1.266658067703247, -1.1329028606414795, -0.9991477131843567, -0.8653925657272339, -0.7316373586654663, -0.5978821516036987, -0.4641270041465759, -0.3303718566894531, -0.19661712646484375, -0.06286194920539856, 0.07089322805404663, 0.20464840531349182, 0.338403582572937, 0.4721587896347046, 0.6059139370918274, 0.7396690845489502, 0.8734242916107178, 1.0071794986724854, 1.140934705734253, 1.274689793586731, 1.4084450006484985, 1.5422002077102661, 1.6759552955627441, 1.8097105026245117, 1.9434657096862793, 2.077220916748047, 2.2109761238098145, 2.344731330871582, 2.4784865379333496, 2.612241744995117, 2.7459967136383057, 2.8797519207000732, 3.013507127761841, 3.1472623348236084, 3.281017541885376, 3.4147727489471436, 3.548527717590332, 3.6822829246520996, 3.816038131713867, 3.9497933387756348, 4.083548545837402]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 12.0, 17.0, 20.0, 24.0, 50.0, 54.0, 77.0, 122.0, 229.0, 487.0, 1055.0, 2604.0, 7967.0, 35012.0, 256030.0, 619783.0, 99932.0, 17097.0, 4731.0, 1661.0, 709.0, 348.0, 175.0, 101.0, 74.0, 55.0, 39.0, 21.0, 11.0, 14.0, 9.0, 6.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1201171875, -1.0843048095703125, -1.048492431640625, -1.0126800537109375, -0.97686767578125, -0.9410552978515625, -0.905242919921875, -0.8694305419921875, -0.8336181640625, -0.7978057861328125, -0.761993408203125, -0.7261810302734375, -0.69036865234375, -0.6545562744140625, -0.618743896484375, -0.5829315185546875, -0.547119140625, -0.5113067626953125, -0.475494384765625, -0.4396820068359375, -0.40386962890625, -0.3680572509765625, -0.332244873046875, -0.2964324951171875, -0.2606201171875, -0.2248077392578125, -0.188995361328125, -0.1531829833984375, -0.11737060546875, -0.0815582275390625, -0.045745849609375, -0.0099334716796875, 0.02587890625, 0.0616912841796875, 0.097503662109375, 0.1333160400390625, 0.16912841796875, 0.2049407958984375, 0.240753173828125, 0.2765655517578125, 0.3123779296875, 0.3481903076171875, 0.384002685546875, 0.4198150634765625, 0.45562744140625, 0.4914398193359375, 0.527252197265625, 0.5630645751953125, 0.598876953125, 0.6346893310546875, 0.670501708984375, 0.7063140869140625, 0.74212646484375, 0.7779388427734375, 0.813751220703125, 0.8495635986328125, 0.8853759765625, 0.9211883544921875, 0.957000732421875, 0.9928131103515625, 1.02862548828125, 1.0644378662109375, 1.100250244140625, 1.1360626220703125, 1.171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 3.0, 9.0, 8.0, 8.0, 11.0, 21.0, 19.0, 28.0, 28.0, 26.0, 40.0, 49.0, 49.0, 52.0, 44.0, 45.0, 50.0, 58.0, 46.0, 47.0, 51.0, 34.0, 25.0, 50.0, 37.0, 29.0, 21.0, 14.0, 23.0, 14.0, 12.0, 7.0, 9.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4532470703125, -0.43896484375, -0.4246826171875, -0.410400390625, -0.3961181640625, -0.3818359375, -0.3675537109375, -0.353271484375, -0.3389892578125, -0.32470703125, -0.3104248046875, -0.296142578125, -0.2818603515625, -0.267578125, -0.2532958984375, -0.239013671875, -0.2247314453125, -0.21044921875, -0.1961669921875, -0.181884765625, -0.1676025390625, -0.1533203125, -0.1390380859375, -0.124755859375, -0.1104736328125, -0.09619140625, -0.0819091796875, -0.067626953125, -0.0533447265625, -0.0390625, -0.0247802734375, -0.010498046875, 0.0037841796875, 0.01806640625, 0.0323486328125, 0.046630859375, 0.0609130859375, 0.0751953125, 0.0894775390625, 0.103759765625, 0.1180419921875, 0.13232421875, 0.1466064453125, 0.160888671875, 0.1751708984375, 0.189453125, 0.2037353515625, 0.218017578125, 0.2322998046875, 0.24658203125, 0.2608642578125, 0.275146484375, 0.2894287109375, 0.3037109375, 0.3179931640625, 0.332275390625, 0.3465576171875, 0.36083984375, 0.3751220703125, 0.389404296875, 0.4036865234375, 0.41796875, 0.4322509765625, 0.446533203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 10.0, 8.0, 10.0, 13.0, 28.0, 33.0, 38.0, 55.0, 87.0, 112.0, 155.0, 330.0, 580.0, 1349.0, 5020.0, 36442.0, 741783.0, 239690.0, 17487.0, 3135.0, 1004.0, 440.0, 254.0, 147.0, 126.0, 62.0, 43.0, 34.0, 18.0, 20.0, 9.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.31640625, -1.2691192626953125, -1.221832275390625, -1.1745452880859375, -1.12725830078125, -1.0799713134765625, -1.032684326171875, -0.9853973388671875, -0.9381103515625, -0.8908233642578125, -0.843536376953125, -0.7962493896484375, -0.74896240234375, -0.7016754150390625, -0.654388427734375, -0.6071014404296875, -0.559814453125, -0.5125274658203125, -0.465240478515625, -0.4179534912109375, -0.37066650390625, -0.3233795166015625, -0.276092529296875, -0.2288055419921875, -0.1815185546875, -0.1342315673828125, -0.086944580078125, -0.0396575927734375, 0.00762939453125, 0.0549163818359375, 0.102203369140625, 0.1494903564453125, 0.19677734375, 0.2440643310546875, 0.291351318359375, 0.3386383056640625, 0.38592529296875, 0.4332122802734375, 0.480499267578125, 0.5277862548828125, 0.5750732421875, 0.6223602294921875, 0.669647216796875, 0.7169342041015625, 0.76422119140625, 0.8115081787109375, 0.858795166015625, 0.9060821533203125, 0.953369140625, 1.0006561279296875, 1.047943115234375, 1.0952301025390625, 1.14251708984375, 1.1898040771484375, 1.237091064453125, 1.2843780517578125, 1.3316650390625, 1.3789520263671875, 1.426239013671875, 1.4735260009765625, 1.52081298828125, 1.5680999755859375, 1.615386962890625, 1.6626739501953125, 1.7099609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 9.0, 3.0, 6.0, 10.0, 9.0, 10.0, 18.0, 17.0, 15.0, 20.0, 26.0, 26.0, 38.0, 28.0, 38.0, 46.0, 42.0, 64.0, 63.0, 62.0, 77.0, 52.0, 40.0, 45.0, 33.0, 28.0, 28.0, 34.0, 13.0, 26.0, 13.0, 10.0, 11.0, 12.0, 5.0, 7.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.589202880859375, -1.53778076171875, -1.486358642578125, -1.4349365234375, -1.383514404296875, -1.33209228515625, -1.280670166015625, -1.229248046875, -1.177825927734375, -1.12640380859375, -1.074981689453125, -1.0235595703125, -0.972137451171875, -0.92071533203125, -0.869293212890625, -0.81787109375, -0.766448974609375, -0.71502685546875, -0.663604736328125, -0.6121826171875, -0.560760498046875, -0.50933837890625, -0.457916259765625, -0.406494140625, -0.355072021484375, -0.30364990234375, -0.252227783203125, -0.2008056640625, -0.149383544921875, -0.09796142578125, -0.046539306640625, 0.0048828125, 0.056304931640625, 0.10772705078125, 0.159149169921875, 0.2105712890625, 0.261993408203125, 0.31341552734375, 0.364837646484375, 0.416259765625, 0.467681884765625, 0.51910400390625, 0.570526123046875, 0.6219482421875, 0.673370361328125, 0.72479248046875, 0.776214599609375, 0.82763671875, 0.879058837890625, 0.93048095703125, 0.981903076171875, 1.0333251953125, 1.084747314453125, 1.13616943359375, 1.187591552734375, 1.239013671875, 1.290435791015625, 1.34185791015625, 1.393280029296875, 1.4447021484375, 1.496124267578125, 1.54754638671875, 1.598968505859375, 1.650390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 12.0, 11.0, 8.0, 31.0, 51.0, 72.0, 145.0, 240.0, 504.0, 1297.0, 3811.0, 15017.0, 106761.0, 827105.0, 76079.0, 12064.0, 3205.0, 1167.0, 438.0, 208.0, 117.0, 73.0, 42.0, 27.0, 21.0, 11.0, 11.0, 2.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.52685546875, -0.5127792358398438, -0.4987030029296875, -0.48462677001953125, -0.470550537109375, -0.45647430419921875, -0.4423980712890625, -0.42832183837890625, -0.41424560546875, -0.40016937255859375, -0.3860931396484375, -0.37201690673828125, -0.357940673828125, -0.34386444091796875, -0.3297882080078125, -0.31571197509765625, -0.3016357421875, -0.28755950927734375, -0.2734832763671875, -0.25940704345703125, -0.245330810546875, -0.23125457763671875, -0.2171783447265625, -0.20310211181640625, -0.18902587890625, -0.17494964599609375, -0.1608734130859375, -0.14679718017578125, -0.132720947265625, -0.11864471435546875, -0.1045684814453125, -0.09049224853515625, -0.076416015625, -0.06233978271484375, -0.0482635498046875, -0.03418731689453125, -0.020111083984375, -0.00603485107421875, 0.0080413818359375, 0.02211761474609375, 0.03619384765625, 0.05027008056640625, 0.0643463134765625, 0.07842254638671875, 0.092498779296875, 0.10657501220703125, 0.1206512451171875, 0.13472747802734375, 0.1488037109375, 0.16287994384765625, 0.1769561767578125, 0.19103240966796875, 0.205108642578125, 0.21918487548828125, 0.2332611083984375, 0.24733734130859375, 0.26141357421875, 0.27548980712890625, 0.2895660400390625, 0.30364227294921875, 0.317718505859375, 0.33179473876953125, 0.3458709716796875, 0.35994720458984375, 0.3740234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 4.0, 4.0, 10.0, 4.0, 4.0, 15.0, 10.0, 19.0, 17.0, 36.0, 58.0, 80.0, 124.0, 151.0, 135.0, 87.0, 77.0, 46.0, 25.0, 27.0, 18.0, 14.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.96453857421875e-05, -8.664093911647797e-05, -8.363649249076843e-05, -8.06320458650589e-05, -7.762759923934937e-05, -7.462315261363983e-05, -7.16187059879303e-05, -6.861425936222076e-05, -6.560981273651123e-05, -6.26053661108017e-05, -5.960091948509216e-05, -5.659647285938263e-05, -5.3592026233673096e-05, -5.058757960796356e-05, -4.758313298225403e-05, -4.4578686356544495e-05, -4.157423973083496e-05, -3.856979310512543e-05, -3.5565346479415894e-05, -3.256089985370636e-05, -2.9556453227996826e-05, -2.6552006602287292e-05, -2.354755997657776e-05, -2.0543113350868225e-05, -1.753866672515869e-05, -1.4534220099449158e-05, -1.1529773473739624e-05, -8.52532684803009e-06, -5.520880222320557e-06, -2.516433596611023e-06, 4.880130290985107e-07, 3.4924596548080444e-06, 6.496906280517578e-06, 9.501352906227112e-06, 1.2505799531936646e-05, 1.551024615764618e-05, 1.8514692783355713e-05, 2.1519139409065247e-05, 2.452358603477478e-05, 2.7528032660484314e-05, 3.053247928619385e-05, 3.353692591190338e-05, 3.6541372537612915e-05, 3.954581916332245e-05, 4.255026578903198e-05, 4.5554712414741516e-05, 4.855915904045105e-05, 5.1563605666160583e-05, 5.456805229187012e-05, 5.757249891757965e-05, 6.0576945543289185e-05, 6.358139216899872e-05, 6.658583879470825e-05, 6.959028542041779e-05, 7.259473204612732e-05, 7.559917867183685e-05, 7.860362529754639e-05, 8.160807192325592e-05, 8.461251854896545e-05, 8.761696517467499e-05, 9.062141180038452e-05, 9.362585842609406e-05, 9.663030505180359e-05, 9.963475167751312e-05, 0.00010263919830322266]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 8.0, 9.0, 13.0, 20.0, 16.0, 32.0, 45.0, 63.0, 95.0, 137.0, 168.0, 342.0, 558.0, 1105.0, 2222.0, 5029.0, 14395.0, 52375.0, 312468.0, 572485.0, 60123.0, 16122.0, 5622.0, 2357.0, 1094.0, 589.0, 338.0, 214.0, 148.0, 100.0, 66.0, 46.0, 28.0, 25.0, 20.0, 9.0, 11.0, 6.0, 4.0, 5.0, 7.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.268798828125, -0.25954437255859375, -0.2502899169921875, -0.24103546142578125, -0.231781005859375, -0.22252655029296875, -0.2132720947265625, -0.20401763916015625, -0.19476318359375, -0.18550872802734375, -0.1762542724609375, -0.16699981689453125, -0.157745361328125, -0.14849090576171875, -0.1392364501953125, -0.12998199462890625, -0.1207275390625, -0.11147308349609375, -0.1022186279296875, -0.09296417236328125, -0.083709716796875, -0.07445526123046875, -0.0652008056640625, -0.05594635009765625, -0.04669189453125, -0.03743743896484375, -0.0281829833984375, -0.01892852783203125, -0.009674072265625, -0.00041961669921875, 0.0088348388671875, 0.01808929443359375, 0.02734375, 0.03659820556640625, 0.0458526611328125, 0.05510711669921875, 0.064361572265625, 0.07361602783203125, 0.0828704833984375, 0.09212493896484375, 0.10137939453125, 0.11063385009765625, 0.1198883056640625, 0.12914276123046875, 0.138397216796875, 0.14765167236328125, 0.1569061279296875, 0.16616058349609375, 0.1754150390625, 0.18466949462890625, 0.1939239501953125, 0.20317840576171875, 0.212432861328125, 0.22168731689453125, 0.2309417724609375, 0.24019622802734375, 0.24945068359375, 0.25870513916015625, 0.2679595947265625, 0.27721405029296875, 0.286468505859375, 0.29572296142578125, 0.3049774169921875, 0.31423187255859375, 0.323486328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 6.0, 6.0, 1.0, 7.0, 11.0, 11.0, 19.0, 17.0, 28.0, 22.0, 42.0, 53.0, 70.0, 118.0, 121.0, 138.0, 92.0, 70.0, 38.0, 38.0, 25.0, 15.0, 17.0, 14.0, 6.0, 10.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.472900390625, -0.4603614807128906, -0.44782257080078125, -0.4352836608886719, -0.4227447509765625, -0.4102058410644531, -0.39766693115234375, -0.3851280212402344, -0.372589111328125, -0.3600502014160156, -0.34751129150390625, -0.3349723815917969, -0.3224334716796875, -0.3098945617675781, -0.29735565185546875, -0.2848167419433594, -0.27227783203125, -0.2597389221191406, -0.24720001220703125, -0.23466110229492188, -0.2221221923828125, -0.20958328247070312, -0.19704437255859375, -0.18450546264648438, -0.171966552734375, -0.15942764282226562, -0.14688873291015625, -0.13434982299804688, -0.1218109130859375, -0.10927200317382812, -0.09673309326171875, -0.08419418334960938, -0.0716552734375, -0.059116363525390625, -0.04657745361328125, -0.034038543701171875, -0.0214996337890625, -0.008960723876953125, 0.00357818603515625, 0.016117095947265625, 0.028656005859375, 0.041194915771484375, 0.05373382568359375, 0.06627273559570312, 0.0788116455078125, 0.09135055541992188, 0.10388946533203125, 0.11642837524414062, 0.12896728515625, 0.14150619506835938, 0.15404510498046875, 0.16658401489257812, 0.1791229248046875, 0.19166183471679688, 0.20420074462890625, 0.21673965454101562, 0.229278564453125, 0.24181747436523438, 0.25435638427734375, 0.2668952941894531, 0.2794342041015625, 0.2919731140136719, 0.30451202392578125, 0.3170509338378906, 0.32958984375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 13.0, 24.0, 75.0, 168.0, 378.0, 171.0, 98.0, 39.0, 15.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9643964767456055, -5.602572441101074, -5.240747928619385, -4.8789238929748535, -4.517099380493164, -4.155275344848633, -3.7934513092041016, -3.431627035140991, -3.069802761077881, -2.7079784870147705, -2.34615421295166, -1.984330177307129, -1.6225059032440186, -1.2606816291809082, -0.898857593536377, -0.5370333194732666, -0.17520904541015625, 0.18661516904830933, 0.5484393835067749, 0.9102635383605957, 1.272087812423706, 1.6339120864868164, 1.9957361221313477, 2.357560396194458, 2.7193846702575684, 3.0812089443206787, 3.443033218383789, 3.8048572540283203, 4.166681289672852, 4.528505802154541, 4.890329837799072, 5.252154350280762, 5.613977432250977, 5.975801467895508, 6.337625980377197, 6.6994500160217285, 7.061274528503418, 7.423098564147949, 7.7849225997924805, 8.146746635437012, 8.50857162475586, 8.87039566040039, 9.232219696044922, 9.594043731689453, 9.9558687210083, 10.317692756652832, 10.679516792297363, 11.041340827941895, 11.403164863586426, 11.764988899230957, 12.126812934875488, 12.488637924194336, 12.850461959838867, 13.212285995483398, 13.57411003112793, 13.935934066772461, 14.297758102416992, 14.659582138061523, 15.021406173706055, 15.383230209350586, 15.745055198669434, 16.10688018798828, 16.468704223632812, 16.830528259277344, 17.192352294921875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 11.0, 13.0, 11.0, 14.0, 27.0, 26.0, 23.0, 35.0, 33.0, 48.0, 53.0, 72.0, 112.0, 115.0, 79.0, 51.0, 48.0, 40.0, 30.0, 32.0, 22.0, 14.0, 19.0, 11.0, 19.0, 7.0, 3.0, 5.0, 8.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.125114440917969, -8.891151428222656, -8.657188415527344, -8.423224449157715, -8.189261436462402, -7.95529842376709, -7.721334934234619, -7.487371921539307, -7.253408432006836, -7.019445419311523, -6.785481929779053, -6.55151891708374, -6.3175554275512695, -6.083592414855957, -5.849628925323486, -5.615665912628174, -5.381702423095703, -5.147739410400391, -4.91377592086792, -4.679812908172607, -4.445849418640137, -4.211886405944824, -3.9779229164123535, -3.743959903717041, -3.5099968910217285, -3.276033639907837, -3.0420703887939453, -2.8081071376800537, -2.574143886566162, -2.3401808738708496, -2.106217384338379, -1.8722542524337769, -1.6382908821105957, -1.404327630996704, -1.1703643798828125, -0.9364011883735657, -0.7024379372596741, -0.46847474575042725, -0.23451149463653564, -0.000548243522644043, 0.23341500759124756, 0.46737825870513916, 0.7013415098190308, 0.9353047013282776, 1.1692678928375244, 1.403231143951416, 1.6371943950653076, 1.8711576461791992, 2.105120897293091, 2.3390841484069824, 2.573047399520874, 2.8070106506347656, 3.0409739017486572, 3.274937152862549, 3.5089001655578613, 3.742863655090332, 3.9768266677856445, 4.210789680480957, 4.444753170013428, 4.67871618270874, 4.912679672241211, 5.146642684936523, 5.380606174468994, 5.614569187164307, 5.848532676696777]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 2.0, 15.0, 18.0, 29.0, 45.0, 70.0, 118.0, 176.0, 352.0, 651.0, 1305.0, 2768.0, 7276.0, 24530.0, 150907.0, 2031981.0, 1799901.0, 138030.0, 23696.0, 7012.0, 2659.0, 1211.0, 640.0, 332.0, 196.0, 115.0, 81.0, 61.0, 33.0, 16.0, 11.0, 9.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.828125, -0.8051071166992188, -0.7820892333984375, -0.7590713500976562, -0.736053466796875, -0.7130355834960938, -0.6900177001953125, -0.6669998168945312, -0.64398193359375, -0.6209640502929688, -0.5979461669921875, -0.5749282836914062, -0.551910400390625, -0.5288925170898438, -0.5058746337890625, -0.48285675048828125, -0.4598388671875, -0.43682098388671875, -0.4138031005859375, -0.39078521728515625, -0.367767333984375, -0.34474945068359375, -0.3217315673828125, -0.29871368408203125, -0.27569580078125, -0.25267791748046875, -0.2296600341796875, -0.20664215087890625, -0.183624267578125, -0.16060638427734375, -0.1375885009765625, -0.11457061767578125, -0.091552734375, -0.06853485107421875, -0.0455169677734375, -0.02249908447265625, 0.000518798828125, 0.02353668212890625, 0.0465545654296875, 0.06957244873046875, 0.09259033203125, 0.11560821533203125, 0.1386260986328125, 0.16164398193359375, 0.184661865234375, 0.20767974853515625, 0.2306976318359375, 0.25371551513671875, 0.2767333984375, 0.29975128173828125, 0.3227691650390625, 0.34578704833984375, 0.368804931640625, 0.39182281494140625, 0.4148406982421875, 0.43785858154296875, 0.46087646484375, 0.48389434814453125, 0.5069122314453125, 0.5299301147460938, 0.552947998046875, 0.5759658813476562, 0.5989837646484375, 0.6220016479492188, 0.64501953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 10.0, 8.0, 12.0, 12.0, 21.0, 11.0, 21.0, 30.0, 38.0, 43.0, 50.0, 43.0, 46.0, 48.0, 57.0, 59.0, 50.0, 62.0, 48.0, 53.0, 36.0, 31.0, 40.0, 30.0, 24.0, 23.0, 26.0, 13.0, 7.0, 9.0, 8.0, 2.0, 6.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.45258331298828125, -0.4386138916015625, -0.42464447021484375, -0.410675048828125, -0.39670562744140625, -0.3827362060546875, -0.36876678466796875, -0.35479736328125, -0.34082794189453125, -0.3268585205078125, -0.31288909912109375, -0.298919677734375, -0.28495025634765625, -0.2709808349609375, -0.25701141357421875, -0.2430419921875, -0.22907257080078125, -0.2151031494140625, -0.20113372802734375, -0.187164306640625, -0.17319488525390625, -0.1592254638671875, -0.14525604248046875, -0.13128662109375, -0.11731719970703125, -0.1033477783203125, -0.08937835693359375, -0.075408935546875, -0.06143951416015625, -0.0474700927734375, -0.03350067138671875, -0.01953125, -0.00556182861328125, 0.0084075927734375, 0.02237701416015625, 0.036346435546875, 0.05031585693359375, 0.0642852783203125, 0.07825469970703125, 0.09222412109375, 0.10619354248046875, 0.1201629638671875, 0.13413238525390625, 0.148101806640625, 0.16207122802734375, 0.1760406494140625, 0.19001007080078125, 0.2039794921875, 0.21794891357421875, 0.2319183349609375, 0.24588775634765625, 0.259857177734375, 0.27382659912109375, 0.2877960205078125, 0.30176544189453125, 0.31573486328125, 0.32970428466796875, 0.3436737060546875, 0.35764312744140625, 0.371612548828125, 0.38558197021484375, 0.3995513916015625, 0.41352081298828125, 0.427490234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 7.0, 0.0, 1.0, 2.0, 3.0, 4.0, 11.0, 18.0, 13.0, 17.0, 36.0, 63.0, 98.0, 171.0, 443.0, 1306.0, 5223.0, 35743.0, 2852114.0, 1267904.0, 25102.0, 4178.0, 1083.0, 347.0, 158.0, 87.0, 57.0, 20.0, 19.0, 12.0, 12.0, 9.0, 2.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.671875, -1.6226043701171875, -1.573333740234375, -1.5240631103515625, -1.47479248046875, -1.4255218505859375, -1.376251220703125, -1.3269805908203125, -1.2777099609375, -1.2284393310546875, -1.179168701171875, -1.1298980712890625, -1.08062744140625, -1.0313568115234375, -0.982086181640625, -0.9328155517578125, -0.883544921875, -0.8342742919921875, -0.785003662109375, -0.7357330322265625, -0.68646240234375, -0.6371917724609375, -0.587921142578125, -0.5386505126953125, -0.4893798828125, -0.4401092529296875, -0.390838623046875, -0.3415679931640625, -0.29229736328125, -0.2430267333984375, -0.193756103515625, -0.1444854736328125, -0.09521484375, -0.0459442138671875, 0.003326416015625, 0.0525970458984375, 0.10186767578125, 0.1511383056640625, 0.200408935546875, 0.2496795654296875, 0.2989501953125, 0.3482208251953125, 0.397491455078125, 0.4467620849609375, 0.49603271484375, 0.5453033447265625, 0.594573974609375, 0.6438446044921875, 0.693115234375, 0.7423858642578125, 0.791656494140625, 0.8409271240234375, 0.89019775390625, 0.9394683837890625, 0.988739013671875, 1.0380096435546875, 1.0872802734375, 1.1365509033203125, 1.185821533203125, 1.2350921630859375, 1.28436279296875, 1.3336334228515625, 1.382904052734375, 1.4321746826171875, 1.4814453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 8.0, 6.0, 11.0, 17.0, 10.0, 31.0, 51.0, 52.0, 92.0, 139.0, 229.0, 427.0, 759.0, 890.0, 565.0, 319.0, 164.0, 86.0, 65.0, 37.0, 26.0, 21.0, 21.0, 10.0, 4.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.04296875, -1.011566162109375, -0.98016357421875, -0.948760986328125, -0.9173583984375, -0.885955810546875, -0.85455322265625, -0.823150634765625, -0.791748046875, -0.760345458984375, -0.72894287109375, -0.697540283203125, -0.6661376953125, -0.634735107421875, -0.60333251953125, -0.571929931640625, -0.54052734375, -0.509124755859375, -0.47772216796875, -0.446319580078125, -0.4149169921875, -0.383514404296875, -0.35211181640625, -0.320709228515625, -0.289306640625, -0.257904052734375, -0.22650146484375, -0.195098876953125, -0.1636962890625, -0.132293701171875, -0.10089111328125, -0.069488525390625, -0.0380859375, -0.006683349609375, 0.02471923828125, 0.056121826171875, 0.0875244140625, 0.118927001953125, 0.15032958984375, 0.181732177734375, 0.213134765625, 0.244537353515625, 0.27593994140625, 0.307342529296875, 0.3387451171875, 0.370147705078125, 0.40155029296875, 0.432952880859375, 0.46435546875, 0.495758056640625, 0.52716064453125, 0.558563232421875, 0.5899658203125, 0.621368408203125, 0.65277099609375, 0.684173583984375, 0.715576171875, 0.746978759765625, 0.77838134765625, 0.809783935546875, 0.8411865234375, 0.872589111328125, 0.90399169921875, 0.935394287109375, 0.966796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 12.0, 17.0, 43.0, 112.0, 288.0, 281.0, 152.0, 58.0, 19.0, 12.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.318859100341797, -14.918415069580078, -14.517971992492676, -14.117527961730957, -13.717084884643555, -13.316640853881836, -12.916196823120117, -12.515752792358398, -12.115309715270996, -11.714865684509277, -11.314422607421875, -10.913978576660156, -10.513534545898438, -10.113091468811035, -9.712647438049316, -9.312204360961914, -8.911760330200195, -8.511316299438477, -8.110873222351074, -7.7104291915893555, -7.309985637664795, -6.909542083740234, -6.509098052978516, -6.108654499053955, -5.7082109451293945, -5.307767391204834, -4.907323837280273, -4.506879806518555, -4.106436252593994, -3.7059926986694336, -3.305548906326294, -2.9051051139831543, -2.5046606063842773, -2.104217052459717, -1.7037732601165771, -1.303329586982727, -0.902885913848877, -0.5024423599243164, -0.10199856758117676, 0.2984452247619629, 0.6988887786865234, 1.0993324518203735, 1.4997761249542236, 1.9002197980880737, 2.300663471221924, 2.7011070251464844, 3.101550817489624, 3.5019946098327637, 3.902438163757324, 4.302881717681885, 4.703325271606445, 5.103769302368164, 5.504212856292725, 5.904656410217285, 6.305100440979004, 6.7055439949035645, 7.105987548828125, 7.5064311027526855, 7.906874656677246, 8.307318687438965, 8.707761764526367, 9.108205795288086, 9.508649826049805, 9.909093856811523, 10.309536933898926]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 13.0, 13.0, 19.0, 6.0, 6.0, 20.0, 17.0, 20.0, 17.0, 33.0, 43.0, 33.0, 31.0, 37.0, 43.0, 46.0, 31.0, 40.0, 33.0, 46.0, 37.0, 40.0, 37.0, 27.0, 28.0, 43.0, 42.0, 34.0, 22.0, 21.0, 22.0, 15.0, 11.0, 12.0, 9.0, 9.0, 9.0, 5.0, 8.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.717419385910034, -3.6078617572784424, -3.4983038902282715, -3.3887462615966797, -3.279188394546509, -3.169630765914917, -3.060072898864746, -2.9505152702331543, -2.8409576416015625, -2.7314000129699707, -2.6218421459198, -2.512284517288208, -2.402726650238037, -2.2931690216064453, -2.1836113929748535, -2.0740535259246826, -1.9644956588745117, -1.8549379110336304, -1.745380163192749, -1.6358225345611572, -1.5262646675109863, -1.4167070388793945, -1.3071492910385132, -1.1975915431976318, -1.0880337953567505, -0.9784760475158691, -0.8689182996749878, -0.7593606114387512, -0.6498028635978699, -0.5402451157569885, -0.43068742752075195, -0.3211296796798706, -0.21157217025756836, -0.1020144373178482, 0.007543295621871948, 0.11710101366043091, 0.22665876150131226, 0.3362165093421936, 0.4457741975784302, 0.5553319454193115, 0.6648896932601929, 0.7744474411010742, 0.8840051889419556, 0.9935628771781921, 1.1031205654144287, 1.2126784324645996, 1.3222360610961914, 1.4317938089370728, 1.541351556777954, 1.6509093046188354, 1.7604670524597168, 1.8700246810913086, 1.9795825481414795, 2.0891401767730713, 2.198698043823242, 2.308255672454834, 2.417813301086426, 2.5273709297180176, 2.6369287967681885, 2.7464864253997803, 2.856044292449951, 2.965601921081543, 3.0751595497131348, 3.1847174167633057, 3.2942752838134766]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 7.0, 9.0, 23.0, 36.0, 37.0, 66.0, 99.0, 172.0, 322.0, 649.0, 1477.0, 3982.0, 14082.0, 75124.0, 634031.0, 271709.0, 34190.0, 7879.0, 2507.0, 1021.0, 481.0, 254.0, 149.0, 76.0, 51.0, 35.0, 23.0, 17.0, 15.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2372894287109375, -1.194305419921875, -1.1513214111328125, -1.10833740234375, -1.0653533935546875, -1.022369384765625, -0.9793853759765625, -0.9364013671875, -0.8934173583984375, -0.850433349609375, -0.8074493408203125, -0.76446533203125, -0.7214813232421875, -0.678497314453125, -0.6355133056640625, -0.592529296875, -0.5495452880859375, -0.506561279296875, -0.4635772705078125, -0.42059326171875, -0.3776092529296875, -0.334625244140625, -0.2916412353515625, -0.2486572265625, -0.2056732177734375, -0.162689208984375, -0.1197052001953125, -0.07672119140625, -0.0337371826171875, 0.009246826171875, 0.0522308349609375, 0.09521484375, 0.1381988525390625, 0.181182861328125, 0.2241668701171875, 0.26715087890625, 0.3101348876953125, 0.353118896484375, 0.3961029052734375, 0.4390869140625, 0.4820709228515625, 0.525054931640625, 0.5680389404296875, 0.61102294921875, 0.6540069580078125, 0.696990966796875, 0.7399749755859375, 0.782958984375, 0.8259429931640625, 0.868927001953125, 0.9119110107421875, 0.95489501953125, 0.9978790283203125, 1.040863037109375, 1.0838470458984375, 1.1268310546875, 1.1698150634765625, 1.212799072265625, 1.2557830810546875, 1.29876708984375, 1.3417510986328125, 1.384735107421875, 1.4277191162109375, 1.470703125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 6.0, 10.0, 18.0, 12.0, 27.0, 29.0, 35.0, 36.0, 34.0, 49.0, 47.0, 55.0, 43.0, 53.0, 55.0, 59.0, 51.0, 53.0, 41.0, 45.0, 33.0, 36.0, 29.0, 30.0, 22.0, 16.0, 11.0, 10.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.544921875, -0.5302352905273438, -0.5155487060546875, -0.5008621215820312, -0.486175537109375, -0.47148895263671875, -0.4568023681640625, -0.44211578369140625, -0.42742919921875, -0.41274261474609375, -0.3980560302734375, -0.38336944580078125, -0.368682861328125, -0.35399627685546875, -0.3393096923828125, -0.32462310791015625, -0.3099365234375, -0.29524993896484375, -0.2805633544921875, -0.26587677001953125, -0.251190185546875, -0.23650360107421875, -0.2218170166015625, -0.20713043212890625, -0.19244384765625, -0.17775726318359375, -0.1630706787109375, -0.14838409423828125, -0.133697509765625, -0.11901092529296875, -0.1043243408203125, -0.08963775634765625, -0.074951171875, -0.06026458740234375, -0.0455780029296875, -0.03089141845703125, -0.016204833984375, -0.00151824951171875, 0.0131683349609375, 0.02785491943359375, 0.04254150390625, 0.05722808837890625, 0.0719146728515625, 0.08660125732421875, 0.101287841796875, 0.11597442626953125, 0.1306610107421875, 0.14534759521484375, 0.1600341796875, 0.17472076416015625, 0.1894073486328125, 0.20409393310546875, 0.218780517578125, 0.23346710205078125, 0.2481536865234375, 0.26284027099609375, 0.27752685546875, 0.29221343994140625, 0.3069000244140625, 0.32158660888671875, 0.336273193359375, 0.35095977783203125, 0.3656463623046875, 0.38033294677734375, 0.39501953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 13.0, 5.0, 10.0, 11.0, 14.0, 41.0, 32.0, 62.0, 94.0, 150.0, 242.0, 392.0, 815.0, 1683.0, 4497.0, 19294.0, 222770.0, 752175.0, 35357.0, 6408.0, 2194.0, 972.0, 470.0, 304.0, 179.0, 117.0, 80.0, 49.0, 30.0, 25.0, 15.0, 11.0, 9.0, 2.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5294342041015625, -1.484649658203125, -1.4398651123046875, -1.39508056640625, -1.3502960205078125, -1.305511474609375, -1.2607269287109375, -1.2159423828125, -1.1711578369140625, -1.126373291015625, -1.0815887451171875, -1.03680419921875, -0.9920196533203125, -0.947235107421875, -0.9024505615234375, -0.857666015625, -0.8128814697265625, -0.768096923828125, -0.7233123779296875, -0.67852783203125, -0.6337432861328125, -0.588958740234375, -0.5441741943359375, -0.4993896484375, -0.4546051025390625, -0.409820556640625, -0.3650360107421875, -0.32025146484375, -0.2754669189453125, -0.230682373046875, -0.1858978271484375, -0.14111328125, -0.0963287353515625, -0.051544189453125, -0.0067596435546875, 0.03802490234375, 0.0828094482421875, 0.127593994140625, 0.1723785400390625, 0.2171630859375, 0.2619476318359375, 0.306732177734375, 0.3515167236328125, 0.39630126953125, 0.4410858154296875, 0.485870361328125, 0.5306549072265625, 0.575439453125, 0.6202239990234375, 0.665008544921875, 0.7097930908203125, 0.75457763671875, 0.7993621826171875, 0.844146728515625, 0.8889312744140625, 0.9337158203125, 0.9785003662109375, 1.023284912109375, 1.0680694580078125, 1.11285400390625, 1.1576385498046875, 1.202423095703125, 1.2472076416015625, 1.2919921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 8.0, 3.0, 12.0, 12.0, 14.0, 12.0, 26.0, 22.0, 19.0, 23.0, 34.0, 43.0, 41.0, 46.0, 43.0, 45.0, 48.0, 56.0, 47.0, 54.0, 43.0, 55.0, 32.0, 42.0, 22.0, 25.0, 31.0, 20.0, 24.0, 12.0, 9.0, 12.0, 6.0, 8.0, 6.0, 8.0, 4.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.490234375, -1.4468994140625, -1.403564453125, -1.3602294921875, -1.31689453125, -1.2735595703125, -1.230224609375, -1.1868896484375, -1.1435546875, -1.1002197265625, -1.056884765625, -1.0135498046875, -0.97021484375, -0.9268798828125, -0.883544921875, -0.8402099609375, -0.796875, -0.7535400390625, -0.710205078125, -0.6668701171875, -0.62353515625, -0.5802001953125, -0.536865234375, -0.4935302734375, -0.4501953125, -0.4068603515625, -0.363525390625, -0.3201904296875, -0.27685546875, -0.2335205078125, -0.190185546875, -0.1468505859375, -0.103515625, -0.0601806640625, -0.016845703125, 0.0264892578125, 0.06982421875, 0.1131591796875, 0.156494140625, 0.1998291015625, 0.2431640625, 0.2864990234375, 0.329833984375, 0.3731689453125, 0.41650390625, 0.4598388671875, 0.503173828125, 0.5465087890625, 0.58984375, 0.6331787109375, 0.676513671875, 0.7198486328125, 0.76318359375, 0.8065185546875, 0.849853515625, 0.8931884765625, 0.9365234375, 0.9798583984375, 1.023193359375, 1.0665283203125, 1.10986328125, 1.1531982421875, 1.196533203125, 1.2398681640625, 1.283203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 3.0, 9.0, 15.0, 14.0, 20.0, 34.0, 35.0, 50.0, 83.0, 149.0, 203.0, 452.0, 830.0, 2126.0, 6723.0, 32087.0, 653931.0, 313239.0, 28605.0, 6146.0, 1935.0, 788.0, 399.0, 226.0, 144.0, 86.0, 61.0, 38.0, 22.0, 19.0, 23.0, 8.0, 11.0, 8.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3447265625, -0.33282470703125, -0.3209228515625, -0.30902099609375, -0.297119140625, -0.28521728515625, -0.2733154296875, -0.26141357421875, -0.24951171875, -0.23760986328125, -0.2257080078125, -0.21380615234375, -0.201904296875, -0.19000244140625, -0.1781005859375, -0.16619873046875, -0.154296875, -0.14239501953125, -0.1304931640625, -0.11859130859375, -0.106689453125, -0.09478759765625, -0.0828857421875, -0.07098388671875, -0.05908203125, -0.04718017578125, -0.0352783203125, -0.02337646484375, -0.011474609375, 0.00042724609375, 0.0123291015625, 0.02423095703125, 0.0361328125, 0.04803466796875, 0.0599365234375, 0.07183837890625, 0.083740234375, 0.09564208984375, 0.1075439453125, 0.11944580078125, 0.13134765625, 0.14324951171875, 0.1551513671875, 0.16705322265625, 0.178955078125, 0.19085693359375, 0.2027587890625, 0.21466064453125, 0.2265625, 0.23846435546875, 0.2503662109375, 0.26226806640625, 0.274169921875, 0.28607177734375, 0.2979736328125, 0.30987548828125, 0.32177734375, 0.33367919921875, 0.3455810546875, 0.35748291015625, 0.369384765625, 0.38128662109375, 0.3931884765625, 0.40509033203125, 0.4169921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 7.0, 9.0, 8.0, 16.0, 13.0, 23.0, 33.0, 50.0, 60.0, 101.0, 136.0, 143.0, 118.0, 72.0, 55.0, 27.0, 28.0, 24.0, 14.0, 17.0, 6.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.912252426147461e-05, -9.637046605348587e-05, -9.361840784549713e-05, -9.086634963750839e-05, -8.811429142951965e-05, -8.536223322153091e-05, -8.261017501354218e-05, -7.985811680555344e-05, -7.71060585975647e-05, -7.435400038957596e-05, -7.160194218158722e-05, -6.884988397359848e-05, -6.609782576560974e-05, -6.3345767557621e-05, -6.059370934963226e-05, -5.7841651141643524e-05, -5.5089592933654785e-05, -5.2337534725666046e-05, -4.958547651767731e-05, -4.683341830968857e-05, -4.408136010169983e-05, -4.132930189371109e-05, -3.857724368572235e-05, -3.582518547773361e-05, -3.307312726974487e-05, -3.0321069061756134e-05, -2.7569010853767395e-05, -2.4816952645778656e-05, -2.2064894437789917e-05, -1.9312836229801178e-05, -1.656077802181244e-05, -1.38087198138237e-05, -1.1056661605834961e-05, -8.304603397846222e-06, -5.552545189857483e-06, -2.800486981868744e-06, -4.842877388000488e-08, 2.703629434108734e-06, 5.455687642097473e-06, 8.207745850086212e-06, 1.0959804058074951e-05, 1.371186226606369e-05, 1.646392047405243e-05, 1.9215978682041168e-05, 2.1968036890029907e-05, 2.4720095098018646e-05, 2.7472153306007385e-05, 3.0224211513996124e-05, 3.297626972198486e-05, 3.57283279299736e-05, 3.848038613796234e-05, 4.123244434595108e-05, 4.398450255393982e-05, 4.673656076192856e-05, 4.94886189699173e-05, 5.2240677177906036e-05, 5.4992735385894775e-05, 5.7744793593883514e-05, 6.0496851801872253e-05, 6.324891000986099e-05, 6.600096821784973e-05, 6.875302642583847e-05, 7.150508463382721e-05, 7.425714284181595e-05, 7.700920104980469e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 1.0, 7.0, 5.0, 12.0, 11.0, 14.0, 29.0, 16.0, 29.0, 57.0, 55.0, 84.0, 120.0, 189.0, 282.0, 477.0, 864.0, 1519.0, 3160.0, 7976.0, 24649.0, 118890.0, 743170.0, 108813.0, 23690.0, 7619.0, 3149.0, 1508.0, 783.0, 476.0, 291.0, 180.0, 119.0, 80.0, 50.0, 45.0, 32.0, 32.0, 16.0, 21.0, 13.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.258056640625, -0.24985885620117188, -0.24166107177734375, -0.23346328735351562, -0.2252655029296875, -0.21706771850585938, -0.20886993408203125, -0.20067214965820312, -0.192474365234375, -0.18427658081054688, -0.17607879638671875, -0.16788101196289062, -0.1596832275390625, -0.15148544311523438, -0.14328765869140625, -0.13508987426757812, -0.12689208984375, -0.11869430541992188, -0.11049652099609375, -0.10229873657226562, -0.0941009521484375, -0.08590316772460938, -0.07770538330078125, -0.06950759887695312, -0.061309814453125, -0.053112030029296875, -0.04491424560546875, -0.036716461181640625, -0.0285186767578125, -0.020320892333984375, -0.01212310791015625, -0.003925323486328125, 0.0042724609375, 0.012470245361328125, 0.02066802978515625, 0.028865814208984375, 0.0370635986328125, 0.045261383056640625, 0.05345916748046875, 0.061656951904296875, 0.069854736328125, 0.07805252075195312, 0.08625030517578125, 0.09444808959960938, 0.1026458740234375, 0.11084365844726562, 0.11904144287109375, 0.12723922729492188, 0.13543701171875, 0.14363479614257812, 0.15183258056640625, 0.16003036499023438, 0.1682281494140625, 0.17642593383789062, 0.18462371826171875, 0.19282150268554688, 0.201019287109375, 0.20921707153320312, 0.21741485595703125, 0.22561264038085938, 0.2338104248046875, 0.24200820922851562, 0.25020599365234375, 0.2584037780761719, 0.2666015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 8.0, 10.0, 10.0, 16.0, 20.0, 27.0, 28.0, 40.0, 42.0, 68.0, 59.0, 78.0, 84.0, 78.0, 75.0, 60.0, 51.0, 35.0, 37.0, 25.0, 26.0, 18.0, 14.0, 17.0, 14.0, 4.0, 7.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.241455078125, -0.23395538330078125, -0.2264556884765625, -0.21895599365234375, -0.211456298828125, -0.20395660400390625, -0.1964569091796875, -0.18895721435546875, -0.18145751953125, -0.17395782470703125, -0.1664581298828125, -0.15895843505859375, -0.151458740234375, -0.14395904541015625, -0.1364593505859375, -0.12895965576171875, -0.1214599609375, -0.11396026611328125, -0.1064605712890625, -0.09896087646484375, -0.091461181640625, -0.08396148681640625, -0.0764617919921875, -0.06896209716796875, -0.06146240234375, -0.05396270751953125, -0.0464630126953125, -0.03896331787109375, -0.031463623046875, -0.02396392822265625, -0.0164642333984375, -0.00896453857421875, -0.00146484375, 0.00603485107421875, 0.0135345458984375, 0.02103424072265625, 0.028533935546875, 0.03603363037109375, 0.0435333251953125, 0.05103302001953125, 0.05853271484375, 0.06603240966796875, 0.0735321044921875, 0.08103179931640625, 0.088531494140625, 0.09603118896484375, 0.1035308837890625, 0.11103057861328125, 0.1185302734375, 0.12602996826171875, 0.1335296630859375, 0.14102935791015625, 0.148529052734375, 0.15602874755859375, 0.1635284423828125, 0.17102813720703125, 0.17852783203125, 0.18602752685546875, 0.1935272216796875, 0.20102691650390625, 0.208526611328125, 0.21602630615234375, 0.2235260009765625, 0.23102569580078125, 0.238525390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 30.0, 119.0, 466.0, 230.0, 78.0, 30.0, 12.0, 7.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.86053466796875, -14.360454559326172, -13.86037540435791, -13.360295295715332, -12.860215187072754, -12.360136032104492, -11.860055923461914, -11.359975814819336, -10.859895706176758, -10.35981559753418, -9.859736442565918, -9.35965633392334, -8.859576225280762, -8.3594970703125, -7.859416961669922, -7.359336853027344, -6.859257698059082, -6.359178066253662, -5.859097957611084, -5.359018325805664, -4.858938217163086, -4.358858585357666, -3.858778953552246, -3.358699083328247, -2.858619213104248, -2.358539342880249, -1.8584595918655396, -1.35837984085083, -0.858299970626831, -0.35822010040283203, 0.1418595314025879, 0.6419394016265869, 1.142019271850586, 1.642099142074585, 2.142179012298584, 2.642258644104004, 3.142338514328003, 3.642418384552002, 4.142498016357422, 4.642578125, 5.14265775680542, 5.64273738861084, 6.142817497253418, 6.642897129058838, 7.142976760864258, 7.643056869506836, 8.143136978149414, 8.643216133117676, 9.143296241760254, 9.643376350402832, 10.143455505371094, 10.643535614013672, 11.14361572265625, 11.643695831298828, 12.14377498626709, 12.643855094909668, 13.14393424987793, 13.644014358520508, 14.14409351348877, 14.644173622131348, 15.144253730773926, 15.644332885742188, 16.144412994384766, 16.644493103027344, 17.144573211669922]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 16.0, 12.0, 13.0, 25.0, 25.0, 28.0, 24.0, 30.0, 28.0, 31.0, 33.0, 57.0, 99.0, 98.0, 90.0, 67.0, 41.0, 29.0, 30.0, 37.0, 33.0, 17.0, 20.0, 16.0, 17.0, 12.0, 9.0, 11.0, 5.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.9609527587890625, -5.777299404144287, -5.593646049499512, -5.409992218017578, -5.226338863372803, -5.042685508728027, -4.859031677246094, -4.675378322601318, -4.491724967956543, -4.308071613311768, -4.124418258666992, -3.9407644271850586, -3.757111072540283, -3.573457717895508, -3.3898041248321533, -3.206150531768799, -3.0224971771240234, -2.838843822479248, -2.6551902294158936, -2.471536636352539, -2.2878832817077637, -2.1042299270629883, -1.9205763339996338, -1.7369228601455688, -1.553269386291504, -1.369615912437439, -1.185962438583374, -1.002308964729309, -0.8186554908752441, -0.6350020170211792, -0.45134854316711426, -0.2676950693130493, -0.08404159545898438, 0.09961187839508057, 0.2832653522491455, 0.46691882610321045, 0.6505722999572754, 0.8342257738113403, 1.0178792476654053, 1.2015327215194702, 1.3851861953735352, 1.5688396692276, 1.752493143081665, 1.93614661693573, 2.119800090789795, 2.3034534454345703, 2.487107038497925, 2.6707606315612793, 2.8544139862060547, 3.03806734085083, 3.2217209339141846, 3.405374526977539, 3.5890278816223145, 3.77268123626709, 3.9563348293304443, 4.139988422393799, 4.323641777038574, 4.50729513168335, 4.690948486328125, 4.874602317810059, 5.058255672454834, 5.241909027099609, 5.425562858581543, 5.609216213226318, 5.792869567871094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 3.0, 13.0, 11.0, 18.0, 21.0, 22.0, 75.0, 93.0, 129.0, 254.0, 445.0, 719.0, 1395.0, 2778.0, 6956.0, 21170.0, 113135.0, 1247985.0, 2471781.0, 270334.0, 38934.0, 10155.0, 3826.0, 1825.0, 908.0, 473.0, 323.0, 184.0, 125.0, 68.0, 46.0, 25.0, 15.0, 13.0, 6.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.2002334594726562, -1.1670684814453125, -1.1339035034179688, -1.100738525390625, -1.0675735473632812, -1.0344085693359375, -1.0012435913085938, -0.96807861328125, -0.9349136352539062, -0.9017486572265625, -0.8685836791992188, -0.835418701171875, -0.8022537231445312, -0.7690887451171875, -0.7359237670898438, -0.7027587890625, -0.6695938110351562, -0.6364288330078125, -0.6032638549804688, -0.570098876953125, -0.5369338989257812, -0.5037689208984375, -0.47060394287109375, -0.43743896484375, -0.40427398681640625, -0.3711090087890625, -0.33794403076171875, -0.304779052734375, -0.27161407470703125, -0.2384490966796875, -0.20528411865234375, -0.172119140625, -0.13895416259765625, -0.1057891845703125, -0.07262420654296875, -0.039459228515625, -0.00629425048828125, 0.0268707275390625, 0.06003570556640625, 0.09320068359375, 0.12636566162109375, 0.1595306396484375, 0.19269561767578125, 0.225860595703125, 0.25902557373046875, 0.2921905517578125, 0.32535552978515625, 0.3585205078125, 0.39168548583984375, 0.4248504638671875, 0.45801544189453125, 0.491180419921875, 0.5243453979492188, 0.5575103759765625, 0.5906753540039062, 0.62384033203125, 0.6570053100585938, 0.6901702880859375, 0.7233352661132812, 0.756500244140625, 0.7896652221679688, 0.8228302001953125, 0.8559951782226562, 0.88916015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 8.0, 14.0, 18.0, 19.0, 32.0, 26.0, 37.0, 46.0, 53.0, 44.0, 55.0, 44.0, 62.0, 50.0, 63.0, 55.0, 45.0, 40.0, 41.0, 33.0, 22.0, 39.0, 20.0, 20.0, 22.0, 14.0, 13.0, 8.0, 8.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.548828125, -0.5344467163085938, -0.5200653076171875, -0.5056838989257812, -0.491302490234375, -0.47692108154296875, -0.4625396728515625, -0.44815826416015625, -0.43377685546875, -0.41939544677734375, -0.4050140380859375, -0.39063262939453125, -0.376251220703125, -0.36186981201171875, -0.3474884033203125, -0.33310699462890625, -0.3187255859375, -0.30434417724609375, -0.2899627685546875, -0.27558135986328125, -0.261199951171875, -0.24681854248046875, -0.2324371337890625, -0.21805572509765625, -0.20367431640625, -0.18929290771484375, -0.1749114990234375, -0.16053009033203125, -0.146148681640625, -0.13176727294921875, -0.1173858642578125, -0.10300445556640625, -0.088623046875, -0.07424163818359375, -0.0598602294921875, -0.04547882080078125, -0.031097412109375, -0.01671600341796875, -0.0023345947265625, 0.01204681396484375, 0.02642822265625, 0.04080963134765625, 0.0551910400390625, 0.06957244873046875, 0.083953857421875, 0.09833526611328125, 0.1127166748046875, 0.12709808349609375, 0.1414794921875, 0.15586090087890625, 0.1702423095703125, 0.18462371826171875, 0.199005126953125, 0.21338653564453125, 0.2277679443359375, 0.24214935302734375, 0.25653076171875, 0.27091217041015625, 0.2852935791015625, 0.29967498779296875, 0.314056396484375, 0.32843780517578125, 0.3428192138671875, 0.35720062255859375, 0.37158203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 7.0, 9.0, 17.0, 16.0, 21.0, 33.0, 49.0, 73.0, 77.0, 148.0, 213.0, 454.0, 923.0, 2560.0, 14025.0, 795307.0, 3353481.0, 21346.0, 3200.0, 1079.0, 463.0, 275.0, 157.0, 122.0, 52.0, 41.0, 29.0, 29.0, 14.0, 10.0, 14.0, 7.0, 7.0, 5.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.11328125, -3.013153076171875, -2.91302490234375, -2.812896728515625, -2.7127685546875, -2.612640380859375, -2.51251220703125, -2.412384033203125, -2.312255859375, -2.212127685546875, -2.11199951171875, -2.011871337890625, -1.9117431640625, -1.811614990234375, -1.71148681640625, -1.611358642578125, -1.51123046875, -1.411102294921875, -1.31097412109375, -1.210845947265625, -1.1107177734375, -1.010589599609375, -0.91046142578125, -0.810333251953125, -0.710205078125, -0.610076904296875, -0.50994873046875, -0.409820556640625, -0.3096923828125, -0.209564208984375, -0.10943603515625, -0.009307861328125, 0.0908203125, 0.190948486328125, 0.29107666015625, 0.391204833984375, 0.4913330078125, 0.591461181640625, 0.69158935546875, 0.791717529296875, 0.891845703125, 0.991973876953125, 1.09210205078125, 1.192230224609375, 1.2923583984375, 1.392486572265625, 1.49261474609375, 1.592742919921875, 1.69287109375, 1.792999267578125, 1.89312744140625, 1.993255615234375, 2.0933837890625, 2.193511962890625, 2.29364013671875, 2.393768310546875, 2.493896484375, 2.594024658203125, 2.69415283203125, 2.794281005859375, 2.8944091796875, 2.994537353515625, 3.09466552734375, 3.194793701171875, 3.294921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 7.0, 5.0, 3.0, 12.0, 8.0, 10.0, 14.0, 12.0, 18.0, 18.0, 40.0, 48.0, 65.0, 104.0, 125.0, 167.0, 247.0, 348.0, 519.0, 610.0, 497.0, 346.0, 215.0, 173.0, 103.0, 94.0, 62.0, 45.0, 38.0, 29.0, 20.0, 16.0, 11.0, 11.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4501953125, -1.408355712890625, -1.36651611328125, -1.324676513671875, -1.2828369140625, -1.240997314453125, -1.19915771484375, -1.157318115234375, -1.115478515625, -1.073638916015625, -1.03179931640625, -0.989959716796875, -0.9481201171875, -0.906280517578125, -0.86444091796875, -0.822601318359375, -0.78076171875, -0.738922119140625, -0.69708251953125, -0.655242919921875, -0.6134033203125, -0.571563720703125, -0.52972412109375, -0.487884521484375, -0.446044921875, -0.404205322265625, -0.36236572265625, -0.320526123046875, -0.2786865234375, -0.236846923828125, -0.19500732421875, -0.153167724609375, -0.111328125, -0.069488525390625, -0.02764892578125, 0.014190673828125, 0.0560302734375, 0.097869873046875, 0.13970947265625, 0.181549072265625, 0.223388671875, 0.265228271484375, 0.30706787109375, 0.348907470703125, 0.3907470703125, 0.432586669921875, 0.47442626953125, 0.516265869140625, 0.55810546875, 0.599945068359375, 0.64178466796875, 0.683624267578125, 0.7254638671875, 0.767303466796875, 0.80914306640625, 0.850982666015625, 0.892822265625, 0.934661865234375, 0.97650146484375, 1.018341064453125, 1.0601806640625, 1.102020263671875, 1.14385986328125, 1.185699462890625, 1.2275390625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 12.0, 31.0, 89.0, 296.0, 354.0, 141.0, 41.0, 14.0, 5.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.294099807739258, -30.147010803222656, -28.999923706054688, -27.852834701538086, -26.705745697021484, -25.558658599853516, -24.411569595336914, -23.264480590820312, -22.117393493652344, -20.970304489135742, -19.823217391967773, -18.676128387451172, -17.52903938293457, -16.38195037841797, -15.23486328125, -14.087774276733398, -12.940685272216797, -11.793597221374512, -10.64650821685791, -9.499420166015625, -8.352331161499023, -7.205243110656738, -6.058155059814453, -4.911066055297852, -3.7639780044555664, -2.616889476776123, -1.4698011875152588, -0.32271289825439453, 0.8243756294250488, 1.9714641571044922, 3.1185522079467773, 4.265641212463379, 5.412727355957031, 6.559815883636475, 7.706904411315918, 8.853992462158203, 10.001081466674805, 11.14816951751709, 12.295257568359375, 13.442346572875977, 14.589434623718262, 15.736522674560547, 16.88361167907715, 18.03070068359375, 19.17778778076172, 20.32487678527832, 21.471965789794922, 22.61905288696289, 23.766141891479492, 24.913230895996094, 26.060317993164062, 27.207406997680664, 28.354496002197266, 29.501583099365234, 30.648672103881836, 31.795761108398438, 32.942848205566406, 34.089935302734375, 35.23702621459961, 36.38411331176758, 37.53120040893555, 38.67829132080078, 39.82537841796875, 40.97246551513672, 42.11955642700195]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 6.0, 11.0, 18.0, 16.0, 12.0, 18.0, 15.0, 32.0, 33.0, 41.0, 54.0, 54.0, 49.0, 66.0, 81.0, 57.0, 60.0, 43.0, 54.0, 44.0, 44.0, 23.0, 31.0, 25.0, 15.0, 22.0, 20.0, 10.0, 9.0, 11.0, 5.0, 1.0, 2.0, 1.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.74195384979248, -8.4307279586792, -8.119501113891602, -7.808274745941162, -7.497048377990723, -7.185822486877441, -6.874596118927002, -6.5633697509765625, -6.252143383026123, -5.940917015075684, -5.629690647125244, -5.318464279174805, -5.007238388061523, -4.696011543273926, -4.3847856521606445, -4.073559284210205, -3.7623329162597656, -3.451106548309326, -3.1398801803588867, -2.8286540508270264, -2.517427682876587, -2.2062013149261475, -1.8949750661849976, -1.5837488174438477, -1.2725224494934082, -0.9612961411476135, -0.6500698328018188, -0.33884352445602417, -0.027617216110229492, 0.28360915184020996, 0.5948354005813599, 0.9060616493225098, 1.2172889709472656, 1.528515338897705, 1.839741587638855, 2.150967836380005, 2.4621942043304443, 2.773420572280884, 3.084646701812744, 3.3958730697631836, 3.707099437713623, 4.0183258056640625, 4.329552173614502, 4.640778541564941, 4.952004432678223, 5.26323127746582, 5.574457168579102, 5.885683536529541, 6.1969099044799805, 6.50813627243042, 6.819362640380859, 7.130589008331299, 7.441815376281738, 7.7530412673950195, 8.064268112182617, 8.375494003295898, 8.68671989440918, 8.997945785522461, 9.309172630310059, 9.62039852142334, 9.931625366210938, 10.242851257324219, 10.554078102111816, 10.865303993225098, 11.176530838012695]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 14.0, 9.0, 12.0, 14.0, 31.0, 39.0, 61.0, 99.0, 136.0, 264.0, 464.0, 942.0, 2143.0, 5660.0, 19333.0, 102041.0, 753669.0, 129383.0, 23140.0, 6455.0, 2368.0, 1022.0, 520.0, 264.0, 185.0, 95.0, 58.0, 47.0, 21.0, 9.0, 13.0, 13.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1181640625, -1.082733154296875, -1.04730224609375, -1.011871337890625, -0.9764404296875, -0.941009521484375, -0.90557861328125, -0.870147705078125, -0.834716796875, -0.799285888671875, -0.76385498046875, -0.728424072265625, -0.6929931640625, -0.657562255859375, -0.62213134765625, -0.586700439453125, -0.55126953125, -0.515838623046875, -0.48040771484375, -0.444976806640625, -0.4095458984375, -0.374114990234375, -0.33868408203125, -0.303253173828125, -0.267822265625, -0.232391357421875, -0.19696044921875, -0.161529541015625, -0.1260986328125, -0.090667724609375, -0.05523681640625, -0.019805908203125, 0.015625, 0.051055908203125, 0.08648681640625, 0.121917724609375, 0.1573486328125, 0.192779541015625, 0.22821044921875, 0.263641357421875, 0.299072265625, 0.334503173828125, 0.36993408203125, 0.405364990234375, 0.4407958984375, 0.476226806640625, 0.51165771484375, 0.547088623046875, 0.58251953125, 0.617950439453125, 0.65338134765625, 0.688812255859375, 0.7242431640625, 0.759674072265625, 0.79510498046875, 0.830535888671875, 0.865966796875, 0.901397705078125, 0.93682861328125, 0.972259521484375, 1.0076904296875, 1.043121337890625, 1.07855224609375, 1.113983154296875, 1.1494140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 9.0, 10.0, 8.0, 22.0, 25.0, 31.0, 43.0, 67.0, 75.0, 72.0, 94.0, 73.0, 74.0, 72.0, 70.0, 54.0, 48.0, 38.0, 40.0, 23.0, 16.0, 21.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8488006591796875, -0.822113037109375, -0.7954254150390625, -0.76873779296875, -0.7420501708984375, -0.715362548828125, -0.6886749267578125, -0.6619873046875, -0.6352996826171875, -0.608612060546875, -0.5819244384765625, -0.55523681640625, -0.5285491943359375, -0.501861572265625, -0.4751739501953125, -0.448486328125, -0.4217987060546875, -0.395111083984375, -0.3684234619140625, -0.34173583984375, -0.3150482177734375, -0.288360595703125, -0.2616729736328125, -0.2349853515625, -0.2082977294921875, -0.181610107421875, -0.1549224853515625, -0.12823486328125, -0.1015472412109375, -0.074859619140625, -0.0481719970703125, -0.021484375, 0.0052032470703125, 0.031890869140625, 0.0585784912109375, 0.08526611328125, 0.1119537353515625, 0.138641357421875, 0.1653289794921875, 0.1920166015625, 0.2187042236328125, 0.245391845703125, 0.2720794677734375, 0.29876708984375, 0.3254547119140625, 0.352142333984375, 0.3788299560546875, 0.405517578125, 0.4322052001953125, 0.458892822265625, 0.4855804443359375, 0.51226806640625, 0.5389556884765625, 0.565643310546875, 0.5923309326171875, 0.6190185546875, 0.6457061767578125, 0.672393798828125, 0.6990814208984375, 0.72576904296875, 0.7524566650390625, 0.779144287109375, 0.8058319091796875, 0.83251953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 9.0, 13.0, 20.0, 28.0, 44.0, 101.0, 122.0, 223.0, 417.0, 1034.0, 3320.0, 25992.0, 935629.0, 72577.0, 6167.0, 1542.0, 550.0, 302.0, 162.0, 92.0, 62.0, 36.0, 23.0, 23.0, 16.0, 7.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7958984375, -1.74822998046875, -1.7005615234375, -1.65289306640625, -1.605224609375, -1.55755615234375, -1.5098876953125, -1.46221923828125, -1.41455078125, -1.36688232421875, -1.3192138671875, -1.27154541015625, -1.223876953125, -1.17620849609375, -1.1285400390625, -1.08087158203125, -1.033203125, -0.98553466796875, -0.9378662109375, -0.89019775390625, -0.842529296875, -0.79486083984375, -0.7471923828125, -0.69952392578125, -0.65185546875, -0.60418701171875, -0.5565185546875, -0.50885009765625, -0.461181640625, -0.41351318359375, -0.3658447265625, -0.31817626953125, -0.2705078125, -0.22283935546875, -0.1751708984375, -0.12750244140625, -0.079833984375, -0.03216552734375, 0.0155029296875, 0.06317138671875, 0.11083984375, 0.15850830078125, 0.2061767578125, 0.25384521484375, 0.301513671875, 0.34918212890625, 0.3968505859375, 0.44451904296875, 0.4921875, 0.53985595703125, 0.5875244140625, 0.63519287109375, 0.682861328125, 0.73052978515625, 0.7781982421875, 0.82586669921875, 0.87353515625, 0.92120361328125, 0.9688720703125, 1.01654052734375, 1.064208984375, 1.11187744140625, 1.1595458984375, 1.20721435546875, 1.2548828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 8.0, 9.0, 9.0, 15.0, 11.0, 18.0, 9.0, 18.0, 22.0, 24.0, 32.0, 43.0, 43.0, 58.0, 68.0, 67.0, 72.0, 68.0, 63.0, 58.0, 35.0, 34.0, 35.0, 25.0, 19.0, 18.0, 18.0, 13.0, 10.0, 10.0, 9.0, 7.0, 11.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7783203125, -1.7154083251953125, -1.652496337890625, -1.5895843505859375, -1.52667236328125, -1.4637603759765625, -1.400848388671875, -1.3379364013671875, -1.2750244140625, -1.2121124267578125, -1.149200439453125, -1.0862884521484375, -1.02337646484375, -0.9604644775390625, -0.897552490234375, -0.8346405029296875, -0.771728515625, -0.7088165283203125, -0.645904541015625, -0.5829925537109375, -0.52008056640625, -0.4571685791015625, -0.394256591796875, -0.3313446044921875, -0.2684326171875, -0.2055206298828125, -0.142608642578125, -0.0796966552734375, -0.01678466796875, 0.0461273193359375, 0.109039306640625, 0.1719512939453125, 0.23486328125, 0.2977752685546875, 0.360687255859375, 0.4235992431640625, 0.48651123046875, 0.5494232177734375, 0.612335205078125, 0.6752471923828125, 0.7381591796875, 0.8010711669921875, 0.863983154296875, 0.9268951416015625, 0.98980712890625, 1.0527191162109375, 1.115631103515625, 1.1785430908203125, 1.241455078125, 1.3043670654296875, 1.367279052734375, 1.4301910400390625, 1.49310302734375, 1.5560150146484375, 1.618927001953125, 1.6818389892578125, 1.7447509765625, 1.8076629638671875, 1.870574951171875, 1.9334869384765625, 1.99639892578125, 2.0593109130859375, 2.122222900390625, 2.1851348876953125, 2.248046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 5.0, 7.0, 16.0, 25.0, 35.0, 71.0, 124.0, 172.0, 329.0, 608.0, 1282.0, 3447.0, 11791.0, 64422.0, 888140.0, 60562.0, 11483.0, 3406.0, 1262.0, 589.0, 329.0, 163.0, 104.0, 56.0, 28.0, 25.0, 18.0, 15.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.213134765625, -0.20744895935058594, -0.20176315307617188, -0.1960773468017578, -0.19039154052734375, -0.1847057342529297, -0.17901992797851562, -0.17333412170410156, -0.1676483154296875, -0.16196250915527344, -0.15627670288085938, -0.1505908966064453, -0.14490509033203125, -0.1392192840576172, -0.13353347778320312, -0.12784767150878906, -0.122161865234375, -0.11647605895996094, -0.11079025268554688, -0.10510444641113281, -0.09941864013671875, -0.09373283386230469, -0.08804702758789062, -0.08236122131347656, -0.0766754150390625, -0.07098960876464844, -0.06530380249023438, -0.05961799621582031, -0.05393218994140625, -0.04824638366699219, -0.042560577392578125, -0.03687477111816406, -0.03118896484375, -0.025503158569335938, -0.019817352294921875, -0.014131546020507812, -0.00844573974609375, -0.0027599334716796875, 0.002925872802734375, 0.008611679077148438, 0.0142974853515625, 0.019983291625976562, 0.025669097900390625, 0.03135490417480469, 0.03704071044921875, 0.04272651672363281, 0.048412322998046875, 0.05409812927246094, 0.059783935546875, 0.06546974182128906, 0.07115554809570312, 0.07684135437011719, 0.08252716064453125, 0.08821296691894531, 0.09389877319335938, 0.09958457946777344, 0.1052703857421875, 0.11095619201660156, 0.11664199829101562, 0.12232780456542969, 0.12801361083984375, 0.1336994171142578, 0.13938522338867188, 0.14507102966308594, 0.1507568359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 8.0, 7.0, 14.0, 15.0, 19.0, 27.0, 31.0, 49.0, 61.0, 78.0, 127.0, 132.0, 109.0, 88.0, 63.0, 48.0, 38.0, 27.0, 16.0, 13.0, 6.0, 1.0, 7.0, 2.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4717063903808594e-05, -5.271565169095993e-05, -5.071423947811127e-05, -4.8712827265262604e-05, -4.671141505241394e-05, -4.471000283956528e-05, -4.2708590626716614e-05, -4.070717841386795e-05, -3.870576620101929e-05, -3.6704353988170624e-05, -3.470294177532196e-05, -3.27015295624733e-05, -3.0700117349624634e-05, -2.869870513677597e-05, -2.6697292923927307e-05, -2.4695880711078644e-05, -2.269446849822998e-05, -2.0693056285381317e-05, -1.8691644072532654e-05, -1.669023185968399e-05, -1.4688819646835327e-05, -1.2687407433986664e-05, -1.0685995221138e-05, -8.684583008289337e-06, -6.683170795440674e-06, -4.6817585825920105e-06, -2.680346369743347e-06, -6.789341568946838e-07, 1.3224780559539795e-06, 3.323890268802643e-06, 5.325302481651306e-06, 7.3267146944999695e-06, 9.328126907348633e-06, 1.1329539120197296e-05, 1.333095133304596e-05, 1.5332363545894623e-05, 1.7333775758743286e-05, 1.933518797159195e-05, 2.1336600184440613e-05, 2.3338012397289276e-05, 2.533942461013794e-05, 2.7340836822986603e-05, 2.9342249035835266e-05, 3.134366124868393e-05, 3.334507346153259e-05, 3.5346485674381256e-05, 3.734789788722992e-05, 3.934931010007858e-05, 4.1350722312927246e-05, 4.335213452577591e-05, 4.535354673862457e-05, 4.7354958951473236e-05, 4.93563711643219e-05, 5.135778337717056e-05, 5.3359195590019226e-05, 5.536060780286789e-05, 5.736202001571655e-05, 5.9363432228565216e-05, 6.136484444141388e-05, 6.336625665426254e-05, 6.53676688671112e-05, 6.736908107995987e-05, 6.937049329280853e-05, 7.13719055056572e-05, 7.337331771850586e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 2.0, 7.0, 6.0, 9.0, 19.0, 27.0, 44.0, 55.0, 86.0, 138.0, 229.0, 414.0, 850.0, 1686.0, 3781.0, 10006.0, 34482.0, 712464.0, 236832.0, 31236.0, 9182.0, 3666.0, 1619.0, 706.0, 394.0, 211.0, 151.0, 95.0, 59.0, 31.0, 21.0, 14.0, 9.0, 6.0, 0.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.139404296875, -0.13441848754882812, -0.12943267822265625, -0.12444686889648438, -0.1194610595703125, -0.11447525024414062, -0.10948944091796875, -0.10450363159179688, -0.099517822265625, -0.09453201293945312, -0.08954620361328125, -0.08456039428710938, -0.0795745849609375, -0.07458877563476562, -0.06960296630859375, -0.06461715698242188, -0.05963134765625, -0.054645538330078125, -0.04965972900390625, -0.044673919677734375, -0.0396881103515625, -0.034702301025390625, -0.02971649169921875, -0.024730682373046875, -0.019744873046875, -0.014759063720703125, -0.00977325439453125, -0.004787445068359375, 0.0001983642578125, 0.005184173583984375, 0.01016998291015625, 0.015155792236328125, 0.0201416015625, 0.025127410888671875, 0.03011322021484375, 0.035099029541015625, 0.0400848388671875, 0.045070648193359375, 0.05005645751953125, 0.055042266845703125, 0.060028076171875, 0.06501388549804688, 0.06999969482421875, 0.07498550415039062, 0.0799713134765625, 0.08495712280273438, 0.08994293212890625, 0.09492874145507812, 0.09991455078125, 0.10490036010742188, 0.10988616943359375, 0.11487197875976562, 0.1198577880859375, 0.12484359741210938, 0.12982940673828125, 0.13481521606445312, 0.139801025390625, 0.14478683471679688, 0.14977264404296875, 0.15475845336914062, 0.1597442626953125, 0.16473007202148438, 0.16971588134765625, 0.17470169067382812, 0.1796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 5.0, 5.0, 17.0, 12.0, 10.0, 11.0, 19.0, 25.0, 28.0, 41.0, 84.0, 110.0, 124.0, 147.0, 92.0, 54.0, 41.0, 32.0, 24.0, 17.0, 13.0, 16.0, 13.0, 12.0, 10.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1572265625, -0.15213775634765625, -0.1470489501953125, -0.14196014404296875, -0.136871337890625, -0.13178253173828125, -0.1266937255859375, -0.12160491943359375, -0.11651611328125, -0.11142730712890625, -0.1063385009765625, -0.10124969482421875, -0.096160888671875, -0.09107208251953125, -0.0859832763671875, -0.08089447021484375, -0.0758056640625, -0.07071685791015625, -0.0656280517578125, -0.06053924560546875, -0.055450439453125, -0.05036163330078125, -0.0452728271484375, -0.04018402099609375, -0.03509521484375, -0.03000640869140625, -0.0249176025390625, -0.01982879638671875, -0.014739990234375, -0.00965118408203125, -0.0045623779296875, 0.00052642822265625, 0.005615234375, 0.01070404052734375, 0.0157928466796875, 0.02088165283203125, 0.025970458984375, 0.03105926513671875, 0.0361480712890625, 0.04123687744140625, 0.04632568359375, 0.05141448974609375, 0.0565032958984375, 0.06159210205078125, 0.066680908203125, 0.07176971435546875, 0.0768585205078125, 0.08194732666015625, 0.0870361328125, 0.09212493896484375, 0.0972137451171875, 0.10230255126953125, 0.107391357421875, 0.11248016357421875, 0.1175689697265625, 0.12265777587890625, 0.12774658203125, 0.13283538818359375, 0.1379241943359375, 0.14301300048828125, 0.148101806640625, 0.15319061279296875, 0.1582794189453125, 0.16336822509765625, 0.16845703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 9.0, 18.0, 18.0, 39.0, 57.0, 166.0, 404.0, 157.0, 47.0, 32.0, 22.0, 12.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.465400695800781, -12.202834129333496, -11.940266609191895, -11.67770004272461, -11.415133476257324, -11.152566909790039, -10.889999389648438, -10.627432823181152, -10.364866256713867, -10.102299690246582, -9.83973217010498, -9.577165603637695, -9.31459903717041, -9.052032470703125, -8.789464950561523, -8.526898384094238, -8.264330863952637, -8.001764297485352, -7.739197254180908, -7.476630210876465, -7.21406364440918, -6.951496601104736, -6.688929557800293, -6.426362991333008, -6.1637959480285645, -5.901228904724121, -5.638662338256836, -5.376095294952393, -5.113528251647949, -4.850961685180664, -4.588394641876221, -4.325827598571777, -4.06326150894165, -3.800694704055786, -3.538127899169922, -3.2755608558654785, -3.0129940509796143, -2.75042724609375, -2.4878602027893066, -2.2252933979034424, -1.9627265930175781, -1.7001597881317139, -1.43759286403656, -1.1750259399414062, -0.912459135055542, -0.6498923301696777, -0.3873254060745239, -0.12475848197937012, 0.13780832290649414, 0.4003751873970032, 0.6629420518875122, 0.9255089163780212, 1.1880757808685303, 1.4506425857543945, 1.7132095098495483, 1.9757764339447021, 2.2383432388305664, 2.5009100437164307, 2.763476848602295, 3.0260438919067383, 3.2886106967926025, 3.551177501678467, 3.81374454498291, 4.076311111450195, 4.338878154754639]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 9.0, 5.0, 13.0, 8.0, 11.0, 11.0, 21.0, 31.0, 29.0, 30.0, 75.0, 84.0, 116.0, 126.0, 120.0, 70.0, 51.0, 29.0, 15.0, 14.0, 15.0, 20.0, 9.0, 13.0, 17.0, 15.0, 8.0, 5.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.255499839782715, -7.05584716796875, -6.856194019317627, -6.656541347503662, -6.456888675689697, -6.257235527038574, -6.057582855224609, -5.8579301834106445, -5.65827751159668, -5.458624839782715, -5.258971691131592, -5.059319019317627, -4.859666347503662, -4.660013198852539, -4.460360527038574, -4.260707855224609, -4.061054706573486, -3.8614017963409424, -3.6617491245269775, -3.4620962142944336, -3.2624435424804688, -3.062790632247925, -2.863137722015381, -2.663485050201416, -2.463832139968872, -2.264179229736328, -2.0645265579223633, -1.8648736476898193, -1.665220856666565, -1.4655680656433105, -1.2659151554107666, -1.0662623643875122, -0.8666090965270996, -0.6669563055038452, -0.46730345487594604, -0.2676506042480469, -0.06799781322479248, 0.13165497779846191, 0.33130788803100586, 0.5309606790542603, 0.7306134700775146, 0.930266261100769, 1.1299190521240234, 1.3295719623565674, 1.5292247533798218, 1.7288775444030762, 1.9285304546356201, 2.128183364868164, 2.327836036682129, 2.527488946914673, 2.7271416187286377, 2.9267945289611816, 3.1264472007751465, 3.3261001110076904, 3.5257530212402344, 3.725405693054199, 3.925058603286743, 4.124711513519287, 4.324364185333252, 4.524017333984375, 4.72367000579834, 4.923322677612305, 5.1229753494262695, 5.322628498077393, 5.522281169891357]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 3.0, 0.0, 5.0, 5.0, 4.0, 8.0, 17.0, 18.0, 25.0, 19.0, 40.0, 35.0, 41.0, 52.0, 93.0, 295.0, 81.0, 43.0, 38.0, 33.0, 29.0, 25.0, 18.0, 20.0, 14.0, 7.0, 13.0, 9.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5737838745117188, -0.5543060302734375, -0.5348281860351562, -0.515350341796875, -0.49587249755859375, -0.4763946533203125, -0.45691680908203125, -0.43743896484375, -0.41796112060546875, -0.3984832763671875, -0.37900543212890625, -0.359527587890625, -0.34004974365234375, -0.3205718994140625, -0.30109405517578125, -0.2816162109375, -0.26213836669921875, -0.2426605224609375, -0.22318267822265625, -0.203704833984375, -0.18422698974609375, -0.1647491455078125, -0.14527130126953125, -0.12579345703125, -0.10631561279296875, -0.0868377685546875, -0.06735992431640625, -0.047882080078125, -0.02840423583984375, -0.0089263916015625, 0.01055145263671875, 0.030029296875, 0.04950714111328125, 0.0689849853515625, 0.08846282958984375, 0.107940673828125, 0.12741851806640625, 0.1468963623046875, 0.16637420654296875, 0.18585205078125, 0.20532989501953125, 0.2248077392578125, 0.24428558349609375, 0.263763427734375, 0.28324127197265625, 0.3027191162109375, 0.32219696044921875, 0.3416748046875, 0.36115264892578125, 0.3806304931640625, 0.40010833740234375, 0.419586181640625, 0.43906402587890625, 0.4585418701171875, 0.47801971435546875, 0.49749755859375, 0.5169754028320312, 0.5364532470703125, 0.5559310913085938, 0.575408935546875, 0.5948867797851562, 0.6143646240234375, 0.6338424682617188, 0.6533203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 10.0, 8.0, 10.0, 19.0, 14.0, 41.0, 54.0, 119.0, 212.0, 463.0, 1378.0, 6292.0, 8182443.0, 190200.0, 5182.0, 1239.0, 459.0, 147.0, 107.0, 59.0, 45.0, 25.0, 16.0, 17.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0], "bins": [-7.8193769454956055, -7.61326265335083, -7.407148838043213, -7.2010345458984375, -6.994920253753662, -6.788805961608887, -6.5826921463012695, -6.376577854156494, -6.170463562011719, -5.964349269866943, -5.758235454559326, -5.552121162414551, -5.346006870269775, -5.139892578125, -4.933778762817383, -4.727664470672607, -4.521550178527832, -4.315435886383057, -4.1093220710754395, -3.903207778930664, -3.6970934867858887, -3.4909794330596924, -3.284865379333496, -3.0787510871887207, -2.8726372718811035, -2.6665232181549072, -2.460408926010132, -2.2542948722839355, -2.04818058013916, -1.8420665264129639, -1.635952353477478, -1.4298381805419922, -1.2237238883972168, -1.017609715461731, -0.8114955425262451, -0.605381429195404, -0.3992672562599182, -0.19315314292907715, 0.012961030006408691, 0.21907520294189453, 0.42518937587738037, 0.6313035488128662, 0.837417721748352, 1.043531894683838, 1.2496459484100342, 1.45576012134552, 1.6618742942810059, 1.8679884672164917, 2.0741026401519775, 2.280216693878174, 2.486330986022949, 2.6924450397491455, 2.898559331893921, 3.104673385620117, 3.3107876777648926, 3.516901731491089, 3.723015785217285, 3.9291298389434814, 4.135243892669678, 4.341358184814453, 4.5474724769592285, 4.753586769104004, 4.959700584411621, 5.1658148765563965, 5.371929168701172]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 5.0, 7.0, 2.0, 2.0, 7.0, 3.0, 8.0, 5.0, 2.0, 1.0, 2.0, 6.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.537432670593262, -6.272882461547852, -6.008332252502441, -5.7437825202941895, -5.479232311248779, -5.214682102203369, -4.950132369995117, -4.685582160949707, -4.421031951904297, -4.156481742858887, -3.8919317722320557, -3.6273818016052246, -3.3628315925598145, -3.0982813835144043, -2.8337314128875732, -2.569181442260742, -2.304631233215332, -2.040081024169922, -1.7755310535430908, -1.5109809637069702, -1.2464308738708496, -0.981880784034729, -0.7173306941986084, -0.4527806043624878, -0.1882305145263672, 0.07631957530975342, 0.340869665145874, 0.6054197549819946, 0.8699698448181152, 1.1345199346542358, 1.3990700244903564, 1.663620114326477, 1.9281692504882812, 2.1927194595336914, 2.4572694301605225, 2.7218194007873535, 2.9863696098327637, 3.250919818878174, 3.515469789505005, 3.780019760131836, 4.044569969177246, 4.309120178222656, 4.573670387268066, 4.838220119476318, 5.1027703285217285, 5.367320537567139, 5.631870269775391, 5.896420478820801, 6.160970687866211, 6.425520896911621, 6.690071105957031, 6.954620838165283, 7.219171047210693, 7.4837212562561035, 7.7482709884643555, 8.012821197509766, 8.277371406555176, 8.541921615600586, 8.806471824645996, 9.071022033691406, 9.3355712890625, 9.60012149810791, 9.86467170715332, 10.12922191619873, 10.39377212524414]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 18.0, 21.0, 31.0, 52.0, 82.0, 133.0, 282.0, 580.0, 1460.0, 5276.0, 22792.0, 118057.0, 277276.0, 76612.0, 15561.0, 3814.0, 1143.0, 441.0, 209.0, 114.0, 83.0, 44.0, 51.0, 29.0, 20.0, 15.0, 13.0, 7.0, 10.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.63275146484375, -4.4256591796875, -4.21856689453125, -4.011474609375, -3.80438232421875, -3.5972900390625, -3.39019775390625, -3.18310546875, -2.97601318359375, -2.7689208984375, -2.56182861328125, -2.354736328125, -2.14764404296875, -1.9405517578125, -1.73345947265625, -1.5263671875, -1.31927490234375, -1.1121826171875, -0.90509033203125, -0.697998046875, -0.49090576171875, -0.2838134765625, -0.07672119140625, 0.13037109375, 0.33746337890625, 0.5445556640625, 0.75164794921875, 0.958740234375, 1.16583251953125, 1.3729248046875, 1.58001708984375, 1.787109375, 1.99420166015625, 2.2012939453125, 2.40838623046875, 2.615478515625, 2.82257080078125, 3.0296630859375, 3.23675537109375, 3.44384765625, 3.65093994140625, 3.8580322265625, 4.06512451171875, 4.272216796875, 4.47930908203125, 4.6864013671875, 4.89349365234375, 5.1005859375, 5.30767822265625, 5.5147705078125, 5.72186279296875, 5.928955078125, 6.13604736328125, 6.3431396484375, 6.55023193359375, 6.75732421875, 6.96441650390625, 7.1715087890625, 7.37860107421875, 7.585693359375, 7.79278564453125, 7.9998779296875, 8.20697021484375, 8.4140625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 10.0, 5.0, 11.0, 23.0, 24.0, 35.0, 49.0, 40.0, 82.0, 72.0, 85.0, 83.0, 96.0, 84.0, 70.0, 45.0, 51.0, 37.0, 29.0, 14.0, 13.0, 14.0, 5.0, 2.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7666015625, -0.7406005859375, -0.714599609375, -0.6885986328125, -0.66259765625, -0.6365966796875, -0.610595703125, -0.5845947265625, -0.55859375, -0.5325927734375, -0.506591796875, -0.4805908203125, -0.45458984375, -0.4285888671875, -0.402587890625, -0.3765869140625, -0.3505859375, -0.3245849609375, -0.298583984375, -0.2725830078125, -0.24658203125, -0.2205810546875, -0.194580078125, -0.1685791015625, -0.142578125, -0.1165771484375, -0.090576171875, -0.0645751953125, -0.03857421875, -0.0125732421875, 0.013427734375, 0.0394287109375, 0.0654296875, 0.0914306640625, 0.117431640625, 0.1434326171875, 0.16943359375, 0.1954345703125, 0.221435546875, 0.2474365234375, 0.2734375, 0.2994384765625, 0.325439453125, 0.3514404296875, 0.37744140625, 0.4034423828125, 0.429443359375, 0.4554443359375, 0.4814453125, 0.5074462890625, 0.533447265625, 0.5594482421875, 0.58544921875, 0.6114501953125, 0.637451171875, 0.6634521484375, 0.689453125, 0.7154541015625, 0.741455078125, 0.7674560546875, 0.79345703125, 0.8194580078125, 0.845458984375, 0.8714599609375, 0.8974609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 15.0, 57.0, 84.0, 103.0, 79.0, 58.0, 20.0, 9.0, 7.0, 4.0, 9.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.105530261993408, -6.916867733001709, -6.728205680847168, -6.539543151855469, -6.3508806228637695, -6.1622185707092285, -5.973556041717529, -5.784893989562988, -5.596231460571289, -5.40756893157959, -5.218906879425049, -5.03024435043335, -4.841582298278809, -4.652919769287109, -4.46425724029541, -4.275594711303711, -4.08693265914917, -3.89827036857605, -3.7096080780029297, -3.5209455490112305, -3.3322832584381104, -3.1436209678649902, -2.954958438873291, -2.766296148300171, -2.577633857727051, -2.3889715671539307, -2.2003092765808105, -2.0116467475891113, -1.8229844570159912, -1.634322166442871, -1.4456597566604614, -1.2569973468780518, -1.0683345794677734, -0.8796722292900085, -0.6910098791122437, -0.5023475289344788, -0.31368517875671387, -0.12502282857894897, 0.06363952159881592, 0.2523019313812256, 0.4409642219543457, 0.6296265721321106, 0.8182889223098755, 1.0069513320922852, 1.1956136226654053, 1.3842759132385254, 1.572938323020935, 1.7616007328033447, 1.9502630233764648, 2.138925313949585, 2.327587604522705, 2.5162501335144043, 2.7049124240875244, 2.8935747146606445, 3.0822372436523438, 3.270899534225464, 3.459561824798584, 3.648224115371704, 3.836886405944824, 4.025548934936523, 4.214211463928223, 4.402873516082764, 4.591536045074463, 4.780198097229004, 4.968860626220703]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 7.0, 0.0, 3.0, 8.0, 8.0, 25.0, 58.0, 73.0, 104.0, 83.0, 38.0, 12.0, 16.0, 5.0, 9.0, 5.0, 6.0, 6.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36710262298584, -3.250770092010498, -3.134437322616577, -3.0181047916412354, -2.9017722606658936, -2.7854394912719727, -2.669106960296631, -2.552774429321289, -2.4364418983459473, -2.3201093673706055, -2.2037765979766846, -2.0874440670013428, -1.971111536026001, -1.8547788858413696, -1.7384462356567383, -1.6221137046813965, -1.5057810544967651, -1.3894484043121338, -1.273115873336792, -1.1567832231521606, -1.0404506921768188, -0.9241180419921875, -0.8077854514122009, -0.6914528608322144, -0.5751202702522278, -0.4587876796722412, -0.34245508909225464, -0.22612246870994568, -0.1097898781299591, 0.0065427422523498535, 0.12287533283233643, 0.239207923412323, 0.35554051399230957, 0.47187310457229614, 0.5882056951522827, 0.7045383453369141, 0.8208708763122559, 0.9372035264968872, 1.0535361766815186, 1.1698687076568604, 1.2862012386322021, 1.4025338888168335, 1.5188664197921753, 1.6351990699768066, 1.7515316009521484, 1.8678642511367798, 1.9841969013214111, 2.100529432296753, 2.216862201690674, 2.3331947326660156, 2.4495275020599365, 2.5658600330352783, 2.68219256401062, 2.798525333404541, 2.914857864379883, 3.0311903953552246, 3.1475229263305664, 3.263855457305908, 3.380188226699829, 3.496520757675171, 3.6128532886505127, 3.7291860580444336, 3.8455185890197754, 3.961851119995117, 4.078183650970459]}, "eval/loss": 1.7713568210601807, "eval/wer": 1.0580126933756446, "eval/runtime": 1261.7903, "eval/samples_per_second": 2.094, "eval/steps_per_second": 0.262} \ No newline at end of file